From 0d8a3f13e39c9e0be87c8459db9582c7c336617f Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 26 Jul 2024 21:49:41 +0100
Subject: [PATCH 01/52] impl

---
 src/Processors/Sources/ShellCommandSource.cpp    | 16 ++++++++++++----
 .../test_executable_dictionary/test.py           |  1 +
 2 files changed, 13 insertions(+), 4 deletions(-)
diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index 55eaf67eb3b..1659287c227 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -8,13 +8,15 @@
 #include <IO/WriteHelpers.h>
 #include <IO/ReadHelpers.h>
 
-#include <QueryPipeline/Pipe.h>
-#include <Processors/ISimpleTransform.h>
-#include <Processors/Formats/IOutputFormat.h>
-#include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Interpreters/Context.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <Processors/Formats/IOutputFormat.h>
+#include <Processors/ISimpleTransform.h>
+#include <QueryPipeline/Pipe.h>
+
 #include <boost/circular_buffer.hpp>
 
+#include <ranges>
 
 namespace DB
 {
@@ -137,9 +139,15 @@ public:
 
         while (!bytes_read)
         {
+            LOG_TRACE(
+                getLogger("TimeoutReadBufferFromFileDescriptor"),
+                "Starting polling on descriptors ({}) with timeout {} ms",
+                fmt::join(std::span(pfds, pfds + num_pfds) | std::views::transform([](const auto & pollfd) { return pollfd.fd; }), ", "),
+                timeout_milliseconds);
             pfds[0].revents = 0;
             pfds[1].revents = 0;
             size_t num_events = pollWithTimeout(pfds, num_pfds, timeout_milliseconds);
+            LOG_TRACE(getLogger("TimeoutReadBufferFromFileDescriptor"), "Poll returned with num_events={}", num_events);
             if (0 == num_events)
                 throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Pipe read timeout exceeded {} milliseconds", timeout_milliseconds);
 
diff --git a/tests/integration/test_executable_dictionary/test.py b/tests/integration/test_executable_dictionary/test.py
index 22f3442bb95..a1de429a235 100644
--- a/tests/integration/test_executable_dictionary/test.py
+++ b/tests/integration/test_executable_dictionary/test.py
@@ -245,6 +245,7 @@ def test_executable_input_slow_python(started_cluster):
     )
 
 
+@pytest.mark.repeat(50)
 def test_executable_implicit_input_slow_python(started_cluster):
     skip_test_msan(node)
     assert node.query_and_get_error(

From 6317979825794882905bc02b3a18dd82cfd8ec1c Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Mon, 29 Jul 2024 20:53:11 +0100
Subject: [PATCH 02/52] add one more

---
 tests/integration/test_executable_table_function/test.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_executable_table_function/test.py b/tests/integration/test_executable_table_function/test.py
index 801a3c7c14a..a79616fc008 100644
--- a/tests/integration/test_executable_table_function/test.py
+++ b/tests/integration/test_executable_table_function/test.py
@@ -139,6 +139,7 @@ def test_executable_function_input_signalled_python(started_cluster):
     assert node.query(query.format(source="(SELECT id FROM test_data_table)")) == ""
 
 
+@pytest.mark.repeat(50)
 def test_executable_function_input_slow_python(started_cluster):
     skip_test_msan(node)
 

From 51b39a6c745d61cb2e6feb39659ddb3cac57ad03 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Aug 2024 18:24:45 +0100
Subject: [PATCH 03/52] some more

---
 tests/integration/test_executable_dictionary/test.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_executable_dictionary/test.py b/tests/integration/test_executable_dictionary/test.py
index a1de429a235..2a6af75e751 100644
--- a/tests/integration/test_executable_dictionary/test.py
+++ b/tests/integration/test_executable_dictionary/test.py
@@ -235,6 +235,7 @@ def test_executable_implicit_input_signalled_python(started_cluster):
     )
 
 
+@pytest.mark.repeat(50)
 def test_executable_input_slow_python(started_cluster):
     skip_test_msan(node)
     assert node.query_and_get_error(

From 51918dc080c9fa4b128a151cfbd0d28b294c56d3 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sat, 3 Aug 2024 00:24:00 +0100
Subject: [PATCH 04/52] impl

---
 src/Common/ShellCommand.cpp                   |  9 ++++-
 src/Processors/Sources/ShellCommandSource.cpp | 39 +++++++++++++------
 2 files changed, 35 insertions(+), 13 deletions(-)

diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 98a21b43d76..79b0d667863 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -237,7 +237,14 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(
         res->write_fds.emplace(fd, fds.fds_rw[1]);
     }
 
-    LOG_TRACE(getLogger(), "Started shell command '{}' with pid {}", filename, pid);
+    LOG_TRACE(
+        getLogger(),
+        "Started shell command '{}' with pid {} and file descriptors: read {}, write {}",
+        filename,
+        pid,
+        res->out.getFD(),
+        res->err.getFD());
+
     return res;
 }
 
diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index 1659287c227..923bdfad8f8 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -75,6 +75,15 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
     while (true)
     {
         Stopwatch watch;
+
+#if defined(DEBUG_OR_SANITIZER_BUILD)
+        auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
+        LOG_TRACE(
+            getLogger("TimeoutReadBufferFromFileDescriptor"),
+            "Polling descriptors: {}",
+            fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "));
+#endif
+
         res = poll(pfds, static_cast<nfds_t>(num), static_cast<int>(timeout_milliseconds));
 
         if (res < 0)
@@ -84,7 +93,16 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
 
             const auto elapsed = watch.elapsedMilliseconds();
             if (timeout_milliseconds <= elapsed)
+            {
+#if defined(DEBUG_OR_SANITIZER_BUILD)
+                LOG_TRACE(
+                    getLogger("TimeoutReadBufferFromFileDescriptor"),
+                    "Timeout exceeded: elapsed={}, timeout={}",
+                    elapsed,
+                    timeout_milliseconds);
+#endif
                 break;
+            }
             timeout_milliseconds -= elapsed;
         }
         else
@@ -93,6 +111,15 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
         }
     }
 
+#if defined(DEBUG_OR_SANITIZER_BUILD)
+    auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
+    LOG_TRACE(
+        getLogger("TimeoutReadBufferFromFileDescriptor"),
+        "Poll for descriptors: {} returned {}",
+        fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "),
+        res);
+#endif
+
     return res;
 }
 
@@ -139,15 +166,9 @@ public:
 
         while (!bytes_read)
         {
-            LOG_TRACE(
-                getLogger("TimeoutReadBufferFromFileDescriptor"),
-                "Starting polling on descriptors ({}) with timeout {} ms",
-                fmt::join(std::span(pfds, pfds + num_pfds) | std::views::transform([](const auto & pollfd) { return pollfd.fd; }), ", "),
-                timeout_milliseconds);
             pfds[0].revents = 0;
             pfds[1].revents = 0;
             size_t num_events = pollWithTimeout(pfds, num_pfds, timeout_milliseconds);
-            LOG_TRACE(getLogger("TimeoutReadBufferFromFileDescriptor"), "Poll returned with num_events={}", num_events);
             if (0 == num_events)
                 throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Pipe read timeout exceeded {} milliseconds", timeout_milliseconds);
 
@@ -208,12 +229,6 @@ public:
         return true;
     }
 
-    void reset() const
-    {
-        makeFdBlocking(stdout_fd);
-        makeFdBlocking(stderr_fd);
-    }
-
     ~TimeoutReadBufferFromFileDescriptor() override
     {
         tryMakeFdBlocking(stdout_fd);

From cb6baefa948ef1270ce9454f72075ac10bf6e729 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Mon, 5 Aug 2024 21:49:36 +0100
Subject: [PATCH 05/52] better

---
 src/Common/ShellCommand.cpp                          |  2 +-
 src/Processors/Sources/ShellCommandSource.cpp        | 12 +++---------
 tests/integration/test_executable_dictionary/test.py |  2 --
 .../test_executable_table_function/test.py           |  1 -
 4 files changed, 4 insertions(+), 13 deletions(-)

diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 79b0d667863..0d41669816c 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -239,7 +239,7 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(
 
     LOG_TRACE(
         getLogger(),
-        "Started shell command '{}' with pid {} and file descriptors: read {}, write {}",
+        "Started shell command '{}' with pid {} and file descriptors: out {}, err {}",
         filename,
         pid,
         res->out.getFD(),
diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index 923bdfad8f8..23359367a9b 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -76,13 +76,11 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
     {
         Stopwatch watch;
 
-#if defined(DEBUG_OR_SANITIZER_BUILD)
         auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
-        LOG_TRACE(
+        LOG_TEST(
             getLogger("TimeoutReadBufferFromFileDescriptor"),
             "Polling descriptors: {}",
             fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "));
-#endif
 
         res = poll(pfds, static_cast<nfds_t>(num), static_cast<int>(timeout_milliseconds));
 
@@ -94,13 +92,11 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
             const auto elapsed = watch.elapsedMilliseconds();
             if (timeout_milliseconds <= elapsed)
             {
-#if defined(DEBUG_OR_SANITIZER_BUILD)
-                LOG_TRACE(
+                LOG_TEST(
                     getLogger("TimeoutReadBufferFromFileDescriptor"),
                     "Timeout exceeded: elapsed={}, timeout={}",
                     elapsed,
                     timeout_milliseconds);
-#endif
                 break;
             }
             timeout_milliseconds -= elapsed;
@@ -111,14 +107,12 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
         }
     }
 
-#if defined(DEBUG_OR_SANITIZER_BUILD)
     auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
-    LOG_TRACE(
+    LOG_TEST(
         getLogger("TimeoutReadBufferFromFileDescriptor"),
         "Poll for descriptors: {} returned {}",
         fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "),
         res);
-#endif
 
     return res;
 }
diff --git a/tests/integration/test_executable_dictionary/test.py b/tests/integration/test_executable_dictionary/test.py
index 2a6af75e751..22f3442bb95 100644
--- a/tests/integration/test_executable_dictionary/test.py
+++ b/tests/integration/test_executable_dictionary/test.py
@@ -235,7 +235,6 @@ def test_executable_implicit_input_signalled_python(started_cluster):
     )
 
 
-@pytest.mark.repeat(50)
 def test_executable_input_slow_python(started_cluster):
     skip_test_msan(node)
     assert node.query_and_get_error(
@@ -246,7 +245,6 @@ def test_executable_input_slow_python(started_cluster):
     )
 
 
-@pytest.mark.repeat(50)
 def test_executable_implicit_input_slow_python(started_cluster):
     skip_test_msan(node)
     assert node.query_and_get_error(
diff --git a/tests/integration/test_executable_table_function/test.py b/tests/integration/test_executable_table_function/test.py
index a79616fc008..801a3c7c14a 100644
--- a/tests/integration/test_executable_table_function/test.py
+++ b/tests/integration/test_executable_table_function/test.py
@@ -139,7 +139,6 @@ def test_executable_function_input_signalled_python(started_cluster):
     assert node.query(query.format(source="(SELECT id FROM test_data_table)")) == ""
 
 
-@pytest.mark.repeat(50)
 def test_executable_function_input_slow_python(started_cluster):
     skip_test_msan(node)
 

From 815fdc43ac333a75adff646fef073ea591494d13 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 6 Aug 2024 14:36:02 +0000
Subject: [PATCH 06/52] Revert "Merge pull request #67800 from
 ClickHouse/revert-66510"

This reverts commit 45c4a71ccb62bac6728d0e583fd04c0fc4f45a6f, reversing
changes made to bb71c1eea8e6019a5a21b6add08c2244764ddea5.
---
 src/Storages/MergeTree/MergeTreeData.cpp      |  2 +-
 src/Storages/VirtualColumnUtils.cpp           | 21 ++++++++++++-------
 src/Storages/VirtualColumnUtils.h             | 10 ++++++++-
 ..._with_non_deterministic_function.reference |  2 ++
 ..._count_with_non_deterministic_function.sql |  4 ++++
 5 files changed, 30 insertions(+), 9 deletions(-)
 create mode 100644 tests/queries/0_stateless/03203_count_with_non_deterministic_function.reference
 create mode 100644 tests/queries/0_stateless/03203_count_with_non_deterministic_function.sql

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 49888596fbb..ce27ad24e10 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -1146,7 +1146,7 @@ std::optional<UInt64> MergeTreeData::totalRowsByPartitionPredicateImpl(
     auto metadata_snapshot = getInMemoryMetadataPtr();
     auto virtual_columns_block = getBlockWithVirtualsForFilter(metadata_snapshot, {parts[0]});
 
-    auto filter_dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_actions_dag.getOutputs().at(0), nullptr);
+    auto filter_dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_actions_dag.getOutputs().at(0), nullptr, /*allow_non_deterministic_functions=*/ false);
     if (!filter_dag)
         return {};
 
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index ba1f4488005..90c2c7f93c1 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -275,7 +275,8 @@ bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
 static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
     const ActionsDAG::Node * node,
     const Block * allowed_inputs,
-    ActionsDAG::Nodes & additional_nodes)
+    ActionsDAG::Nodes & additional_nodes,
+    bool allow_non_deterministic_functions)
 {
     if (node->type == ActionsDAG::ActionType::FUNCTION)
     {
@@ -284,8 +285,14 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
             auto & node_copy = additional_nodes.emplace_back(*node);
             node_copy.children.clear();
             for (const auto * child : node->children)
-                if (const auto * child_copy = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes))
+                if (const auto * child_copy = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_non_deterministic_functions))
                     node_copy.children.push_back(child_copy);
+                /// Expression like (now_allowed AND allowed) is not allowed if allow_non_deterministic_functions = true. This is important for
+                /// trivial count optimization, otherwise we can get incorrect results. For example, if the query is
+                /// SELECT count() FROM table WHERE _partition_id = '0' AND rowNumberInBlock() = 1, we cannot apply
+                /// trivial count.
+                else if (!allow_non_deterministic_functions)
+                    return nullptr;
 
             if (node_copy.children.empty())
                 return nullptr;
@@ -311,7 +318,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
         {
             auto & node_copy = additional_nodes.emplace_back(*node);
             for (auto & child : node_copy.children)
-                if (child = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes); !child)
+                if (child = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_non_deterministic_functions); !child)
                     return nullptr;
 
             return &node_copy;
@@ -325,7 +332,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
                     auto index_hint_dag = index_hint->getActions().clone();
                     ActionsDAG::NodeRawConstPtrs atoms;
                     for (const auto & output : index_hint_dag.getOutputs())
-                        if (const auto * child_copy = splitFilterNodeForAllowedInputs(output, allowed_inputs, additional_nodes))
+                        if (const auto * child_copy = splitFilterNodeForAllowedInputs(output, allowed_inputs, additional_nodes, allow_non_deterministic_functions))
                             atoms.push_back(child_copy);
 
                     if (!atoms.empty())
@@ -359,13 +366,13 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
     return node;
 }
 
-std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs)
+std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_non_deterministic_functions)
 {
     if (!predicate)
         return {};
 
     ActionsDAG::Nodes additional_nodes;
-    const auto * res = splitFilterNodeForAllowedInputs(predicate, allowed_inputs, additional_nodes);
+    const auto * res = splitFilterNodeForAllowedInputs(predicate, allowed_inputs, additional_nodes, allow_non_deterministic_functions);
     if (!res)
         return {};
 
@@ -374,7 +381,7 @@ std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node
 
 void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block, ContextPtr context)
 {
-    auto dag = splitFilterDagForAllowedInputs(predicate, &block);
+    auto dag = splitFilterDagForAllowedInputs(predicate, &block,  /*allow_non_deterministic_functions=*/ false);
     if (dag)
         filterBlockWithExpression(buildFilterExpression(std::move(*dag), context), block);
 }
diff --git a/src/Storages/VirtualColumnUtils.h b/src/Storages/VirtualColumnUtils.h
index d75dc70ae44..abf46dc23a4 100644
--- a/src/Storages/VirtualColumnUtils.h
+++ b/src/Storages/VirtualColumnUtils.h
@@ -41,7 +41,15 @@ void buildSetsForDAG(const ActionsDAG & dag, const ContextPtr & context);
 bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node);
 
 /// Extract a part of predicate that can be evaluated using only columns from input_names.
-std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs);
+/// When allow_non_deterministic_functions is true then even if the predicate contains non-deterministic
+/// functions, we still allow to extract a part of the predicate, otherwise we return nullptr.
+/// allow_non_deterministic_functions must be false when we are going to use the result to filter parts in
+/// MergeTreeData::totalRowsByPartitionPredicateImp. For example, if the query is
+/// `SELECT count() FROM table  WHERE _partition_id = '0' AND rowNumberInBlock() = 1`
+/// The predicate will be `_partition_id = '0' AND rowNumberInBlock() = 1`, and `rowNumberInBlock()` is
+/// non-deterministic. If we still extract the part `_partition_id = '0'` for filtering parts, then trivial
+/// count optimization will be mistakenly applied to the query.
+std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_non_deterministic_functions = true);
 
 /// Extract from the input stream a set of `name` column values
 template <typename T>
diff --git a/tests/queries/0_stateless/03203_count_with_non_deterministic_function.reference b/tests/queries/0_stateless/03203_count_with_non_deterministic_function.reference
new file mode 100644
index 00000000000..6ed281c757a
--- /dev/null
+++ b/tests/queries/0_stateless/03203_count_with_non_deterministic_function.reference
@@ -0,0 +1,2 @@
+1
+1
diff --git a/tests/queries/0_stateless/03203_count_with_non_deterministic_function.sql b/tests/queries/0_stateless/03203_count_with_non_deterministic_function.sql
new file mode 100644
index 00000000000..bb3269da597
--- /dev/null
+++ b/tests/queries/0_stateless/03203_count_with_non_deterministic_function.sql
@@ -0,0 +1,4 @@
+CREATE TABLE t (p UInt8, x UInt64) Engine = MergeTree PARTITION BY p ORDER BY x;
+INSERT INTO t SELECT 0, number FROM numbers(10) SETTINGS max_block_size = 100;
+SELECT count() FROM t WHERE p = 0 AND rowNumberInAllBlocks() = 1 SETTINGS allow_experimental_analyzer = 0;
+SELECT count() FROM t WHERE p = 0 AND rowNumberInAllBlocks() = 1 SETTINGS allow_experimental_analyzer = 1;

From 2074485083e8860aafc36ac7886a54a75e144468 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 6 Aug 2024 14:25:02 +0000
Subject: [PATCH 07/52] Fix partial filtering in `filterBlockWithPredicate`

---
 src/Storages/MergeTree/MergeTreeData.cpp      |  3 +-
 src/Storages/VirtualColumnUtils.cpp           | 86 +++++++++----------
 src/Storages/VirtualColumnUtils.h             | 16 ++--
 ...03217_read_rows_in_system_tables.reference | 10 +++
 .../03217_read_rows_in_system_tables.sql      | 34 ++++++++
 5 files changed, 97 insertions(+), 52 deletions(-)
 create mode 100644 tests/queries/0_stateless/03217_read_rows_in_system_tables.reference
 create mode 100644 tests/queries/0_stateless/03217_read_rows_in_system_tables.sql

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index ce27ad24e10..b24d7968b61 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -6914,7 +6914,8 @@ Block MergeTreeData::getMinMaxCountProjectionBlock(
         const auto * predicate = filter_dag->getOutputs().at(0);
 
         // Generate valid expressions for filtering
-        VirtualColumnUtils::filterBlockWithPredicate(predicate, virtual_columns_block, query_context);
+        VirtualColumnUtils::filterBlockWithPredicate(
+            predicate, virtual_columns_block, query_context, /*allow_filtering_with_partial_predicate =*/true);
 
         rows = virtual_columns_block.rows();
         part_name_column = virtual_columns_block.getByName("_part").column;
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 90c2c7f93c1..b40378250bb 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -1,51 +1,46 @@
-#include <algorithm>
+#include <Storages/VirtualColumnUtils.h>
+
 #include <memory>
 #include <stack>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnSet.h>
+#include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnsNumber.h>
+#include <Columns/FilterDescription.h>
 #include <Core/NamesAndTypes.h>
 #include <Core/TypeId.h>
-
+#include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/FunctionsLogical.h>
+#include <Functions/IFunction.h>
+#include <Functions/IFunctionAdaptors.h>
+#include <Functions/indexHint.h>
+#include <IO/WriteHelpers.h>
+#include <Interpreters/ActionsDAG.h>
+#include <Interpreters/ActionsVisitor.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/TreeRewriter.h>
-#include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/ExpressionActions.h>
+#include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/IdentifierSemantic.h>
+#include <Interpreters/TreeRewriter.h>
 #include <Interpreters/misc.h>
-
-#include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTExpressionList.h>
-#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTSubquery.h>
-
-#include <Columns/ColumnConst.h>
-#include <Columns/ColumnsNumber.h>
-#include <Columns/ColumnsCommon.h>
-#include <Columns/FilterDescription.h>
-
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <DataTypes/DataTypeDateTime.h>
-
-#include <Processors/QueryPlan/QueryPlan.h>
+#include <Parsers/makeASTForLogicalFunction.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
 #include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/Sinks/EmptySink.h>
-#include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
-
-#include <Storages/VirtualColumnUtils.h>
-#include <IO/WriteHelpers.h>
 #include <Common/typeid_cast.h>
-#include "Functions/FunctionsLogical.h"
-#include "Functions/IFunction.h"
-#include "Functions/IFunctionAdaptors.h"
-#include "Functions/indexHint.h"
-#include <Parsers/makeASTForLogicalFunction.h>
-#include <Columns/ColumnSet.h>
-#include <Functions/FunctionHelpers.h>
-#include <Interpreters/ActionsVisitor.h>
 
 
 namespace DB
@@ -273,10 +268,7 @@ bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
 }
 
 static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
-    const ActionsDAG::Node * node,
-    const Block * allowed_inputs,
-    ActionsDAG::Nodes & additional_nodes,
-    bool allow_non_deterministic_functions)
+    const ActionsDAG::Node * node, const Block * allowed_inputs, ActionsDAG::Nodes & additional_nodes, bool allow_partial_result)
 {
     if (node->type == ActionsDAG::ActionType::FUNCTION)
     {
@@ -285,13 +277,14 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
             auto & node_copy = additional_nodes.emplace_back(*node);
             node_copy.children.clear();
             for (const auto * child : node->children)
-                if (const auto * child_copy = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_non_deterministic_functions))
+                if (const auto * child_copy
+                    = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_partial_result))
                     node_copy.children.push_back(child_copy);
-                /// Expression like (now_allowed AND allowed) is not allowed if allow_non_deterministic_functions = true. This is important for
+                /// Expression like (now_allowed AND allowed) is not allowed if allow_partial_result = true. This is important for
                 /// trivial count optimization, otherwise we can get incorrect results. For example, if the query is
                 /// SELECT count() FROM table WHERE _partition_id = '0' AND rowNumberInBlock() = 1, we cannot apply
                 /// trivial count.
-                else if (!allow_non_deterministic_functions)
+                else if (!allow_partial_result)
                     return nullptr;
 
             if (node_copy.children.empty())
@@ -300,7 +293,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
             if (node_copy.children.size() == 1)
             {
                 const ActionsDAG::Node * res = node_copy.children.front();
-                /// Expression like (not_allowed AND 256) can't be resuced to (and(256)) because AND requires
+                /// Expression like (not_allowed AND 256) can't be reduced to (and(256)) because AND requires
                 /// at least two arguments; also it can't be reduced to (256) because result type is different.
                 if (!res->result_type->equals(*node->result_type))
                 {
@@ -318,7 +311,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
         {
             auto & node_copy = additional_nodes.emplace_back(*node);
             for (auto & child : node_copy.children)
-                if (child = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_non_deterministic_functions); !child)
+                if (child = splitFilterNodeForAllowedInputs(child, allowed_inputs, additional_nodes, allow_partial_result); !child)
                     return nullptr;
 
             return &node_copy;
@@ -332,7 +325,8 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
                     auto index_hint_dag = index_hint->getActions().clone();
                     ActionsDAG::NodeRawConstPtrs atoms;
                     for (const auto & output : index_hint_dag.getOutputs())
-                        if (const auto * child_copy = splitFilterNodeForAllowedInputs(output, allowed_inputs, additional_nodes, allow_non_deterministic_functions))
+                        if (const auto * child_copy
+                            = splitFilterNodeForAllowedInputs(output, allowed_inputs, additional_nodes, allow_partial_result))
                             atoms.push_back(child_copy);
 
                     if (!atoms.empty())
@@ -366,22 +360,24 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
     return node;
 }
 
-std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_non_deterministic_functions)
+std::optional<ActionsDAG>
+splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_partial_result)
 {
     if (!predicate)
         return {};
 
     ActionsDAG::Nodes additional_nodes;
-    const auto * res = splitFilterNodeForAllowedInputs(predicate, allowed_inputs, additional_nodes, allow_non_deterministic_functions);
+    const auto * res = splitFilterNodeForAllowedInputs(predicate, allowed_inputs, additional_nodes, allow_partial_result);
     if (!res)
         return {};
 
     return ActionsDAG::cloneSubDAG({res}, true);
 }
 
-void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block, ContextPtr context)
+void filterBlockWithPredicate(
+    const ActionsDAG::Node * predicate, Block & block, ContextPtr context, bool allow_filtering_with_partial_predicate)
 {
-    auto dag = splitFilterDagForAllowedInputs(predicate, &block,  /*allow_non_deterministic_functions=*/ false);
+    auto dag = splitFilterDagForAllowedInputs(predicate, &block, /*allow_partial_result=*/allow_filtering_with_partial_predicate);
     if (dag)
         filterBlockWithExpression(buildFilterExpression(std::move(*dag), context), block);
 }
diff --git a/src/Storages/VirtualColumnUtils.h b/src/Storages/VirtualColumnUtils.h
index abf46dc23a4..f76cf2cad76 100644
--- a/src/Storages/VirtualColumnUtils.h
+++ b/src/Storages/VirtualColumnUtils.h
@@ -26,9 +26,13 @@ namespace VirtualColumnUtils
 ///
 /// Otherwise calling filter*() outside applyFilters() will throw "Not-ready Set is passed"
 /// if there are subqueries.
+///
+/// Similar to filterBlockWithExpression(buildFilterExpression(splitFilterDagForAllowedInputs(...)))./// Similar to filterBlockWithQuery, but uses ActionsDAG as a predicate.
+/// Basically it is filterBlockWithDAG(splitFilterDagForAllowedInputs).
+/// If allow_filtering_with_partial_predicate is true, then the filtering will be done even if some part of the predicate
+/// cannot be evaluated using the columns from the block.
+void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block, ContextPtr context, bool allow_filtering_with_partial_predicate = true);
 
-/// Similar to filterBlockWithExpression(buildFilterExpression(splitFilterDagForAllowedInputs(...))).
-void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block, ContextPtr context);
 
 /// Just filters block. Block should contain all the required columns.
 ExpressionActionsPtr buildFilterExpression(ActionsDAG dag, ContextPtr context);
@@ -41,15 +45,15 @@ void buildSetsForDAG(const ActionsDAG & dag, const ContextPtr & context);
 bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node);
 
 /// Extract a part of predicate that can be evaluated using only columns from input_names.
-/// When allow_non_deterministic_functions is true then even if the predicate contains non-deterministic
-/// functions, we still allow to extract a part of the predicate, otherwise we return nullptr.
-/// allow_non_deterministic_functions must be false when we are going to use the result to filter parts in
+/// When allow_partial_result is false, then the result will be empty if any part of if cannot be evaluated deterministically
+/// on the given inputs.
+/// allow_partial_result must be false when we are going to use the result to filter parts in
 /// MergeTreeData::totalRowsByPartitionPredicateImp. For example, if the query is
 /// `SELECT count() FROM table  WHERE _partition_id = '0' AND rowNumberInBlock() = 1`
 /// The predicate will be `_partition_id = '0' AND rowNumberInBlock() = 1`, and `rowNumberInBlock()` is
 /// non-deterministic. If we still extract the part `_partition_id = '0'` for filtering parts, then trivial
 /// count optimization will be mistakenly applied to the query.
-std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_non_deterministic_functions = true);
+std::optional<ActionsDAG> splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs, bool allow_partial_result = true);
 
 /// Extract from the input stream a set of `name` column values
 template <typename T>
diff --git a/tests/queries/0_stateless/03217_read_rows_in_system_tables.reference b/tests/queries/0_stateless/03217_read_rows_in_system_tables.reference
new file mode 100644
index 00000000000..b21ead49b1e
--- /dev/null
+++ b/tests/queries/0_stateless/03217_read_rows_in_system_tables.reference
@@ -0,0 +1,10 @@
+information_schema	tables
+default	test_replica_1	r1
+Expression ((Project names + Projection))
+  Aggregating
+    Expression (Before GROUP BY)
+      ReadFromMerge
+        Filter (( + ( + )))
+          ReadFromMergeTree (default.test_replica_1)
+1	1
+1	1
diff --git a/tests/queries/0_stateless/03217_read_rows_in_system_tables.sql b/tests/queries/0_stateless/03217_read_rows_in_system_tables.sql
new file mode 100644
index 00000000000..3bea04ccccf
--- /dev/null
+++ b/tests/queries/0_stateless/03217_read_rows_in_system_tables.sql
@@ -0,0 +1,34 @@
+SELECT database, table FROM system.tables WHERE database = 'information_schema' AND table = 'tables';
+
+-- To verify StorageSystemReplicas applies the filter properly
+CREATE TABLE test_replica_1(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217/test_replica', 'r1')
+    ORDER BY x;
+CREATE TABLE test_replica_2(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217/test_replica', 'r2')
+    ORDER BY x;
+
+SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_replica_1' AND replica_name = 'r1';
+
+
+-- To verify StorageMerge
+CREATE TABLE all_replicas (x UInt32)
+    ENGINE = Merge(currentDatabase(), 'test_replica_*');
+
+INSERT INTO test_replica_1 SELECT number AS x FROM numbers(10);
+SYSTEM SYNC REPLICA test_replica_2;
+-- If the filter not applied, then the plan will show both replicas
+EXPLAIN SELECT _table, count() FROM all_replicas WHERE  _table = 'test_replica_1' AND x >= 0 GROUP BY _table;
+
+SYSTEM FLUSH LOGS;
+-- argMin-argMax make the test repeatable
+
+-- StorageSystemTables
+SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+    AND query LIKE '%SELECT database, table FROM system.tables WHERE database = \'information_schema\' AND table = \'tables\';'
+    AND type = 'QueryFinish';
+
+-- StorageSystemReplicas
+SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+    AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_replica_1\' AND replica_name = \'r1\';'
+    AND type = 'QueryFinish';

From 5eb896b9f1976feaa423071919e65d22e09da4ea Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 7 Aug 2024 10:43:41 +0200
Subject: [PATCH 08/52] Add documentation for toDecimal32 and variants

---
 .../functions/type-conversion-functions.md    | 471 ++++++++++++------
 1 file changed, 305 insertions(+), 166 deletions(-)

diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index 1e618b8cdab..24055bb99b7 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -95,7 +95,7 @@ SELECT
     toInt8(-8),
     toInt8(-8.8),
     toInt8('-8')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -156,7 +156,7 @@ Query:
 SELECT
     toInt8OrZero('-8'),
     toInt8OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -216,7 +216,7 @@ Query:
 SELECT
     toInt8OrNull('-8'),
     toInt8OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -281,7 +281,7 @@ Query:
 SELECT
     toInt8OrDefault('-8', CAST('-1', 'Int8')),
     toInt8OrDefault('abc', CAST('-1', 'Int8'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -345,7 +345,7 @@ SELECT
     toInt16(-16),
     toInt16(-16.16),
     toInt16('-16')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -406,7 +406,7 @@ Query:
 SELECT
     toInt16OrZero('-16'),
     toInt16OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -466,7 +466,7 @@ Query:
 SELECT
     toInt16OrNull('-16'),
     toInt16OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -531,7 +531,7 @@ Query:
 SELECT
     toInt16OrDefault('-16', CAST('-1', 'Int16')),
     toInt16OrDefault('abc', CAST('-1', 'Int16'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -595,7 +595,7 @@ SELECT
     toInt32(-32),
     toInt32(-32.32),
     toInt32('-32')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -656,7 +656,7 @@ Query:
 SELECT
     toInt32OrZero('-32'),
     toInt32OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -715,7 +715,7 @@ Query:
 SELECT
     toInt32OrNull('-32'),
     toInt32OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -780,7 +780,7 @@ Query:
 SELECT
     toInt32OrDefault('-32', CAST('-1', 'Int32')),
     toInt32OrDefault('abc', CAST('-1', 'Int32'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -844,7 +844,7 @@ SELECT
     toInt64(-64),
     toInt64(-64.64),
     toInt64('-64')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -905,7 +905,7 @@ Query:
 SELECT
     toInt64OrZero('-64'),
     toInt64OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -965,7 +965,7 @@ Query:
 SELECT
     toInt64OrNull('-64'),
     toInt64OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1030,7 +1030,7 @@ Query:
 SELECT
     toInt64OrDefault('-64', CAST('-1', 'Int64')),
     toInt64OrDefault('abc', CAST('-1', 'Int64'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1093,7 +1093,7 @@ SELECT
     toInt128(-128),
     toInt128(-128.8),
     toInt128('-128')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1154,7 +1154,7 @@ Query:
 SELECT
     toInt128OrZero('-128'),
     toInt128OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1214,7 +1214,7 @@ Query:
 SELECT
     toInt128OrNull('-128'),
     toInt128OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1279,7 +1279,7 @@ Query:
 SELECT
     toInt128OrDefault('-128', CAST('-1', 'Int128')),
     toInt128OrDefault('abc', CAST('-1', 'Int128'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1342,7 +1342,7 @@ SELECT
     toInt256(-256),
     toInt256(-256.256),
     toInt256('-256')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1403,7 +1403,7 @@ Query:
 SELECT
     toInt256OrZero('-256'),
     toInt256OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1463,7 +1463,7 @@ Query:
 SELECT
     toInt256OrNull('-256'),
     toInt256OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1528,7 +1528,7 @@ Query:
 SELECT
     toInt256OrDefault('-256', CAST('-1', 'Int256')),
     toInt256OrDefault('abc', CAST('-1', 'Int256'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1592,7 +1592,7 @@ SELECT
     toUInt8(8),
     toUInt8(8.8),
     toUInt8('8')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1653,7 +1653,7 @@ Query:
 SELECT
     toUInt8OrZero('-8'),
     toUInt8OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1713,7 +1713,7 @@ Query:
 SELECT
     toUInt8OrNull('8'),
     toUInt8OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1778,7 +1778,7 @@ Query:
 SELECT
     toUInt8OrDefault('8', CAST('0', 'UInt8')),
     toUInt8OrDefault('abc', CAST('0', 'UInt8'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1842,7 +1842,7 @@ SELECT
     toUInt16(16),
     toUInt16(16.16),
     toUInt16('16')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1903,7 +1903,7 @@ Query:
 SELECT
     toUInt16OrZero('16'),
     toUInt16OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -1963,7 +1963,7 @@ Query:
 SELECT
     toUInt16OrNull('16'),
     toUInt16OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2028,7 +2028,7 @@ Query:
 SELECT
     toUInt16OrDefault('16', CAST('0', 'UInt16')),
     toUInt16OrDefault('abc', CAST('0', 'UInt16'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2092,7 +2092,7 @@ SELECT
     toUInt32(32),
     toUInt32(32.32),
     toUInt32('32')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2154,7 +2154,7 @@ Query:
 SELECT
     toUInt32OrZero('32'),
     toUInt32OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2214,7 +2214,7 @@ Query:
 SELECT
     toUInt32OrNull('32'),
     toUInt32OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2279,7 +2279,7 @@ Query:
 SELECT
     toUInt32OrDefault('32', CAST('0', 'UInt32')),
     toUInt32OrDefault('abc', CAST('0', 'UInt32'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2343,7 +2343,7 @@ SELECT
     toUInt64(64),
     toUInt64(64.64),
     toUInt64('64')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2404,7 +2404,7 @@ Query:
 SELECT
     toUInt64OrZero('64'),
     toUInt64OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2464,7 +2464,7 @@ Query:
 SELECT
     toUInt64OrNull('64'),
     toUInt64OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2529,7 +2529,7 @@ Query:
 SELECT
     toUInt64OrDefault('64', CAST('0', 'UInt64')),
     toUInt64OrDefault('abc', CAST('0', 'UInt64'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2592,7 +2592,7 @@ SELECT
     toUInt128(128),
     toUInt128(128.8),
     toUInt128('128')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2653,7 +2653,7 @@ Query:
 SELECT
     toUInt128OrZero('128'),
     toUInt128OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2713,7 +2713,7 @@ Query:
 SELECT
     toUInt128OrNull('128'),
     toUInt128OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2778,7 +2778,7 @@ Query:
 SELECT
     toUInt128OrDefault('128', CAST('0', 'UInt128')),
     toUInt128OrDefault('abc', CAST('0', 'UInt128'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2841,7 +2841,7 @@ SELECT
     toUInt256(256),
     toUInt256(256.256),
     toUInt256('256')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2902,7 +2902,7 @@ Query:
 SELECT
     toUInt256OrZero('256'),
     toUInt256OrZero('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -2962,7 +2962,7 @@ Query:
 SELECT
     toUInt256OrNull('256'),
     toUInt256OrNull('abc')
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -3027,7 +3027,7 @@ Query:
 SELECT
     toUInt256OrDefault('-256', CAST('0', 'UInt256')),
     toUInt256OrDefault('abc', CAST('0', 'UInt256'))
-FORMAT vertical;
+FORMAT Vertical;
 ```
 
 Result:
@@ -3542,173 +3542,312 @@ SELECT toDateTime64('2019-01-01 00:00:00', 3, 'Asia/Istanbul') AS value, toTypeN
 
 ## toDateTime64OrDefault
 
-## toDecimal(32\|64\|128\|256)
+## toDecimal32
 
-Converts `value` to the [Decimal](../data-types/decimal.md) data type with precision of `S`. The `value` can be a number or a string. The `S` (scale) parameter specifies the number of decimal places.
+Converts an input value to a value of type [`Decimal(9, S)`](../data-types/decimal.md) with scale of `S`. Throws an exception in case of an error.
 
-- `toDecimal32(value, S)`
-- `toDecimal64(value, S)`
-- `toDecimal128(value, S)`
-- `toDecimal256(value, S)`
+**Syntax**
 
-## toDecimal(32\|64\|128\|256)OrNull
-
-Converts an input string to a [Nullable(Decimal(P,S))](../data-types/decimal.md) data type value. This family of functions includes:
-
-- `toDecimal32OrNull(expr, S)` — Results in `Nullable(Decimal32(S))` data type.
-- `toDecimal64OrNull(expr, S)` — Results in `Nullable(Decimal64(S))` data type.
-- `toDecimal128OrNull(expr, S)` — Results in `Nullable(Decimal128(S))` data type.
-- `toDecimal256OrNull(expr, S)` — Results in `Nullable(Decimal256(S))` data type.
-
-These functions should be used instead of `toDecimal*()` functions, if you prefer to get a `NULL` value instead of an exception in the event of an input value parsing error.
+```sql
+toDecimal32(expr, S)
+```
 
 **Arguments**
 
-- `expr` — [Expression](../syntax.md/#syntax-expressions), returns a value in the [String](../data-types/string.md) data type. ClickHouse expects the textual representation of the decimal number. For example, `'1.111'`.
-- `S` — Scale, the number of decimal places in the resulting value.
+- `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
+- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- Values or string representations of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type Float32/64.
+
+Unsupported arguments:
+- Values or string representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32('0xc0fe', 1);`.
+
+:::note
+Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`. 
+Excessive digits in a fraction are discarded (not rounded). 
+Excessive digits in the integer part will lead to an exception.
+:::
 
 **Returned value**
 
-A value in the `Nullable(Decimal(P,S))` data type. The value contains:
+- Value of type `Decimal(9, S)`. [Decimal32(S)](../data-types/int-uint.md).
 
-- Number with `S` decimal places, if ClickHouse interprets the input string as a number.
-- `NULL`, if ClickHouse can’t interpret the input string as a number or if the input number contains more than `S` decimal places.
-
-**Examples**
+**Example**
 
 Query:
 
-``` sql
-SELECT toDecimal32OrNull(toString(-1.111), 5) AS val, toTypeName(val);
+```sql
+SELECT
+    toDecimal32(2, 1) AS a, toTypeName(a) AS type_a,
+    toDecimal32(4.2, 2) AS b, toTypeName(b) AS type_b,
+    toDecimal32('4.2', 3) AS c, toTypeName(c) AS type_c
+FORMAT Vertical;
 ```
 
 Result:
 
 ```response
-┌────val─┬─toTypeName(toDecimal32OrNull(toString(-1.111), 5))─┐
-│ -1.111 │ Nullable(Decimal(9, 5))                            │
-└────────┴────────────────────────────────────────────────────┘
+Row 1:
+──────
+a:      2
+type_a: Decimal(9, 1)
+b:      4.2
+type_b: Decimal(9, 2)
+c:      4.2
+type_c: Decimal(9, 3)
 ```
 
-Query:
+**See also**
 
-``` sql
-SELECT toDecimal32OrNull(toString(-1.111), 2) AS val, toTypeName(val);
+- [`toDecimal32OrZero`](#todecimal32orzero).
+- [`toDecimal32OrNull`](#todecimal32ornull).
+- [`toDecimal32OrDefault`](#todecimal32ordefault).
+
+## toDecimal32OrZero
+
+Like [`toDecimal32`](#todecimal32), this function converts an input value to a value of type [Decimal(9, S)](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal32OrZero(expr, S)
 ```
 
-Result:
-
-```response
-┌──val─┬─toTypeName(toDecimal32OrNull(toString(-1.111), 2))─┐
-│ ᴺᵁᴸᴸ │ Nullable(Decimal(9, 2))                            │
-└──────┴────────────────────────────────────────────────────┘
-```
-
-
-## toDecimal(32\|64\|128\|256)OrDefault
-
-Converts an input string to a [Decimal(P,S)](../data-types/decimal.md) data type value. This family of functions includes:
-
-- `toDecimal32OrDefault(expr, S)` — Results in `Decimal32(S)` data type.
-- `toDecimal64OrDefault(expr, S)` — Results in `Decimal64(S)` data type.
-- `toDecimal128OrDefault(expr, S)` — Results in `Decimal128(S)` data type.
-- `toDecimal256OrDefault(expr, S)` — Results in `Decimal256(S)` data type.
-
-These functions should be used instead of `toDecimal*()` functions, if you prefer to get a default value instead of an exception in the event of an input value parsing error.
-
 **Arguments**
 
-- `expr` — [Expression](../syntax.md/#syntax-expressions), returns a value in the [String](../data-types/string.md) data type. ClickHouse expects the textual representation of the decimal number. For example, `'1.111'`.
-- `S` — Scale, the number of decimal places in the resulting value.
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrZero('0xc0fe', 1);`.
+
+:::note
+Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
 
 **Returned value**
 
-A value in the `Decimal(P,S)` data type. The value contains:
-
-- Number with `S` decimal places, if ClickHouse interprets the input string as a number.
-- Default `Decimal(P,S)` data type value, if ClickHouse can’t interpret the input string as a number or if the input number contains more than `S` decimal places.
-
-**Examples**
-
-Query:
-
-``` sql
-SELECT toDecimal32OrDefault(toString(-1.111), 5) AS val, toTypeName(val);
-```
-
-Result:
-
-```response
-┌────val─┬─toTypeName(toDecimal32OrDefault(toString(-1.111), 5))─┐
-│ -1.111 │ Decimal(9, 5)                                         │
-└────────┴───────────────────────────────────────────────────────┘
-```
-
-Query:
-
-``` sql
-SELECT toDecimal32OrDefault(toString(-1.111), 2) AS val, toTypeName(val);
-```
-
-Result:
-
-```response
-┌─val─┬─toTypeName(toDecimal32OrDefault(toString(-1.111), 2))─┐
-│   0 │ Decimal(9, 2)                                         │
-└─────┴───────────────────────────────────────────────────────┘
-```
-
-## toDecimal(32\|64\|128\|256)OrZero
-
-Converts an input value to the [Decimal(P,S)](../data-types/decimal.md) data type. This family of functions includes:
-
-- `toDecimal32OrZero( expr, S)` — Results in `Decimal32(S)` data type.
-- `toDecimal64OrZero( expr, S)` — Results in `Decimal64(S)` data type.
-- `toDecimal128OrZero( expr, S)` — Results in `Decimal128(S)` data type.
-- `toDecimal256OrZero( expr, S)` — Results in `Decimal256(S)` data type.
-
-These functions should be used instead of `toDecimal*()` functions, if you prefer to get a `0` value instead of an exception in the event of an input value parsing error.
-
-**Arguments**
-
-- `expr` — [Expression](../syntax.md/#syntax-expressions), returns a value in the [String](../data-types/string.md) data type. ClickHouse expects the textual representation of the decimal number. For example, `'1.111'`.
-- `S` — Scale, the number of decimal places in the resulting value.
-
-**Returned value**
-
-A value in the `Nullable(Decimal(P,S))` data type. The value contains:
-
-- Number with `S` decimal places, if ClickHouse interprets the input string as a number.
-- 0 with `S` decimal places, if ClickHouse can’t interpret the input string as a number or if the input number contains more than `S` decimal places.
+- Value of type `Decimal(9, S)` if successful, otherwise `0` with `S` decimal places. [Decimal32(S)](../data-types/decimal.md).
 
 **Example**
 
 Query:
 
 ``` sql
-SELECT toDecimal32OrZero(toString(-1.111), 5) AS val, toTypeName(val);
+SELECT
+    toDecimal32OrZero(toString(-1.111), 5) AS val,
+    toTypeName(val)
+FORMAT Vertical;
 ```
 
 Result:
 
 ```response
-┌────val─┬─toTypeName(toDecimal32OrZero(toString(-1.111), 5))─┐
-│ -1.111 │ Decimal(9, 5)                                      │
-└────────┴────────────────────────────────────────────────────┘
+Row 1:
+──────
+val:             -1.111
+toTypeName(val): Decimal(9, 5)
 ```
 
 Query:
 
 ``` sql
-SELECT toDecimal32OrZero(toString(-1.111), 2) AS val, toTypeName(val);
+SELECT
+    toDecimal32OrZero(toString(-1.111), 2) AS val,
+    toTypeName(val)
+FORMAT Vertical;
 ```
 
 Result:
 
 ```response
-┌──val─┬─toTypeName(toDecimal32OrZero(toString(-1.111), 2))─┐
-│ 0.00 │ Decimal(9, 2)                                      │
-└──────┴────────────────────────────────────────────────────┘
+Row 1:
+──────
+val:             -1.11
+toTypeName(val): Decimal(9, 2)
+```
+
+**See also**
+
+- [`toDecimal32`](#todecimal32).
+- [`toDecimal32OrNull`](#todecimal32ornull).
+- [`toDecimal32OrDefault`](#todecimal32ordefault).
+
+## toDecimal32OrNull
+
+Like [`toDecimal32`](#todecimal32), this function converts an input value to a value of type [Nullable(Decimal(9, S))](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal32OrNull(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrNull('0xc0fe', 1);`.
+
+:::note
+Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
+
+**Returned value**
+
+- Value of type `Nullable(Decimal(9, S))` if successful, otherwise value `NULL` of the same type. [Decimal32(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal32OrNull(toString(-1.111), 5) AS val,
+    toTypeName(val)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+val:             -1.111
+toTypeName(val): Nullable(Decimal(9, 5))
+```
+
+Query:
+
+``` sql
+SELECT
+    toDecimal32OrNull(toString(-1.111), 2) AS val,
+    toTypeName(val)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+val:             -1.11
+toTypeName(val): Nullable(Decimal(9, 2))
+```
+
+**See also**
+
+- [`toDecimal32`](#todecimal32).
+- [`toDecimal32OrZero`](#todecimal32orzero).
+- [`toDecimal32OrDefault`](#todecimal32ordefault).
+
+## toDecimal32OrDefault
+
+Like [`toDecimal32`](#todecimal32), this function converts an input value to a value of type [Decimal(9, S)](../data-types/decimal.md) but returns the default value in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal32OrDefault(expr, S[, default])
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `default` (optional) — The default value to return if parsing to type `Decimal32(S)` is unsuccessful. [Decimal32(S](../data-types/decimal.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrDefault('0xc0fe', 1);`.
+
+:::note
+Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(9, S)` if successful, otherwise returns the default value if passed or `0` if not. [Decimal32(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal32OrDefault(toString(-1.111), 5) AS val,
+    toTypeName(val)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+val:             -1.111
+toTypeName(val): Decimal(9, 5)
+```
+
+Query:
+
+``` sql
+SELECT
+    toDecimal32OrDefault(toString(-1.111), 2) AS val,
+    toTypeName(val)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+val:             -1.11
+toTypeName(val): Decimal(9, 2)
+```
+
+Query:
+
+``` sql
+SELECT
+    toDecimal32OrDefault('Inf', 2, CAST('0', 'Decimal32(2)')) AS val,
+    toTypeName(val)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+val:             0
+toTypeName(val): Decimal(9, 2)
 ```
 
 ## toString

From 4f2b1c36b7115143a23462282dc5474ed5b90afd Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 7 Aug 2024 11:12:09 +0200
Subject: [PATCH 09/52] Fix typo from previous PR

---
 docs/en/sql-reference/functions/type-conversion-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index 24055bb99b7..5db44da3e2d 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -2362,7 +2362,7 @@ toUInt64('64'):  64
 - [`toUInt64OrNull`](#touint64ornull).
 - [`toUInt64OrDefault`](#touint64ordefault).
 
-## toInt64OrZero
+## toUInt64OrZero
 
 Like [`toUInt64`](#touint64), this function converts an input value to a value of type [UInt64](../data-types/int-uint.md) but returns `0` in case of an error.
 

From b76e4acbc0a260f5222249a250066c77d2fcaff8 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 7 Aug 2024 11:13:56 +0200
Subject: [PATCH 10/52] fix another typo

---
 docs/en/sql-reference/functions/type-conversion-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index 5db44da3e2d..8e72fea7fdb 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -1546,7 +1546,7 @@ toInt256OrDefault('abc', CAST('-1', 'Int256')):  -1
 - [`toInt256OrZero`](#toint256orzero).
 - [`toInt256OrNull`](#toint256ornull).
 
-# toUInt8
+## toUInt8
 
 Converts an input value to a value of type [`UInt8`](../data-types/int-uint.md). Throws an exception in case of an error.
 

From 6172c56c1fd27f39d11914542f9e2dcb94fffd36 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 7 Aug 2024 09:48:38 +0000
Subject: [PATCH 11/52] Split tests to separate vaguely correlated tests

---
 ...3217_filtering_in_storage_merge.reference} |  6 +----
 .../03217_filtering_in_storage_merge.sql      | 16 +++++++++++
 ...03217_filtering_in_system_tables.reference |  4 +++
 ...l => 03217_filtering_in_system_tables.sql} | 27 +++++++------------
 4 files changed, 30 insertions(+), 23 deletions(-)
 rename tests/queries/0_stateless/{03217_read_rows_in_system_tables.reference => 03217_filtering_in_storage_merge.reference} (54%)
 create mode 100644 tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
 create mode 100644 tests/queries/0_stateless/03217_filtering_in_system_tables.reference
 rename tests/queries/0_stateless/{03217_read_rows_in_system_tables.sql => 03217_filtering_in_system_tables.sql} (55%)

diff --git a/tests/queries/0_stateless/03217_read_rows_in_system_tables.reference b/tests/queries/0_stateless/03217_filtering_in_storage_merge.reference
similarity index 54%
rename from tests/queries/0_stateless/03217_read_rows_in_system_tables.reference
rename to tests/queries/0_stateless/03217_filtering_in_storage_merge.reference
index b21ead49b1e..d366ad04c39 100644
--- a/tests/queries/0_stateless/03217_read_rows_in_system_tables.reference
+++ b/tests/queries/0_stateless/03217_filtering_in_storage_merge.reference
@@ -1,10 +1,6 @@
-information_schema	tables
-default	test_replica_1	r1
 Expression ((Project names + Projection))
   Aggregating
     Expression (Before GROUP BY)
       ReadFromMerge
         Filter (( + ( + )))
-          ReadFromMergeTree (default.test_replica_1)
-1	1
-1	1
+          ReadFromMergeTree (default.test_03217_merge_replica_1)
diff --git a/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql b/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
new file mode 100644
index 00000000000..5ecc1e7c672
--- /dev/null
+++ b/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
@@ -0,0 +1,16 @@
+CREATE TABLE test_03217_merge_replica_1(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217_merge_replica', 'r1')
+    ORDER BY x;
+CREATE TABLE test_03217_merge_replica_2(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217_merge_replica', 'r2')
+    ORDER BY x;
+
+
+CREATE TABLE test_03217_all_replicas (x UInt32)
+    ENGINE = Merge(currentDatabase(), 'test_03217_merge_replica_*');
+
+INSERT INTO test_03217_merge_replica_1 SELECT number AS x FROM numbers(10);
+SYSTEM SYNC REPLICA test_03217_merge_replica_2;
+
+-- If the filter on _table is not applied, then the plan will show both replicas
+EXPLAIN SELECT _table, count() FROM test_03217_all_replicas WHERE  _table = 'test_03217_merge_replica_1' AND x >= 0 GROUP BY _table;
diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.reference b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
new file mode 100644
index 00000000000..218fddf92e0
--- /dev/null
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
@@ -0,0 +1,4 @@
+information_schema	tables
+default	test_03217_system_tables_replica_1	r1
+1	1
+1	1
diff --git a/tests/queries/0_stateless/03217_read_rows_in_system_tables.sql b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
similarity index 55%
rename from tests/queries/0_stateless/03217_read_rows_in_system_tables.sql
rename to tests/queries/0_stateless/03217_filtering_in_system_tables.sql
index 3bea04ccccf..bbc755e478d 100644
--- a/tests/queries/0_stateless/03217_read_rows_in_system_tables.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
@@ -1,27 +1,18 @@
+-- If filtering is not done correctly on databases, then this query report to read 3 rows, which are: `system.tables`, `information_schema.tables` and `INFORMATION_SCHEMA.tables`
 SELECT database, table FROM system.tables WHERE database = 'information_schema' AND table = 'tables';
 
--- To verify StorageSystemReplicas applies the filter properly
-CREATE TABLE test_replica_1(x UInt32)
-    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217/test_replica', 'r1')
+CREATE TABLE test_03217_system_tables_replica_1(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217_system_tables_replica', 'r1')
     ORDER BY x;
-CREATE TABLE test_replica_2(x UInt32)
-    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217/test_replica', 'r2')
+CREATE TABLE test_03217_system_tables_replica_2(x UInt32)
+    ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217_system_tables_replica', 'r2')
     ORDER BY x;
 
-SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_replica_1' AND replica_name = 'r1';
-
-
--- To verify StorageMerge
-CREATE TABLE all_replicas (x UInt32)
-    ENGINE = Merge(currentDatabase(), 'test_replica_*');
-
-INSERT INTO test_replica_1 SELECT number AS x FROM numbers(10);
-SYSTEM SYNC REPLICA test_replica_2;
--- If the filter not applied, then the plan will show both replicas
-EXPLAIN SELECT _table, count() FROM all_replicas WHERE  _table = 'test_replica_1' AND x >= 0 GROUP BY _table;
+-- If filtering is not done correctly on database-table column, then this query report to read 2 rows, which are the above tables
+SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_03217_system_tables_replica_1' AND replica_name = 'r1';
 
 SYSTEM FLUSH LOGS;
--- argMin-argMax make the test repeatable
+-- argMin-argMax is necessary to make the test repeatable
 
 -- StorageSystemTables
 SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
@@ -30,5 +21,5 @@ SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_
 
 -- StorageSystemReplicas
 SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
-    AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_replica_1\' AND replica_name = \'r1\';'
+    AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_03217_system_tables_replica_1\' AND replica_name = \'r1\';'
     AND type = 'QueryFinish';

From ddc058aa6ff6780fa67bc5c59d9d7ff9a71d4ee1 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 7 Aug 2024 12:51:06 +0200
Subject: [PATCH 12/52] Update minio in stateless tests

---
 docker/test/stateless/Dockerfile     |  4 ++--
 docker/test/stateless/setup_minio.sh | 10 +++++-----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index a0e5513a3a2..d8eb072328f 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -69,8 +69,8 @@ ENV MAX_RUN_TIME=0
 
 # Unrelated to vars in setup_minio.sh, but should be the same there
 # to have the same binaries for local running scenario
-ARG MINIO_SERVER_VERSION=2022-01-03T18-22-58Z
-ARG MINIO_CLIENT_VERSION=2022-01-05T23-52-51Z
+ARG MINIO_SERVER_VERSION=2024-08-03T04-33-23Z
+ARG MINIO_CLIENT_VERSION=2024-07-31T15-58-33Z
 ARG TARGETARCH
 
 # Download Minio-related binaries
diff --git a/docker/test/stateless/setup_minio.sh b/docker/test/stateless/setup_minio.sh
index 2b9433edd20..d8310d072b8 100755
--- a/docker/test/stateless/setup_minio.sh
+++ b/docker/test/stateless/setup_minio.sh
@@ -59,8 +59,8 @@ find_os() {
 download_minio() {
   local os
   local arch
-  local minio_server_version=${MINIO_SERVER_VERSION:-2022-09-07T22-25-02Z}
-  local minio_client_version=${MINIO_CLIENT_VERSION:-2022-08-28T20-08-11Z}
+  local minio_server_version=${MINIO_SERVER_VERSION:-2024-08-03T04-33-23Z}
+  local minio_client_version=${MINIO_CLIENT_VERSION:-2024-07-31T15-58-33Z}
 
   os=$(find_os)
   arch=$(find_arch)
@@ -82,10 +82,10 @@ setup_minio() {
   local test_type=$1
   ./mc alias set clickminio http://localhost:11111 clickhouse clickhouse
   ./mc admin user add clickminio test testtest
-  ./mc admin policy set clickminio readwrite user=test
+  ./mc admin policy attach clickminio readwrite --user=test
   ./mc mb --ignore-existing clickminio/test
   if [ "$test_type" = "stateless" ]; then
-    ./mc policy set public clickminio/test
+    ./mc anonymous set public clickminio/test
   fi
 }
 
@@ -148,4 +148,4 @@ main() {
   setup_aws_credentials
 }
 
-main "$@"
\ No newline at end of file
+main "$@"

From 28c8d158635ef2564a60c25a6f971aa324030dcc Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 7 Aug 2024 13:37:56 +0000
Subject: [PATCH 13/52] Fix style

---
 tests/queries/0_stateless/03217_filtering_in_system_tables.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
index bbc755e478d..72ca7c8684d 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
@@ -16,10 +16,12 @@ SYSTEM FLUSH LOGS;
 
 -- StorageSystemTables
 SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+    AND current_database = currentDatabase()
     AND query LIKE '%SELECT database, table FROM system.tables WHERE database = \'information_schema\' AND table = \'tables\';'
     AND type = 'QueryFinish';
 
 -- StorageSystemReplicas
 SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+    AND current_database = currentDatabase()
     AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_03217_system_tables_replica_1\' AND replica_name = \'r1\';'
     AND type = 'QueryFinish';

From ad678cb5a8d4533a88273b8244dc0844c83e641c Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 7 Aug 2024 18:24:03 +0200
Subject: [PATCH 14/52] Ignore disappeared projections on start

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 33 +++++++++++-
 .../MergeTree/MergeTreeDataPartChecksum.cpp   |  6 ---
 .../MergeTree/MergeTreeDataPartChecksum.h     |  3 --
 .../test_broken_projections/test.py           | 50 +++++++++++++++++++
 4 files changed, 81 insertions(+), 11 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 3a44359b537..918a4cda714 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -72,6 +72,7 @@ namespace ErrorCodes
     extern const int BAD_TTL_FILE;
     extern const int NOT_IMPLEMENTED;
     extern const int NO_SUCH_COLUMN_IN_TABLE;
+    extern const int FILE_DOESNT_EXIST;
 }
 
 
@@ -749,8 +750,16 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
                 /// Probably there is something wrong with files of this part.
                 /// So it can be helpful to add to the error message some information about those files.
                 String files_in_part;
+
                 for (auto it = getDataPartStorage().iterate(); it->isValid(); it->next())
-                    files_in_part += fmt::format("{}{} ({} bytes)", (files_in_part.empty() ? "" : ", "), it->name(), getDataPartStorage().getFileSize(it->name()));
+                {
+                    std::string file_info;
+                    if (!getDataPartStorage().isDirectory(it->name()))
+                        file_info = fmt::format(" ({} bytes)", getDataPartStorage().getFileSize(it->name()));
+
+                    files_in_part += fmt::format("{}{}{}", (files_in_part.empty() ? "" : ", "), it->name(), file_info);
+
+                }
                 if (!files_in_part.empty())
                     e->addMessage("Part contains files: {}", files_in_part);
                 if (isEmpty())
@@ -2141,7 +2150,27 @@ void IMergeTreeDataPart::checkConsistencyBase() const
             }
         }
 
-        checksums.checkSizes(getDataPartStorage());
+        const auto & data_part_storage = getDataPartStorage();
+        for (const auto & [filename, checksum] : checksums.files)
+        {
+            try
+            {
+                checksum.checkSize(data_part_storage, filename);
+            }
+            catch (const Exception & ex)
+            {
+                /// For projection parts check will mark them broken in loadProjections
+                if (!parent_part && filename.ends_with(".proj"))
+                {
+                    std::string projection_name = fs::path(filename).stem();
+                    LOG_INFO(storage.log, "Projection {} doesn't exist on start for part {}, marking it as broken", projection_name, name);
+                    if (hasProjection(projection_name))
+                        markProjectionPartAsBroken(projection_name, ex.message(), ex.code());
+                }
+                else
+                    throw;
+            }
+        }
     }
     else
     {
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index b327480fa92..3ef36ce364c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -100,12 +100,6 @@ void MergeTreeDataPartChecksums::checkEqual(const MergeTreeDataPartChecksums & r
     }
 }
 
-void MergeTreeDataPartChecksums::checkSizes(const IDataPartStorage & storage) const
-{
-    for (const auto & [name, checksum] : files)
-        checksum.checkSize(storage, name);
-}
-
 UInt64 MergeTreeDataPartChecksums::getTotalSizeOnDisk() const
 {
     UInt64 res = 0;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 05178dc3a60..dc52f1ada2b 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -65,9 +65,6 @@ struct MergeTreeDataPartChecksums
 
     static bool isBadChecksumsErrorCode(int code);
 
-    /// Checks that the directory contains all the needed files of the correct size. Does not check the checksum.
-    void checkSizes(const IDataPartStorage & storage) const;
-
     /// Returns false if the checksum is too old.
     bool read(ReadBuffer & in);
     /// Assume that header with version (the first line) is read
diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 162c0dbaa2f..578ff42369c 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -4,6 +4,7 @@ import logging
 import string
 import random
 from helpers.cluster import ClickHouseCluster
+from multiprocessing.dummy import Pool
 
 cluster = ClickHouseCluster(__file__)
 
@@ -18,6 +19,12 @@ def cluster():
             stay_alive=True,
             with_zookeeper=True,
         )
+        cluster.add_instance(
+            "node_restart",
+            main_configs=["config.d/dont_start_broken.xml"],
+            stay_alive=True,
+            with_zookeeper=True,
+        )
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -632,6 +639,49 @@ def test_broken_on_start(cluster):
     check(node, table_name, 0)
 
 
+def test_disappeared_projection_on_start(cluster):
+    node = cluster.instances["node_restart"]
+
+    table_name = "test_disapperead_projection"
+    create_table(node, table_name, 1)
+
+    node.query(f"SYSTEM STOP MERGES {table_name}")
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    def drop_projection():
+        node.query(
+            f"ALTER TABLE {table_name} DROP PROJECTION proj2",
+            settings={"mutations_sync": "0"},
+        )
+
+    p = Pool(2)
+    p.apply_async(drop_projection)
+
+    for i in range(30):
+        create_query = node.query(f"SHOW CREATE TABLE {table_name}")
+        if "proj2" not in create_query:
+            break
+        time.sleep(0.5)
+
+    assert "proj2" not in create_query
+
+    # Remove 'proj2' for part all_2_2_0
+    break_projection(node, table_name, "proj2", "all_2_2_0", "part")
+
+    node.restart_clickhouse()
+
+    # proj2 is not broken, it doesn't exist, but ok
+    check(node, table_name, 0, expect_broken_part="proj2", do_check_command=0)
+
+
 def test_mutation_with_broken_projection(cluster):
     node = cluster.instances["node"]
 

From 0dc4d773edd530494c1ab514d104a45665bdd16a Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 7 Aug 2024 18:46:34 +0200
Subject: [PATCH 15/52] Fxi style

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 918a4cda714..93904c1a838 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -72,7 +72,6 @@ namespace ErrorCodes
     extern const int BAD_TTL_FILE;
     extern const int NOT_IMPLEMENTED;
     extern const int NO_SUCH_COLUMN_IN_TABLE;
-    extern const int FILE_DOESNT_EXIST;
 }
 
 

From ec3a248e70e16d2cb4db1ec5ff17e95cc11dedae Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 7 Aug 2024 17:37:54 +0000
Subject: [PATCH 16/52] Fix clang-tidy

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index b24d7968b61..5ee0bd328e0 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -1146,7 +1146,7 @@ std::optional<UInt64> MergeTreeData::totalRowsByPartitionPredicateImpl(
     auto metadata_snapshot = getInMemoryMetadataPtr();
     auto virtual_columns_block = getBlockWithVirtualsForFilter(metadata_snapshot, {parts[0]});
 
-    auto filter_dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_actions_dag.getOutputs().at(0), nullptr, /*allow_non_deterministic_functions=*/ false);
+    auto filter_dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_actions_dag.getOutputs().at(0), nullptr, /*allow_partial_result=*/ false);
     if (!filter_dag)
         return {};
 

From d81b5239debaf01b74521511db44d6cb4cd419c4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Aug 2024 21:37:01 +0200
Subject: [PATCH 17/52] Remove unused CLI option

---
 src/Client/ClientApplicationBase.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Client/ClientApplicationBase.cpp b/src/Client/ClientApplicationBase.cpp
index 9f133616d2e..71d13ad4f53 100644
--- a/src/Client/ClientApplicationBase.cpp
+++ b/src/Client/ClientApplicationBase.cpp
@@ -200,8 +200,6 @@ void ClientApplicationBase::init(int argc, char ** argv)
         ("pager", po::value<std::string>(), "Pipe all output into this command (less or similar)")
         ("max_memory_usage_in_client", po::value<std::string>(), "Set memory limit in client/local server")
 
-        ("fuzzer-args", po::value<std::string>(), "Command line arguments for the LLVM's libFuzzer driver. Only relevant if the application is compiled with libFuzzer.")
-
         ("client_logs_file", po::value<std::string>(), "Path to a file for writing client logs. Currently we only have fatal logs (when the client crashes)")
     ;
 

From 1dece979fe317a04f98d2b8008619c47fb72edb1 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Wed, 7 Aug 2024 23:10:40 +0200
Subject: [PATCH 18/52] CI: pass job timout into tests

---
 tests/ci/ci.py                    | 1 +
 tests/ci/ci_definitions.py        | 2 +-
 tests/ci/functional_test_check.py | 3 +++
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 8d0414ce7a8..49b597333dc 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -985,6 +985,7 @@ def _run_test(job_name: str, run_command: str) -> int:
     else:
         print("Use run command from the workflow")
     env["CHECK_NAME"] = job_name
+    env["MAX_RUN_TIME"] = str(timeout or 0)
     print(f"Going to start run command [{run_command}]")
     stopwatch = Stopwatch()
     job_log = Path(TEMP_PATH) / "job_log.txt"
diff --git a/tests/ci/ci_definitions.py b/tests/ci/ci_definitions.py
index 48847b0d7a6..592cb2f4879 100644
--- a/tests/ci/ci_definitions.py
+++ b/tests/ci/ci_definitions.py
@@ -420,7 +420,7 @@ class CommonJobConfigs:
         ),
         run_command='functional_test_check.py "$CHECK_NAME"',
         runner_type=Runners.FUNC_TESTER,
-        timeout=9000,
+        timeout=1000,  # test
     )
     STATEFUL_TEST = JobConfig(
         job_name_keyword="stateful",
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index 52970404d2d..3aff97643c3 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -114,6 +114,9 @@ def get_run_command(
     if flaky_check:
         envs.append("-e NUM_TRIES=50")
         envs.append("-e MAX_RUN_TIME=2800")
+    else:
+        max_run_time = os.getenv("MAX_RUN_TIME", 0)
+        envs.append(f"-e MAX_RUN_TIME={max_run_time}")
 
     envs += [f"-e {e}" for e in additional_envs]
 

From 086b3d240dd696c483f136d79db4587a83bb0a14 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Wed, 7 Aug 2024 23:34:36 +0200
Subject: [PATCH 19/52] CI: push CI

---
 tests/ci/ci_definitions.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_definitions.py b/tests/ci/ci_definitions.py
index 592cb2f4879..b62d2e0aa8e 100644
--- a/tests/ci/ci_definitions.py
+++ b/tests/ci/ci_definitions.py
@@ -420,7 +420,7 @@ class CommonJobConfigs:
         ),
         run_command='functional_test_check.py "$CHECK_NAME"',
         runner_type=Runners.FUNC_TESTER,
-        timeout=1000,  # test
+        timeout=1001,  # test
     )
     STATEFUL_TEST = JobConfig(
         job_name_keyword="stateful",

From 55ad7d30946d609159fe5ae9156f02f5b160585a Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Thu, 8 Aug 2024 00:08:12 +0200
Subject: [PATCH 20/52] Fix stylelint

---
 tests/ci/functional_test_check.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index 3aff97643c3..b7391eff01b 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -115,7 +115,7 @@ def get_run_command(
         envs.append("-e NUM_TRIES=50")
         envs.append("-e MAX_RUN_TIME=2800")
     else:
-        max_run_time = os.getenv("MAX_RUN_TIME", 0)
+        max_run_time = os.getenv("MAX_RUN_TIME", "0")
         envs.append(f"-e MAX_RUN_TIME={max_run_time}")
 
     envs += [f"-e {e}" for e in additional_envs]

From 142e9528f0f1f7daa68f296181f1c0e5f7b6108b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 8 Aug 2024 03:10:45 +0200
Subject: [PATCH 21/52] Add a test for #57420

---
 .../03218_materialize_msan.reference          |  1 +
 .../0_stateless/03218_materialize_msan.sql    | 21 +++++++++++++++++++
 2 files changed, 22 insertions(+)
 create mode 100644 tests/queries/0_stateless/03218_materialize_msan.reference
 create mode 100644 tests/queries/0_stateless/03218_materialize_msan.sql

diff --git a/tests/queries/0_stateless/03218_materialize_msan.reference b/tests/queries/0_stateless/03218_materialize_msan.reference
new file mode 100644
index 00000000000..eb84f35f9f4
--- /dev/null
+++ b/tests/queries/0_stateless/03218_materialize_msan.reference
@@ -0,0 +1 @@
+[(NULL,'11\01111111\011111','1111')]		-2147483648	\N
diff --git a/tests/queries/0_stateless/03218_materialize_msan.sql b/tests/queries/0_stateless/03218_materialize_msan.sql
new file mode 100644
index 00000000000..b41300ea1e3
--- /dev/null
+++ b/tests/queries/0_stateless/03218_materialize_msan.sql
@@ -0,0 +1,21 @@
+SELECT
+    materialize([(NULL, '11\01111111\011111', '1111')]) AS t,
+    (t[1048576]).2,
+    materialize(-2147483648),
+    (t[-2147483648]).1
+GROUP BY
+    materialize([(NULL, '1')]),
+    '',
+    (materialize((t[1023]).2), (materialize(''), (t[2147483647]).1, materialize(9223372036854775807)), (materialize(''), materialize(NULL, 2147483647, t[65535], 256)), materialize(NULL))
+; -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+
+SELECT
+    materialize([(NULL, '11\01111111\011111', '1111')]) AS t,
+    (t[1048576]).2,
+    materialize(-2147483648),
+    (t[-2147483648]).1
+GROUP BY
+    materialize([(NULL, '1')]),
+    '',
+    (materialize((t[1023]).2), (materialize(''), (t[2147483647]).1, materialize(9223372036854775807)), (materialize(''), materialize(NULL), materialize(2147483647), materialize(t[65535]), materialize(256)), materialize(NULL))
+;

From d6ecabb41dff64a1fb8ac5a77ffc1a8bed15162b Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Mon, 5 Aug 2024 00:40:23 +0000
Subject: [PATCH 22/52] Fix flaky
 test_storage_s3_queue/test.py::test_multiple_tables_streaming_sync_distributed

Disable parallel processing for the Ordered mode for the
test_storage_s3_queue/test.py::test_multiple_tables_streaming_sync_distributed
test.

The reason for this is that the load between the processing nodes is
too uneven when s3queue_processing_threads_num != 1,
e.g.:

```
$ grep res1 pytest.log
2024-08-07 07:15:58 [ 575 ] DEBUG : res1 size: 13300, res2 size: 1700, total_rows: 15000 (test.py:813, test_multiple_tables_streaming_sync_distributed)
```

In CIs environment, there are rare cases when one of the processors handles all the workload,
while the other is busy-waiting, and the test fails on assert:

When s3queue_processing_threads_num == 1, the workload is evenly
distributed:

```
$ grep res1 pytest.log
2024-08-07 07:26:52 [ 586 ] DEBUG : res1 size: 7200, res2 size: 7800, total_rows: 15000 (test.py:813, test_multiple_tables_streaming_sync_distributed)
```

This change only fixes test flakiness. Further investigation of the Order
mode parallelism is required.
---
 tests/integration/test_storage_s3_queue/test.py | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 92d6f181464..8f197e09e61 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -771,7 +771,11 @@ def test_multiple_tables_streaming_sync_distributed(started_cluster, mode):
             table_name,
             mode,
             files_path,
-            additional_settings={"keeper_path": keeper_path, "s3queue_buckets": 2},
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_buckets": 2,
+                **({"s3queue_processing_threads_num": 1} if mode == "ordered" else {}),
+            },
         )
 
     for instance in [node, node_2]:
@@ -806,6 +810,10 @@ def test_multiple_tables_streaming_sync_distributed(started_cluster, mode):
         list(map(int, l.split())) for l in run_query(node_2, get_query).splitlines()
     ]
 
+    logging.debug(
+        f"res1 size: {len(res1)}, res2 size: {len(res2)}, total_rows: {total_rows}"
+    )
+
     assert len(res1) + len(res2) == total_rows
 
     # Checking that all engines have made progress

From d0f35ce6a60e13b8aff9687a45e293ce89693241 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 8 Aug 2024 10:29:01 +0200
Subject: [PATCH 23/52] Fix setting prefix

---
 src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index 433a0e96d2e..7205b5b3294 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -305,7 +305,8 @@ void S3ObjectStorage::listObjects(const std::string & path, RelativePathsWithMet
 
     S3::ListObjectsV2Request request;
     request.SetBucket(uri.bucket);
-    request.SetPrefix(path);
+    if (path != "/")
+        request.SetPrefix(path);
     if (max_keys)
         request.SetMaxKeys(static_cast<int>(max_keys));
     else

From 59b737c9ac045ca0ec48eb2b8893c5e54646003a Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Thu, 8 Aug 2024 10:50:14 +0200
Subject: [PATCH 24/52] CI: set correct timeout for stateless tests

---
 tests/ci/ci_definitions.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_definitions.py b/tests/ci/ci_definitions.py
index b62d2e0aa8e..48847b0d7a6 100644
--- a/tests/ci/ci_definitions.py
+++ b/tests/ci/ci_definitions.py
@@ -420,7 +420,7 @@ class CommonJobConfigs:
         ),
         run_command='functional_test_check.py "$CHECK_NAME"',
         runner_type=Runners.FUNC_TESTER,
-        timeout=1001,  # test
+        timeout=9000,
     )
     STATEFUL_TEST = JobConfig(
         job_name_keyword="stateful",

From b0ba53788ac758ac1405ceefacd91bb0418b5834 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 7 Aug 2024 16:29:07 +0000
Subject: [PATCH 25/52] Refactor tests for (experimental) statistics

---
 docs/en/development/tests.md                  |   4 +-
 .../statements/alter/statistics.md            |  16 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |   2 +-
 ...2864_statistics_count_min_sketch.reference |  14 --
 .../02864_statistics_count_min_sketch.sql     |  70 ------
 .../02864_statistics_ddl.reference            |  37 +--
 .../0_stateless/02864_statistics_ddl.sql      | 234 ++++++++++++++----
 ...delayed_materialization_in_merge.reference |  12 +
 ...stics_delayed_materialization_in_merge.sql |  36 +++
 .../02864_statistics_exception.reference      |   0
 .../02864_statistics_exception.sql            |  55 ----
 ..._statistics_materialize_in_merge.reference |  10 -
 .../02864_statistics_materialize_in_merge.sql |  52 ----
 .../02864_statistics_predicates.reference     |  92 +++++++
 .../02864_statistics_predicates.sql           | 214 ++++++++++++++++
 .../02864_statistics_uniq.reference           |  35 ---
 .../0_stateless/02864_statistics_uniq.sql     |  73 ------
 .../02864_statistics_usage.reference          |  20 ++
 .../0_stateless/02864_statistics_usage.sql    |  42 ++++
 19 files changed, 619 insertions(+), 399 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_exception.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_exception.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_predicates.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_predicates.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_uniq.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_uniq.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_usage.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_usage.sql

diff --git a/docs/en/development/tests.md b/docs/en/development/tests.md
index 269995a1a96..6cb36e2049b 100644
--- a/docs/en/development/tests.md
+++ b/docs/en/development/tests.md
@@ -14,7 +14,7 @@ Each functional test sends one or multiple queries to the running ClickHouse ser
 
 Tests are located in `queries` directory. There are two subdirectories: `stateless` and `stateful`. Stateless tests run queries without any preloaded test data - they often create small synthetic datasets on the fly, within the test itself. Stateful tests require preloaded test data from ClickHouse and it is available to general public.
 
-Each test can be one of two types: `.sql` and `.sh`. `.sql` test is the simple SQL script that is piped to `clickhouse-client --multiquery`. `.sh` test is a script that is run by itself. SQL tests are generally preferable to `.sh` tests. You should use `.sh` tests only when you have to test some feature that cannot be exercised from pure SQL, such as piping some input data into `clickhouse-client` or testing `clickhouse-local`.
+Each test can be one of two types: `.sql` and `.sh`. `.sql` test is the simple SQL script that is piped to `clickhouse-client`. `.sh` test is a script that is run by itself. SQL tests are generally preferable to `.sh` tests. You should use `.sh` tests only when you have to test some feature that cannot be exercised from pure SQL, such as piping some input data into `clickhouse-client` or testing `clickhouse-local`.
 
 :::note
 A common mistake when testing data types `DateTime` and `DateTime64` is assuming that the server uses a specific time zone (e.g. "UTC"). This is not the case, time zones in CI test runs
@@ -38,7 +38,7 @@ For more options, see `tests/clickhouse-test --help`. You can simply run all tes
 
 ### Adding a New Test
 
-To add new test, create a `.sql` or `.sh` file in `queries/0_stateless` directory, check it manually and then generate `.reference` file in the following way: `clickhouse-client --multiquery < 00000_test.sql > 00000_test.reference` or `./00000_test.sh > ./00000_test.reference`.
+To add new test, create a `.sql` or `.sh` file in `queries/0_stateless` directory, check it manually and then generate `.reference` file in the following way: `clickhouse-client < 00000_test.sql > 00000_test.reference` or `./00000_test.sh > ./00000_test.reference`.
 
 Tests should use (create, drop, etc) only tables in `test` database that is assumed to be created beforehand; also tests can use temporary tables.
 
diff --git a/docs/en/sql-reference/statements/alter/statistics.md b/docs/en/sql-reference/statements/alter/statistics.md
index 6880cef0e5c..7a1774a01b5 100644
--- a/docs/en/sql-reference/statements/alter/statistics.md
+++ b/docs/en/sql-reference/statements/alter/statistics.md
@@ -8,26 +8,28 @@ sidebar_label: STATISTICS
 
 The following operations are available:
 
--   `ALTER TABLE [db].table ADD STATISTICS (columns list) TYPE (type list)` - Adds statistic description to tables metadata.
+-   `ALTER TABLE [db].table ADD STATISTICS [IF NOT EXISTS] (column list) TYPE (type list)` - Adds statistic description to tables metadata.
 
--   `ALTER TABLE [db].table MODIFY STATISTICS (columns list) TYPE (type list)` - Modifies statistic description to tables metadata.
+-   `ALTER TABLE [db].table MODIFY STATISTICS (column list) TYPE (type list)` - Modifies statistic description to tables metadata.
 
--   `ALTER TABLE [db].table DROP STATISTICS (columns list)` - Removes statistics from the metadata of the specified columns and deletes all statistics objects in all parts for the specified columns.
+-   `ALTER TABLE [db].table DROP STATISTICS [IF EXISTS] (column list)` - Removes statistics from the metadata of the specified columns and deletes all statistics objects in all parts for the specified columns.
 
--   `ALTER TABLE [db].table CLEAR STATISTICS (columns list)` - Deletes all statistics objects in all parts for the specified columns. Statistics objects can be rebuild using `ALTER TABLE MATERIALIZE STATISTICS`.
+-   `ALTER TABLE [db].table CLEAR STATISTICS [IF EXISTS] (column list)` - Deletes all statistics objects in all parts for the specified columns. Statistics objects can be rebuild using `ALTER TABLE MATERIALIZE STATISTICS`.
 
--   `ALTER TABLE [db.]table MATERIALIZE STATISTICS (columns list)` - Rebuilds the statistic for columns. Implemented as a [mutation](../../../sql-reference/statements/alter/index.md#mutations). 
+-   `ALTER TABLE [db.]table MATERIALIZE STATISTICS [IF EXISTS] (column list)` - Rebuilds the statistic for columns. Implemented as a [mutation](../../../sql-reference/statements/alter/index.md#mutations). 
 
 The first two commands are lightweight in a sense that they only change metadata or remove files.
 
 Also, they are replicated, syncing statistics metadata via ZooKeeper.
 
-There is an example adding two statistics types to two columns:
+## Example:
+
+Adding two statistics types to two columns:
 
 ```
 ALTER TABLE t1 MODIFY STATISTICS c, d TYPE TDigest, Uniq;
 ```
 
 :::note
-Statistic manipulation is supported only for tables with [`*MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) engine (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) variants).
+Statistic are supported only for [`*MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) engine tables (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) variants).
 :::
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 051d52a71cd..fe4857e9449 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -3513,7 +3513,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
                         const auto & new_column = new_metadata.getColumns().get(command.column_name);
                         if (!old_column.type->equals(*new_column.type))
                             throw Exception(ErrorCodes::ALTER_OF_COLUMN_IS_FORBIDDEN,
-                                            "ALTER types of column {} with statistics is not not safe "
+                                            "ALTER types of column {} with statistics is not safe "
                                             "because it can change the representation of statistics",
                                             backQuoteIfNeed(command.column_name));
                     }
diff --git a/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference b/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
deleted file mode 100644
index 02c41656a36..00000000000
--- a/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
+++ /dev/null
@@ -1,14 +0,0 @@
-CREATE TABLE default.tab\n(\n    `a` String,\n    `b` UInt64,\n    `c` Int64,\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-Test statistics count_min:
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(equals(a, \'0\'), equals(b, 0), equals(c, 0)) (removed)
-Test statistics multi-types:
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(equals(a, \'0\'), less(c, -90), greater(b, 900)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(equals(a, \'10000\'), equals(b, 0), less(c, 0)) (removed)
-Test LowCardinality and Nullable data type:
-tab2
diff --git a/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql b/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
deleted file mode 100644
index c730aa7b4a7..00000000000
--- a/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
+++ /dev/null
@@ -1,70 +0,0 @@
--- Tags: no-fasttest
-
-DROP TABLE IF EXISTS tab SYNC;
-
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-SET allow_suspicious_low_cardinality_types=1;
-SET mutations_sync = 2;
-
-CREATE TABLE tab
-(
-    a String,
-    b UInt64,
-    c Int64,
-    pk String,
-) Engine = MergeTree() ORDER BY pk
-SETTINGS min_bytes_for_wide_part = 0;
-
-SHOW CREATE TABLE tab;
-
-INSERT INTO tab select toString(number % 10000), number % 1000, -(number % 100), generateUUIDv4() FROM system.numbers LIMIT 10000;
-
-SELECT 'Test statistics count_min:';
-
-ALTER TABLE tab ADD STATISTICS a TYPE count_min;
-ALTER TABLE tab ADD STATISTICS b TYPE count_min;
-ALTER TABLE tab ADD STATISTICS c TYPE count_min;
-ALTER TABLE tab MATERIALIZE STATISTICS a, b, c;
-
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
-FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c = 0/*100*/ and b = 0/*10*/ and a = '0'/*1*/) xx
-WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-ALTER TABLE tab DROP STATISTICS a, b, c;
-
-
-SELECT 'Test statistics multi-types:';
-
-ALTER TABLE tab ADD STATISTICS a TYPE count_min;
-ALTER TABLE tab ADD STATISTICS b TYPE count_min, uniq, tdigest;
-ALTER TABLE tab ADD STATISTICS c TYPE count_min, uniq, tdigest;
-ALTER TABLE tab MATERIALIZE STATISTICS a, b, c;
-
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
-FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < -90/*900*/ and b > 900/*990*/ and a = '0'/*1*/)
-WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
-FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 0/*9900*/ and b = 0/*10*/ and a = '10000'/*0*/)
-WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-ALTER TABLE tab DROP STATISTICS a, b, c;
-
-DROP TABLE IF EXISTS tab SYNC;
-
-
-SELECT 'Test LowCardinality and Nullable data type:';
-DROP TABLE IF EXISTS tab2 SYNC;
-SET allow_suspicious_low_cardinality_types=1;
-CREATE TABLE tab2
-(
-    a LowCardinality(Int64) STATISTICS(count_min),
-    b Nullable(Int64) STATISTICS(count_min),
-    c LowCardinality(Nullable(Int64)) STATISTICS(count_min),
-    pk String,
-) Engine = MergeTree() ORDER BY pk;
-
-select name from system.tables where name = 'tab2' and database = currentDatabase();
-
-DROP TABLE IF EXISTS tab2 SYNC;
diff --git a/tests/queries/0_stateless/02864_statistics_ddl.reference b/tests/queries/0_stateless/02864_statistics_ddl.reference
index a7ff5caa0b0..0e453b0ee8a 100644
--- a/tests/queries/0_stateless/02864_statistics_ddl.reference
+++ b/tests/queries/0_stateless/02864_statistics_ddl.reference
@@ -1,31 +1,6 @@
-CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-After insert
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
-10
-0
-After drop statistic
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(b, 10), less(a, 10)) (removed)
-10
-CREATE TABLE default.tab\n(\n    `a` Float64,\n    `b` Int64,\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-After add statistic
-CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-After materialize statistic
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
-20
-After merge
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
-20
-CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `c` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-After rename
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), less(c, 10)) (removed)
-20
+CREATE TABLE default.tab\n(\n    `f64` Float64,\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32,\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `f64` Float64,\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32,\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
diff --git a/tests/queries/0_stateless/02864_statistics_ddl.sql b/tests/queries/0_stateless/02864_statistics_ddl.sql
index fe612efe2ac..32b56a842b7 100644
--- a/tests/queries/0_stateless/02864_statistics_ddl.sql
+++ b/tests/queries/0_stateless/02864_statistics_ddl.sql
@@ -1,59 +1,195 @@
--- Tests that various DDL statements create/drop/materialize statistics
+-- Tags: no-fasttest
+-- no-fasttest: 'count_min' sketches need a 3rd party library
+
+-- Tests that DDL statements which create / drop / materialize statistics
+
+SET mutations_sync = 1;
 
 DROP TABLE IF EXISTS tab;
 
+-- Error case: Can't create statistics when allow_experimental_statistics = 0
+CREATE TABLE tab (col Float64 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
 SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
+
+-- Error case: Unknown statistics types are rejected
+CREATE TABLE tab (col Float64 STATISTICS(no_statistics_type)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
+-- Error case: The same statistics type can't exist more than once on a column
+CREATE TABLE tab (col Float64 STATISTICS(tdigest, tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
+SET allow_suspicious_low_cardinality_types = 1;
+
+-- Statistics can only be created on columns of specific data types (depending on the statistics kind), (*)
+
+--   tdigest requires data_type.isValueRepresentedByInteger
+--     These types work:
+CREATE TABLE tab (col UInt8 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col UInt256 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Float32 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Decimal32(3) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date32 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime64 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col IPv4 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Nullable(UInt8) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+--     These types don't work:
+CREATE TABLE tab (col String STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col FixedString(1) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Array(Float64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col UUID STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col IPv6 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+
+--   uniq requires data_type.isValueRepresentedByInteger
+--     These types work:
+CREATE TABLE tab (col UInt8 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col UInt256 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Float32 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Decimal32(3) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date32 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime64 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col IPv4 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Nullable(UInt8) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+--     These types don't work:
+CREATE TABLE tab (col String STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col FixedString(1) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Array(Float64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col UUID STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col IPv6 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+
+--   count_min requires data_type.isValueRepresentedByInteger or data_type = (Fixed)String
+--     These types work:
+CREATE TABLE tab (col UInt8 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col UInt256 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Float32 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Decimal32(3) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Date32 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col DateTime64 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col IPv4 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col Nullable(UInt8) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col String STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+CREATE TABLE tab (col FixedString(1) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
+--     These types don't work:
+CREATE TABLE tab (col Array(Float64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col UUID STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+CREATE TABLE tab (col IPv6 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+
+-- CREATE TABLE was easy, ALTER is more fun
 
 CREATE TABLE tab
 (
-    a Float64 STATISTICS(tdigest),
-    b Int64 STATISTICS(tdigest),
-    pk String,
-) Engine = MergeTree() ORDER BY pk
-SETTINGS min_bytes_for_wide_part = 0;
+    f64           Float64,
+    f64_tdigest   Float64 STATISTICS(tdigest),
+    f32           Float32,
+    s             String,
+    a             Array(Float64)
+)
+Engine = MergeTree()
+ORDER BY tuple();
 
+-- Error case: Unknown statistics types are rejected
+-- (relevant for ADD and MODIFY)
+ALTER TABLE tab ADD STATISTICS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
+ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
+ALTER TABLE tab MODIFY STATISTICS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
+-- for some reason, ALTER TABLE tab MODIFY STATISTICS IF EXISTS is not supported
+
+-- Error case: The same statistics type can't exist more than once on a column
+-- (relevant for ADD and MODIFY)
+--   Create the same statistics object twice
+ALTER TABLE tab ADD STATISTICS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
+ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
+ALTER TABLE tab MODIFY STATISTICS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
+--   Create an statistics which exists already
+ALTER TABLE tab ADD STATISTICS f64_tdigest TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64_tdigest TYPE tdigest; -- no-op
+ALTER TABLE tab MODIFY STATISTICS f64_tdigest TYPE tdigest; -- no-op
+
+-- Error case: Column does not exist
+-- (relevant for ADD, MODIFY, DROP, CLEAR, and MATERIALIZE)
+-- Note that the results are unfortunately quite inconsistent ...
+ALTER TABLE tab ADD STATISTICS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab ADD STATISTICS IF NOT EXISTS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MODIFY STATISTICS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS IF EXISTS no_such_column; -- no-op
+ALTER TABLE tab CLEAR STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab CLEAR STATISTICS IF EXISTS no_such_column; -- no-op
+ALTER TABLE tab MATERIALIZE STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MATERIALIZE STATISTICS IF EXISTS no_such_column; -- { serverError ILLEGAL_STATISTICS }
+
+-- Error case: Column exists but has no statistics
+-- (relevant for MODIFY, DROP, CLEAR, and MATERIALIZE)
+-- Note that the results are unfortunately quite inconsistent ...
+ALTER TABLE tab MODIFY STATISTICS s TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS IF EXISTS s; -- no-op
+ALTER TABLE tab CLEAR STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab CLEAR STATISTICS IF EXISTS s; -- no-op
+ALTER TABLE tab MATERIALIZE STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MATERIALIZE STATISTICS IF EXISTS s; -- { serverError ILLEGAL_STATISTICS }
+
+-- We don't check systematically that that statistics can only be created via ALTER ADD STATISTICS on columns of specific data types (the
+-- internal type validation code is tested already above, (*)). Only do a rudimentary check for each statistics type with a data type that
+-- works and one that doesn't work.
+--   tdigest
+--     Works:
+ALTER TABLE tab ADD STATISTICS f64 TYPE tdigest; ALTER TABLE tab DROP STATISTICS f64;
+ALTER TABLE tab MODIFY STATISTICS f64 TYPE tdigest; ALTER TABLE tab DROP STATISTICS f64;
+--     Doesn't work:
+ALTER TABLE tab ADD STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MODIFY STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+--   uniq
+--     Works:
+ALTER TABLE tab ADD STATISTICS f64 TYPE uniq; ALTER TABLE tab DROP STATISTICS f64;
+ALTER TABLE tab MODIFY STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
+--     Doesn't work:
+ALTER TABLE tab ADD STATISTICS a TYPE uniq; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MODIFY STATISTICS a TYPE uniq; -- { serverError ILLEGAL_STATISTICS }
+--   count_min
+--     Works:
+ALTER TABLE tab ADD STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
+ALTER TABLE tab MODIFY STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
+--     Doesn't work:
+ALTER TABLE tab ADD STATISTICS a TYPE count_min; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MODIFY STATISTICS a TYPE count_min; -- { serverError ILLEGAL_STATISTICS }
+
+-- Any data type changes on columns with statistics are disallowed, for simplicity even if the new data type is compatible with all existing
+-- statistics objects (e.g. tdigest can be created on Float64 and UInt64)
+ALTER TABLE tab MODIFY COLUMN f64_tdigest UInt64; -- { serverError ALTER_OF_COLUMN_IS_FORBIDDEN }
+
+-- Finally, do a full-circle test of a good case. Print table definition after each step.
+-- Intentionally specifying _two_ columns and _two_ statistics types to have that also tested.
+SHOW CREATE TABLE tab;
+ALTER TABLE tab ADD STATISTICS f64, f32 TYPE tdigest, uniq;
+SHOW CREATE TABLE tab;
+ALTER TABLE tab MODIFY STATISTICS f64, f32 TYPE tdigest, uniq;
+SHOW CREATE TABLE tab;
+ALTER TABLE tab CLEAR STATISTICS f64, f32;
+SHOW CREATE TABLE tab;
+ALTER TABLE tab MATERIALIZE STATISTICS f64, f32;
+SHOW CREATE TABLE tab;
+ALTER TABLE tab DROP STATISTICS f64, f32;
 SHOW CREATE TABLE tab;
 
-INSERT INTO tab select number, -number, generateUUIDv4() FROM system.numbers LIMIT 10000;
-
-SELECT 'After insert';
-SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT count(*) FROM tab WHERE b < 10 and a < 10;
-SELECT count(*) FROM tab WHERE b < NULL and a < '10';
-
-ALTER TABLE tab DROP STATISTICS a, b;
-
-SELECT 'After drop statistic';
-SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT count(*) FROM tab WHERE b < 10 and a < 10;
-
-SHOW CREATE TABLE tab;
-
-ALTER TABLE tab ADD STATISTICS a, b TYPE tdigest;
-
-SELECT 'After add statistic';
-
-SHOW CREATE TABLE tab;
-
-ALTER TABLE tab MATERIALIZE STATISTICS a, b;
-INSERT INTO tab select number, -number, generateUUIDv4() FROM system.numbers LIMIT 10000;
-
-SELECT 'After materialize statistic';
-SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT count(*) FROM tab WHERE b < 10 and a < 10;
-
-OPTIMIZE TABLE tab FINAL;
-
-SELECT 'After merge';
-SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT count(*) FROM tab WHERE b < 10 and a < 10;
-
-ALTER TABLE tab RENAME COLUMN b TO c;
-SHOW CREATE TABLE tab;
-
-SELECT 'After rename';
-SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT count(*) FROM tab WHERE c < 10 and a < 10;
-
-DROP TABLE IF EXISTS tab;
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
new file mode 100644
index 00000000000..eb5e685597c
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
@@ -0,0 +1,12 @@
+After insert
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(b, 10_UInt8), less(a, 10_UInt8)) (removed)
+After merge
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
+After truncate, insert, and materialize
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
new file mode 100644
index 00000000000..33a5f9052ba
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
@@ -0,0 +1,36 @@
+-- Tests delayed materialization of statistics in merge instead of during insert (setting 'materialize_statistics_on_insert = 0').
+-- (The concrete statistics type, column data type and predicate type don't matter)
+
+-- Checks by the predicate evaluation order in EXPLAIN. This is quite fragile, a better approach would be helpful (maybe 'send_logs_level'?)
+
+DROP TABLE IF EXISTS tab;
+
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+SET allow_analyzer = 1;
+
+SET materialize_statistics_on_insert = 0;
+
+CREATE TABLE tab
+(
+    a Int64 STATISTICS(tdigest),
+    b Int16 STATISTICS(tdigest),
+) ENGINE = MergeTree() ORDER BY tuple()
+SETTINGS min_bytes_for_wide_part = 0, enable_vertical_merge_algorithm = 0; -- TODO: there is a bug in vertical merge with statistics.
+
+INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
+SELECT 'After insert';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks b first, then a (statistics not used)
+
+OPTIMIZE TABLE tab FINAL;
+SELECT 'After merge';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
+
+TRUNCATE TABLE tab;
+SET mutations_sync = 2;
+INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
+ALTER TABLE tab MATERIALIZE STATISTICS a, b;
+SELECT 'After truncate, insert, and materialize';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_exception.reference b/tests/queries/0_stateless/02864_statistics_exception.reference
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/queries/0_stateless/02864_statistics_exception.sql b/tests/queries/0_stateless/02864_statistics_exception.sql
deleted file mode 100644
index 289ffee6600..00000000000
--- a/tests/queries/0_stateless/02864_statistics_exception.sql
+++ /dev/null
@@ -1,55 +0,0 @@
--- Tests creating/dropping/materializing statistics produces the right exceptions.
-
-DROP TABLE IF EXISTS tab;
-
--- Can't create statistics when allow_experimental_statistics = 0
-CREATE TABLE tab
-(
-    a Float64 STATISTICS(tdigest)
-) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
-SET allow_experimental_statistics = 1;
-
--- The same type of statistics can't exist more than once on a column
-CREATE TABLE tab
-(
-    a Float64 STATISTICS(tdigest, tdigest)
-) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
--- Unknown statistics types are rejected
-CREATE TABLE tab
-(
-    a Float64 STATISTICS(no_statistics_type)
-) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
--- tDigest statistics can only be created on numeric columns
-CREATE TABLE tab
-(
-    a String STATISTICS(tdigest),
-) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-
-CREATE TABLE tab
-(
-    a Float64,
-    b String
-) Engine = MergeTree() ORDER BY tuple();
-
-ALTER TABLE tab ADD STATISTICS a TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
-ALTER TABLE tab ADD STATISTICS a TYPE tdigest;
-ALTER TABLE tab ADD STATISTICS IF NOT EXISTS a TYPE tdigest;
-ALTER TABLE tab ADD STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MODIFY STATISTICS a TYPE tdigest;
--- Statistics can be created only on integer columns
-ALTER TABLE tab ADD STATISTICS b TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS b; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS a;
-ALTER TABLE tab DROP STATISTICS IF EXISTS a;
-ALTER TABLE tab CLEAR STATISTICS a; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab CLEAR STATISTICS IF EXISTS a;
-ALTER TABLE tab MATERIALIZE STATISTICS b; -- { serverError ILLEGAL_STATISTICS }
-
-ALTER TABLE tab ADD STATISTICS a TYPE tdigest;
-ALTER TABLE tab MODIFY COLUMN a Float64 TTL toDateTime(b) + INTERVAL 1 MONTH;
-ALTER TABLE tab MODIFY COLUMN a Int64; -- { serverError ALTER_OF_COLUMN_IS_FORBIDDEN }
-
-DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
deleted file mode 100644
index 5e969cf41cb..00000000000
--- a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
+++ /dev/null
@@ -1,10 +0,0 @@
-10
-10
-10
-statistics not used	Condition less(b, 10_UInt8) moved to PREWHERE
-statistics not used	Condition less(a, 10_UInt8) moved to PREWHERE
-statistics used after merge	Condition less(a, 10_UInt8) moved to PREWHERE
-statistics used after merge	Condition less(b, 10_UInt8) moved to PREWHERE
-statistics used after materialize	Condition less(a, 10_UInt8) moved to PREWHERE
-statistics used after materialize	Condition less(b, 10_UInt8) moved to PREWHERE
-2	0
diff --git a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
deleted file mode 100644
index 6606cff263f..00000000000
--- a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
+++ /dev/null
@@ -1,52 +0,0 @@
--- Tests delayed materialization of statistics in merge instead of during insert (setting 'materialize_statistics_on_insert = 0').
-
-DROP TABLE IF EXISTS tab;
-
-SET enable_analyzer = 1;
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-
-SET materialize_statistics_on_insert = 0;
-
-CREATE TABLE tab
-(
-    a Int64 STATISTICS(tdigest),
-    b Int16 STATISTICS(tdigest),
-) ENGINE = MergeTree() ORDER BY tuple()
-SETTINGS min_bytes_for_wide_part = 0, enable_vertical_merge_algorithm = 0; -- TODO: there is a bug in vertical merge with statistics.
-
-INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
-
-SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics not used';
-
-OPTIMIZE TABLE tab FINAL;
-
-SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics used after merge';
-
-TRUNCATE TABLE tab;
-SET mutations_sync = 2;
-
-INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
-ALTER TABLE tab MATERIALIZE STATISTICS a, b;
-
-SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics used after materialize';
-
-DROP TABLE tab;
-
-SYSTEM FLUSH LOGS;
-
-SELECT log_comment, message FROM system.text_log JOIN
-(
-    SELECT Settings['log_comment'] AS log_comment, query_id FROM system.query_log
-    WHERE current_database = currentDatabase()
-        AND query LIKE 'SELECT count(*) FROM tab%'
-        AND type = 'QueryFinish'
-) AS query_log USING (query_id)
-WHERE message LIKE '%moved to PREWHERE%'
-ORDER BY event_time_microseconds;
-
-SELECT count(), sum(ProfileEvents['MergeTreeDataWriterStatisticsCalculationMicroseconds'])
-FROM system.query_log
-WHERE current_database = currentDatabase()
-    AND query LIKE 'INSERT INTO tab SELECT%'
-    AND type = 'QueryFinish';
diff --git a/tests/queries/0_stateless/02864_statistics_predicates.reference b/tests/queries/0_stateless/02864_statistics_predicates.reference
new file mode 100644
index 00000000000..1c2abd47aaf
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_predicates.reference
@@ -0,0 +1,92 @@
+u64 and =
+10
+10
+10
+10
+0
+0
+0
+0
+10
+10
+10
+10
+u64 and <
+70
+70
+70
+70
+80
+80
+80
+80
+70
+70
+70
+f64 and =
+10
+10
+10
+10
+0
+0
+0
+0
+10
+10
+10
+0
+0
+0
+f64 and <
+70
+70
+70
+70
+80
+80
+80
+80
+70
+70
+70
+80
+80
+80
+dt and =
+0
+0
+0
+0
+10
+10
+10
+10
+dt and <
+10000
+10000
+10000
+70
+70
+70
+70
+b and =
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+5000
+0
+0
+0
+0
+s and =
+10
+10
diff --git a/tests/queries/0_stateless/02864_statistics_predicates.sql b/tests/queries/0_stateless/02864_statistics_predicates.sql
new file mode 100644
index 00000000000..3e754dfb1de
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_predicates.sql
@@ -0,0 +1,214 @@
+-- Tags: no-fasttest
+-- no-fasttest: 'count_min' sketches need a 3rd party library
+
+-- Tests the cross product of all predicates with all right-hand sides on all data types and all statistics types.
+
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab
+(
+    u64                 UInt64,
+    u64_tdigest         UInt64 STATISTICS(tdigest),
+    u64_count_min       UInt64 STATISTICS(count_min),
+    u64_uniq            UInt64 STATISTICS(uniq),
+    f64                 Float64,
+    f64_tdigest         Float64 STATISTICS(tdigest),
+    f64_count_min       Float64 STATISTICS(count_min),
+    f64_uniq            Float64 STATISTICS(uniq),
+    dt                  DateTime,
+    dt_tdigest          DateTime STATISTICS(tdigest),
+    dt_count_min        DateTime STATISTICS(count_min),
+    dt_uniq             DateTime STATISTICS(uniq),
+    b                   Bool,
+    b_tdigest           Bool STATISTICS(tdigest),
+    b_count_min         Bool STATISTICS(count_min),
+    b_uniq              Bool STATISTICS(uniq),
+    s                   String,
+ -- s_tdigest           String STATISTICS(tdigest), -- not supported by tdigest
+    s_count_min         String STATISTICS(count_min)
+ -- s_uniq              String STATISTICS(uniq), -- not supported by uniq
+) Engine = MergeTree() ORDER BY tuple()
+SETTINGS min_bytes_for_wide_part = 0;
+
+INSERT INTO tab
+-- SELECT number % 10000, number % 1000, -(number % 100) FROM system.numbers LIMIT 10000;
+SELECT number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 1000,
+       number % 2,
+       number % 2,
+       number % 2,
+       number % 2,
+       toString(number % 1000),
+       toString(number % 1000)
+FROM system.numbers LIMIT 10000;
+
+-- u64 ----------------------------------------------------
+
+SELECT 'u64 and =';
+
+SELECT count(*) FROM tab WHERE u64 = 7;
+SELECT count(*) FROM tab WHERE u64_tdigest = 7;
+SELECT count(*) FROM tab WHERE u64_count_min = 7;
+SELECT count(*) FROM tab WHERE u64_uniq = 7;
+
+SELECT count(*) FROM tab WHERE u64 = 7.7;
+SELECT count(*) FROM tab WHERE u64_tdigest = 7.7;
+SELECT count(*) FROM tab WHERE u64_count_min = 7.7;
+SELECT count(*) FROM tab WHERE u64_uniq = 7.7;
+
+SELECT count(*) FROM tab WHERE u64 = '7';
+SELECT count(*) FROM tab WHERE u64_tdigest = '7';
+SELECT count(*) FROM tab WHERE u64_count_min = '7';
+SELECT count(*) FROM tab WHERE u64_uniq = '7';
+
+SELECT count(*) FROM tab WHERE u64 = '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_tdigest = '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_count_min = '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_uniq = '7.7'; -- { serverError TYPE_MISMATCH }
+
+SELECT 'u64 and <';
+
+SELECT count(*) FROM tab WHERE u64 < 7;
+SELECT count(*) FROM tab WHERE u64_tdigest < 7;
+SELECT count(*) FROM tab WHERE u64_count_min < 7;
+SELECT count(*) FROM tab WHERE u64_uniq < 7;
+
+SELECT count(*) FROM tab WHERE u64 < 7.7;
+SELECT count(*) FROM tab WHERE u64_tdigest < 7.7;
+SELECT count(*) FROM tab WHERE u64_count_min < 7.7;
+SELECT count(*) FROM tab WHERE u64_uniq < 7.7;
+
+SELECT count(*) FROM tab WHERE u64 < '7';
+-- SELECT count(*) FROM tab WHERE u64_tdigest < '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE u64_count_min < '7';
+SELECT count(*) FROM tab WHERE u64_uniq < '7';
+
+SELECT count(*) FROM tab WHERE u64 < '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_tdigest < '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_count_min < '7.7'; -- { serverError TYPE_MISMATCH }
+SELECT count(*) FROM tab WHERE u64_uniq < '7.7'; -- { serverError TYPE_MISMATCH }
+
+-- f64 ----------------------------------------------------
+
+SELECT 'f64 and =';
+
+SELECT count(*) FROM tab WHERE f64 = 7;
+SELECT count(*) FROM tab WHERE f64_tdigest = 7;
+SELECT count(*) FROM tab WHERE f64_count_min = 7;
+SELECT count(*) FROM tab WHERE f64_uniq = 7;
+
+SELECT count(*) FROM tab WHERE f64 = 7.7;
+SELECT count(*) FROM tab WHERE f64_tdigest = 7.7;
+SELECT count(*) FROM tab WHERE f64_count_min = 7.7;
+SELECT count(*) FROM tab WHERE f64_uniq = 7.7;
+
+SELECT count(*) FROM tab WHERE f64 = '7';
+-- SELECT count(*) FROM tab WHERE f64_tdigest = '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_count_min = '7';
+SELECT count(*) FROM tab WHERE f64_uniq = '7';
+
+SELECT count(*) FROM tab WHERE f64 = '7.7';
+-- SELECT count(*) FROM tab WHERE f64_tdigest = '7.7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_count_min = '7.7';
+SELECT count(*) FROM tab WHERE f64_uniq = '7.7';
+
+SELECT 'f64 and <';
+
+SELECT count(*) FROM tab WHERE f64 < 7;
+SELECT count(*) FROM tab WHERE f64_tdigest < 7;
+SELECT count(*) FROM tab WHERE f64_count_min < 7;
+SELECT count(*) FROM tab WHERE f64_uniq < 7;
+
+SELECT count(*) FROM tab WHERE f64 < 7.7;
+SELECT count(*) FROM tab WHERE f64_tdigest < 7.7;
+SELECT count(*) FROM tab WHERE f64_count_min < 7.7;
+SELECT count(*) FROM tab WHERE f64_uniq < 7.7;
+
+SELECT count(*) FROM tab WHERE f64 < '7';
+-- SELECT count(*) FROM tab WHERE f64_tdigest < '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_count_min < '7';
+SELECT count(*) FROM tab WHERE f64_uniq < '7';
+
+SELECT count(*) FROM tab WHERE f64 < '7.7';
+-- SELECT count(*) FROM tab WHERE f64_tdigest < '7.7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_count_min < '7.7';
+SELECT count(*) FROM tab WHERE f64_uniq < '7.7';
+
+-- dt ----------------------------------------------------
+
+SELECT 'dt and =';
+
+SELECT count(*) FROM tab WHERE dt = '2024-08-08 11:12:13';
+SELECT count(*) FROM tab WHERE dt_tdigest = '2024-08-08 11:12:13';
+SELECT count(*) FROM tab WHERE dt_count_min = '2024-08-08 11:12:13';
+SELECT count(*) FROM tab WHERE dt_uniq = '2024-08-08 11:12:13';
+
+SELECT count(*) FROM tab WHERE dt = 7;
+SELECT count(*) FROM tab WHERE dt_tdigest = 7;
+SELECT count(*) FROM tab WHERE dt_count_min = 7;
+SELECT count(*) FROM tab WHERE dt_uniq = 7;
+
+SELECT 'dt and <';
+
+SELECT count(*) FROM tab WHERE dt < '2024-08-08 11:12:13';
+-- SELECT count(*) FROM tab WHERE dt_tdigest < '2024-08-08 11:12:13'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE dt_count_min < '2024-08-08 11:12:13';
+SELECT count(*) FROM tab WHERE dt_uniq < '2024-08-08 11:12:13';
+
+SELECT count(*) FROM tab WHERE dt < 7;
+SELECT count(*) FROM tab WHERE dt_tdigest < 7;
+SELECT count(*) FROM tab WHERE dt_count_min < 7;
+SELECT count(*) FROM tab WHERE dt_uniq < 7;
+
+-- b ----------------------------------------------------
+
+SELECT 'b and =';
+
+SELECT count(*) FROM tab WHERE b = true;
+SELECT count(*) FROM tab WHERE b_tdigest = true;
+SELECT count(*) FROM tab WHERE b_count_min = true;
+SELECT count(*) FROM tab WHERE b_uniq = true;
+
+SELECT count(*) FROM tab WHERE b = 'true';
+SELECT count(*) FROM tab WHERE b_tdigest = 'true';
+SELECT count(*) FROM tab WHERE b_count_min = 'true';
+SELECT count(*) FROM tab WHERE b_uniq = 'true';
+
+SELECT count(*) FROM tab WHERE b = 1;
+SELECT count(*) FROM tab WHERE b_tdigest = 1;
+SELECT count(*) FROM tab WHERE b_count_min = 1;
+SELECT count(*) FROM tab WHERE b_uniq = 1;
+
+SELECT count(*) FROM tab WHERE b = 1.1;
+SELECT count(*) FROM tab WHERE b_tdigest = 1.1;
+SELECT count(*) FROM tab WHERE b_count_min = 1.1;
+SELECT count(*) FROM tab WHERE b_uniq = 1.1;
+
+-- s ----------------------------------------------------
+
+SELECT 's and =';
+
+SELECT count(*) FROM tab WHERE s = 7; -- { serverError NO_COMMON_TYPE }
+-- SELECT count(*) FROM tab WHERE s_tdigest = 7; -- not supported
+SELECT count(*) FROM tab WHERE s_count_min = 7; -- { serverError NO_COMMON_TYPE }
+-- SELECT count(*) FROM tab WHERE s_uniq = 7; -- not supported
+
+SELECT count(*) FROM tab WHERE s = '7';
+-- SELECT count(*) FROM tab WHERE s_tdigest = '7'; -- not supported
+SELECT count(*) FROM tab WHERE s_count_min = '7';
+-- SELECT count(*) FROM tab WHERE s_uniq = '7'; -- not supported
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_uniq.reference b/tests/queries/0_stateless/02864_statistics_uniq.reference
deleted file mode 100644
index 77786dbdd8c..00000000000
--- a/tests/queries/0_stateless/02864_statistics_uniq.reference
+++ /dev/null
@@ -1,35 +0,0 @@
-CREATE TABLE default.t1\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `c` Int64 STATISTICS(tdigest, uniq),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
-After insert
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(equals(c, 11), less(a, 10), less(b, 10)) (removed)
-After merge
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(equals(c, 11), less(a, 10), less(b, 10)) (removed)
-After modify TDigest
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 11), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(c, -1), less(a, 10), less(b, 10)) (removed)
-After drop
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 11), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10), less(c, -1), less(b, 10)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_uniq.sql b/tests/queries/0_stateless/02864_statistics_uniq.sql
deleted file mode 100644
index 0f5f353c045..00000000000
--- a/tests/queries/0_stateless/02864_statistics_uniq.sql
+++ /dev/null
@@ -1,73 +0,0 @@
-DROP TABLE IF EXISTS t1;
-
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-SET mutations_sync = 1;
-
-CREATE TABLE t1
-(
-    a Float64 STATISTICS(tdigest),
-    b Int64 STATISTICS(tdigest),
-    c Int64 STATISTICS(tdigest, uniq),
-    pk String,
-) Engine = MergeTree() ORDER BY pk
-SETTINGS min_bytes_for_wide_part = 0;
-
-SHOW CREATE TABLE t1;
-
-INSERT INTO t1 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
-INSERT INTO t1 select 0, 0, 11, generateUUIDv4();
-
-SELECT 'After insert';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-OPTIMIZE TABLE t1 FINAL;
-
-SELECT 'After merge';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-SELECT 'After modify TDigest';
-ALTER TABLE t1 MODIFY STATISTICS c TYPE TDigest;
-ALTER TABLE t1 MATERIALIZE STATISTICS c;
-
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c < -1 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-
-ALTER TABLE t1 DROP STATISTICS c;
-
-SELECT 'After drop';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c < -1 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
-
-DROP TABLE IF EXISTS t1;
-DROP TABLE IF EXISTS t2;
-SET allow_suspicious_low_cardinality_types=1;
-CREATE TABLE t2
-(
-    a Float64 STATISTICS(tdigest),
-    b Int64 STATISTICS(tdigest),
-    c LowCardinality(Int64) STATISTICS(tdigest, uniq),
-    pk String,
-) Engine = MergeTree() ORDER BY pk
-SETTINGS min_bytes_for_wide_part = 0;
-INSERT INTO t2 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
-
-DROP TABLE IF EXISTS t2;
-DROP TABLE IF EXISTS t3;
-
-CREATE TABLE t3
-(
-    a Float64 STATISTICS(tdigest),
-    b Int64 STATISTICS(tdigest),
-    c Nullable(Int64) STATISTICS(tdigest, uniq),
-    pk String,
-) Engine = MergeTree() ORDER BY pk
-SETTINGS min_bytes_for_wide_part = 0;
-INSERT INTO t3 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
-
-DROP TABLE IF EXISTS t3;
-
diff --git a/tests/queries/0_stateless/02864_statistics_usage.reference b/tests/queries/0_stateless/02864_statistics_usage.reference
new file mode 100644
index 00000000000..a9f669b88c1
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_usage.reference
@@ -0,0 +1,20 @@
+After insert
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
+After drop statistic
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(b, 10_UInt8), less(a, 10_UInt8)) (removed)
+After add and materialize statistic
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
+After merge
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
+After rename
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10_UInt8), less(c, 10_UInt8)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_usage.sql b/tests/queries/0_stateless/02864_statistics_usage.sql
new file mode 100644
index 00000000000..f936854df44
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_usage.sql
@@ -0,0 +1,42 @@
+-- Test that the optimizer picks up column statistics
+-- (The concrete statistics type, column data type and predicate type don't matter)
+
+-- Checks by the predicate evaluation order in EXPLAIN. This is quite fragile, a better approach would be helpful (maybe 'send_logs_level'?)
+
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+SET mutations_sync = 1;
+SET allow_analyzer = 1;
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab
+(
+    a Float64 STATISTICS(tdigest),
+    b Int64 STATISTICS(tdigest)
+) Engine = MergeTree() ORDER BY tuple()
+SETTINGS min_bytes_for_wide_part = 0;
+
+INSERT INTO tab select number, -number FROM system.numbers LIMIT 10000;
+SELECT 'After insert';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
+
+ALTER TABLE tab DROP STATISTICS a, b;
+SELECT 'After drop statistic';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks b first, then a (statistics not used)
+
+ALTER TABLE tab ADD STATISTICS a, b TYPE tdigest;
+ALTER TABLE tab MATERIALIZE STATISTICS a, b;
+INSERT INTO tab select number, -number FROM system.numbers LIMIT 10000;
+SELECT 'After add and materialize statistic';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
+
+OPTIMIZE TABLE tab FINAL;
+SELECT 'After merge';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
+
+ALTER TABLE tab RENAME COLUMN b TO c;
+SELECT 'After rename';
+SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then c (statistics used)
+
+DROP TABLE IF EXISTS tab;

From 55b2000d38e0bc6282714fdb1204d450437433ec Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Aug 2024 13:58:43 +0000
Subject: [PATCH 26/52] Fix fasttest

---
 .../02864_statistics_delayed_materialization_in_merge.sql       | 2 +-
 tests/queries/0_stateless/02864_statistics_usage.sql            | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
index 33a5f9052ba..d469a4c2036 100644
--- a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
+++ b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
@@ -7,7 +7,7 @@ DROP TABLE IF EXISTS tab;
 
 SET allow_experimental_statistics = 1;
 SET allow_statistics_optimize = 1;
-SET allow_analyzer = 1;
+SET enable_analyzer = 1;
 
 SET materialize_statistics_on_insert = 0;
 
diff --git a/tests/queries/0_stateless/02864_statistics_usage.sql b/tests/queries/0_stateless/02864_statistics_usage.sql
index f936854df44..4956bd27e87 100644
--- a/tests/queries/0_stateless/02864_statistics_usage.sql
+++ b/tests/queries/0_stateless/02864_statistics_usage.sql
@@ -6,7 +6,7 @@
 SET allow_experimental_statistics = 1;
 SET allow_statistics_optimize = 1;
 SET mutations_sync = 1;
-SET allow_analyzer = 1;
+SET enable_analyzer = 1;
 
 DROP TABLE IF EXISTS tab;
 

From 33ba78ee42bc85690dce69c82fd51d723a6d2eab Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Thu, 8 Aug 2024 17:47:12 +0200
Subject: [PATCH 27/52] Update test.py

---
 tests/integration/test_drop_is_lock_free/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_drop_is_lock_free/test.py b/tests/integration/test_drop_is_lock_free/test.py
index 1bb8767a9a0..3855bc21f90 100644
--- a/tests/integration/test_drop_is_lock_free/test.py
+++ b/tests/integration/test_drop_is_lock_free/test.py
@@ -176,7 +176,7 @@ def test_query_is_permanent(transaction, permanent, exclusive_table):
 
     select_handler = node.get_query_request(
         f"""
-            SELECT sleepEachRow(3) FROM {exclusive_table} SETTINGS function_sleep_max_microseconds_per_block = 0;
+            SELECT sleepEachRow(3) FROM {exclusive_table} SETTINGS function_sleep_max_microseconds_per_block = 0, max_threads=1;
         """,
         query_id=query_id,
     )

From f9f13a8e415e9f2130281d069c28dd6e9a68be75 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 8 Aug 2024 16:27:25 +0000
Subject: [PATCH 28/52] enable setting optimize_functions_to_subcolumns by
 default

---
 src/Core/Settings.h                 | 2 +-
 src/Core/SettingsChangesHistory.cpp | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index f04c696645a..f0a8d0c2647 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -605,7 +605,7 @@ class IColumn;
     M(Bool, optimize_if_chain_to_multiif, false, "Replace if(cond1, then1, if(cond2, ...)) chains to multiIf. Currently it's not beneficial for numeric types.", 0) \
     M(Bool, optimize_multiif_to_if, true, "Replace 'multiIf' with only one condition to 'if'.", 0) \
     M(Bool, optimize_if_transform_strings_to_enum, false, "Replaces string-type arguments in If and Transform to enum. Disabled by default cause it could make inconsistent change in distributed query that would lead to its fail.", 0) \
-    M(Bool, optimize_functions_to_subcolumns, false, "Transform functions to subcolumns, if possible, to reduce amount of read data. E.g. 'length(arr)' -> 'arr.size0', 'col IS NULL' -> 'col.null' ", 0) \
+    M(Bool, optimize_functions_to_subcolumns, true, "Transform functions to subcolumns, if possible, to reduce amount of read data. E.g. 'length(arr)' -> 'arr.size0', 'col IS NULL' -> 'col.null' ", 0) \
     M(Bool, optimize_using_constraints, false, "Use constraints for query optimization", 0)                                                                                                                                           \
     M(Bool, optimize_substitute_columns, false, "Use constraints for column substitution", 0)                                                                                                                                         \
     M(Bool, optimize_append_index, false, "Use constraints in order to append index condition (indexHint)", 0) \
diff --git a/src/Core/SettingsChangesHistory.cpp b/src/Core/SettingsChangesHistory.cpp
index 41e4ac2e154..b00d0964e01 100644
--- a/src/Core/SettingsChangesHistory.cpp
+++ b/src/Core/SettingsChangesHistory.cpp
@@ -83,6 +83,7 @@ static std::initializer_list<std::pair<ClickHouseVersion, SettingsChangesHistory
             {"allow_archive_path_syntax", true, true, "Added new setting to allow disabling archive path syntax."},
             {"allow_experimental_time_series_table", false, false, "Added new setting to allow the TimeSeries table engine"},
             {"enable_analyzer", 1, 1, "Added an alias to a setting `allow_experimental_analyzer`."},
+            {"optimize_functions_to_subcolumns", false, true, "Enabled settings by default"},
         }
     },
     {"24.7",

From b0b150c599052d596b8c746a31ba50019601b6a0 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Aug 2024 18:29:20 +0000
Subject: [PATCH 29/52] Remove workarounds for solved bugs

---
 .../02864_statistics_predicates.reference            |  6 ++++++
 .../0_stateless/02864_statistics_predicates.sql      | 12 ++++++------
 2 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/02864_statistics_predicates.reference b/tests/queries/0_stateless/02864_statistics_predicates.reference
index 1c2abd47aaf..ffbd7269e05 100644
--- a/tests/queries/0_stateless/02864_statistics_predicates.reference
+++ b/tests/queries/0_stateless/02864_statistics_predicates.reference
@@ -23,6 +23,7 @@ u64 and <
 70
 70
 70
+70
 f64 and =
 10
 10
@@ -35,6 +36,8 @@ f64 and =
 10
 10
 10
+10
+0
 0
 0
 0
@@ -50,6 +53,8 @@ f64 and <
 70
 70
 70
+70
+80
 80
 80
 80
@@ -66,6 +71,7 @@ dt and <
 10000
 10000
 10000
+10000
 70
 70
 70
diff --git a/tests/queries/0_stateless/02864_statistics_predicates.sql b/tests/queries/0_stateless/02864_statistics_predicates.sql
index 3e754dfb1de..779116cf19a 100644
--- a/tests/queries/0_stateless/02864_statistics_predicates.sql
+++ b/tests/queries/0_stateless/02864_statistics_predicates.sql
@@ -92,7 +92,7 @@ SELECT count(*) FROM tab WHERE u64_count_min < 7.7;
 SELECT count(*) FROM tab WHERE u64_uniq < 7.7;
 
 SELECT count(*) FROM tab WHERE u64 < '7';
--- SELECT count(*) FROM tab WHERE u64_tdigest < '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE u64_tdigest < '7';
 SELECT count(*) FROM tab WHERE u64_count_min < '7';
 SELECT count(*) FROM tab WHERE u64_uniq < '7';
 
@@ -116,12 +116,12 @@ SELECT count(*) FROM tab WHERE f64_count_min = 7.7;
 SELECT count(*) FROM tab WHERE f64_uniq = 7.7;
 
 SELECT count(*) FROM tab WHERE f64 = '7';
--- SELECT count(*) FROM tab WHERE f64_tdigest = '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_tdigest = '7';
 SELECT count(*) FROM tab WHERE f64_count_min = '7';
 SELECT count(*) FROM tab WHERE f64_uniq = '7';
 
 SELECT count(*) FROM tab WHERE f64 = '7.7';
--- SELECT count(*) FROM tab WHERE f64_tdigest = '7.7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_tdigest = '7.7';
 SELECT count(*) FROM tab WHERE f64_count_min = '7.7';
 SELECT count(*) FROM tab WHERE f64_uniq = '7.7';
 
@@ -138,12 +138,12 @@ SELECT count(*) FROM tab WHERE f64_count_min < 7.7;
 SELECT count(*) FROM tab WHERE f64_uniq < 7.7;
 
 SELECT count(*) FROM tab WHERE f64 < '7';
--- SELECT count(*) FROM tab WHERE f64_tdigest < '7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_tdigest < '7';
 SELECT count(*) FROM tab WHERE f64_count_min < '7';
 SELECT count(*) FROM tab WHERE f64_uniq < '7';
 
 SELECT count(*) FROM tab WHERE f64 < '7.7';
--- SELECT count(*) FROM tab WHERE f64_tdigest < '7.7'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE f64_tdigest < '7.7';
 SELECT count(*) FROM tab WHERE f64_count_min < '7.7';
 SELECT count(*) FROM tab WHERE f64_uniq < '7.7';
 
@@ -164,7 +164,7 @@ SELECT count(*) FROM tab WHERE dt_uniq = 7;
 SELECT 'dt and <';
 
 SELECT count(*) FROM tab WHERE dt < '2024-08-08 11:12:13';
--- SELECT count(*) FROM tab WHERE dt_tdigest < '2024-08-08 11:12:13'; -- BOOM (#67742)
+SELECT count(*) FROM tab WHERE dt_tdigest < '2024-08-08 11:12:13';
 SELECT count(*) FROM tab WHERE dt_count_min < '2024-08-08 11:12:13';
 SELECT count(*) FROM tab WHERE dt_uniq < '2024-08-08 11:12:13';
 

From fe234bd88f3eb1dca8cdb8b217606abfbcea1d54 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 8 Aug 2024 20:56:51 +0200
Subject: [PATCH 30/52] Fix test

---
 tests/queries/0_stateless/03218_materialize_msan.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03218_materialize_msan.sql b/tests/queries/0_stateless/03218_materialize_msan.sql
index b41300ea1e3..7e7043e687b 100644
--- a/tests/queries/0_stateless/03218_materialize_msan.sql
+++ b/tests/queries/0_stateless/03218_materialize_msan.sql
@@ -1,3 +1,5 @@
+SET enable_analyzer = 1;
+
 SELECT
     materialize([(NULL, '11\01111111\011111', '1111')]) AS t,
     (t[1048576]).2,

From bc20b637eae8bba72ecfab5256c7eace40586976 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Thu, 8 Aug 2024 21:47:23 +0200
Subject: [PATCH 31/52] Add missing file

---
 .../test_broken_projections/config.d/dont_start_broken.xml  | 6 ++++++
 1 file changed, 6 insertions(+)
 create mode 100644 tests/integration/test_broken_projections/config.d/dont_start_broken.xml

diff --git a/tests/integration/test_broken_projections/config.d/dont_start_broken.xml b/tests/integration/test_broken_projections/config.d/dont_start_broken.xml
new file mode 100644
index 00000000000..9603cdc7e3e
--- /dev/null
+++ b/tests/integration/test_broken_projections/config.d/dont_start_broken.xml
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="utf-8"?>
+<clickhouse>
+  <merge_tree>
+    <max_suspicious_broken_parts_bytes>0</max_suspicious_broken_parts_bytes>
+  </merge_tree>
+</clickhouse>

From 759299910c2892b809735caaf663fe374c315c5c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Fri, 9 Aug 2024 09:14:00 +0000
Subject: [PATCH 32/52] Force new analyzer for test

---
 tests/queries/0_stateless/03217_filtering_in_storage_merge.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql b/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
index 5ecc1e7c672..42d31e95f9c 100644
--- a/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_storage_merge.sql
@@ -13,4 +13,4 @@ INSERT INTO test_03217_merge_replica_1 SELECT number AS x FROM numbers(10);
 SYSTEM SYNC REPLICA test_03217_merge_replica_2;
 
 -- If the filter on _table is not applied, then the plan will show both replicas
-EXPLAIN SELECT _table, count() FROM test_03217_all_replicas WHERE  _table = 'test_03217_merge_replica_1' AND x >= 0 GROUP BY _table;
+EXPLAIN SELECT _table, count() FROM test_03217_all_replicas WHERE  _table = 'test_03217_merge_replica_1' AND x >= 0 GROUP BY _table SETTINGS allow_experimental_analyzer=1;

From dc64550536ff249b1c12070ed646bc4321bc68bf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Fri, 9 Aug 2024 09:14:13 +0000
Subject: [PATCH 33/52] Remove wrong check from test

---
 .../0_stateless/03217_filtering_in_system_tables.reference | 4 ++--
 .../0_stateless/03217_filtering_in_system_tables.sql       | 7 +++----
 2 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.reference b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
index 218fddf92e0..d7ccd989f53 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
@@ -1,4 +1,4 @@
 information_schema	tables
 default	test_03217_system_tables_replica_1	r1
-1	1
-1	1
+1
+1
diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
index 72ca7c8684d..0db846bc500 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
@@ -10,18 +10,17 @@ CREATE TABLE test_03217_system_tables_replica_2(x UInt32)
 
 -- If filtering is not done correctly on database-table column, then this query report to read 2 rows, which are the above tables
 SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_03217_system_tables_replica_1' AND replica_name = 'r1';
-
 SYSTEM FLUSH LOGS;
--- argMin-argMax is necessary to make the test repeatable
+-- argMax is necessary to make the test repeatable
 
 -- StorageSystemTables
-SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+SELECT argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
     AND current_database = currentDatabase()
     AND query LIKE '%SELECT database, table FROM system.tables WHERE database = \'information_schema\' AND table = \'tables\';'
     AND type = 'QueryFinish';
 
 -- StorageSystemReplicas
-SELECT argMin(read_rows, event_time_microseconds), argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
+SELECT argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
     AND current_database = currentDatabase()
     AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_03217_system_tables_replica_1\' AND replica_name = \'r1\';'
     AND type = 'QueryFinish';

From e4903858c8ae108b87b726a8056acab10dd6b851 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Fri, 9 Aug 2024 09:31:33 +0000
Subject: [PATCH 34/52] Add extra check to make sure both replicas are present
 in system.replicas

---
 .../0_stateless/03217_filtering_in_system_tables.reference      | 2 ++
 tests/queries/0_stateless/03217_filtering_in_system_tables.sql  | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.reference b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
index d7ccd989f53..c0761c3f689 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.reference
@@ -1,4 +1,6 @@
 information_schema	tables
+both	default	test_03217_system_tables_replica_1	r1
+both	default	test_03217_system_tables_replica_2	r2
 default	test_03217_system_tables_replica_1	r1
 1
 1
diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
index 0db846bc500..2ce63559b99 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
@@ -8,6 +8,8 @@ CREATE TABLE test_03217_system_tables_replica_2(x UInt32)
     ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_03217_system_tables_replica', 'r2')
     ORDER BY x;
 
+-- Make sure we can read both replicas
+SELECT 'both', database, table, replica_name FROM system.replicas WHERE database = currentDatabase();
 -- If filtering is not done correctly on database-table column, then this query report to read 2 rows, which are the above tables
 SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_03217_system_tables_replica_1' AND replica_name = 'r1';
 SYSTEM FLUSH LOGS;

From 36c0c4562b8622b84012a12e29175f272bda2b0b Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 9 Aug 2024 13:14:30 +0200
Subject: [PATCH 35/52] Fix race in WithRetries

---
 src/Backups/WithRetries.cpp | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/Backups/WithRetries.cpp b/src/Backups/WithRetries.cpp
index 181e6331ac9..9f22085f5a9 100644
--- a/src/Backups/WithRetries.cpp
+++ b/src/Backups/WithRetries.cpp
@@ -68,13 +68,19 @@ const WithRetries::KeeperSettings & WithRetries::getKeeperSettings() const
 
 WithRetries::FaultyKeeper WithRetries::getFaultyZooKeeper() const
 {
-    /// We need to create new instance of ZooKeeperWithFaultInjection each time a copy a pointer to ZooKeeper client there
+    zkutil::ZooKeeperPtr current_zookeeper;
+    {
+        std::lock_guard lock(zookeeper_mutex);
+        current_zookeeper = zookeeper;
+    }
+
+    /// We need to create new instance of ZooKeeperWithFaultInjection each time and copy a pointer to ZooKeeper client there
     /// The reason is that ZooKeeperWithFaultInjection may reset the underlying pointer and there could be a race condition
     /// when the same object is used from multiple threads.
     auto faulty_zookeeper = ZooKeeperWithFaultInjection::createInstance(
         settings.keeper_fault_injection_probability,
         settings.keeper_fault_injection_seed,
-        zookeeper,
+        current_zookeeper,
         log->name(),
         log);
 

From 1e3ccbc3ec81c5b9d79a034159181f1f6bdb195c Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Fri, 9 Aug 2024 11:22:44 +0000
Subject: [PATCH 36/52] add perf test for subcolumns

---
 .../optimize_functions_to_subcolumns.xml      | 27 +++++++++++++++++++
 1 file changed, 27 insertions(+)
 create mode 100644 tests/performance/optimize_functions_to_subcolumns.xml

diff --git a/tests/performance/optimize_functions_to_subcolumns.xml b/tests/performance/optimize_functions_to_subcolumns.xml
new file mode 100644
index 00000000000..a246aae7950
--- /dev/null
+++ b/tests/performance/optimize_functions_to_subcolumns.xml
@@ -0,0 +1,27 @@
+<test>
+    <settings>
+        <optimize_functions_to_subcolumns>1</optimize_functions_to_subcolumns>
+        <max_insert_threads>4</max_insert_threads>
+    </settings>
+
+    <create_query>
+        CREATE TABLE t_subcolumns (a Array(UInt64), s Nullable(String), m Map(String, UInt64)) ENGINE = MergeTree ORDER BY tuple()
+    </create_query>
+
+    <fill_query>
+        INSERT INTO t_subcolumns SELECT range(number % 20), toString(number), mapFromArrays(range(number % 20), range(number % 20)) FROM numbers_mt(50000000)
+    </fill_query>
+
+    <fill_query>
+        OPTIMIZE TABLE t_subcolumns FINAL
+    </fill_query>
+
+    <query>SELECT count() FROM t_subcolumns WHERE NOT ignore(length(a))</query>
+    <query>SELECT count() FROM t_subcolumns WHERE notEmpty(a)</query>
+    <query>SELECT count() FROM t_subcolumns WHERE NOT ignore(length(m))</query>
+    <query>SELECT count() FROM t_subcolumns WHERE notEmpty(m)</query>
+    <query>SELECT count() FROM t_subcolumns WHERE isNotNull(s)</query>
+    <query>SELECT count(s) FROM t_subcolumns</query>
+
+    <drop_query>DROP TABLE t_subcolumns</drop_query>
+</test>

From e8f2f65e62c65878463879396b7ebdceed48c5e3 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Aug 2024 11:51:23 +0000
Subject: [PATCH 37/52] Avoid converting type to string and back in _CAST

---
 src/Functions/CastOverloadResolver.cpp        | 23 +++++++++++++++----
 src/Functions/CastOverloadResolver.h          |  6 ++++-
 src/Functions/toBool.cpp                      |  3 +--
 src/Interpreters/ActionsDAG.cpp               | 12 +++++-----
 src/Interpreters/castColumn.cpp               |  6 ++---
 .../optimizeUseAggregateProjection.cpp        | 21 ++++++-----------
 src/Processors/Transforms/WindowTransform.cpp | 17 ++------------
 src/Storages/MergeTree/KeyCondition.cpp       |  7 ++----
 .../MergeTreeSplitPrewhereIntoReadSteps.cpp   | 20 +++++-----------
 ...rojection_with_normalized_states.reference |  1 +
 ...gate_projection_with_normalized_states.sql |  2 ++
 11 files changed, 52 insertions(+), 66 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 49f63073aaf..6cb4d492fd8 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -3,6 +3,7 @@
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeString.h>
 #include <Columns/ColumnString.h>
 #include <Core/Settings.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
@@ -35,7 +36,7 @@ FunctionBasePtr createFunctionBaseCast(
 class CastOverloadResolverImpl : public IFunctionOverloadResolver
 {
 public:
-    const char * getNameImpl() const
+    static const char * getNameImpl(CastType cast_type, bool internal)
     {
         if (cast_type == CastType::accurate)
             return "accurateCast";
@@ -49,7 +50,7 @@ public:
 
     String getName() const override
     {
-        return getNameImpl();
+        return getNameImpl(cast_type, internal);
     }
 
     size_t getNumberOfArguments() const override { return 2; }
@@ -79,10 +80,22 @@ public:
         }
     }
 
+    static FunctionBasePtr createInternalCast(ColumnWithTypeAndName from, DataTypePtr to, CastType cast_type, std::optional<CastDiagnostic> diagnostic)
+    {
+        if (cast_type == CastType::accurateOrNull && !isVariant(to))
+            to = makeNullable(to);
+
+        ColumnsWithTypeAndName arguments;
+        arguments.emplace_back(std::move(from));
+        arguments.emplace_back().type = std::make_unique<DataTypeString>();
+
+        return createFunctionBaseCast(nullptr, getNameImpl(cast_type, true), arguments, to, diagnostic, cast_type);
+    }
+
 protected:
     FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
     {
-        return createFunctionBaseCast(context, getNameImpl(), arguments, return_type, diagnostic, cast_type);
+        return createFunctionBaseCast(context, getNameImpl(cast_type, internal), arguments, return_type, diagnostic, cast_type);
     }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
@@ -130,9 +143,9 @@ private:
 };
 
 
-FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
+FunctionBasePtr createInternalCast(ColumnWithTypeAndName from, DataTypePtr to, CastType cast_type, std::optional<CastDiagnostic> diagnostic)
 {
-    return CastOverloadResolverImpl::create(ContextPtr{}, type, true, diagnostic);
+    return CastOverloadResolverImpl::createInternalCast(std::move(from), std::move(to), cast_type, std::move(diagnostic));
 }
 
 REGISTER_FUNCTION(CastOverloadResolvers)
diff --git a/src/Functions/CastOverloadResolver.h b/src/Functions/CastOverloadResolver.h
index 7d98f774812..66f9d6cfcaf 100644
--- a/src/Functions/CastOverloadResolver.h
+++ b/src/Functions/CastOverloadResolver.h
@@ -3,6 +3,7 @@
 #include <memory>
 #include <optional>
 #include <Interpreters/Context_fwd.h>
+#include <Core/ColumnWithTypeAndName.h>
 
 
 namespace DB
@@ -11,6 +12,9 @@ namespace DB
 class IFunctionOverloadResolver;
 using FunctionOverloadResolverPtr = std::shared_ptr<IFunctionOverloadResolver>;
 
+class IFunctionBase;
+using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
+
 enum class CastType : uint8_t
 {
     nonAccurate,
@@ -24,6 +28,6 @@ struct CastDiagnostic
     std::string column_to;
 };
 
-FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic);
+FunctionBasePtr createInternalCast(ColumnWithTypeAndName from, DataTypePtr to, CastType cast_type, std::optional<CastDiagnostic> diagnostic);
 
 }
diff --git a/src/Functions/toBool.cpp b/src/Functions/toBool.cpp
index 6f2c436c1ea..ac595d313e3 100644
--- a/src/Functions/toBool.cpp
+++ b/src/Functions/toBool.cpp
@@ -54,8 +54,7 @@ namespace
                 }
             };
 
-            FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(CastType::nonAccurate, {});
-            auto func_cast = func_builder_cast->build(cast_args);
+            auto func_cast = createInternalCast(arguments[0], result_type, CastType::nonAccurate, {});
             return func_cast->execute(cast_args, result_type, arguments[0].column->size());
         }
     };
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index df1c0aa1f2a..2a594839c6a 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -301,11 +301,11 @@ const ActionsDAG::Node & ActionsDAG::addCast(const Node & node_to_cast, const Da
     column.column = DataTypeString().createColumnConst(0, cast_type_constant_value);
     column.type = std::make_shared<DataTypeString>();
 
-    const auto * cast_type_constant_node = &addColumn(std::move(column));
+    const auto * cast_type_constant_node = &addColumn(column);
     ActionsDAG::NodeRawConstPtrs children = {&node_to_cast, cast_type_constant_node};
-    FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(CastType::nonAccurate, {});
+    auto func_base_cast = createInternalCast(ColumnWithTypeAndName{node_to_cast.result_type, node_to_cast.result_name}, cast_type, CastType::nonAccurate, {});
 
-    return addFunction(func_builder_cast, std::move(children), result_name);
+    return addFunction(func_base_cast, std::move(children), result_name);
 }
 
 const ActionsDAG::Node & ActionsDAG::addFunctionImpl(
@@ -1547,11 +1547,11 @@ ActionsDAG ActionsDAG::makeConvertingActions(
             const auto * left_arg = dst_node;
 
             CastDiagnostic diagnostic = {dst_node->result_name, res_elem.name};
-            FunctionOverloadResolverPtr func_builder_cast
-                = createInternalCastOverloadResolver(CastType::nonAccurate, std::move(diagnostic));
+            ColumnWithTypeAndName left_column{nullptr, dst_node->result_type, {}};
+            auto func_base_cast = createInternalCast(std::move(left_column), res_elem.type, CastType::nonAccurate, std::move(diagnostic));
 
             NodeRawConstPtrs children = { left_arg, right_arg };
-            dst_node = &actions_dag.addFunction(func_builder_cast, std::move(children), {});
+            dst_node = &actions_dag.addFunction(func_base_cast, std::move(children), {});
         }
 
         if (dst_node->column && isColumnConst(*dst_node->column) && !(res_elem.column && isColumnConst(*res_elem.column)))
diff --git a/src/Interpreters/castColumn.cpp b/src/Interpreters/castColumn.cpp
index 906dfb84b14..a779c9bc34d 100644
--- a/src/Interpreters/castColumn.cpp
+++ b/src/Interpreters/castColumn.cpp
@@ -26,11 +26,9 @@ static ColumnPtr castColumn(CastType cast_type, const ColumnWithTypeAndName & ar
             ""
         }
     };
-    auto get_cast_func = [cast_type, &arguments]
+    auto get_cast_func = [from = arg, to = type, cast_type]
     {
-
-        FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(cast_type, {});
-        return func_builder_cast->build(arguments);
+        return createInternalCast(from, to, cast_type, {});
     };
 
     FunctionBasePtr func_cast = cache ? cache->getOrSet(cast_type, from_name, to_name, std::move(get_cast_func)) : get_cast_func();
diff --git a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
index 52d1931c51e..b31ee7ea53c 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
@@ -255,20 +255,13 @@ static void appendAggregateFunctions(
 
         const auto * node = input;
 
-        if (node->result_name != aggregate.column_name)
-        {
-            if (DataTypeAggregateFunction::strictEquals(type, node->result_type))
-            {
-                node = &proj_dag.addAlias(*node, aggregate.column_name);
-            }
-            else
-            {
-                /// Cast to aggregate types specified in query if it's not
-                /// strictly the same as the one specified in projection. This
-                /// is required to generate correct results during finalization.
-                node = &proj_dag.addCast(*node, type, aggregate.column_name);
-            }
-        }
+        if (!DataTypeAggregateFunction::strictEquals(type, node->result_type))
+            /// Cast to aggregate types specified in query if it's not
+            /// strictly the same as the one specified in projection. This
+            /// is required to generate correct results during finalization.
+            node = &proj_dag.addCast(*node, type, aggregate.column_name);
+        else if (node->result_name != aggregate.column_name)
+            node = &proj_dag.addAlias(*node, aggregate.column_name);
 
         proj_dag_outputs.push_back(node);
     }
diff --git a/src/Processors/Transforms/WindowTransform.cpp b/src/Processors/Transforms/WindowTransform.cpp
index c26cd7cc8c3..c27c230c741 100644
--- a/src/Processors/Transforms/WindowTransform.cpp
+++ b/src/Processors/Transforms/WindowTransform.cpp
@@ -2337,22 +2337,9 @@ struct WindowFunctionLagLeadInFrame final : public WindowFunction
                 argument_types[2]->getName());
         }
 
-        const auto from_name = argument_types[2]->getName();
-        const auto to_name = argument_types[0]->getName();
-        ColumnsWithTypeAndName arguments
+        auto get_cast_func = [from = argument_types[2], to = argument_types[0]]
         {
-            { argument_types[2], "" },
-            {
-                DataTypeString().createColumnConst(0, to_name),
-                std::make_shared<DataTypeString>(),
-                ""
-            }
-        };
-
-        auto get_cast_func = [&arguments]
-        {
-            FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(CastType::accurate, {});
-            return func_builder_cast->build(arguments);
+            return createInternalCast({from, {}}, to, CastType::accurate, {});
         };
 
         func_cast = get_cast_func();
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index dfb43c4e75d..aa7a498d5a3 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1956,11 +1956,8 @@ bool KeyCondition::extractAtomFromTree(const RPNBuilderTreeNode & node, RPNEleme
                         auto common_type_maybe_nullable = (key_expr_type_is_nullable && !common_type->isNullable())
                             ? DataTypePtr(std::make_shared<DataTypeNullable>(common_type))
                             : common_type;
-                        ColumnsWithTypeAndName arguments{
-                            {nullptr, key_expr_type, ""},
-                            {DataTypeString().createColumnConst(1, common_type_maybe_nullable->getName()), common_type_maybe_nullable, ""}};
-                        FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(CastType::nonAccurate, {});
-                        auto func_cast = func_builder_cast->build(arguments);
+
+                        auto func_cast = createInternalCast({key_expr_type, {}}, common_type_maybe_nullable, CastType::nonAccurate, {});
 
                         /// If we know the given range only contains one value, then we treat all functions as positive monotonic.
                         if (!single_point && !func_cast->hasInformationAboutMonotonicity())
diff --git a/src/Storages/MergeTree/MergeTreeSplitPrewhereIntoReadSteps.cpp b/src/Storages/MergeTree/MergeTreeSplitPrewhereIntoReadSteps.cpp
index 36ff6c0a4bd..9c82817e8cb 100644
--- a/src/Storages/MergeTree/MergeTreeSplitPrewhereIntoReadSteps.cpp
+++ b/src/Storages/MergeTree/MergeTreeSplitPrewhereIntoReadSteps.cpp
@@ -152,23 +152,15 @@ const ActionsDAG::Node & addFunction(
 const ActionsDAG::Node & addCast(
         const ActionsDAGPtr & dag,
         const ActionsDAG::Node & node_to_cast,
-        const String & type_name,
+        const DataTypePtr & to_type,
         OriginalToNewNodeMap & node_remap)
 {
-    if (node_to_cast.result_type->getName() == type_name)
+    if (!node_to_cast.result_type->equals(*to_type))
         return node_to_cast;
 
-    Field cast_type_constant_value(type_name);
-
-    ColumnWithTypeAndName column;
-    column.column = DataTypeString().createColumnConst(0, cast_type_constant_value);
-    column.type = std::make_shared<DataTypeString>();
-
-    const auto * cast_type_constant_node = &dag->addColumn(std::move(column));
-    ActionsDAG::NodeRawConstPtrs children = {&node_to_cast, cast_type_constant_node};
-    FunctionOverloadResolverPtr func_builder_cast = createInternalCastOverloadResolver(CastType::nonAccurate, {});
-
-    return addFunction(dag, func_builder_cast, std::move(children), node_remap);
+    const auto & new_node = dag->addCast(node_to_cast, to_type, {});
+    node_remap[new_node.result_name] = {dag.get(), &new_node};
+    return new_node;
 }
 
 /// Normalizes the filter node by adding AND with a constant true.
@@ -332,7 +324,7 @@ bool tryBuildPrewhereSteps(PrewhereInfoPtr prewhere_info, const ExpressionAction
             /// Build AND(last_step_result_node, true)
             const auto & and_node = addAndTrue(last_step_dag, *last_step_result_node_info.node, node_remap);
             /// Build CAST(and_node, type of PREWHERE column)
-            const auto & cast_node = addCast(last_step_dag, and_node, output->result_type->getName(), node_remap);
+            const auto & cast_node = addCast(last_step_dag, and_node, output->result_type, node_remap);
             /// Add alias for the result with the name of the PREWHERE column
             const auto & prewhere_result_node = last_step_dag->addAlias(cast_node, output->result_name);
             last_step_dag->addOrReplaceInOutputs(prewhere_result_node);
diff --git a/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.reference b/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.reference
index 25aa9dc5dec..37993873983 100644
--- a/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.reference
+++ b/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.reference
@@ -1,2 +1,3 @@
 3
 950	990	500	2000
+[950]	[999]
diff --git a/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.sql b/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.sql
index 5375823aa8e..956bf3711a2 100644
--- a/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.sql
+++ b/tests/queries/0_stateless/01710_aggregate_projection_with_normalized_states.sql
@@ -29,4 +29,6 @@ FROM cluster('test_cluster_two_shards', currentDatabase(), r)
 WHERE a = 'x'
 settings prefer_localhost_replica=0;
 
+SELECT quantilesTimingMerge(0.95)(q), quantilesTimingMerge(toInt64(1))(q) FROM remote('127.0.0.{1,2}', currentDatabase(), r);
+
 DROP TABLE r;

From 3d850f8ceb0ca5cfae26e8faa7c4d900cc4e8fda Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 9 Aug 2024 13:58:02 +0200
Subject: [PATCH 38/52] fix

---
 src/Processors/Sources/ShellCommandSource.cpp | 18 ++++++------------
 1 file changed, 6 insertions(+), 12 deletions(-)

diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index 23359367a9b..f55a3713215 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -70,17 +70,16 @@ static void makeFdBlocking(int fd)
 
 static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_milliseconds)
 {
+    auto logger = getLogger("TimeoutReadBufferFromFileDescriptor");
+    auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
+
     int res;
 
     while (true)
     {
         Stopwatch watch;
 
-        auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
-        LOG_TEST(
-            getLogger("TimeoutReadBufferFromFileDescriptor"),
-            "Polling descriptors: {}",
-            fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "));
+        LOG_TEST(logger, "Polling descriptors: {}", fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "));
 
         res = poll(pfds, static_cast<nfds_t>(num), static_cast<int>(timeout_milliseconds));
 
@@ -92,11 +91,7 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
             const auto elapsed = watch.elapsedMilliseconds();
             if (timeout_milliseconds <= elapsed)
             {
-                LOG_TEST(
-                    getLogger("TimeoutReadBufferFromFileDescriptor"),
-                    "Timeout exceeded: elapsed={}, timeout={}",
-                    elapsed,
-                    timeout_milliseconds);
+                LOG_TEST(logger, "Timeout exceeded: elapsed={}, timeout={}", elapsed, timeout_milliseconds);
                 break;
             }
             timeout_milliseconds -= elapsed;
@@ -107,9 +102,8 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
         }
     }
 
-    auto describe_fd = [](const auto & pollfd) { return fmt::format("(fd={}, flags={})", pollfd.fd, fcntl(pollfd.fd, F_GETFL)); };
     LOG_TEST(
-        getLogger("TimeoutReadBufferFromFileDescriptor"),
+        logger,
         "Poll for descriptors: {} returned {}",
         fmt::join(std::span(pfds, pfds + num) | std::views::transform(describe_fd), ", "),
         res);

From 20563bc6cbc6e70eb6926c5f21fded356270f40f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Fri, 9 Aug 2024 12:19:44 +0000
Subject: [PATCH 39/52] Make test work with ReplicatedDatabase in test

---
 .../0_stateless/03217_filtering_in_system_tables.sql      | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
index 2ce63559b99..eb506dfe39a 100644
--- a/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
+++ b/tests/queries/0_stateless/03217_filtering_in_system_tables.sql
@@ -9,9 +9,11 @@ CREATE TABLE test_03217_system_tables_replica_2(x UInt32)
     ORDER BY x;
 
 -- Make sure we can read both replicas
-SELECT 'both', database, table, replica_name FROM system.replicas WHERE database = currentDatabase();
+-- The replica name might be altered because of `_functional_tests_helper_database_replicated_replace_args_macros`,
+-- thus we need to use `left`
+SELECT 'both', database, table, left(replica_name, 2) FROM system.replicas WHERE database = currentDatabase();
 -- If filtering is not done correctly on database-table column, then this query report to read 2 rows, which are the above tables
-SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = 'test_03217_system_tables_replica_1' AND replica_name = 'r1';
+SELECT database, table, left(replica_name, 2) FROM system.replicas WHERE database = currentDatabase() AND table = 'test_03217_system_tables_replica_1' AND replica_name LIKE 'r1%';
 SYSTEM FLUSH LOGS;
 -- argMax is necessary to make the test repeatable
 
@@ -24,5 +26,5 @@ SELECT argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
 -- StorageSystemReplicas
 SELECT argMax(read_rows, event_time_microseconds) FROM system.query_log WHERE 1
     AND current_database = currentDatabase()
-    AND query LIKE '%SELECT database, table, replica_name FROM system.replicas WHERE database = currentDatabase() AND table = \'test_03217_system_tables_replica_1\' AND replica_name = \'r1\';'
+    AND query LIKE '%SELECT database, table, left(replica_name, 2) FROM system.replicas WHERE database = currentDatabase() AND table = \'test_03217_system_tables_replica_1\' AND replica_name LIKE \'r1\%\';'
     AND type = 'QueryFinish';

From 65ebcd6f21b26144cb47e6b71c939517b1fb38a2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Aug 2024 13:55:47 +0000
Subject: [PATCH 40/52] Fixing test.

---
 .../0_stateless/01656_test_query_log_factories_info.reference   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01656_test_query_log_factories_info.reference b/tests/queries/0_stateless/01656_test_query_log_factories_info.reference
index 47b3133ceca..44531c19ab7 100644
--- a/tests/queries/0_stateless/01656_test_query_log_factories_info.reference
+++ b/tests/queries/0_stateless/01656_test_query_log_factories_info.reference
@@ -17,7 +17,7 @@ used_functions
 ['repeat']
 
 arraySort(used_data_type_families)
-['Array','Int32','Nullable','String']
+['Int32','Nullable','String']
 
 used_database_engines
 ['Atomic']

From c13d348d1e8a467b9d16fc83214ef574752092e0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Aug 2024 19:56:50 +0200
Subject: [PATCH 41/52] Fix test `00900_long_parquet_load`

---
 tests/queries/0_stateless/00900_long_parquet_load.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00900_long_parquet_load.sh b/tests/queries/0_stateless/00900_long_parquet_load.sh
index 1bafb033f56..3a7022ac0cf 100755
--- a/tests/queries/0_stateless/00900_long_parquet_load.sh
+++ b/tests/queries/0_stateless/00900_long_parquet_load.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-fasttest, no-debug
+# Tags: long, no-fasttest, no-debug, no-asan, no-msan, no-tsan
 
 #
 # Load all possible .parquet files found in submodules.

From b5afddb1af0a9aeb4738cf3fb7b7242361469028 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Fri, 9 Aug 2024 22:56:25 +0200
Subject: [PATCH 42/52] Update optimize_functions_to_subcolumns.xml

---
 tests/performance/optimize_functions_to_subcolumns.xml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/performance/optimize_functions_to_subcolumns.xml b/tests/performance/optimize_functions_to_subcolumns.xml
index a246aae7950..146af1605c4 100644
--- a/tests/performance/optimize_functions_to_subcolumns.xml
+++ b/tests/performance/optimize_functions_to_subcolumns.xml
@@ -1,6 +1,5 @@
 <test>
     <settings>
-        <optimize_functions_to_subcolumns>1</optimize_functions_to_subcolumns>
         <max_insert_threads>4</max_insert_threads>
     </settings>
 

From 9b9fff4232d80e579b1d23ced8bfbb1b2c5e2147 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Sat, 10 Aug 2024 08:48:08 +0200
Subject: [PATCH 43/52] Push CI


From e582118544f3c49c3c6600ac8fa252151714d25f Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sat, 10 Aug 2024 13:09:40 +0200
Subject: [PATCH 44/52] review changes

---
 .../functions/type-conversion-functions.md    | 916 +++++++++++++++---
 1 file changed, 801 insertions(+), 115 deletions(-)

diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index 8e72fea7fdb..5c06e72f977 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -64,9 +64,8 @@ toInt8(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -251,9 +250,8 @@ toInt8OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `Int8` is unsuccessful. [Int8](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -314,9 +312,8 @@ toInt16(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -501,9 +498,8 @@ toInt16OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `Int16` is unsuccessful. [Int16](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -564,9 +560,8 @@ toInt32(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -750,9 +745,8 @@ toInt32OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `Int32` is unsuccessful. [Int32](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -813,9 +807,8 @@ toInt64(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported types:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1000,9 +993,8 @@ toInt64OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `Int64` is unsuccessful. [Int64](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1063,9 +1055,8 @@ toInt128(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1312,9 +1303,8 @@ toInt256(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1498,9 +1488,8 @@ toInt256OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `Int256` is unsuccessful. [Int256](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`
@@ -1561,9 +1550,8 @@ toUInt8(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1748,9 +1736,8 @@ toUInt8OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `UInt8` is unsuccessful. [UInt8](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1811,9 +1798,8 @@ toUInt16(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -1998,9 +1984,8 @@ toUInt16OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `UInt16` is unsuccessful. [UInt16](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2061,9 +2046,8 @@ toUInt32(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2249,9 +2233,8 @@ toUInt32OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `UInt32` is unsuccessful. [UInt32](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2312,9 +2295,8 @@ toUInt64(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported types:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2499,9 +2481,8 @@ toUInt64OrDefault(expr[, default])
 - `defauult` (optional) — The default value to return if parsing to type `UInt64` is unsuccessful. [UInt64](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2562,9 +2543,8 @@ toUInt128(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2811,9 +2791,8 @@ toUInt256(expr)
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Unsupported arguments:
 - String representations of Float32/64 values, including `NaN` and `Inf`.
@@ -2997,9 +2976,8 @@ toUInt256OrDefault(expr[, default])
 - `default` (optional) — The default value to return if parsing to type `UInt256` is unsuccessful. [UInt256](../data-types/int-uint.md).
 
 Supported arguments:
-- Values of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type (U)Int8/16/32/64/128/256.
 - Values of type Float32/64.
-- String representations of (U)Int8/16/32/128/256.
 
 Arguments for which the default value is returned:
 - String representations of Float32/64 values, including `NaN` and `Inf`
@@ -3555,7 +3533,7 @@ toDecimal32(expr, S)
 **Arguments**
 
 - `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
-- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `S` — Scale parameter between 0 and 9, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
 
 Supported arguments:
 - Values or string representations of type (U)Int8/16/32/64/128/256.
@@ -3566,7 +3544,7 @@ Unsupported arguments:
 - String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32('0xc0fe', 1);`.
 
 :::note
-Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`. 
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`. 
 Excessive digits in a fraction are discarded (not rounded). 
 Excessive digits in the integer part will lead to an exception.
 :::
@@ -3619,20 +3597,20 @@ toDecimal32OrZero(expr, S)
 **Arguments**
 
 - `expr` — A String representation of a number. [String](../data-types/string.md).
-- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `S` — Scale parameter between 0 and 9, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
 
 Supported arguments:
 - String representations of type (U)Int8/16/32/64/128/256.
 - String representations of type Float32/64.
 
 Unsupported arguments:
-- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of Float32/64 values `NaN` and `Inf`.
 - String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrZero('0xc0fe', 1);`.
 
 :::note
-Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
 Excessive digits in a fraction are discarded (not rounded).
-Excessive digits in the integer part will lead to an exception.
+Excessive digits in the integer part will lead to an error.
 :::
 
 **Returned value**
@@ -3645,8 +3623,10 @@ Query:
 
 ``` sql
 SELECT
-    toDecimal32OrZero(toString(-1.111), 5) AS val,
-    toTypeName(val)
+    toDecimal32OrZero(toString(-1.111), 5) AS a,
+    toTypeName(a),
+    toDecimal32OrZero(toString('Inf'), 5) as b,
+    toTypeName(b)
 FORMAT Vertical;
 ```
 
@@ -3655,26 +3635,10 @@ Result:
 ```response
 Row 1:
 ──────
-val:             -1.111
-toTypeName(val): Decimal(9, 5)
-```
-
-Query:
-
-``` sql
-SELECT
-    toDecimal32OrZero(toString(-1.111), 2) AS val,
-    toTypeName(val)
-FORMAT Vertical;
-```
-
-Result:
-
-```response
-Row 1:
-──────
-val:             -1.11
-toTypeName(val): Decimal(9, 2)
+a:             -1.111
+toTypeName(a): Decimal(9, 5)
+b:             0
+toTypeName(b): Decimal(9, 5)
 ```
 
 **See also**
@@ -3696,20 +3660,20 @@ toDecimal32OrNull(expr, S)
 **Arguments**
 
 - `expr` — A String representation of a number. [String](../data-types/string.md).
-- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `S` — Scale parameter between 0 and 9, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
 
 Supported arguments:
 - String representations of type (U)Int8/16/32/64/128/256.
 - String representations of type Float32/64.
 
 Unsupported arguments:
-- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of Float32/64 values `NaN` and `Inf`.
 - String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrNull('0xc0fe', 1);`.
 
 :::note
-Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
 Excessive digits in a fraction are discarded (not rounded).
-Excessive digits in the integer part will lead to an exception.
+Excessive digits in the integer part will lead to an error.
 :::
 
 **Returned value**
@@ -3722,8 +3686,10 @@ Query:
 
 ``` sql
 SELECT
-    toDecimal32OrNull(toString(-1.111), 5) AS val,
-    toTypeName(val)
+    toDecimal32OrNull(toString(-1.111), 5) AS a,
+    toTypeName(a),
+    toDecimal32OrNull(toString('Inf'), 5) as b,
+    toTypeName(b)
 FORMAT Vertical;
 ```
 
@@ -3732,26 +3698,10 @@ Result:
 ```response
 Row 1:
 ──────
-val:             -1.111
-toTypeName(val): Nullable(Decimal(9, 5))
-```
-
-Query:
-
-``` sql
-SELECT
-    toDecimal32OrNull(toString(-1.111), 2) AS val,
-    toTypeName(val)
-FORMAT Vertical;
-```
-
-Result:
-
-```response
-Row 1:
-──────
-val:             -1.11
-toTypeName(val): Nullable(Decimal(9, 2))
+a:             -1.111
+toTypeName(a): Nullable(Decimal(9, 5))
+b:             ᴺᵁᴸᴸ
+toTypeName(b): Nullable(Decimal(9, 5))
 ```
 
 **See also**
@@ -3773,21 +3723,21 @@ toDecimal32OrDefault(expr, S[, default])
 **Arguments**
 
 - `expr` — A String representation of a number. [String](../data-types/string.md).
-- `S` — Scale parameter from [ 1 : 9 ] specifying how many decimal digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
-- `default` (optional) — The default value to return if parsing to type `Decimal32(S)` is unsuccessful. [Decimal32(S](../data-types/decimal.md).
+- `S` — Scale parameter between 0 and 9, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `default` (optional) — The default value to return if parsing to type `Decimal32(S)` is unsuccessful. [Decimal32(S)](../data-types/decimal.md).
 
 Supported arguments:
 - String representations of type (U)Int8/16/32/64/128/256.
 - String representations of type Float32/64.
 
 Unsupported arguments:
-- String representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of Float32/64 values `NaN` and `Inf`.
 - String representations of binary and hexadecimal values, e.g. `SELECT toDecimal32OrDefault('0xc0fe', 1);`.
 
 :::note
-Integer overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal32`: `( -1 * 10^(9 - S), 1 * 10^(9 - S) )`.
 Excessive digits in a fraction are discarded (not rounded).
-Excessive digits in the integer part will lead to an exception.
+Excessive digits in the integer part will lead to an error.
 :::
 
 **Returned value**
@@ -3800,8 +3750,10 @@ Query:
 
 ``` sql
 SELECT
-    toDecimal32OrDefault(toString(-1.111), 5) AS val,
-    toTypeName(val)
+    toDecimal32OrDefault(toString(0.0001), 5) AS a,
+    toTypeName(a),
+    toDecimal32OrDefault('Inf', 0, CAST('-1', 'Decimal32(0)')) AS b,
+    toTypeName(b)
 FORMAT Vertical;
 ```
 
@@ -3810,16 +3762,125 @@ Result:
 ```response
 Row 1:
 ──────
-val:             -1.111
-toTypeName(val): Decimal(9, 5)
+a:             0.0001
+toTypeName(a): Decimal(9, 5)
+b:             -1
+toTypeName(b): Decimal(9, 0)
 ```
 
+**See also**
+
+- [`toDecimal32`](#todecimal32).
+- [`toDecimal32OrZero`](#todecimal32orzero).
+- [`toDecimal32OrNull`](#todecimal32ornull).
+
+## toDecimal64
+
+Converts an input value to a value of type [`Decimal(18, S)`](../data-types/decimal.md) with scale of `S`. Throws an exception in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal64(expr, S)
+```
+
+**Arguments**
+
+- `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
+- `S` — Scale parameter between 0 and 18, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- Values or string representations of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type Float32/64.
+
+Unsupported arguments:
+- Values or string representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal64('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal64`: `( -1 * 10^(18 - S), 1 * 10^(18 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(18, S)`. [Decimal64(S)](../data-types/int-uint.md).
+
+**Example**
+
+Query:
+
+```sql
+SELECT
+    toDecimal64(2, 1) AS a, toTypeName(a) AS type_a,
+    toDecimal64(4.2, 2) AS b, toTypeName(b) AS type_b,
+    toDecimal64('4.2', 3) AS c, toTypeName(c) AS type_c
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:      2
+type_a: Decimal(18, 1)
+b:      4.2
+type_b: Decimal(18, 2)
+c:      4.2
+type_c: Decimal(18, 3)
+```
+
+**See also**
+
+- [`toDecimal64OrZero`](#todecimal64orzero).
+- [`toDecimal64OrNull`](#todecimal64ornull).
+- [`toDecimal64OrDefault`](#todecimal64ordefault).
+
+## toDecimal64OrZero
+
+Like [`toDecimal64`](#todecimal64), this function converts an input value to a value of type [Decimal(18, S)](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal64OrZero(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 18, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal64OrZero('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal64`: `( -1 * 10^(18 - S), 1 * 10^(18 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(18, S)` if successful, otherwise `0` with `S` decimal places. [Decimal64(S)](../data-types/decimal.md).
+
+**Example**
+
 Query:
 
 ``` sql
 SELECT
-    toDecimal32OrDefault(toString(-1.111), 2) AS val,
-    toTypeName(val)
+    toDecimal64OrZero(toString(0.0001), 18) AS a,
+    toTypeName(a),
+    toDecimal64OrZero(toString('Inf'), 18) as b,
+    toTypeName(b)
 FORMAT Vertical;
 ```
 
@@ -3828,16 +3889,61 @@ Result:
 ```response
 Row 1:
 ──────
-val:             -1.11
-toTypeName(val): Decimal(9, 2)
+a:             0.0001
+toTypeName(a): Decimal(18, 18)
+b:             0
+toTypeName(b): Decimal(18, 18)
 ```
 
+**See also**
+
+- [`toDecimal64`](#todecimal64).
+- [`toDecimal64OrNull`](#todecimal64ornull).
+- [`toDecimal64OrDefault`](#todecimal64ordefault).
+
+## toDecimal64OrNull
+
+Like [`toDecimal64`](#todecimal64), this function converts an input value to a value of type [Nullable(Decimal(18, S))](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal64OrNull(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 18, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal64OrNull('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal64`: `( -1 * 10^(18 - S), 1 * 10^(18 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Nullable(Decimal(18, S))` if successful, otherwise value `NULL` of the same type. [Decimal64(S)](../data-types/decimal.md).
+
+**Examples**
+
 Query:
 
 ``` sql
 SELECT
-    toDecimal32OrDefault('Inf', 2, CAST('0', 'Decimal32(2)')) AS val,
-    toTypeName(val)
+    toDecimal64OrNull(toString(0.0001), 18) AS a,
+    toTypeName(a),
+    toDecimal64OrNull(toString('Inf'), 18) as b,
+    toTypeName(b)
 FORMAT Vertical;
 ```
 
@@ -3846,10 +3952,590 @@ Result:
 ```response
 Row 1:
 ──────
-val:             0
-toTypeName(val): Decimal(9, 2)
+a:             0.0001
+toTypeName(a): Nullable(Decimal(18, 18))
+b:             ᴺᵁᴸᴸ
+toTypeName(b): Nullable(Decimal(18, 18))
 ```
 
+**See also**
+
+- [`toDecimal64`](#todecimal64).
+- [`toDecimal64OrZero`](#todecimal64orzero).
+- [`toDecimal64OrDefault`](#todecimal64ordefault).
+
+## toDecimal64OrDefault
+
+Like [`toDecimal64`](#todecimal64), this function converts an input value to a value of type [Decimal(18, S)](../data-types/decimal.md) but returns the default value in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal64OrDefault(expr, S[, default])
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 18, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `default` (optional) — The default value to return if parsing to type `Decimal64(S)` is unsuccessful. [Decimal64(S)](../data-types/decimal.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal64OrDefault('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal64`: `( -1 * 10^(18 - S), 1 * 10^(18 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(18, S)` if successful, otherwise returns the default value if passed or `0` if not. [Decimal64(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal64OrDefault(toString(0.0001), 18) AS a,
+    toTypeName(a),
+    toDecimal64OrDefault('Inf', 0, CAST('-1', 'Decimal64(0)')) AS b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.0001
+toTypeName(a): Decimal(18, 18)
+b:             -1
+toTypeName(b): Decimal(18, 0)
+```
+
+**See also**
+
+- [`toDecimal64`](#todecimal64).
+- [`toDecimal64OrZero`](#todecimal64orzero).
+- [`toDecimal64OrNull`](#todecimal64ornull).
+
+## toDecimal128
+
+Converts an input value to a value of type [`Decimal(38, S)`](../data-types/decimal.md) with scale of `S`. Throws an exception in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal128(expr, S)
+```
+
+**Arguments**
+
+- `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
+- `S` — Scale parameter between 0 and 38, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- Values or string representations of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type Float32/64.
+
+Unsupported arguments:
+- Values or string representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal128('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal128`: `( -1 * 10^(38 - S), 1 * 10^(38 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(38, S)`. [Decimal128(S)](../data-types/int-uint.md).
+
+**Example**
+
+Query:
+
+```sql
+SELECT
+    toDecimal128(99, 1) AS a, toTypeName(a) AS type_a,
+    toDecimal128(99.67, 2) AS b, toTypeName(b) AS type_b,
+    toDecimal128('99.67', 3) AS c, toTypeName(c) AS type_c
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:      99
+type_a: Decimal(38, 1)
+b:      99.67
+type_b: Decimal(38, 2)
+c:      99.67
+type_c: Decimal(38, 3)
+```
+
+**See also**
+
+- [`toDecimal128OrZero`](#todecimal128orzero).
+- [`toDecimal128OrNull`](#todecimal128ornull).
+- [`toDecimal128OrDefault`](#todecimal128ordefault).
+
+## toDecimal128OrZero
+
+Like [`toDecimal128`](#todecimal128), this function converts an input value to a value of type [Decimal(38, S)](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal128OrZero(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 38, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal128OrZero('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal128`: `( -1 * 10^(38 - S), 1 * 10^(38 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(38, S)` if successful, otherwise `0` with `S` decimal places. [Decimal128(S)](../data-types/decimal.md).
+
+**Example**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal128OrZero(toString(0.0001), 38) AS a,
+    toTypeName(a),
+    toDecimal128OrZero(toString('Inf'), 38) as b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.0001
+toTypeName(a): Decimal(38, 38)
+b:             0
+toTypeName(b): Decimal(38, 38)
+```
+
+**See also**
+
+- [`toDecimal128`](#todecimal128).
+- [`toDecimal128OrNull`](#todecimal128ornull).
+- [`toDecimal128OrDefault`](#todecimal128ordefault).
+
+## toDecimal128OrNull
+
+Like [`toDecimal128`](#todecimal128), this function converts an input value to a value of type [Nullable(Decimal(38, S))](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal128OrNull(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 38, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal128OrNull('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal128`: `( -1 * 10^(38 - S), 1 * 10^(38 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Nullable(Decimal(38, S))` if successful, otherwise value `NULL` of the same type. [Decimal128(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal128OrNull(toString(1/42), 38) AS a,
+    toTypeName(a),
+    toDecimal128OrNull(toString('Inf'), 38) as b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.023809523809523808
+toTypeName(a): Nullable(Decimal(38, 38))
+b:             ᴺᵁᴸᴸ
+toTypeName(b): Nullable(Decimal(38, 38))
+```
+
+**See also**
+
+- [`toDecimal128`](#todecimal128).
+- [`toDecimal128OrZero`](#todecimal128orzero).
+- [`toDecimal128OrDefault`](#todecimal128ordefault).
+
+## toDecimal128OrDefault
+
+Like [`toDecimal128`](#todecimal128), this function converts an input value to a value of type [Decimal(38, S)](../data-types/decimal.md) but returns the default value in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal128OrDefault(expr, S[, default])
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 38, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `default` (optional) — The default value to return if parsing to type `Decimal128(S)` is unsuccessful. [Decimal128(S)](../data-types/decimal.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal128OrDefault('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal128`: `( -1 * 10^(38 - S), 1 * 10^(38 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(38, S)` if successful, otherwise returns the default value if passed or `0` if not. [Decimal128(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal128OrDefault(toString(1/42), 18) AS a,
+    toTypeName(a),
+    toDecimal128OrDefault('Inf', 0, CAST('-1', 'Decimal128(0)')) AS b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.023809523809523808
+toTypeName(a): Decimal(38, 18)
+b:             -1
+toTypeName(b): Decimal(38, 0)
+```
+
+**See also**
+
+- [`toDecimal128`](#todecimal128).
+- [`toDecimal128OrZero`](#todecimal128orzero).
+- [`toDecimal128OrNull`](#todecimal128ornull).
+
+## toDecimal256
+
+Converts an input value to a value of type [`Decimal(76, S)`](../data-types/decimal.md) with scale of `S`. Throws an exception in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal256(expr, S)
+```
+
+**Arguments**
+
+- `expr` — Expression returning a number or a string representation of a number. [Expression](../syntax.md/#syntax-expressions).
+- `S` — Scale parameter between 0 and 76, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- Values or string representations of type (U)Int8/16/32/64/128/256.
+- Values or string representations of type Float32/64.
+
+Unsupported arguments:
+- Values or string representations of Float32/64 values `NaN` and `Inf` (case-insensitive).
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal256('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal256`: `( -1 * 10^(76 - S), 1 * 10^(76 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an exception.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(76, S)`. [Decimal256(S)](../data-types/int-uint.md).
+
+**Example**
+
+Query:
+
+```sql
+SELECT
+    toDecimal256(99, 1) AS a, toTypeName(a) AS type_a,
+    toDecimal256(99.67, 2) AS b, toTypeName(b) AS type_b,
+    toDecimal256('99.67', 3) AS c, toTypeName(c) AS type_c
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:      99
+type_a: Decimal(76, 1)
+b:      99.67
+type_b: Decimal(76, 2)
+c:      99.67
+type_c: Decimal(76, 3)
+```
+
+**See also**
+
+- [`toDecimal256OrZero`](#todecimal256orzero).
+- [`toDecimal256OrNull`](#todecimal256ornull).
+- [`toDecimal256OrDefault`](#todecimal256ordefault).
+
+## toDecimal256OrZero
+
+Like [`toDecimal256`](#todecimal256), this function converts an input value to a value of type [Decimal(76, S)](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal256OrZero(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 76, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal256OrZero('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal256`: `( -1 * 10^(76 - S), 1 * 10^(76 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(76, S)` if successful, otherwise `0` with `S` decimal places. [Decimal256(S)](../data-types/decimal.md).
+
+**Example**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal256OrZero(toString(0.0001), 76) AS a,
+    toTypeName(a),
+    toDecimal256OrZero(toString('Inf'), 76) as b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.0001
+toTypeName(a): Decimal(76, 76)
+b:             0
+toTypeName(b): Decimal(76, 76)
+```
+
+**See also**
+
+- [`toDecimal256`](#todecimal256).
+- [`toDecimal256OrNull`](#todecimal256ornull).
+- [`toDecimal256OrDefault`](#todecimal256ordefault).
+
+## toDecimal256OrNull
+
+Like [`toDecimal256`](#todecimal256), this function converts an input value to a value of type [Nullable(Decimal(76, S))](../data-types/decimal.md) but returns `0` in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal256OrNull(expr, S)
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 76, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal256OrNull('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal256`: `( -1 * 10^(76 - S), 1 * 10^(76 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Nullable(Decimal(76, S))` if successful, otherwise value `NULL` of the same type. [Decimal256(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal256OrNull(toString(1/42), 76) AS a,
+    toTypeName(a),
+    toDecimal256OrNull(toString('Inf'), 76) as b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.023809523809523808
+toTypeName(a): Nullable(Decimal(76, 76))
+b:             ᴺᵁᴸᴸ
+toTypeName(b): Nullable(Decimal(76, 76))
+```
+
+**See also**
+
+- [`toDecimal256`](#todecimal256).
+- [`toDecimal256OrZero`](#todecimal256orzero).
+- [`toDecimal256OrDefault`](#todecimal256ordefault).
+
+## toDecimal256OrDefault
+
+Like [`toDecimal256`](#todecimal256), this function converts an input value to a value of type [Decimal(76, S)](../data-types/decimal.md) but returns the default value in case of an error.
+
+**Syntax**
+
+```sql
+toDecimal256OrDefault(expr, S[, default])
+```
+
+**Arguments**
+
+- `expr` — A String representation of a number. [String](../data-types/string.md).
+- `S` — Scale parameter between 0 and 76, specifying how many digits the fractional part of a number can have. [UInt8](../data-types/int-uint.md).
+- `default` (optional) — The default value to return if parsing to type `Decimal256(S)` is unsuccessful. [Decimal256(S)](../data-types/decimal.md).
+
+Supported arguments:
+- String representations of type (U)Int8/16/32/64/128/256.
+- String representations of type Float32/64.
+
+Unsupported arguments:
+- String representations of Float32/64 values `NaN` and `Inf`.
+- String representations of binary and hexadecimal values, e.g. `SELECT toDecimal256OrDefault('0xc0fe', 1);`.
+
+:::note
+An overflow can occur if the value of `expr` exceeds the bounds of `Decimal256`: `( -1 * 10^(76 - S), 1 * 10^(76 - S) )`.
+Excessive digits in a fraction are discarded (not rounded).
+Excessive digits in the integer part will lead to an error.
+:::
+
+**Returned value**
+
+- Value of type `Decimal(76, S)` if successful, otherwise returns the default value if passed or `0` if not. [Decimal256(S)](../data-types/decimal.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT
+    toDecimal256OrDefault(toString(1/42), 76) AS a,
+    toTypeName(a),
+    toDecimal256OrDefault('Inf', 0, CAST('-1', 'Decimal256(0)')) AS b,
+    toTypeName(b)
+FORMAT Vertical;
+```
+
+Result:
+
+```response
+Row 1:
+──────
+a:             0.023809523809523808
+toTypeName(a): Decimal(76, 76)
+b:             -1
+toTypeName(b): Decimal(76, 0)
+```
+
+**See also**
+
+- [`toDecimal256`](#todecimal256).
+- [`toDecimal256OrZero`](#todecimal256orzero).
+- [`toDecimal256OrNull`](#todecimal256ornull).
+
 ## toString
 
 Functions for converting between numbers, strings (but not fixed strings), dates, and dates with times.

From 18d9bb2ade4e98051df007663a387eb74146c26f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 10 Aug 2024 16:25:32 +0200
Subject: [PATCH 45/52] tests: attempt to fix 01600_parts_states_metrics_long
 (by forbid parallel run)

CI: https://s3.amazonaws.com/clickhouse-test-reports/68134/8d4f822fee64d44440459b733c67dee5e9fb1e02/stateless_tests__tsan__s3_storage__[2_4].html
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/01600_parts_states_metrics_long.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh b/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
index 47b5a4dea13..8062bb0ba5d 100755
--- a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
+++ b/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long
+# Tags: long, no-parallel
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From eeda67042c08bedbd18c3b7a76cb8928e9975348 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 10 Aug 2024 16:28:49 +0200
Subject: [PATCH 46/52] tests: make 01600_parts_states_metrics_long faster

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../01600_parts_states_metrics_long.sh        | 22 ++++++++++++-------
 1 file changed, 14 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh b/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
index 8062bb0ba5d..a07dd306b3e 100755
--- a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
+++ b/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
@@ -5,6 +5,12 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+function query()
+{
+    # NOTE: database_atomic_wait_for_drop_and_detach_synchronously needed only for local env, CI has it ON
+    ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&database_atomic_wait_for_drop_and_detach_synchronously=1" -d "$*"
+}
+
 # NOTE: database = $CLICKHOUSE_DATABASE is unwanted
 verify_sql="SELECT
     (SELECT sumIf(value, metric = 'PartsActive'), sumIf(value, metric = 'PartsOutdated') FROM system.metrics)
@@ -18,13 +24,13 @@ verify()
 {
     for i in {1..5000}
     do
-        result=$( $CLICKHOUSE_CLIENT --query="$verify_sql" )
+        result=$( query "$verify_sql" )
         [ "$result" = "1" ] && echo "$result" && break
         sleep 0.1
 
         if [[ $i -eq 5000 ]]
         then
-            $CLICKHOUSE_CLIENT "
+            query "
               SELECT sumIf(value, metric = 'PartsActive'), sumIf(value, metric = 'PartsOutdated') FROM system.metrics;
               SELECT sum(active), sum(NOT active) FROM system.parts;
               SELECT sum(active), sum(NOT active) FROM system.projection_parts;
@@ -34,17 +40,17 @@ verify()
     done
 }
 
-$CLICKHOUSE_CLIENT --database_atomic_wait_for_drop_and_detach_synchronously=1 --query="DROP TABLE IF EXISTS test_table"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE test_table (data Date) ENGINE = MergeTree PARTITION BY toYear(data) ORDER BY data;"
+query "DROP TABLE IF EXISTS test_table"
+query "CREATE TABLE test_table (data Date) ENGINE = MergeTree PARTITION BY toYear(data) ORDER BY data;"
 
-$CLICKHOUSE_CLIENT --query="INSERT INTO test_table VALUES ('1992-01-01')"
+query "INSERT INTO test_table VALUES ('1992-01-01')"
 verify
 
-$CLICKHOUSE_CLIENT --query="INSERT INTO test_table VALUES ('1992-01-02')"
+query "INSERT INTO test_table VALUES ('1992-01-02')"
 verify
 
-$CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE test_table FINAL"
+query "OPTIMIZE TABLE test_table FINAL"
 verify
 
-$CLICKHOUSE_CLIENT --database_atomic_wait_for_drop_and_detach_synchronously=1 --query="DROP TABLE test_table"
+query "DROP TABLE test_table"
 verify

From 613ebe367c1f811eea38d7c5e778cedddbfb0ce7 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Sat, 10 Aug 2024 22:05:11 +0000
Subject: [PATCH 47/52] Only add extra cell when necessary

---
 tests/ci/report.py | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/tests/ci/report.py b/tests/ci/report.py
index 15b1512896a..6779a6dae96 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -738,7 +738,7 @@ def create_test_html_report(
     if test_results:
         rows_part = []
         num_fails = 0
-        has_test_time = False
+        has_test_time = any(tr.time is not None for tr in test_results)
         has_log_urls = False
 
         # Display entires with logs at the top (they correspond to failed tests)
@@ -770,12 +770,12 @@ def create_test_html_report(
             row.append(f'<td {fail_id}style="{style}">{test_result.status}</td>')
             colspan += 1
 
-            row.append("<td>")
-            if test_result.time is not None:
-                has_test_time = True
-                row.append(str(test_result.time))
-            row.append("</td>")
-            colspan += 1
+            if has_test_time:
+                if test_result.time is not None:
+                    row.append(f"<td>{test_result.time}</td>")
+                else:
+                    row.append("<td></td>")
+                colspan += 1
 
             if test_result.log_urls is not None:
                 has_log_urls = True

From 1142305b113e261d0c8910c0b622ba94727fe78d Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 10 Aug 2024 09:53:43 +0200
Subject: [PATCH 48/52] tests: fix 01246_buffer_flush flakiness due to slow
 trace_log flush

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/01246_buffer_flush.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01246_buffer_flush.sh b/tests/queries/0_stateless/01246_buffer_flush.sh
index aea91a0bf6b..3c7b9038e1f 100755
--- a/tests/queries/0_stateless/01246_buffer_flush.sh
+++ b/tests/queries/0_stateless/01246_buffer_flush.sh
@@ -27,7 +27,7 @@ function wait_until()
 function get_buffer_delay()
 {
     local buffer_insert_id=$1 && shift
-    query "SYSTEM FLUSH LOGS"
+    $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
     query "
         WITH
             (SELECT event_time_microseconds FROM system.query_log WHERE current_database = '$CLICKHOUSE_DATABASE' AND type = 'QueryStart' AND query_id = '$buffer_insert_id') AS begin_,

From 53bc1b7e3539cde14cb34f26af296bde5c29449e Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@gmail.com>
Date: Sun, 11 Aug 2024 13:19:36 +0200
Subject: [PATCH 49/52] Revert "Refactor tests for (experimental) statistics"

---
 docs/en/development/tests.md                  |   4 +-
 .../statements/alter/statistics.md            |  16 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |   2 +-
 ...2864_statistics_count_min_sketch.reference |  14 ++
 .../02864_statistics_count_min_sketch.sql     |  70 ++++++
 .../02864_statistics_ddl.reference            |  37 ++-
 .../0_stateless/02864_statistics_ddl.sql      | 234 ++++--------------
 ...delayed_materialization_in_merge.reference |  12 -
 ...stics_delayed_materialization_in_merge.sql |  36 ---
 .../02864_statistics_exception.reference      |   0
 .../02864_statistics_exception.sql            |  55 ++++
 ..._statistics_materialize_in_merge.reference |  10 +
 .../02864_statistics_materialize_in_merge.sql |  52 ++++
 .../02864_statistics_predicates.reference     |  98 --------
 .../02864_statistics_predicates.sql           | 214 ----------------
 .../02864_statistics_uniq.reference           |  35 +++
 .../0_stateless/02864_statistics_uniq.sql     |  73 ++++++
 .../02864_statistics_usage.reference          |  20 --
 .../0_stateless/02864_statistics_usage.sql    |  42 ----
 19 files changed, 399 insertions(+), 625 deletions(-)
 create mode 100644 tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_exception.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_exception.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_predicates.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_predicates.sql
 create mode 100644 tests/queries/0_stateless/02864_statistics_uniq.reference
 create mode 100644 tests/queries/0_stateless/02864_statistics_uniq.sql
 delete mode 100644 tests/queries/0_stateless/02864_statistics_usage.reference
 delete mode 100644 tests/queries/0_stateless/02864_statistics_usage.sql

diff --git a/docs/en/development/tests.md b/docs/en/development/tests.md
index 6cb36e2049b..269995a1a96 100644
--- a/docs/en/development/tests.md
+++ b/docs/en/development/tests.md
@@ -14,7 +14,7 @@ Each functional test sends one or multiple queries to the running ClickHouse ser
 
 Tests are located in `queries` directory. There are two subdirectories: `stateless` and `stateful`. Stateless tests run queries without any preloaded test data - they often create small synthetic datasets on the fly, within the test itself. Stateful tests require preloaded test data from ClickHouse and it is available to general public.
 
-Each test can be one of two types: `.sql` and `.sh`. `.sql` test is the simple SQL script that is piped to `clickhouse-client`. `.sh` test is a script that is run by itself. SQL tests are generally preferable to `.sh` tests. You should use `.sh` tests only when you have to test some feature that cannot be exercised from pure SQL, such as piping some input data into `clickhouse-client` or testing `clickhouse-local`.
+Each test can be one of two types: `.sql` and `.sh`. `.sql` test is the simple SQL script that is piped to `clickhouse-client --multiquery`. `.sh` test is a script that is run by itself. SQL tests are generally preferable to `.sh` tests. You should use `.sh` tests only when you have to test some feature that cannot be exercised from pure SQL, such as piping some input data into `clickhouse-client` or testing `clickhouse-local`.
 
 :::note
 A common mistake when testing data types `DateTime` and `DateTime64` is assuming that the server uses a specific time zone (e.g. "UTC"). This is not the case, time zones in CI test runs
@@ -38,7 +38,7 @@ For more options, see `tests/clickhouse-test --help`. You can simply run all tes
 
 ### Adding a New Test
 
-To add new test, create a `.sql` or `.sh` file in `queries/0_stateless` directory, check it manually and then generate `.reference` file in the following way: `clickhouse-client < 00000_test.sql > 00000_test.reference` or `./00000_test.sh > ./00000_test.reference`.
+To add new test, create a `.sql` or `.sh` file in `queries/0_stateless` directory, check it manually and then generate `.reference` file in the following way: `clickhouse-client --multiquery < 00000_test.sql > 00000_test.reference` or `./00000_test.sh > ./00000_test.reference`.
 
 Tests should use (create, drop, etc) only tables in `test` database that is assumed to be created beforehand; also tests can use temporary tables.
 
diff --git a/docs/en/sql-reference/statements/alter/statistics.md b/docs/en/sql-reference/statements/alter/statistics.md
index 7a1774a01b5..6880cef0e5c 100644
--- a/docs/en/sql-reference/statements/alter/statistics.md
+++ b/docs/en/sql-reference/statements/alter/statistics.md
@@ -8,28 +8,26 @@ sidebar_label: STATISTICS
 
 The following operations are available:
 
--   `ALTER TABLE [db].table ADD STATISTICS [IF NOT EXISTS] (column list) TYPE (type list)` - Adds statistic description to tables metadata.
+-   `ALTER TABLE [db].table ADD STATISTICS (columns list) TYPE (type list)` - Adds statistic description to tables metadata.
 
--   `ALTER TABLE [db].table MODIFY STATISTICS (column list) TYPE (type list)` - Modifies statistic description to tables metadata.
+-   `ALTER TABLE [db].table MODIFY STATISTICS (columns list) TYPE (type list)` - Modifies statistic description to tables metadata.
 
--   `ALTER TABLE [db].table DROP STATISTICS [IF EXISTS] (column list)` - Removes statistics from the metadata of the specified columns and deletes all statistics objects in all parts for the specified columns.
+-   `ALTER TABLE [db].table DROP STATISTICS (columns list)` - Removes statistics from the metadata of the specified columns and deletes all statistics objects in all parts for the specified columns.
 
--   `ALTER TABLE [db].table CLEAR STATISTICS [IF EXISTS] (column list)` - Deletes all statistics objects in all parts for the specified columns. Statistics objects can be rebuild using `ALTER TABLE MATERIALIZE STATISTICS`.
+-   `ALTER TABLE [db].table CLEAR STATISTICS (columns list)` - Deletes all statistics objects in all parts for the specified columns. Statistics objects can be rebuild using `ALTER TABLE MATERIALIZE STATISTICS`.
 
--   `ALTER TABLE [db.]table MATERIALIZE STATISTICS [IF EXISTS] (column list)` - Rebuilds the statistic for columns. Implemented as a [mutation](../../../sql-reference/statements/alter/index.md#mutations). 
+-   `ALTER TABLE [db.]table MATERIALIZE STATISTICS (columns list)` - Rebuilds the statistic for columns. Implemented as a [mutation](../../../sql-reference/statements/alter/index.md#mutations). 
 
 The first two commands are lightweight in a sense that they only change metadata or remove files.
 
 Also, they are replicated, syncing statistics metadata via ZooKeeper.
 
-## Example:
-
-Adding two statistics types to two columns:
+There is an example adding two statistics types to two columns:
 
 ```
 ALTER TABLE t1 MODIFY STATISTICS c, d TYPE TDigest, Uniq;
 ```
 
 :::note
-Statistic are supported only for [`*MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) engine tables (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) variants).
+Statistic manipulation is supported only for tables with [`*MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) engine (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) variants).
 :::
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index c7101021f02..625b1281c61 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -3517,7 +3517,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
                         const auto & new_column = new_metadata.getColumns().get(command.column_name);
                         if (!old_column.type->equals(*new_column.type))
                             throw Exception(ErrorCodes::ALTER_OF_COLUMN_IS_FORBIDDEN,
-                                            "ALTER types of column {} with statistics is not safe "
+                                            "ALTER types of column {} with statistics is not not safe "
                                             "because it can change the representation of statistics",
                                             backQuoteIfNeed(command.column_name));
                     }
diff --git a/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference b/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
new file mode 100644
index 00000000000..02c41656a36
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_count_min_sketch.reference
@@ -0,0 +1,14 @@
+CREATE TABLE default.tab\n(\n    `a` String,\n    `b` UInt64,\n    `c` Int64,\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+Test statistics count_min:
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(equals(a, \'0\'), equals(b, 0), equals(c, 0)) (removed)
+Test statistics multi-types:
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(equals(a, \'0\'), less(c, -90), greater(b, 900)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(equals(a, \'10000\'), equals(b, 0), less(c, 0)) (removed)
+Test LowCardinality and Nullable data type:
+tab2
diff --git a/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql b/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
new file mode 100644
index 00000000000..c730aa7b4a7
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_count_min_sketch.sql
@@ -0,0 +1,70 @@
+-- Tags: no-fasttest
+
+DROP TABLE IF EXISTS tab SYNC;
+
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+SET allow_suspicious_low_cardinality_types=1;
+SET mutations_sync = 2;
+
+CREATE TABLE tab
+(
+    a String,
+    b UInt64,
+    c Int64,
+    pk String,
+) Engine = MergeTree() ORDER BY pk
+SETTINGS min_bytes_for_wide_part = 0;
+
+SHOW CREATE TABLE tab;
+
+INSERT INTO tab select toString(number % 10000), number % 1000, -(number % 100), generateUUIDv4() FROM system.numbers LIMIT 10000;
+
+SELECT 'Test statistics count_min:';
+
+ALTER TABLE tab ADD STATISTICS a TYPE count_min;
+ALTER TABLE tab ADD STATISTICS b TYPE count_min;
+ALTER TABLE tab ADD STATISTICS c TYPE count_min;
+ALTER TABLE tab MATERIALIZE STATISTICS a, b, c;
+
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
+FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c = 0/*100*/ and b = 0/*10*/ and a = '0'/*1*/) xx
+WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+ALTER TABLE tab DROP STATISTICS a, b, c;
+
+
+SELECT 'Test statistics multi-types:';
+
+ALTER TABLE tab ADD STATISTICS a TYPE count_min;
+ALTER TABLE tab ADD STATISTICS b TYPE count_min, uniq, tdigest;
+ALTER TABLE tab ADD STATISTICS c TYPE count_min, uniq, tdigest;
+ALTER TABLE tab MATERIALIZE STATISTICS a, b, c;
+
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
+FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < -90/*900*/ and b > 900/*990*/ and a = '0'/*1*/)
+WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8|_UInt16|_String', '')
+FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 0/*9900*/ and b = 0/*10*/ and a = '10000'/*0*/)
+WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+ALTER TABLE tab DROP STATISTICS a, b, c;
+
+DROP TABLE IF EXISTS tab SYNC;
+
+
+SELECT 'Test LowCardinality and Nullable data type:';
+DROP TABLE IF EXISTS tab2 SYNC;
+SET allow_suspicious_low_cardinality_types=1;
+CREATE TABLE tab2
+(
+    a LowCardinality(Int64) STATISTICS(count_min),
+    b Nullable(Int64) STATISTICS(count_min),
+    c LowCardinality(Nullable(Int64)) STATISTICS(count_min),
+    pk String,
+) Engine = MergeTree() ORDER BY pk;
+
+select name from system.tables where name = 'tab2' and database = currentDatabase();
+
+DROP TABLE IF EXISTS tab2 SYNC;
diff --git a/tests/queries/0_stateless/02864_statistics_ddl.reference b/tests/queries/0_stateless/02864_statistics_ddl.reference
index 0e453b0ee8a..a7ff5caa0b0 100644
--- a/tests/queries/0_stateless/02864_statistics_ddl.reference
+++ b/tests/queries/0_stateless/02864_statistics_ddl.reference
@@ -1,6 +1,31 @@
-CREATE TABLE default.tab\n(\n    `f64` Float64,\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32,\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-CREATE TABLE default.tab\n(\n    `f64` Float64 STATISTICS(tdigest, uniq),\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32 STATISTICS(tdigest, uniq),\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
-CREATE TABLE default.tab\n(\n    `f64` Float64,\n    `f64_tdigest` Float64 STATISTICS(tdigest),\n    `f32` Float32,\n    `s` String,\n    `a` Array(Float64)\n)\nENGINE = MergeTree\nORDER BY tuple()\nSETTINGS index_granularity = 8192
+CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+After insert
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
+10
+0
+After drop statistic
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(b, 10), less(a, 10)) (removed)
+10
+CREATE TABLE default.tab\n(\n    `a` Float64,\n    `b` Int64,\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+After add statistic
+CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+After materialize statistic
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
+20
+After merge
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), less(b, 10)) (removed)
+20
+CREATE TABLE default.tab\n(\n    `a` Float64 STATISTICS(tdigest),\n    `c` Int64 STATISTICS(tdigest),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+After rename
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), less(c, 10)) (removed)
+20
diff --git a/tests/queries/0_stateless/02864_statistics_ddl.sql b/tests/queries/0_stateless/02864_statistics_ddl.sql
index 32b56a842b7..fe612efe2ac 100644
--- a/tests/queries/0_stateless/02864_statistics_ddl.sql
+++ b/tests/queries/0_stateless/02864_statistics_ddl.sql
@@ -1,195 +1,59 @@
--- Tags: no-fasttest
--- no-fasttest: 'count_min' sketches need a 3rd party library
-
--- Tests that DDL statements which create / drop / materialize statistics
-
-SET mutations_sync = 1;
+-- Tests that various DDL statements create/drop/materialize statistics
 
 DROP TABLE IF EXISTS tab;
 
--- Error case: Can't create statistics when allow_experimental_statistics = 0
-CREATE TABLE tab (col Float64 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
 SET allow_experimental_statistics = 1;
-
--- Error case: Unknown statistics types are rejected
-CREATE TABLE tab (col Float64 STATISTICS(no_statistics_type)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
--- Error case: The same statistics type can't exist more than once on a column
-CREATE TABLE tab (col Float64 STATISTICS(tdigest, tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
-
-SET allow_suspicious_low_cardinality_types = 1;
-
--- Statistics can only be created on columns of specific data types (depending on the statistics kind), (*)
-
---   tdigest requires data_type.isValueRepresentedByInteger
---     These types work:
-CREATE TABLE tab (col UInt8 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col UInt256 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Float32 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Decimal32(3) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date32 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime64 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col IPv4 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Nullable(UInt8) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
---     These types don't work:
-CREATE TABLE tab (col String STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col FixedString(1) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Array(Float64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col UUID STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col IPv6 STATISTICS(tdigest)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-
---   uniq requires data_type.isValueRepresentedByInteger
---     These types work:
-CREATE TABLE tab (col UInt8 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col UInt256 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Float32 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Decimal32(3) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date32 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime64 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col IPv4 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Nullable(UInt8) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
---     These types don't work:
-CREATE TABLE tab (col String STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col FixedString(1) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Array(Float64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col UUID STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col IPv6 STATISTICS(uniq)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-
---   count_min requires data_type.isValueRepresentedByInteger or data_type = (Fixed)String
---     These types work:
-CREATE TABLE tab (col UInt8 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col UInt256 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Float32 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Decimal32(3) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Date32 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col DateTime64 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Enum('hello', 'world') STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col IPv4 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col Nullable(UInt8) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(UInt8) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col LowCardinality(Nullable(UInt8)) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col String STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
-CREATE TABLE tab (col FixedString(1) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); DROP TABLE tab;
---     These types don't work:
-CREATE TABLE tab (col Array(Float64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Tuple(Float64, Float64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col Map(UInt64, UInt64) STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col UUID STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-CREATE TABLE tab (col IPv6 STATISTICS(count_min)) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
-
--- CREATE TABLE was easy, ALTER is more fun
+SET allow_statistics_optimize = 1;
 
 CREATE TABLE tab
 (
-    f64           Float64,
-    f64_tdigest   Float64 STATISTICS(tdigest),
-    f32           Float32,
-    s             String,
-    a             Array(Float64)
-)
-Engine = MergeTree()
-ORDER BY tuple();
+    a Float64 STATISTICS(tdigest),
+    b Int64 STATISTICS(tdigest),
+    pk String,
+) Engine = MergeTree() ORDER BY pk
+SETTINGS min_bytes_for_wide_part = 0;
 
--- Error case: Unknown statistics types are rejected
--- (relevant for ADD and MODIFY)
-ALTER TABLE tab ADD STATISTICS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
-ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
-ALTER TABLE tab MODIFY STATISTICS f64 TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
--- for some reason, ALTER TABLE tab MODIFY STATISTICS IF EXISTS is not supported
-
--- Error case: The same statistics type can't exist more than once on a column
--- (relevant for ADD and MODIFY)
---   Create the same statistics object twice
-ALTER TABLE tab ADD STATISTICS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
-ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
-ALTER TABLE tab MODIFY STATISTICS f64 TYPE tdigest, tdigest; -- { serverError INCORRECT_QUERY }
---   Create an statistics which exists already
-ALTER TABLE tab ADD STATISTICS f64_tdigest TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab ADD STATISTICS IF NOT EXISTS f64_tdigest TYPE tdigest; -- no-op
-ALTER TABLE tab MODIFY STATISTICS f64_tdigest TYPE tdigest; -- no-op
-
--- Error case: Column does not exist
--- (relevant for ADD, MODIFY, DROP, CLEAR, and MATERIALIZE)
--- Note that the results are unfortunately quite inconsistent ...
-ALTER TABLE tab ADD STATISTICS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab ADD STATISTICS IF NOT EXISTS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MODIFY STATISTICS no_such_column TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS IF EXISTS no_such_column; -- no-op
-ALTER TABLE tab CLEAR STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab CLEAR STATISTICS IF EXISTS no_such_column; -- no-op
-ALTER TABLE tab MATERIALIZE STATISTICS no_such_column; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MATERIALIZE STATISTICS IF EXISTS no_such_column; -- { serverError ILLEGAL_STATISTICS }
-
--- Error case: Column exists but has no statistics
--- (relevant for MODIFY, DROP, CLEAR, and MATERIALIZE)
--- Note that the results are unfortunately quite inconsistent ...
-ALTER TABLE tab MODIFY STATISTICS s TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab DROP STATISTICS IF EXISTS s; -- no-op
-ALTER TABLE tab CLEAR STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab CLEAR STATISTICS IF EXISTS s; -- no-op
-ALTER TABLE tab MATERIALIZE STATISTICS s; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MATERIALIZE STATISTICS IF EXISTS s; -- { serverError ILLEGAL_STATISTICS }
-
--- We don't check systematically that that statistics can only be created via ALTER ADD STATISTICS on columns of specific data types (the
--- internal type validation code is tested already above, (*)). Only do a rudimentary check for each statistics type with a data type that
--- works and one that doesn't work.
---   tdigest
---     Works:
-ALTER TABLE tab ADD STATISTICS f64 TYPE tdigest; ALTER TABLE tab DROP STATISTICS f64;
-ALTER TABLE tab MODIFY STATISTICS f64 TYPE tdigest; ALTER TABLE tab DROP STATISTICS f64;
---     Doesn't work:
-ALTER TABLE tab ADD STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MODIFY STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
---   uniq
---     Works:
-ALTER TABLE tab ADD STATISTICS f64 TYPE uniq; ALTER TABLE tab DROP STATISTICS f64;
-ALTER TABLE tab MODIFY STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
---     Doesn't work:
-ALTER TABLE tab ADD STATISTICS a TYPE uniq; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MODIFY STATISTICS a TYPE uniq; -- { serverError ILLEGAL_STATISTICS }
---   count_min
---     Works:
-ALTER TABLE tab ADD STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
-ALTER TABLE tab MODIFY STATISTICS f64 TYPE count_min; ALTER TABLE tab DROP STATISTICS f64;
---     Doesn't work:
-ALTER TABLE tab ADD STATISTICS a TYPE count_min; -- { serverError ILLEGAL_STATISTICS }
-ALTER TABLE tab MODIFY STATISTICS a TYPE count_min; -- { serverError ILLEGAL_STATISTICS }
-
--- Any data type changes on columns with statistics are disallowed, for simplicity even if the new data type is compatible with all existing
--- statistics objects (e.g. tdigest can be created on Float64 and UInt64)
-ALTER TABLE tab MODIFY COLUMN f64_tdigest UInt64; -- { serverError ALTER_OF_COLUMN_IS_FORBIDDEN }
-
--- Finally, do a full-circle test of a good case. Print table definition after each step.
--- Intentionally specifying _two_ columns and _two_ statistics types to have that also tested.
-SHOW CREATE TABLE tab;
-ALTER TABLE tab ADD STATISTICS f64, f32 TYPE tdigest, uniq;
-SHOW CREATE TABLE tab;
-ALTER TABLE tab MODIFY STATISTICS f64, f32 TYPE tdigest, uniq;
-SHOW CREATE TABLE tab;
-ALTER TABLE tab CLEAR STATISTICS f64, f32;
-SHOW CREATE TABLE tab;
-ALTER TABLE tab MATERIALIZE STATISTICS f64, f32;
-SHOW CREATE TABLE tab;
-ALTER TABLE tab DROP STATISTICS f64, f32;
 SHOW CREATE TABLE tab;
 
-DROP TABLE tab;
+INSERT INTO tab select number, -number, generateUUIDv4() FROM system.numbers LIMIT 10000;
+
+SELECT 'After insert';
+SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT count(*) FROM tab WHERE b < 10 and a < 10;
+SELECT count(*) FROM tab WHERE b < NULL and a < '10';
+
+ALTER TABLE tab DROP STATISTICS a, b;
+
+SELECT 'After drop statistic';
+SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT count(*) FROM tab WHERE b < 10 and a < 10;
+
+SHOW CREATE TABLE tab;
+
+ALTER TABLE tab ADD STATISTICS a, b TYPE tdigest;
+
+SELECT 'After add statistic';
+
+SHOW CREATE TABLE tab;
+
+ALTER TABLE tab MATERIALIZE STATISTICS a, b;
+INSERT INTO tab select number, -number, generateUUIDv4() FROM system.numbers LIMIT 10000;
+
+SELECT 'After materialize statistic';
+SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT count(*) FROM tab WHERE b < 10 and a < 10;
+
+OPTIMIZE TABLE tab FINAL;
+
+SELECT 'After merge';
+SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT count(*) FROM tab WHERE b < 10 and a < 10;
+
+ALTER TABLE tab RENAME COLUMN b TO c;
+SHOW CREATE TABLE tab;
+
+SELECT 'After rename';
+SELECT replaceRegexpAll(explain, '__table1\.|_UInt8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 10 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT count(*) FROM tab WHERE c < 10 and a < 10;
+
+DROP TABLE IF EXISTS tab;
diff --git a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
deleted file mode 100644
index eb5e685597c..00000000000
--- a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.reference
+++ /dev/null
@@ -1,12 +0,0 @@
-After insert
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(b, 10_UInt8), less(a, 10_UInt8)) (removed)
-After merge
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
-After truncate, insert, and materialize
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql b/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
deleted file mode 100644
index d469a4c2036..00000000000
--- a/tests/queries/0_stateless/02864_statistics_delayed_materialization_in_merge.sql
+++ /dev/null
@@ -1,36 +0,0 @@
--- Tests delayed materialization of statistics in merge instead of during insert (setting 'materialize_statistics_on_insert = 0').
--- (The concrete statistics type, column data type and predicate type don't matter)
-
--- Checks by the predicate evaluation order in EXPLAIN. This is quite fragile, a better approach would be helpful (maybe 'send_logs_level'?)
-
-DROP TABLE IF EXISTS tab;
-
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-SET enable_analyzer = 1;
-
-SET materialize_statistics_on_insert = 0;
-
-CREATE TABLE tab
-(
-    a Int64 STATISTICS(tdigest),
-    b Int16 STATISTICS(tdigest),
-) ENGINE = MergeTree() ORDER BY tuple()
-SETTINGS min_bytes_for_wide_part = 0, enable_vertical_merge_algorithm = 0; -- TODO: there is a bug in vertical merge with statistics.
-
-INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
-SELECT 'After insert';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks b first, then a (statistics not used)
-
-OPTIMIZE TABLE tab FINAL;
-SELECT 'After merge';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
-
-TRUNCATE TABLE tab;
-SET mutations_sync = 2;
-INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
-ALTER TABLE tab MATERIALIZE STATISTICS a, b;
-SELECT 'After truncate, insert, and materialize';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
-
-DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_exception.reference b/tests/queries/0_stateless/02864_statistics_exception.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02864_statistics_exception.sql b/tests/queries/0_stateless/02864_statistics_exception.sql
new file mode 100644
index 00000000000..289ffee6600
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_exception.sql
@@ -0,0 +1,55 @@
+-- Tests creating/dropping/materializing statistics produces the right exceptions.
+
+DROP TABLE IF EXISTS tab;
+
+-- Can't create statistics when allow_experimental_statistics = 0
+CREATE TABLE tab
+(
+    a Float64 STATISTICS(tdigest)
+) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
+SET allow_experimental_statistics = 1;
+
+-- The same type of statistics can't exist more than once on a column
+CREATE TABLE tab
+(
+    a Float64 STATISTICS(tdigest, tdigest)
+) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
+-- Unknown statistics types are rejected
+CREATE TABLE tab
+(
+    a Float64 STATISTICS(no_statistics_type)
+) Engine = MergeTree() ORDER BY tuple(); -- { serverError INCORRECT_QUERY }
+
+-- tDigest statistics can only be created on numeric columns
+CREATE TABLE tab
+(
+    a String STATISTICS(tdigest),
+) Engine = MergeTree() ORDER BY tuple(); -- { serverError ILLEGAL_STATISTICS }
+
+CREATE TABLE tab
+(
+    a Float64,
+    b String
+) Engine = MergeTree() ORDER BY tuple();
+
+ALTER TABLE tab ADD STATISTICS a TYPE no_statistics_type; -- { serverError INCORRECT_QUERY }
+ALTER TABLE tab ADD STATISTICS a TYPE tdigest;
+ALTER TABLE tab ADD STATISTICS IF NOT EXISTS a TYPE tdigest;
+ALTER TABLE tab ADD STATISTICS a TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab MODIFY STATISTICS a TYPE tdigest;
+-- Statistics can be created only on integer columns
+ALTER TABLE tab ADD STATISTICS b TYPE tdigest; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS b; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab DROP STATISTICS a;
+ALTER TABLE tab DROP STATISTICS IF EXISTS a;
+ALTER TABLE tab CLEAR STATISTICS a; -- { serverError ILLEGAL_STATISTICS }
+ALTER TABLE tab CLEAR STATISTICS IF EXISTS a;
+ALTER TABLE tab MATERIALIZE STATISTICS b; -- { serverError ILLEGAL_STATISTICS }
+
+ALTER TABLE tab ADD STATISTICS a TYPE tdigest;
+ALTER TABLE tab MODIFY COLUMN a Float64 TTL toDateTime(b) + INTERVAL 1 MONTH;
+ALTER TABLE tab MODIFY COLUMN a Int64; -- { serverError ALTER_OF_COLUMN_IS_FORBIDDEN }
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
new file mode 100644
index 00000000000..5e969cf41cb
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.reference
@@ -0,0 +1,10 @@
+10
+10
+10
+statistics not used	Condition less(b, 10_UInt8) moved to PREWHERE
+statistics not used	Condition less(a, 10_UInt8) moved to PREWHERE
+statistics used after merge	Condition less(a, 10_UInt8) moved to PREWHERE
+statistics used after merge	Condition less(b, 10_UInt8) moved to PREWHERE
+statistics used after materialize	Condition less(a, 10_UInt8) moved to PREWHERE
+statistics used after materialize	Condition less(b, 10_UInt8) moved to PREWHERE
+2	0
diff --git a/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
new file mode 100644
index 00000000000..6606cff263f
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_materialize_in_merge.sql
@@ -0,0 +1,52 @@
+-- Tests delayed materialization of statistics in merge instead of during insert (setting 'materialize_statistics_on_insert = 0').
+
+DROP TABLE IF EXISTS tab;
+
+SET enable_analyzer = 1;
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+
+SET materialize_statistics_on_insert = 0;
+
+CREATE TABLE tab
+(
+    a Int64 STATISTICS(tdigest),
+    b Int16 STATISTICS(tdigest),
+) ENGINE = MergeTree() ORDER BY tuple()
+SETTINGS min_bytes_for_wide_part = 0, enable_vertical_merge_algorithm = 0; -- TODO: there is a bug in vertical merge with statistics.
+
+INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
+
+SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics not used';
+
+OPTIMIZE TABLE tab FINAL;
+
+SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics used after merge';
+
+TRUNCATE TABLE tab;
+SET mutations_sync = 2;
+
+INSERT INTO tab SELECT number, -number FROM system.numbers LIMIT 10000;
+ALTER TABLE tab MATERIALIZE STATISTICS a, b;
+
+SELECT count(*) FROM tab WHERE b < 10 and a < 10 SETTINGS log_comment = 'statistics used after materialize';
+
+DROP TABLE tab;
+
+SYSTEM FLUSH LOGS;
+
+SELECT log_comment, message FROM system.text_log JOIN
+(
+    SELECT Settings['log_comment'] AS log_comment, query_id FROM system.query_log
+    WHERE current_database = currentDatabase()
+        AND query LIKE 'SELECT count(*) FROM tab%'
+        AND type = 'QueryFinish'
+) AS query_log USING (query_id)
+WHERE message LIKE '%moved to PREWHERE%'
+ORDER BY event_time_microseconds;
+
+SELECT count(), sum(ProfileEvents['MergeTreeDataWriterStatisticsCalculationMicroseconds'])
+FROM system.query_log
+WHERE current_database = currentDatabase()
+    AND query LIKE 'INSERT INTO tab SELECT%'
+    AND type = 'QueryFinish';
diff --git a/tests/queries/0_stateless/02864_statistics_predicates.reference b/tests/queries/0_stateless/02864_statistics_predicates.reference
deleted file mode 100644
index ffbd7269e05..00000000000
--- a/tests/queries/0_stateless/02864_statistics_predicates.reference
+++ /dev/null
@@ -1,98 +0,0 @@
-u64 and =
-10
-10
-10
-10
-0
-0
-0
-0
-10
-10
-10
-10
-u64 and <
-70
-70
-70
-70
-80
-80
-80
-80
-70
-70
-70
-70
-f64 and =
-10
-10
-10
-10
-0
-0
-0
-0
-10
-10
-10
-10
-0
-0
-0
-0
-f64 and <
-70
-70
-70
-70
-80
-80
-80
-80
-70
-70
-70
-70
-80
-80
-80
-80
-dt and =
-0
-0
-0
-0
-10
-10
-10
-10
-dt and <
-10000
-10000
-10000
-10000
-70
-70
-70
-70
-b and =
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-5000
-0
-0
-0
-0
-s and =
-10
-10
diff --git a/tests/queries/0_stateless/02864_statistics_predicates.sql b/tests/queries/0_stateless/02864_statistics_predicates.sql
deleted file mode 100644
index 779116cf19a..00000000000
--- a/tests/queries/0_stateless/02864_statistics_predicates.sql
+++ /dev/null
@@ -1,214 +0,0 @@
--- Tags: no-fasttest
--- no-fasttest: 'count_min' sketches need a 3rd party library
-
--- Tests the cross product of all predicates with all right-hand sides on all data types and all statistics types.
-
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-
-DROP TABLE IF EXISTS tab;
-
-CREATE TABLE tab
-(
-    u64                 UInt64,
-    u64_tdigest         UInt64 STATISTICS(tdigest),
-    u64_count_min       UInt64 STATISTICS(count_min),
-    u64_uniq            UInt64 STATISTICS(uniq),
-    f64                 Float64,
-    f64_tdigest         Float64 STATISTICS(tdigest),
-    f64_count_min       Float64 STATISTICS(count_min),
-    f64_uniq            Float64 STATISTICS(uniq),
-    dt                  DateTime,
-    dt_tdigest          DateTime STATISTICS(tdigest),
-    dt_count_min        DateTime STATISTICS(count_min),
-    dt_uniq             DateTime STATISTICS(uniq),
-    b                   Bool,
-    b_tdigest           Bool STATISTICS(tdigest),
-    b_count_min         Bool STATISTICS(count_min),
-    b_uniq              Bool STATISTICS(uniq),
-    s                   String,
- -- s_tdigest           String STATISTICS(tdigest), -- not supported by tdigest
-    s_count_min         String STATISTICS(count_min)
- -- s_uniq              String STATISTICS(uniq), -- not supported by uniq
-) Engine = MergeTree() ORDER BY tuple()
-SETTINGS min_bytes_for_wide_part = 0;
-
-INSERT INTO tab
--- SELECT number % 10000, number % 1000, -(number % 100) FROM system.numbers LIMIT 10000;
-SELECT number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 1000,
-       number % 2,
-       number % 2,
-       number % 2,
-       number % 2,
-       toString(number % 1000),
-       toString(number % 1000)
-FROM system.numbers LIMIT 10000;
-
--- u64 ----------------------------------------------------
-
-SELECT 'u64 and =';
-
-SELECT count(*) FROM tab WHERE u64 = 7;
-SELECT count(*) FROM tab WHERE u64_tdigest = 7;
-SELECT count(*) FROM tab WHERE u64_count_min = 7;
-SELECT count(*) FROM tab WHERE u64_uniq = 7;
-
-SELECT count(*) FROM tab WHERE u64 = 7.7;
-SELECT count(*) FROM tab WHERE u64_tdigest = 7.7;
-SELECT count(*) FROM tab WHERE u64_count_min = 7.7;
-SELECT count(*) FROM tab WHERE u64_uniq = 7.7;
-
-SELECT count(*) FROM tab WHERE u64 = '7';
-SELECT count(*) FROM tab WHERE u64_tdigest = '7';
-SELECT count(*) FROM tab WHERE u64_count_min = '7';
-SELECT count(*) FROM tab WHERE u64_uniq = '7';
-
-SELECT count(*) FROM tab WHERE u64 = '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_tdigest = '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_count_min = '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_uniq = '7.7'; -- { serverError TYPE_MISMATCH }
-
-SELECT 'u64 and <';
-
-SELECT count(*) FROM tab WHERE u64 < 7;
-SELECT count(*) FROM tab WHERE u64_tdigest < 7;
-SELECT count(*) FROM tab WHERE u64_count_min < 7;
-SELECT count(*) FROM tab WHERE u64_uniq < 7;
-
-SELECT count(*) FROM tab WHERE u64 < 7.7;
-SELECT count(*) FROM tab WHERE u64_tdigest < 7.7;
-SELECT count(*) FROM tab WHERE u64_count_min < 7.7;
-SELECT count(*) FROM tab WHERE u64_uniq < 7.7;
-
-SELECT count(*) FROM tab WHERE u64 < '7';
-SELECT count(*) FROM tab WHERE u64_tdigest < '7';
-SELECT count(*) FROM tab WHERE u64_count_min < '7';
-SELECT count(*) FROM tab WHERE u64_uniq < '7';
-
-SELECT count(*) FROM tab WHERE u64 < '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_tdigest < '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_count_min < '7.7'; -- { serverError TYPE_MISMATCH }
-SELECT count(*) FROM tab WHERE u64_uniq < '7.7'; -- { serverError TYPE_MISMATCH }
-
--- f64 ----------------------------------------------------
-
-SELECT 'f64 and =';
-
-SELECT count(*) FROM tab WHERE f64 = 7;
-SELECT count(*) FROM tab WHERE f64_tdigest = 7;
-SELECT count(*) FROM tab WHERE f64_count_min = 7;
-SELECT count(*) FROM tab WHERE f64_uniq = 7;
-
-SELECT count(*) FROM tab WHERE f64 = 7.7;
-SELECT count(*) FROM tab WHERE f64_tdigest = 7.7;
-SELECT count(*) FROM tab WHERE f64_count_min = 7.7;
-SELECT count(*) FROM tab WHERE f64_uniq = 7.7;
-
-SELECT count(*) FROM tab WHERE f64 = '7';
-SELECT count(*) FROM tab WHERE f64_tdigest = '7';
-SELECT count(*) FROM tab WHERE f64_count_min = '7';
-SELECT count(*) FROM tab WHERE f64_uniq = '7';
-
-SELECT count(*) FROM tab WHERE f64 = '7.7';
-SELECT count(*) FROM tab WHERE f64_tdigest = '7.7';
-SELECT count(*) FROM tab WHERE f64_count_min = '7.7';
-SELECT count(*) FROM tab WHERE f64_uniq = '7.7';
-
-SELECT 'f64 and <';
-
-SELECT count(*) FROM tab WHERE f64 < 7;
-SELECT count(*) FROM tab WHERE f64_tdigest < 7;
-SELECT count(*) FROM tab WHERE f64_count_min < 7;
-SELECT count(*) FROM tab WHERE f64_uniq < 7;
-
-SELECT count(*) FROM tab WHERE f64 < 7.7;
-SELECT count(*) FROM tab WHERE f64_tdigest < 7.7;
-SELECT count(*) FROM tab WHERE f64_count_min < 7.7;
-SELECT count(*) FROM tab WHERE f64_uniq < 7.7;
-
-SELECT count(*) FROM tab WHERE f64 < '7';
-SELECT count(*) FROM tab WHERE f64_tdigest < '7';
-SELECT count(*) FROM tab WHERE f64_count_min < '7';
-SELECT count(*) FROM tab WHERE f64_uniq < '7';
-
-SELECT count(*) FROM tab WHERE f64 < '7.7';
-SELECT count(*) FROM tab WHERE f64_tdigest < '7.7';
-SELECT count(*) FROM tab WHERE f64_count_min < '7.7';
-SELECT count(*) FROM tab WHERE f64_uniq < '7.7';
-
--- dt ----------------------------------------------------
-
-SELECT 'dt and =';
-
-SELECT count(*) FROM tab WHERE dt = '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_tdigest = '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_count_min = '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_uniq = '2024-08-08 11:12:13';
-
-SELECT count(*) FROM tab WHERE dt = 7;
-SELECT count(*) FROM tab WHERE dt_tdigest = 7;
-SELECT count(*) FROM tab WHERE dt_count_min = 7;
-SELECT count(*) FROM tab WHERE dt_uniq = 7;
-
-SELECT 'dt and <';
-
-SELECT count(*) FROM tab WHERE dt < '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_tdigest < '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_count_min < '2024-08-08 11:12:13';
-SELECT count(*) FROM tab WHERE dt_uniq < '2024-08-08 11:12:13';
-
-SELECT count(*) FROM tab WHERE dt < 7;
-SELECT count(*) FROM tab WHERE dt_tdigest < 7;
-SELECT count(*) FROM tab WHERE dt_count_min < 7;
-SELECT count(*) FROM tab WHERE dt_uniq < 7;
-
--- b ----------------------------------------------------
-
-SELECT 'b and =';
-
-SELECT count(*) FROM tab WHERE b = true;
-SELECT count(*) FROM tab WHERE b_tdigest = true;
-SELECT count(*) FROM tab WHERE b_count_min = true;
-SELECT count(*) FROM tab WHERE b_uniq = true;
-
-SELECT count(*) FROM tab WHERE b = 'true';
-SELECT count(*) FROM tab WHERE b_tdigest = 'true';
-SELECT count(*) FROM tab WHERE b_count_min = 'true';
-SELECT count(*) FROM tab WHERE b_uniq = 'true';
-
-SELECT count(*) FROM tab WHERE b = 1;
-SELECT count(*) FROM tab WHERE b_tdigest = 1;
-SELECT count(*) FROM tab WHERE b_count_min = 1;
-SELECT count(*) FROM tab WHERE b_uniq = 1;
-
-SELECT count(*) FROM tab WHERE b = 1.1;
-SELECT count(*) FROM tab WHERE b_tdigest = 1.1;
-SELECT count(*) FROM tab WHERE b_count_min = 1.1;
-SELECT count(*) FROM tab WHERE b_uniq = 1.1;
-
--- s ----------------------------------------------------
-
-SELECT 's and =';
-
-SELECT count(*) FROM tab WHERE s = 7; -- { serverError NO_COMMON_TYPE }
--- SELECT count(*) FROM tab WHERE s_tdigest = 7; -- not supported
-SELECT count(*) FROM tab WHERE s_count_min = 7; -- { serverError NO_COMMON_TYPE }
--- SELECT count(*) FROM tab WHERE s_uniq = 7; -- not supported
-
-SELECT count(*) FROM tab WHERE s = '7';
--- SELECT count(*) FROM tab WHERE s_tdigest = '7'; -- not supported
-SELECT count(*) FROM tab WHERE s_count_min = '7';
--- SELECT count(*) FROM tab WHERE s_uniq = '7'; -- not supported
-
-DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistics_uniq.reference b/tests/queries/0_stateless/02864_statistics_uniq.reference
new file mode 100644
index 00000000000..77786dbdd8c
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_uniq.reference
@@ -0,0 +1,35 @@
+CREATE TABLE default.t1\n(\n    `a` Float64 STATISTICS(tdigest),\n    `b` Int64 STATISTICS(tdigest),\n    `c` Int64 STATISTICS(tdigest, uniq),\n    `pk` String\n)\nENGINE = MergeTree\nORDER BY pk\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+After insert
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(equals(c, 11), less(a, 10), less(b, 10)) (removed)
+After merge
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(equals(c, 11), less(a, 10), less(b, 10)) (removed)
+After modify TDigest
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 11), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(c, -1), less(a, 10), less(b, 10)) (removed)
+After drop
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 11), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), equals(c, 0), less(b, 10)) (removed)
+        Prewhere info
+          Prewhere filter
+          Prewhere filter column: and(less(a, 10), less(c, -1), less(b, 10)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_uniq.sql b/tests/queries/0_stateless/02864_statistics_uniq.sql
new file mode 100644
index 00000000000..0f5f353c045
--- /dev/null
+++ b/tests/queries/0_stateless/02864_statistics_uniq.sql
@@ -0,0 +1,73 @@
+DROP TABLE IF EXISTS t1;
+
+SET allow_experimental_statistics = 1;
+SET allow_statistics_optimize = 1;
+SET mutations_sync = 1;
+
+CREATE TABLE t1
+(
+    a Float64 STATISTICS(tdigest),
+    b Int64 STATISTICS(tdigest),
+    c Int64 STATISTICS(tdigest, uniq),
+    pk String,
+) Engine = MergeTree() ORDER BY pk
+SETTINGS min_bytes_for_wide_part = 0;
+
+SHOW CREATE TABLE t1;
+
+INSERT INTO t1 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
+INSERT INTO t1 select 0, 0, 11, generateUUIDv4();
+
+SELECT 'After insert';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+OPTIMIZE TABLE t1 FINAL;
+
+SELECT 'After merge';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+SELECT 'After modify TDigest';
+ALTER TABLE t1 MODIFY STATISTICS c TYPE TDigest;
+ALTER TABLE t1 MATERIALIZE STATISTICS c;
+
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c < -1 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+
+ALTER TABLE t1 DROP STATISTICS c;
+
+SELECT 'After drop';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 11 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c = 0 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+SELECT replaceRegexpAll(explain, '__table1.|_UInt8|_Int8', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM t1 WHERE b < 10 and c < -1 and a < 10) WHERE explain LIKE '%Prewhere%' OR explain LIKE '%Filter column%';
+
+DROP TABLE IF EXISTS t1;
+DROP TABLE IF EXISTS t2;
+SET allow_suspicious_low_cardinality_types=1;
+CREATE TABLE t2
+(
+    a Float64 STATISTICS(tdigest),
+    b Int64 STATISTICS(tdigest),
+    c LowCardinality(Int64) STATISTICS(tdigest, uniq),
+    pk String,
+) Engine = MergeTree() ORDER BY pk
+SETTINGS min_bytes_for_wide_part = 0;
+INSERT INTO t2 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
+
+DROP TABLE IF EXISTS t2;
+DROP TABLE IF EXISTS t3;
+
+CREATE TABLE t3
+(
+    a Float64 STATISTICS(tdigest),
+    b Int64 STATISTICS(tdigest),
+    c Nullable(Int64) STATISTICS(tdigest, uniq),
+    pk String,
+) Engine = MergeTree() ORDER BY pk
+SETTINGS min_bytes_for_wide_part = 0;
+INSERT INTO t3 select number, -number, number/1000, generateUUIDv4() FROM system.numbers LIMIT 10000;
+
+DROP TABLE IF EXISTS t3;
+
diff --git a/tests/queries/0_stateless/02864_statistics_usage.reference b/tests/queries/0_stateless/02864_statistics_usage.reference
deleted file mode 100644
index a9f669b88c1..00000000000
--- a/tests/queries/0_stateless/02864_statistics_usage.reference
+++ /dev/null
@@ -1,20 +0,0 @@
-After insert
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
-After drop statistic
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(b, 10_UInt8), less(a, 10_UInt8)) (removed)
-After add and materialize statistic
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
-After merge
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(b, 10_UInt8)) (removed)
-After rename
-        Prewhere info
-          Prewhere filter
-          Prewhere filter column: and(less(a, 10_UInt8), less(c, 10_UInt8)) (removed)
diff --git a/tests/queries/0_stateless/02864_statistics_usage.sql b/tests/queries/0_stateless/02864_statistics_usage.sql
deleted file mode 100644
index 4956bd27e87..00000000000
--- a/tests/queries/0_stateless/02864_statistics_usage.sql
+++ /dev/null
@@ -1,42 +0,0 @@
--- Test that the optimizer picks up column statistics
--- (The concrete statistics type, column data type and predicate type don't matter)
-
--- Checks by the predicate evaluation order in EXPLAIN. This is quite fragile, a better approach would be helpful (maybe 'send_logs_level'?)
-
-SET allow_experimental_statistics = 1;
-SET allow_statistics_optimize = 1;
-SET mutations_sync = 1;
-SET enable_analyzer = 1;
-
-DROP TABLE IF EXISTS tab;
-
-CREATE TABLE tab
-(
-    a Float64 STATISTICS(tdigest),
-    b Int64 STATISTICS(tdigest)
-) Engine = MergeTree() ORDER BY tuple()
-SETTINGS min_bytes_for_wide_part = 0;
-
-INSERT INTO tab select number, -number FROM system.numbers LIMIT 10000;
-SELECT 'After insert';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
-
-ALTER TABLE tab DROP STATISTICS a, b;
-SELECT 'After drop statistic';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks b first, then a (statistics not used)
-
-ALTER TABLE tab ADD STATISTICS a, b TYPE tdigest;
-ALTER TABLE tab MATERIALIZE STATISTICS a, b;
-INSERT INTO tab select number, -number FROM system.numbers LIMIT 10000;
-SELECT 'After add and materialize statistic';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
-
-OPTIMIZE TABLE tab FINAL;
-SELECT 'After merge';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE b < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then b (statistics used)
-
-ALTER TABLE tab RENAME COLUMN b TO c;
-SELECT 'After rename';
-SELECT replaceRegexpAll(explain, '__table1\.', '') FROM (EXPLAIN actions=1 SELECT count(*) FROM tab WHERE c < 10 and a < 10) WHERE explain LIKE '%Prewhere%'; -- checks a first, then c (statistics used)
-
-DROP TABLE IF EXISTS tab;

From 29afd2de785450f2e7f5faec1dc6b35e166cefb4 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 11 Aug 2024 13:26:45 +0200
Subject: [PATCH 50/52] Remove "Processing configuration file" message from
 clickhouse-local

Make the behaviour identical to the clickhouse-client

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/local/LocalServer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 6b0b8fc5b50..200beea7b63 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -143,7 +143,7 @@ void LocalServer::initialize(Poco::Util::Application & self)
 
     if (fs::exists(config_path))
     {
-        ConfigProcessor config_processor(config_path, false, true);
+        ConfigProcessor config_processor(config_path);
         ConfigProcessor::setConfigPath(fs::path(config_path).parent_path());
         auto loaded_config = config_processor.loadConfig();
         getClientConfiguration().add(loaded_config.configuration.duplicate(), PRIO_DEFAULT, false);

From d314e5aa45fb8ac91324721ab278185b09437a40 Mon Sep 17 00:00:00 2001
From: Vladimir Varankin <vladimir@varank.in>
Date: Sun, 11 Aug 2024 18:37:29 +0200
Subject: [PATCH 51/52] typos in prometheus.md

---
 docs/en/interfaces/prometheus.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/interfaces/prometheus.md b/docs/en/interfaces/prometheus.md
index bf541901b34..8e7023cc51f 100644
--- a/docs/en/interfaces/prometheus.md
+++ b/docs/en/interfaces/prometheus.md
@@ -75,7 +75,7 @@ Data are received by this protocol and written to a [TimeSeries](/en/engines/tab
         <my_rule_1>
             <url>/write</url>
             <handler>
-                <type>remote_write</type
+                <type>remote_write</type>
                 <database>db_name</database>
                 <table>time_series_table</table>
             </handler>
@@ -105,7 +105,7 @@ Data are read from a [TimeSeries](/en/engines/table-engines/special/time_series)
         <my_rule_1>
             <url>/read</url>
             <handler>
-                <type>remote_read</type
+                <type>remote_read</type>
                 <database>db_name</database>
                 <table>time_series_table</table>
             </handler>
@@ -144,14 +144,14 @@ Multiple protocols can be specified together in one place:
         <my_rule_2>
             <url>/write</url>
             <handler>
-                <type>remote_write</type
+                <type>remote_write</type>
                 <table>db_name.time_series_table</table>
             </handler>
         </my_rule_2>
         <my_rule_3>
             <url>/read</url>
             <handler>
-                <type>remote_read</type
+                <type>remote_read</type>
                 <table>db_name.time_series_table</table>
             </handler>
         </my_rule_3>

From e384e2c38e405b1b4758adaa44cd321e6d7f41b3 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 11 Aug 2024 18:34:33 +0200
Subject: [PATCH 52/52] tests: fix 02122_join_group_by_timeout flakiness

CI found [1] failure of the test:

    2024-08-11 21:06:07 /usr/share/clickhouse-test/queries/0_stateless/02122_join_group_by_timeout.sh: line 51: 52614 Killed                  timeout -s KILL $MAX_PROCESS_WAIT $CLICKHOUSE_CLIENT -q "SELECT a.name as n

And the problem is not the server, but the client, since query executed
for ~1 second:

    2024.08.11 21:06:02.284318 [ 49232 ] {ba989ee2-f615-49ca-bcd8-31b3916aeb2c} <Debug> executeQuery: (from [::1]:54144) (comment: 02122_join_group_by_timeout.sh) SELECT a.name as n FROM ( SELECT 'Name' as name, number FROM system.numbers LIMIT 2000000 ) AS a, ( SELECT 'Name' as name2, number FROM system.numbers LIMIT 2000000 ) as b FORMAT Null SETTINGS max_execution_time = 1, timeout_overflow_mode = 'break'  (stage: Complete)
    2024.08.11 21:06:03.331249 [ 49232 ] {ba989ee2-f615-49ca-bcd8-31b3916aeb2c} <Debug> executeQuery: Read 517104 rows, 3.95 MiB in 1.072023 sec., 482362.78512681165 rows/sec., 3.68 MiB/sec.

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/67134/18da3f0ab63da1eef9396627d0dfd56cf5356f65/stateless_tests__msan__[1_4].html

So instead of using timeout, let's use time from the system.query_log
instead.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../02122_join_group_by_timeout.reference     |  6 +-
 .../02122_join_group_by_timeout.sh            | 70 ++++++++++---------
 2 files changed, 41 insertions(+), 35 deletions(-)

diff --git a/tests/queries/0_stateless/02122_join_group_by_timeout.reference b/tests/queries/0_stateless/02122_join_group_by_timeout.reference
index f314e22e519..6500560e8fc 100644
--- a/tests/queries/0_stateless/02122_join_group_by_timeout.reference
+++ b/tests/queries/0_stateless/02122_join_group_by_timeout.reference
@@ -1,4 +1,6 @@
-Code: 159
-0
+Code: 159
+query_duration	1
+0
+query_duration	1
 Code: 159
 0
diff --git a/tests/queries/0_stateless/02122_join_group_by_timeout.sh b/tests/queries/0_stateless/02122_join_group_by_timeout.sh
index 8380c5dbd0c..b4644878544 100755
--- a/tests/queries/0_stateless/02122_join_group_by_timeout.sh
+++ b/tests/queries/0_stateless/02122_join_group_by_timeout.sh
@@ -1,27 +1,23 @@
 #!/usr/bin/env bash
-# Tags: no-debug
-
-# no-debug: Query is canceled by timeout after max_execution_time,
-#           but sending an exception to the client may hang
-#           for more than MAX_PROCESS_WAIT seconds in a slow debug build,
-#           and test will fail.
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-MAX_PROCESS_WAIT=5
-
-IS_SANITIZER=$($CLICKHOUSE_CLIENT -q "SELECT count() FROM system.warnings WHERE message like '%built with sanitizer%'")
-if [ "$IS_SANITIZER" -gt 0 ]; then
-    # Query may hang for more than 5 seconds, especially in tsan build
-    MAX_PROCESS_WAIT=15
+TIMEOUT=5
+IS_SANITIZER_OR_DEBUG=$($CLICKHOUSE_CLIENT -q "SELECT count() FROM system.warnings WHERE message like '%built with sanitizer%' or message like '%built in debug mode%'")
+if [ "$IS_SANITIZER_OR_DEBUG" -gt 0 ]; then
+    # Increase the timeout due to in debug/sanitizers build:
+    # - client is slow
+    # - stacktrace resolving is slow
+    TIMEOUT=15
 fi
 
 # TCP CLIENT: As of today (02/12/21) uses PullingAsyncPipelineExecutor
 ### Should be cancelled after 1 second and return a 159 exception (timeout)
-timeout -s KILL $MAX_PROCESS_WAIT $CLICKHOUSE_CLIENT --max_execution_time 1 -q \
-    "SELECT * FROM
+query_id=$(random_str 12)
+$CLICKHOUSE_CLIENT --query_id "$query_id" --max_execution_time 1 -q "
+    SELECT * FROM
     (
         SELECT a.name as n
         FROM
@@ -34,28 +30,35 @@ timeout -s KILL $MAX_PROCESS_WAIT $CLICKHOUSE_CLIENT --max_execution_time 1 -q \
         GROUP BY n
     )
     LIMIT 20
-    FORMAT Null" 2>&1 | grep -o "Code: 159" | sort | uniq
+    FORMAT Null
+" 2>&1 | grep -m1 -o "Code: 159"
+$CLICKHOUSE_CLIENT -q "system flush logs"
+${CLICKHOUSE_CURL} -q -sS "$CLICKHOUSE_URL" -d "select 'query_duration', round(query_duration_ms/1000) from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and query_id = '$query_id' and type != 'QueryStart'"
+
 
 ### Should stop pulling data and return what has been generated already (return code 0)
-timeout -s KILL $MAX_PROCESS_WAIT $CLICKHOUSE_CLIENT -q \
-    "SELECT a.name as n
-     FROM
-     (
-         SELECT 'Name' as name, number FROM system.numbers LIMIT 2000000
-     ) AS a,
-     (
-         SELECT 'Name' as name2, number FROM system.numbers LIMIT 2000000
-     ) as b
-     FORMAT Null
-     SETTINGS max_execution_time = 1, timeout_overflow_mode = 'break'
-    "
+query_id=$(random_str 12)
+$CLICKHOUSE_CLIENT --query_id "$query_id" -q "
+    SELECT a.name as n
+    FROM
+    (
+        SELECT 'Name' as name, number FROM system.numbers LIMIT 2000000
+    ) AS a,
+    (
+        SELECT 'Name' as name2, number FROM system.numbers LIMIT 2000000
+    ) as b
+    FORMAT Null
+    SETTINGS max_execution_time = 1, timeout_overflow_mode = 'break'
+"
 echo $?
+$CLICKHOUSE_CLIENT -q "system flush logs"
+${CLICKHOUSE_CURL} -q -sS "$CLICKHOUSE_URL" -d "select 'query_duration', round(query_duration_ms/1000) from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and query_id = '$query_id' and type != 'QueryStart'"
 
 
 # HTTP CLIENT: As of today (02/12/21) uses PullingPipelineExecutor
 ### Should be cancelled after 1 second and return a 159 exception (timeout)
-${CLICKHOUSE_CURL} -q --max-time $MAX_PROCESS_WAIT -sS "$CLICKHOUSE_URL&max_execution_time=1" -d \
-    "SELECT * FROM
+${CLICKHOUSE_CURL} -q --max-time $TIMEOUT -sS "$CLICKHOUSE_URL&max_execution_time=1" -d "
+    SELECT * FROM
     (
         SELECT a.name as n
         FROM
@@ -68,12 +71,13 @@ ${CLICKHOUSE_CURL} -q --max-time $MAX_PROCESS_WAIT -sS "$CLICKHOUSE_URL&max_exec
         GROUP BY n
     )
     LIMIT 20
-    FORMAT Null" 2>&1 | grep -o "Code: 159" | sort | uniq
+    FORMAT Null
+" 2>&1 | grep -o "Code: 159" | sort | uniq
 
 
 ### Should stop pulling data and return what has been generated already (return code 0)
-${CLICKHOUSE_CURL} -q --max-time $MAX_PROCESS_WAIT -sS "$CLICKHOUSE_URL" -d \
-    "SELECT a.name as n
+${CLICKHOUSE_CURL} -q --max-time $TIMEOUT -sS "$CLICKHOUSE_URL" -d "
+    SELECT a.name as n
           FROM
           (
               SELECT 'Name' as name, number FROM system.numbers LIMIT 2000000
@@ -83,5 +87,5 @@ ${CLICKHOUSE_CURL} -q --max-time $MAX_PROCESS_WAIT -sS "$CLICKHOUSE_URL" -d \
           ) as b
           FORMAT Null
           SETTINGS max_execution_time = 1, timeout_overflow_mode = 'break'
-    "
+"
 echo $?