From 26c9042ea0f0529f464435cbeef111f3e6d396a5 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 12 Jun 2023 17:06:52 +0000
Subject: [PATCH 0001/1081] Analyzer: support aliases in StorageMerge

---
 src/Analyzer/IQueryTreePass.h                 |   2 +-
 ...egateFunctionsArithmericOperationsPass.cpp |   2 +-
 ...gregateFunctionsArithmericOperationsPass.h |   2 +-
 src/Analyzer/Passes/ArrayExistsToHasPass.cpp  |   2 +-
 src/Analyzer/Passes/ArrayExistsToHasPass.h    |   2 +-
 src/Analyzer/Passes/AutoFinalOnQueryPass.cpp  |   2 +-
 src/Analyzer/Passes/AutoFinalOnQueryPass.h    |   2 +-
 .../Passes/ComparisonTupleEliminationPass.cpp |   2 +-
 .../Passes/ComparisonTupleEliminationPass.h   |   2 +-
 .../Passes/ConvertOrLikeChainPass.cpp         |   2 +-
 src/Analyzer/Passes/ConvertOrLikeChainPass.h  |   2 +-
 src/Analyzer/Passes/ConvertQueryToCNFPass.cpp |   2 +-
 src/Analyzer/Passes/ConvertQueryToCNFPass.h   |   2 +-
 src/Analyzer/Passes/CountDistinctPass.cpp     |   2 +-
 src/Analyzer/Passes/CountDistinctPass.h       |   2 +-
 src/Analyzer/Passes/CrossToInnerJoinPass.cpp  |   2 +-
 src/Analyzer/Passes/CrossToInnerJoinPass.h    |   2 +-
 .../Passes/FunctionToSubcolumnsPass.cpp       |   2 +-
 .../Passes/FunctionToSubcolumnsPass.h         |   2 +-
 src/Analyzer/Passes/FuseFunctionsPass.cpp     |   2 +-
 src/Analyzer/Passes/FuseFunctionsPass.h       |   2 +-
 .../Passes/GroupingFunctionsResolvePass.cpp   |   2 +-
 .../Passes/GroupingFunctionsResolvePass.h     |   2 +-
 src/Analyzer/Passes/IfChainToMultiIfPass.cpp  |   2 +-
 src/Analyzer/Passes/IfChainToMultiIfPass.h    |   2 +-
 .../Passes/IfConstantConditionPass.cpp        |   2 +-
 src/Analyzer/Passes/IfConstantConditionPass.h |   2 +-
 .../Passes/IfTransformStringsToEnumPass.cpp   |   2 +-
 .../Passes/IfTransformStringsToEnumPass.h     |   2 +-
 .../Passes/LogicalExpressionOptimizerPass.cpp |   2 +-
 .../Passes/LogicalExpressionOptimizerPass.h   |   2 +-
 src/Analyzer/Passes/MultiIfToIfPass.cpp       |   2 +-
 src/Analyzer/Passes/MultiIfToIfPass.h         |   2 +-
 .../Passes/NormalizeCountVariantsPass.cpp     |   2 +-
 .../Passes/NormalizeCountVariantsPass.h       |   2 +-
 .../OptimizeGroupByFunctionKeysPass.cpp       |   2 +-
 .../Passes/OptimizeGroupByFunctionKeysPass.h  |   2 +-
 ...ptimizeRedundantFunctionsInOrderByPass.cpp |   2 +-
 .../OptimizeRedundantFunctionsInOrderByPass.h |   2 +-
 ...OrderByLimitByDuplicateEliminationPass.cpp |   2 +-
 .../OrderByLimitByDuplicateEliminationPass.h  |   2 +-
 .../Passes/OrderByTupleEliminationPass.cpp    |   2 +-
 .../Passes/OrderByTupleEliminationPass.h      |   2 +-
 src/Analyzer/Passes/QueryAnalysisPass.cpp     |  15 ++-
 src/Analyzer/Passes/QueryAnalysisPass.h       |   2 +-
 .../RewriteAggregateFunctionWithIfPass.cpp    |   2 +-
 .../RewriteAggregateFunctionWithIfPass.h      |   2 +-
 .../Passes/ShardNumColumnToFunctionPass.cpp   |   2 +-
 .../Passes/ShardNumColumnToFunctionPass.h     |   2 +-
 src/Analyzer/Passes/SumIfToCountIfPass.cpp    |   2 +-
 src/Analyzer/Passes/SumIfToCountIfPass.h      |   2 +-
 .../UniqInjectiveFunctionsEliminationPass.cpp |   2 +-
 .../UniqInjectiveFunctionsEliminationPass.h   |   2 +-
 src/Planner/PlannerActionsVisitor.cpp         |   4 +-
 src/Storages/StorageDistributed.cpp           |   4 +-
 src/Storages/StorageMerge.cpp                 | 121 +++++++++++++++---
 src/Storages/StorageMerge.h                   |   9 +-
 57 files changed, 177 insertions(+), 80 deletions(-)

diff --git a/src/Analyzer/IQueryTreePass.h b/src/Analyzer/IQueryTreePass.h
index 4293934c32d..d4499c3271c 100644
--- a/src/Analyzer/IQueryTreePass.h
+++ b/src/Analyzer/IQueryTreePass.h
@@ -31,7 +31,7 @@ public:
     virtual String getDescription() = 0;
 
     /// Run pass over query tree
-    virtual void run(QueryTreeNodePtr query_tree_node, ContextPtr context) = 0;
+    virtual void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) = 0;
 
 };
 
diff --git a/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.cpp b/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.cpp
index 1476a66c892..2a69292ff78 100644
--- a/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.cpp
+++ b/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.cpp
@@ -201,7 +201,7 @@ private:
 
 }
 
-void AggregateFunctionsArithmericOperationsPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void AggregateFunctionsArithmericOperationsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     AggregateFunctionsArithmericOperationsVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h b/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h
index a89d2f87ad9..d510b62f9be 100644
--- a/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h
+++ b/src/Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Extract arithmeric operations from aggregate functions."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/ArrayExistsToHasPass.cpp b/src/Analyzer/Passes/ArrayExistsToHasPass.cpp
index c0f958588f1..63d417cd570 100644
--- a/src/Analyzer/Passes/ArrayExistsToHasPass.cpp
+++ b/src/Analyzer/Passes/ArrayExistsToHasPass.cpp
@@ -92,7 +92,7 @@ public:
 
 }
 
-void RewriteArrayExistsToHasPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void RewriteArrayExistsToHasPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     RewriteArrayExistsToHasVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/ArrayExistsToHasPass.h b/src/Analyzer/Passes/ArrayExistsToHasPass.h
index 8f4623116e3..4795b61c625 100644
--- a/src/Analyzer/Passes/ArrayExistsToHasPass.h
+++ b/src/Analyzer/Passes/ArrayExistsToHasPass.h
@@ -20,7 +20,7 @@ public:
 
     String getDescription() override { return "Rewrite arrayExists(func, arr) functions to has(arr, elem) when logically equivalent"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/AutoFinalOnQueryPass.cpp b/src/Analyzer/Passes/AutoFinalOnQueryPass.cpp
index 15326ca1dc8..ee9e1023949 100644
--- a/src/Analyzer/Passes/AutoFinalOnQueryPass.cpp
+++ b/src/Analyzer/Passes/AutoFinalOnQueryPass.cpp
@@ -67,7 +67,7 @@ private:
 
 }
 
-void AutoFinalOnQueryPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void AutoFinalOnQueryPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     auto visitor = AutoFinalOnQueryPassVisitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/AutoFinalOnQueryPass.h b/src/Analyzer/Passes/AutoFinalOnQueryPass.h
index 3489597108c..d595b98d349 100644
--- a/src/Analyzer/Passes/AutoFinalOnQueryPass.h
+++ b/src/Analyzer/Passes/AutoFinalOnQueryPass.h
@@ -25,7 +25,7 @@ public:
         return "Automatically applies final modifier to table expressions in queries if it is supported and if user level final setting is set";
     }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp b/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
index 4e0562a2fe8..57920065513 100644
--- a/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
+++ b/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
@@ -201,7 +201,7 @@ private:
 
 }
 
-void ComparisonTupleEliminationPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void ComparisonTupleEliminationPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     ComparisonTupleEliminationPassVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/ComparisonTupleEliminationPass.h b/src/Analyzer/Passes/ComparisonTupleEliminationPass.h
index 954a9d6a2f0..7f4245e2d95 100644
--- a/src/Analyzer/Passes/ComparisonTupleEliminationPass.h
+++ b/src/Analyzer/Passes/ComparisonTupleEliminationPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Rewrite tuples comparison into equivalent comparison of tuples arguments"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/ConvertOrLikeChainPass.cpp b/src/Analyzer/Passes/ConvertOrLikeChainPass.cpp
index 7d7362fb742..0d2ddd20374 100644
--- a/src/Analyzer/Passes/ConvertOrLikeChainPass.cpp
+++ b/src/Analyzer/Passes/ConvertOrLikeChainPass.cpp
@@ -132,7 +132,7 @@ private:
 
 }
 
-void ConvertOrLikeChainPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void ConvertOrLikeChainPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     auto or_function_resolver = FunctionFactory::instance().get("or", context);
     auto match_function_resolver = FunctionFactory::instance().get("multiMatchAny", context);
diff --git a/src/Analyzer/Passes/ConvertOrLikeChainPass.h b/src/Analyzer/Passes/ConvertOrLikeChainPass.h
index 0f734bfa73d..90bccaa0e8d 100644
--- a/src/Analyzer/Passes/ConvertOrLikeChainPass.h
+++ b/src/Analyzer/Passes/ConvertOrLikeChainPass.h
@@ -14,7 +14,7 @@ public:
 
     String getDescription() override { return "Replaces all the 'or's with {i}like to multiMatchAny"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/ConvertQueryToCNFPass.cpp b/src/Analyzer/Passes/ConvertQueryToCNFPass.cpp
index 4d32c96b845..ecba2e28749 100644
--- a/src/Analyzer/Passes/ConvertQueryToCNFPass.cpp
+++ b/src/Analyzer/Passes/ConvertQueryToCNFPass.cpp
@@ -720,7 +720,7 @@ public:
 
 }
 
-void ConvertLogicalExpressionToCNFPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void ConvertLogicalExpressionToCNFPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     const auto & settings = context->getSettingsRef();
     if (!settings.convert_query_to_cnf)
diff --git a/src/Analyzer/Passes/ConvertQueryToCNFPass.h b/src/Analyzer/Passes/ConvertQueryToCNFPass.h
index 5ed874db006..60943c04d78 100644
--- a/src/Analyzer/Passes/ConvertQueryToCNFPass.h
+++ b/src/Analyzer/Passes/ConvertQueryToCNFPass.h
@@ -12,7 +12,7 @@ public:
 
     String getDescription() override { return "Convert logical expression to CNF and apply optimizations using constraints"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/CountDistinctPass.cpp b/src/Analyzer/Passes/CountDistinctPass.cpp
index 945295f5cbc..eb2859020be 100644
--- a/src/Analyzer/Passes/CountDistinctPass.cpp
+++ b/src/Analyzer/Passes/CountDistinctPass.cpp
@@ -84,7 +84,7 @@ public:
 
 }
 
-void CountDistinctPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void CountDistinctPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     CountDistinctVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/CountDistinctPass.h b/src/Analyzer/Passes/CountDistinctPass.h
index cac5033c98f..33728b0228c 100644
--- a/src/Analyzer/Passes/CountDistinctPass.h
+++ b/src/Analyzer/Passes/CountDistinctPass.h
@@ -20,7 +20,7 @@ public:
         return "Optimize single countDistinct into count over subquery";
     }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/CrossToInnerJoinPass.cpp b/src/Analyzer/Passes/CrossToInnerJoinPass.cpp
index d4877d23f28..3283c163890 100644
--- a/src/Analyzer/Passes/CrossToInnerJoinPass.cpp
+++ b/src/Analyzer/Passes/CrossToInnerJoinPass.cpp
@@ -264,7 +264,7 @@ private:
 
 }
 
-void CrossToInnerJoinPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void CrossToInnerJoinPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     CrossToInnerJoinVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/CrossToInnerJoinPass.h b/src/Analyzer/Passes/CrossToInnerJoinPass.h
index 127d26dc41d..b0437c562ac 100644
--- a/src/Analyzer/Passes/CrossToInnerJoinPass.h
+++ b/src/Analyzer/Passes/CrossToInnerJoinPass.h
@@ -22,7 +22,7 @@ public:
         return "Replace CROSS JOIN with INNER JOIN";
     }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
index 696483862e0..1b04136e6a4 100644
--- a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
+++ b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
@@ -202,7 +202,7 @@ private:
 
 }
 
-void FunctionToSubcolumnsPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void FunctionToSubcolumnsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     FunctionToSubcolumnsVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/FunctionToSubcolumnsPass.h b/src/Analyzer/Passes/FunctionToSubcolumnsPass.h
index 0e1d2583e7b..d4edcc5b922 100644
--- a/src/Analyzer/Passes/FunctionToSubcolumnsPass.h
+++ b/src/Analyzer/Passes/FunctionToSubcolumnsPass.h
@@ -24,7 +24,7 @@ public:
 
     String getDescription() override { return "Rewrite function to subcolumns, for example tupleElement(column, subcolumn) into column.subcolumn"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/FuseFunctionsPass.cpp b/src/Analyzer/Passes/FuseFunctionsPass.cpp
index 14082697955..ef87528964c 100644
--- a/src/Analyzer/Passes/FuseFunctionsPass.cpp
+++ b/src/Analyzer/Passes/FuseFunctionsPass.cpp
@@ -254,7 +254,7 @@ void tryFuseQuantiles(QueryTreeNodePtr query_tree_node, ContextPtr context)
 
 }
 
-void FuseFunctionsPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void FuseFunctionsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     tryFuseSumCountAvg(query_tree_node, context);
     tryFuseQuantiles(query_tree_node, context);
diff --git a/src/Analyzer/Passes/FuseFunctionsPass.h b/src/Analyzer/Passes/FuseFunctionsPass.h
index a92b77b1115..2fd85da4747 100644
--- a/src/Analyzer/Passes/FuseFunctionsPass.h
+++ b/src/Analyzer/Passes/FuseFunctionsPass.h
@@ -20,7 +20,7 @@ public:
 
     String getDescription() override { return "Replaces several calls of aggregate functions of the same family into one call"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp b/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
index 0cf5310a3ad..774014e5ffd 100644
--- a/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
+++ b/src/Analyzer/Passes/GroupingFunctionsResolvePass.cpp
@@ -248,7 +248,7 @@ private:
 
 }
 
-void GroupingFunctionsResolvePass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void GroupingFunctionsResolvePass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     GroupingFunctionsResolveVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/GroupingFunctionsResolvePass.h b/src/Analyzer/Passes/GroupingFunctionsResolvePass.h
index 070c8dd9389..cd932f76977 100644
--- a/src/Analyzer/Passes/GroupingFunctionsResolvePass.h
+++ b/src/Analyzer/Passes/GroupingFunctionsResolvePass.h
@@ -24,7 +24,7 @@ public:
 
     String getDescription() override { return "Resolve GROUPING functions based on GROUP BY modifiers"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/IfChainToMultiIfPass.cpp b/src/Analyzer/Passes/IfChainToMultiIfPass.cpp
index 1f97e012331..91a5709f142 100644
--- a/src/Analyzer/Passes/IfChainToMultiIfPass.cpp
+++ b/src/Analyzer/Passes/IfChainToMultiIfPass.cpp
@@ -73,7 +73,7 @@ private:
 
 }
 
-void IfChainToMultiIfPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void IfChainToMultiIfPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     auto multi_if_function_ptr = FunctionFactory::instance().get("multiIf", context);
     IfChainToMultiIfPassVisitor visitor(std::move(multi_if_function_ptr), std::move(context));
diff --git a/src/Analyzer/Passes/IfChainToMultiIfPass.h b/src/Analyzer/Passes/IfChainToMultiIfPass.h
index 43f3fb8831d..9e7335d93e4 100644
--- a/src/Analyzer/Passes/IfChainToMultiIfPass.h
+++ b/src/Analyzer/Passes/IfChainToMultiIfPass.h
@@ -18,7 +18,7 @@ public:
 
     String getDescription() override { return "Optimize if chain to multiIf"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/IfConstantConditionPass.cpp b/src/Analyzer/Passes/IfConstantConditionPass.cpp
index 6f9cfe482f1..35c6718f018 100644
--- a/src/Analyzer/Passes/IfConstantConditionPass.cpp
+++ b/src/Analyzer/Passes/IfConstantConditionPass.cpp
@@ -49,7 +49,7 @@ public:
 
 }
 
-void IfConstantConditionPass::run(QueryTreeNodePtr query_tree_node, ContextPtr)
+void IfConstantConditionPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr)
 {
     IfConstantConditionVisitor visitor;
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/IfConstantConditionPass.h b/src/Analyzer/Passes/IfConstantConditionPass.h
index 7817e67aa5e..7548fc702bc 100644
--- a/src/Analyzer/Passes/IfConstantConditionPass.h
+++ b/src/Analyzer/Passes/IfConstantConditionPass.h
@@ -21,7 +21,7 @@ public:
 
     String getDescription() override { return "Optimize if, multiIf for constant condition."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp b/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
index 562aff4cf05..32e3c3cda51 100644
--- a/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
+++ b/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
@@ -205,7 +205,7 @@ public:
 
 }
 
-void IfTransformStringsToEnumPass::run(QueryTreeNodePtr query, ContextPtr context)
+void IfTransformStringsToEnumPass::run(QueryTreeNodePtr & query, ContextPtr context)
 {
     ConvertStringsToEnumVisitor visitor(std::move(context));
     visitor.visit(query);
diff --git a/src/Analyzer/Passes/IfTransformStringsToEnumPass.h b/src/Analyzer/Passes/IfTransformStringsToEnumPass.h
index a4a014967e0..522087aafae 100644
--- a/src/Analyzer/Passes/IfTransformStringsToEnumPass.h
+++ b/src/Analyzer/Passes/IfTransformStringsToEnumPass.h
@@ -33,7 +33,7 @@ public:
 
     String getDescription() override { return "Replaces string-type arguments in If and Transform to enum"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
index 13f8025f5ea..7e0b6b2f828 100644
--- a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
+++ b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
@@ -233,7 +233,7 @@ private:
     }
 };
 
-void LogicalExpressionOptimizerPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void LogicalExpressionOptimizerPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     LogicalExpressionOptimizerVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
index 05c10ddc685..51d9968b48c 100644
--- a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
+++ b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
@@ -76,7 +76,7 @@ public:
 
     String getDescription() override { return "Transform equality chain to a single IN function or a constant if possible"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/MultiIfToIfPass.cpp b/src/Analyzer/Passes/MultiIfToIfPass.cpp
index 4672351bcfb..5012aa7fa78 100644
--- a/src/Analyzer/Passes/MultiIfToIfPass.cpp
+++ b/src/Analyzer/Passes/MultiIfToIfPass.cpp
@@ -43,7 +43,7 @@ private:
 
 }
 
-void MultiIfToIfPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void MultiIfToIfPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     auto if_function_ptr = FunctionFactory::instance().get("if", context);
     MultiIfToIfVisitor visitor(std::move(if_function_ptr), std::move(context));
diff --git a/src/Analyzer/Passes/MultiIfToIfPass.h b/src/Analyzer/Passes/MultiIfToIfPass.h
index 2213f3713ed..e3c03913aaa 100644
--- a/src/Analyzer/Passes/MultiIfToIfPass.h
+++ b/src/Analyzer/Passes/MultiIfToIfPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Optimize multiIf with single condition to if."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp b/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
index d36be98751c..20b308c3af6 100644
--- a/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
+++ b/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
@@ -64,7 +64,7 @@ private:
 
 }
 
-void NormalizeCountVariantsPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void NormalizeCountVariantsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     NormalizeCountVariantsVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/NormalizeCountVariantsPass.h b/src/Analyzer/Passes/NormalizeCountVariantsPass.h
index 78a114f4a85..6cf9f34619a 100644
--- a/src/Analyzer/Passes/NormalizeCountVariantsPass.h
+++ b/src/Analyzer/Passes/NormalizeCountVariantsPass.h
@@ -20,7 +20,7 @@ public:
 
     String getDescription() override { return "Optimize count(literal), sum(1) into count()."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.cpp b/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.cpp
index 5ed52f1210b..7c851d5fc35 100644
--- a/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.cpp
+++ b/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.cpp
@@ -130,7 +130,7 @@ private:
     }
 };
 
-void OptimizeGroupByFunctionKeysPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void OptimizeGroupByFunctionKeysPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     OptimizeGroupByFunctionKeysVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.h b/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.h
index 632960c45bb..fd5eadcb796 100644
--- a/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.h
+++ b/src/Analyzer/Passes/OptimizeGroupByFunctionKeysPass.h
@@ -16,7 +16,7 @@ public:
 
     String getDescription() override { return "Eliminates functions of other keys in GROUP BY section."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.cpp b/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.cpp
index c6d312d0ecf..b6cc50caffe 100644
--- a/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.cpp
+++ b/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.cpp
@@ -124,7 +124,7 @@ private:
 
 }
 
-void OptimizeRedundantFunctionsInOrderByPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void OptimizeRedundantFunctionsInOrderByPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     OptimizeRedundantFunctionsInOrderByVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.h b/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.h
index 609a6360d27..4a63c78022b 100644
--- a/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.h
+++ b/src/Analyzer/Passes/OptimizeRedundantFunctionsInOrderByPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "If ORDER BY has argument x followed by f(x) transforms it to ORDER BY x."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.cpp b/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.cpp
index 3632c41028b..26ca5984b49 100644
--- a/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.cpp
+++ b/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.cpp
@@ -70,7 +70,7 @@ private:
 
 }
 
-void OrderByLimitByDuplicateEliminationPass::run(QueryTreeNodePtr query_tree_node, ContextPtr)
+void OrderByLimitByDuplicateEliminationPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr)
 {
     OrderByLimitByDuplicateEliminationVisitor visitor;
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.h b/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.h
index 11a025af5b9..de5e1898a4c 100644
--- a/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.h
+++ b/src/Analyzer/Passes/OrderByLimitByDuplicateEliminationPass.h
@@ -20,7 +20,7 @@ public:
 
     String getDescription() override { return "Remove duplicate columns from ORDER BY, LIMIT BY."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/OrderByTupleEliminationPass.cpp b/src/Analyzer/Passes/OrderByTupleEliminationPass.cpp
index f70ec27ba5d..7c106082124 100644
--- a/src/Analyzer/Passes/OrderByTupleEliminationPass.cpp
+++ b/src/Analyzer/Passes/OrderByTupleEliminationPass.cpp
@@ -50,7 +50,7 @@ public:
 
 }
 
-void OrderByTupleEliminationPass::run(QueryTreeNodePtr query_tree_node, ContextPtr)
+void OrderByTupleEliminationPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr)
 {
     OrderByTupleEliminationVisitor visitor;
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/OrderByTupleEliminationPass.h b/src/Analyzer/Passes/OrderByTupleEliminationPass.h
index 5665561e227..45c8a756795 100644
--- a/src/Analyzer/Passes/OrderByTupleEliminationPass.h
+++ b/src/Analyzer/Passes/OrderByTupleEliminationPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Remove tuple from ORDER BY."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index c454ad9f84f..1a76bc762a4 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -77,6 +77,8 @@
 #include <Analyzer/QueryTreeBuilder.h>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/Identifier.h>
+#include <Poco/Logger.h>
+#include <Common/logger_useful.h>
 
 namespace ProfileEvents
 {
@@ -1056,7 +1058,7 @@ private:
 class QueryAnalyzer
 {
 public:
-    void resolve(QueryTreeNodePtr node, const QueryTreeNodePtr & table_expression, ContextPtr context)
+    void resolve(QueryTreeNodePtr & node, const QueryTreeNodePtr & table_expression, ContextPtr context)
     {
         IdentifierResolveScope scope(node, nullptr /*parent_scope*/);
 
@@ -1097,6 +1099,7 @@ public:
             {
                 if (table_expression)
                 {
+                    LOG_DEBUG(&Poco::Logger::get("resolve"), "Table expression: {}", table_expression->dumpTree());
                     scope.expression_join_tree_node = table_expression;
                     validateTableExpressionModifiers(scope.expression_join_tree_node, scope);
                     initializeTableExpressionData(scope.expression_join_tree_node, scope);
@@ -1106,6 +1109,7 @@ public:
                     resolveExpressionNodeList(node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
                 else
                     resolveExpressionNode(node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
+                LOG_DEBUG(&Poco::Logger::get("resolve"), "Result: {}", node->dumpTree());
 
                 break;
             }
@@ -2677,6 +2681,7 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
   */
 QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromTableColumns(const IdentifierLookup & identifier_lookup, IdentifierResolveScope & scope)
 {
+    LOG_DEBUG(&Poco::Logger::get("tryResolveIdentifierFromTableColumns"), "{} {}", scope.column_name_to_column_node.size(), !identifier_lookup.isExpressionLookup());
     if (scope.column_name_to_column_node.empty() || !identifier_lookup.isExpressionLookup())
         return {};
 
@@ -2836,11 +2841,14 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromTableExpression(const Id
         QueryTreeNodePtr result_expression;
         bool match_full_identifier = false;
 
+        LOG_DEBUG(&Poco::Logger::get("resolve_identifier_from_storage_or_throw"), "Looking for id: {}", identifier_without_column_qualifier.getFullName());
+
         auto it = table_expression_data.column_name_to_column_node.find(identifier_without_column_qualifier.getFullName());
         if (it != table_expression_data.column_name_to_column_node.end())
         {
             match_full_identifier = true;
             result_expression = it->second;
+            LOG_DEBUG(&Poco::Logger::get("resolve_identifier_from_storage_or_throw"), "Found: {}", result_expression->dumpTree());
         }
         else
         {
@@ -5389,6 +5397,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
             auto unresolved_identifier = identifier_node.getIdentifier();
             auto resolve_identifier_expression_result = tryResolveIdentifier({unresolved_identifier, IdentifierLookupContext::EXPRESSION}, scope);
             auto resolved_identifier_node = resolve_identifier_expression_result.resolved_identifier;
+            LOG_DEBUG(&Poco::Logger::get("resolveExpressionNode"), "Resolved: {}", resolved_identifier_node ? resolved_identifier_node->dumpTree() : "Not resolved");
 
             if (resolved_identifier_node && result_projection_names.empty() &&
                 (resolve_identifier_expression_result.isResolvedFromJoinTree() || resolve_identifier_expression_result.isResolvedFromExpressionArguments()))
@@ -5470,6 +5479,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
             }
 
             node = std::move(resolved_identifier_node);
+            LOG_DEBUG(&Poco::Logger::get("resolveExpressionNode"), "Result node: {}", node ? node->dumpTree() : "Not resolved");
 
             if (node->getNodeType() == QueryTreeNodeType::LIST)
             {
@@ -6173,6 +6183,7 @@ void QueryAnalyzer::initializeTableExpressionData(const QueryTreeNodePtr & table
             table_expression_data.should_qualify_columns = false;
     }
 
+    LOG_DEBUG(&Poco::Logger::get("Analyzer"), "Table data: {}", table_expression_data.dump());
     scope.table_expression_node_to_data.emplace(table_expression_node, std::move(table_expression_data));
 }
 
@@ -7152,7 +7163,7 @@ QueryAnalysisPass::QueryAnalysisPass(QueryTreeNodePtr table_expression_)
     : table_expression(std::move(table_expression_))
 {}
 
-void QueryAnalysisPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void QueryAnalysisPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     QueryAnalyzer analyzer;
     analyzer.resolve(query_tree_node, table_expression, context);
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.h b/src/Analyzer/Passes/QueryAnalysisPass.h
index fa8778ebf76..5d335d3e712 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.h
+++ b/src/Analyzer/Passes/QueryAnalysisPass.h
@@ -89,7 +89,7 @@ public:
         return "Resolve type for each query expression. Replace identifiers, matchers with query expressions. Perform constant folding. Evaluate scalar subqueries.";
     }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 private:
     QueryTreeNodePtr table_expression;
diff --git a/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.cpp b/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.cpp
index de264948d4c..2fe5a89578b 100644
--- a/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.cpp
+++ b/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.cpp
@@ -108,7 +108,7 @@ private:
 }
 
 
-void RewriteAggregateFunctionWithIfPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void RewriteAggregateFunctionWithIfPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     RewriteAggregateFunctionWithIfVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.h b/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.h
index be8ad3ac34d..0a2fc1ba423 100644
--- a/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.h
+++ b/src/Analyzer/Passes/RewriteAggregateFunctionWithIfPass.h
@@ -20,7 +20,7 @@ public:
         return "Rewrite aggregate functions with if expression as argument when logically equivalent";
     }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/ShardNumColumnToFunctionPass.cpp b/src/Analyzer/Passes/ShardNumColumnToFunctionPass.cpp
index b28816e8ff3..c273aecc9b5 100644
--- a/src/Analyzer/Passes/ShardNumColumnToFunctionPass.cpp
+++ b/src/Analyzer/Passes/ShardNumColumnToFunctionPass.cpp
@@ -58,7 +58,7 @@ public:
 
 }
 
-void ShardNumColumnToFunctionPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void ShardNumColumnToFunctionPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     ShardNumColumnToFunctionVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/ShardNumColumnToFunctionPass.h b/src/Analyzer/Passes/ShardNumColumnToFunctionPass.h
index 71a038bcf39..248f4e29bbe 100644
--- a/src/Analyzer/Passes/ShardNumColumnToFunctionPass.h
+++ b/src/Analyzer/Passes/ShardNumColumnToFunctionPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Rewrite _shard_num column into shardNum() function"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.cpp b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
index d55af278152..04d6c134d10 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.cpp
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
@@ -180,7 +180,7 @@ private:
 
 }
 
-void SumIfToCountIfPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void SumIfToCountIfPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     SumIfToCountIfVisitor visitor(context);
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.h b/src/Analyzer/Passes/SumIfToCountIfPass.h
index f3ba47f1c2c..439d80c6306 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.h
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.h
@@ -23,7 +23,7 @@ public:
 
     String getDescription() override { return "Rewrite sum(if) and sumIf into countIf"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.cpp b/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.cpp
index 5c4484457e8..e256934010d 100644
--- a/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.cpp
+++ b/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.cpp
@@ -87,7 +87,7 @@ public:
 
 }
 
-void UniqInjectiveFunctionsEliminationPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void UniqInjectiveFunctionsEliminationPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     UniqInjectiveFunctionsEliminationVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.h b/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.h
index a0f07dfb7b5..c143fe2c39c 100644
--- a/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.h
+++ b/src/Analyzer/Passes/UniqInjectiveFunctionsEliminationPass.h
@@ -17,7 +17,7 @@ public:
 
     String getDescription() override { return "Remove injective functions from uniq functions arguments."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Planner/PlannerActionsVisitor.cpp b/src/Planner/PlannerActionsVisitor.cpp
index c64d82299ca..e9fa72f925d 100644
--- a/src/Planner/PlannerActionsVisitor.cpp
+++ b/src/Planner/PlannerActionsVisitor.cpp
@@ -494,8 +494,8 @@ PlannerActionsVisitorImpl::NodeNameAndNodeMinLevel PlannerActionsVisitorImpl::vi
         return visitFunction(node);
 
     throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
-        "Expected column, constant, function. Actual {}",
-        node->formatASTForErrorMessage());
+        "Expected column, constant, function. Actual {} with type: {}",
+        node->formatASTForErrorMessage(), node_type);
 }
 
 PlannerActionsVisitorImpl::NodeNameAndNodeMinLevel PlannerActionsVisitorImpl::visitColumn(const QueryTreeNodePtr & node)
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index b91ad0b963a..9f9f0fda9e2 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -30,6 +30,7 @@
 #include <Common/randomSeed.h>
 #include <Common/formatReadable.h>
 #include <Common/CurrentMetrics.h>
+#include "Analyzer/IQueryTreeNode.h"
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
@@ -937,7 +938,8 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
             table_function_node->setTableExpressionModifiers(*table_expression_modifiers);
 
         QueryAnalysisPass query_analysis_pass;
-        query_analysis_pass.run(table_function_node, query_context);
+        QueryTreeNodePtr node = table_function_node;
+        query_analysis_pass.run(node, query_context);
 
         replacement_table_expression = std::move(table_function_node);
     }
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index b0ed242d14d..a49155ac2d9 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -27,9 +27,18 @@
 #include <Parsers/ASTExpressionList.h>
 #include <DataTypes/DataTypeString.h>
 #include <Columns/ColumnString.h>
+#include "Common/logger_useful.h"
 #include <Common/typeid_cast.h>
 #include <Common/checkStackSize.h>
+#include "Analyzer/ColumnNode.h"
+#include "Analyzer/IQueryTreeNode.h"
+#include "Analyzer/Identifier.h"
+#include "Analyzer/IdentifierNode.h"
+#include "Analyzer/Passes/QueryAnalysisPass.h"
+#include "Analyzer/QueryTreeBuilder.h"
+#include "Core/NamesAndTypes.h"
 #include "DataTypes/IDataType.h"
+#include "Planner/PlannerActionsVisitor.h"
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Processors/Sources/NullSource.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
@@ -42,6 +51,7 @@
 #include <Databases/IDatabase.h>
 #include <base/range.h>
 #include <algorithm>
+#include <memory>
 
 
 namespace
@@ -464,8 +474,8 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
         auto storage_metadata_snapshot = storage->getInMemoryMetadataPtr();
         auto nested_storage_snaphsot = storage->getStorageSnapshot(storage_metadata_snapshot, context);
 
-        auto modified_query_info = getModifiedQueryInfo(query_info, context, table, nested_storage_snaphsot);
         Names column_names_as_aliases;
+        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names_as_aliases);
 
         if (!context->getSettingsRef().allow_experimental_analyzer)
         {
@@ -553,10 +563,10 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     pipeline.addResources(std::move(resources));
 }
 
-SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const SelectQueryInfo & query_info,
-    const ContextPtr & modified_context,
+SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
-    const StorageSnapshotPtr & storage_snapshot)
+    const StorageSnapshotPtr & storage_snapshot,
+    Names & column_names_as_aliases) const
 {
     const auto & [database_name, storage, storage_lock, table_name] = storage_with_lock_and_name;
     const StorageID current_storage_id = storage->getStorageID();
@@ -586,6 +596,47 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const SelectQueryInfo & quer
         if (!storage_snapshot->tryGetColumn(get_column_options, "_database"))
             column_name_to_node.emplace("_database", std::make_shared<ConstantNode>(current_storage_id.database_name));
 
+        auto storage_columns = storage_snapshot->metadata->getColumns();
+
+        bool with_aliases = /* common_processed_stage == QueryProcessingStage::FetchColumns && */ !storage_columns.getAliases().empty();
+        if (with_aliases)
+        {
+            auto filter_actions_dag = std::make_shared<ActionsDAG>();
+            for (const auto & column : column_names)
+            {
+                const auto column_default = storage_columns.getDefault(column);
+                bool is_alias = column_default && column_default->kind == ColumnDefaultKind::Alias;
+
+                QueryTreeNodePtr column_node;
+
+                if (is_alias)
+                {
+                    column_node = buildQueryTree(column_default->expression, modified_context);
+
+                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT before: {}\n{}", column_node->dumpTree(), modified_query_info.table_expression->dumpTree());
+
+                    column_node->setAlias(column);
+
+                    QueryAnalysisPass query_analysis_pass(modified_query_info.table_expression);
+                    query_analysis_pass.run(column_node, modified_context);
+
+                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT after: {}", column_node->dumpTree());
+
+                    column_name_to_node.emplace(column, column_node);
+                }
+                else
+                {
+                    column_node = std::make_shared<ColumnNode>(NameAndTypePair{column, storage_columns.getColumn(get_column_options, column).type }, modified_query_info.table_expression);
+                }
+
+
+                PlannerActionsVisitor actions_visitor(modified_query_info.planner_context, false /*use_column_identifier_as_action_node_name*/);
+                actions_visitor.visit(filter_actions_dag, column_node);
+            }
+            column_names_as_aliases = filter_actions_dag->getRequiredColumnsNames();
+            LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Required names: {}", toString(column_names_as_aliases));
+        }
+
         if (!column_name_to_node.empty())
         {
             replaceColumns(modified_query_info.query_tree,
@@ -594,6 +645,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const SelectQueryInfo & quer
         }
 
         modified_query_info.query = queryNodeToSelectQuery(modified_query_info.query_tree);
+        LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Modified query: {}", modified_query_info.query->formatForLogging());
     }
     else
     {
@@ -640,6 +692,8 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         modified_select.setFinal();
     }
 
+    LOG_DEBUG(&Poco::Logger::get("createSources"), "real_column_names: {}", toString(real_column_names));
+
     bool allow_experimental_analyzer = modified_context->getSettingsRef().allow_experimental_analyzer;
 
     auto storage_stage = storage->getQueryProcessingStage(modified_context,
@@ -783,7 +837,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
-        convertingSourceStream(header, storage_snapshot->metadata, aliases, modified_context, *builder, processed_stage);
+        convertingSourceStream(header, modified_query_info, storage_snapshot->metadata, aliases, modified_context, *builder, processed_stage);
     }
 
     return builder;
@@ -957,9 +1011,10 @@ void StorageMerge::alter(
 
 void ReadFromMerge::convertingSourceStream(
     const Block & header,
+    SelectQueryInfo & modified_query_info,
     const StorageMetadataPtr & metadata_snapshot,
     const Aliases & aliases,
-    ContextPtr local_context,
+    ContextMutablePtr local_context,
     QueryPipelineBuilder & builder,
     const QueryProcessingStage::Enum & processed_stage)
 {
@@ -968,21 +1023,49 @@ void ReadFromMerge::convertingSourceStream(
     auto storage_sample_block = metadata_snapshot->getSampleBlock();
     auto pipe_columns = builder.getHeader().getNamesAndTypesList();
 
-    for (const auto & alias : aliases)
+    if (local_context->getSettingsRef().allow_experimental_analyzer)
     {
-        pipe_columns.emplace_back(NameAndTypePair(alias.name, alias.type));
-        ASTPtr expr = alias.expression;
-        auto syntax_result = TreeRewriter(local_context).analyze(expr, pipe_columns);
-        auto expression_analyzer = ExpressionAnalyzer{alias.expression, syntax_result, local_context};
-
-        auto dag = std::make_shared<ActionsDAG>(pipe_columns);
-        auto actions_dag = expression_analyzer.getActionsDAG(true, false);
-        auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
-
-        builder.addSimpleTransform([&](const Block & stream_header)
+        for (const auto & alias : aliases)
         {
-            return std::make_shared<ExpressionTransform>(stream_header, actions);
-        });
+            pipe_columns.emplace_back(NameAndTypePair(alias.name, alias.type));
+
+            auto actions_dag = std::make_shared<ActionsDAG>();
+
+            QueryTreeNodePtr query_tree = buildQueryTree(alias.expression, local_context);
+            query_tree->setAlias(alias.name);
+
+            QueryAnalysisPass query_analysis_pass(modified_query_info.table_expression);
+            query_analysis_pass.run(query_tree, local_context);
+
+            PlannerActionsVisitor actions_visitor(modified_query_info.planner_context, false /*use_column_identifier_as_action_node_name*/);
+            actions_visitor.visit(actions_dag, query_tree);
+
+            auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
+
+            builder.addSimpleTransform([&](const Block & stream_header)
+            {
+                return std::make_shared<ExpressionTransform>(stream_header, actions);
+            });
+        }
+    }
+    else
+    {
+        for (const auto & alias : aliases)
+        {
+            pipe_columns.emplace_back(NameAndTypePair(alias.name, alias.type));
+            ASTPtr expr = alias.expression;
+            auto syntax_result = TreeRewriter(local_context).analyze(expr, pipe_columns);
+            auto expression_analyzer = ExpressionAnalyzer{alias.expression, syntax_result, local_context};
+
+            auto dag = std::make_shared<ActionsDAG>(pipe_columns);
+            auto actions_dag = expression_analyzer.getActionsDAG(true, false);
+            auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
+
+            builder.addSimpleTransform([&](const Block & stream_header)
+            {
+                return std::make_shared<ExpressionTransform>(stream_header, actions);
+            });
+        }
     }
 
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index babf0dd92e8..739d6831f6f 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -177,10 +177,10 @@ private:
 
     using Aliases = std::vector<AliasData>;
 
-    static SelectQueryInfo getModifiedQueryInfo(const SelectQueryInfo & query_info,
-        const ContextPtr & modified_context,
+    SelectQueryInfo getModifiedQueryInfo(const ContextPtr & modified_context,
         const StorageWithLockAndName & storage_with_lock_and_name,
-        const StorageSnapshotPtr & storage_snapshot);
+        const StorageSnapshotPtr & storage_snapshot,
+        Names & column_names_as_aliases) const;
 
     QueryPipelineBuilderPtr createSources(
         const StorageSnapshotPtr & storage_snapshot,
@@ -197,9 +197,10 @@ private:
 
     static void convertingSourceStream(
         const Block & header,
+        SelectQueryInfo & modified_query_info,
         const StorageMetadataPtr & metadata_snapshot,
         const Aliases & aliases,
-        ContextPtr context,
+        ContextMutablePtr context,
         QueryPipelineBuilder & builder,
         const QueryProcessingStage::Enum & processed_stage);
 };

From fc9ee3eb4e1e4c4b145bc39bc7ce507cf05b9d1d Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 13 Jun 2023 15:01:31 +0000
Subject: [PATCH 0002/1081] Correctly build the ActionsDAG

---
 src/Storages/StorageMerge.cpp | 28 +++++++++++++++++++++-------
 src/Storages/StorageMerge.h   |  3 ++-
 2 files changed, 23 insertions(+), 8 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index a49155ac2d9..d036eaa9f25 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -475,7 +475,7 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
         auto nested_storage_snaphsot = storage->getStorageSnapshot(storage_metadata_snapshot, context);
 
         Names column_names_as_aliases;
-        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names_as_aliases);
+        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names_as_aliases, aliases);
 
         if (!context->getSettingsRef().allow_experimental_analyzer)
         {
@@ -566,7 +566,8 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
     const StorageSnapshotPtr & storage_snapshot,
-    Names & column_names_as_aliases) const
+    Names & column_names_as_aliases,
+    Aliases & aliases) const
 {
     const auto & [database_name, storage, storage_lock, table_name] = storage_with_lock_and_name;
     const StorageID current_storage_id = storage->getStorageID();
@@ -611,18 +612,23 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
 
                 if (is_alias)
                 {
-                    column_node = buildQueryTree(column_default->expression, modified_context);
+                    // column_node = buildQueryTree(column_default->expression, modified_context);
+                    column_node = std::make_shared<IdentifierNode>(Identifier{column});
 
                     LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT before: {}\n{}", column_node->dumpTree(), modified_query_info.table_expression->dumpTree());
 
-                    column_node->setAlias(column);
-
                     QueryAnalysisPass query_analysis_pass(modified_query_info.table_expression);
                     query_analysis_pass.run(column_node, modified_context);
 
                     LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT after: {}", column_node->dumpTree());
 
+                    auto * resolved_column = column_node->as<ColumnNode>();
+                    if (!resolved_column || !resolved_column->getExpression())
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Alias column is not resolved");
+
+                    column_node = resolved_column->getExpression();
                     column_name_to_node.emplace(column, column_node);
+                    aliases.push_back({ .name = column, .type = resolved_column->getResultType(), .expression = column_node->toAST() });
                 }
                 else
                 {
@@ -634,6 +640,9 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
                 actions_visitor.visit(filter_actions_dag, column_node);
             }
             column_names_as_aliases = filter_actions_dag->getRequiredColumnsNames();
+            if (column_names_as_aliases.empty())
+                column_names_as_aliases.push_back(ExpressionActions::getSmallestColumn(storage_snapshot->metadata->getColumns().getAllPhysical()).name);
+
             LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Required names: {}", toString(column_names_as_aliases));
         }
 
@@ -1029,7 +1038,7 @@ void ReadFromMerge::convertingSourceStream(
         {
             pipe_columns.emplace_back(NameAndTypePair(alias.name, alias.type));
 
-            auto actions_dag = std::make_shared<ActionsDAG>();
+            auto actions_dag = std::make_shared<ActionsDAG>(pipe_columns);
 
             QueryTreeNodePtr query_tree = buildQueryTree(alias.expression, local_context);
             query_tree->setAlias(alias.name);
@@ -1038,7 +1047,12 @@ void ReadFromMerge::convertingSourceStream(
             query_analysis_pass.run(query_tree, local_context);
 
             PlannerActionsVisitor actions_visitor(modified_query_info.planner_context, false /*use_column_identifier_as_action_node_name*/);
-            actions_visitor.visit(actions_dag, query_tree);
+            const auto & nodes = actions_visitor.visit(actions_dag, query_tree);
+
+            if (nodes.size() != 1)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected to have 1 output but got {}", nodes.size());
+
+            actions_dag->addOrReplaceInOutputs(actions_dag->addAlias(*nodes.front(), alias.name));
 
             auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
 
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 739d6831f6f..987869e5de3 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -180,7 +180,8 @@ private:
     SelectQueryInfo getModifiedQueryInfo(const ContextPtr & modified_context,
         const StorageWithLockAndName & storage_with_lock_and_name,
         const StorageSnapshotPtr & storage_snapshot,
-        Names & column_names_as_aliases) const;
+        Names & column_names_as_aliases,
+        Aliases & aliases) const;
 
     QueryPipelineBuilderPtr createSources(
         const StorageSnapshotPtr & storage_snapshot,

From 55b81a5a5e7ad73a3e53aee0d0b83731ff8e76ed Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 13 Jun 2023 23:13:18 +0000
Subject: [PATCH 0003/1081] Fix style

---
 src/Storages/StorageMerge.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index d036eaa9f25..e2a27d4e20e 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -80,6 +80,7 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int LOGICAL_ERROR;
     extern const int BAD_ARGUMENTS;
     extern const int NOT_IMPLEMENTED;
     extern const int ILLEGAL_PREWHERE;

From 6489922dc19a0fda86bdcc8e08c108812dc4aebf Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 16 Jun 2023 18:49:59 +0000
Subject: [PATCH 0004/1081] Fix for column aliases that use other aliases

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp |  9 ------
 src/Storages/StorageMerge.cpp             | 38 ++++++++++++++++++++---
 2 files changed, 33 insertions(+), 14 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 1a76bc762a4..309f067c4c0 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1099,7 +1099,6 @@ public:
             {
                 if (table_expression)
                 {
-                    LOG_DEBUG(&Poco::Logger::get("resolve"), "Table expression: {}", table_expression->dumpTree());
                     scope.expression_join_tree_node = table_expression;
                     validateTableExpressionModifiers(scope.expression_join_tree_node, scope);
                     initializeTableExpressionData(scope.expression_join_tree_node, scope);
@@ -1109,7 +1108,6 @@ public:
                     resolveExpressionNodeList(node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
                 else
                     resolveExpressionNode(node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
-                LOG_DEBUG(&Poco::Logger::get("resolve"), "Result: {}", node->dumpTree());
 
                 break;
             }
@@ -2681,7 +2679,6 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
   */
 QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromTableColumns(const IdentifierLookup & identifier_lookup, IdentifierResolveScope & scope)
 {
-    LOG_DEBUG(&Poco::Logger::get("tryResolveIdentifierFromTableColumns"), "{} {}", scope.column_name_to_column_node.size(), !identifier_lookup.isExpressionLookup());
     if (scope.column_name_to_column_node.empty() || !identifier_lookup.isExpressionLookup())
         return {};
 
@@ -2841,14 +2838,11 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromTableExpression(const Id
         QueryTreeNodePtr result_expression;
         bool match_full_identifier = false;
 
-        LOG_DEBUG(&Poco::Logger::get("resolve_identifier_from_storage_or_throw"), "Looking for id: {}", identifier_without_column_qualifier.getFullName());
-
         auto it = table_expression_data.column_name_to_column_node.find(identifier_without_column_qualifier.getFullName());
         if (it != table_expression_data.column_name_to_column_node.end())
         {
             match_full_identifier = true;
             result_expression = it->second;
-            LOG_DEBUG(&Poco::Logger::get("resolve_identifier_from_storage_or_throw"), "Found: {}", result_expression->dumpTree());
         }
         else
         {
@@ -5397,7 +5391,6 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
             auto unresolved_identifier = identifier_node.getIdentifier();
             auto resolve_identifier_expression_result = tryResolveIdentifier({unresolved_identifier, IdentifierLookupContext::EXPRESSION}, scope);
             auto resolved_identifier_node = resolve_identifier_expression_result.resolved_identifier;
-            LOG_DEBUG(&Poco::Logger::get("resolveExpressionNode"), "Resolved: {}", resolved_identifier_node ? resolved_identifier_node->dumpTree() : "Not resolved");
 
             if (resolved_identifier_node && result_projection_names.empty() &&
                 (resolve_identifier_expression_result.isResolvedFromJoinTree() || resolve_identifier_expression_result.isResolvedFromExpressionArguments()))
@@ -5479,7 +5472,6 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
             }
 
             node = std::move(resolved_identifier_node);
-            LOG_DEBUG(&Poco::Logger::get("resolveExpressionNode"), "Result node: {}", node ? node->dumpTree() : "Not resolved");
 
             if (node->getNodeType() == QueryTreeNodeType::LIST)
             {
@@ -6183,7 +6175,6 @@ void QueryAnalyzer::initializeTableExpressionData(const QueryTreeNodePtr & table
             table_expression_data.should_qualify_columns = false;
     }
 
-    LOG_DEBUG(&Poco::Logger::get("Analyzer"), "Table data: {}", table_expression_data.dump());
     scope.table_expression_node_to_data.emplace(table_expression_node, std::move(table_expression_data));
 }
 
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index e2a27d4e20e..13548a84826 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -34,6 +34,7 @@
 #include "Analyzer/IQueryTreeNode.h"
 #include "Analyzer/Identifier.h"
 #include "Analyzer/IdentifierNode.h"
+#include "Analyzer/InDepthQueryTreeVisitor.h"
 #include "Analyzer/Passes/QueryAnalysisPass.h"
 #include "Analyzer/QueryTreeBuilder.h"
 #include "Core/NamesAndTypes.h"
@@ -564,6 +565,26 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     pipeline.addResources(std::move(resources));
 }
 
+namespace
+{
+
+class ApplyAliasColumnExpressionsVisitor : public InDepthQueryTreeVisitor<ApplyAliasColumnExpressionsVisitor>
+{
+public:
+    ApplyAliasColumnExpressionsVisitor() = default;
+
+    void visitImpl(QueryTreeNodePtr & node)
+    {
+        if (auto * column = node->as<ColumnNode>();
+            column != nullptr && column->hasExpression())
+        {
+            node = column->getExpressionOrThrow();
+        }
+    }
+};
+
+}
+
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
     const StorageSnapshotPtr & storage_snapshot,
@@ -611,23 +632,28 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
 
                 QueryTreeNodePtr column_node;
 
+
                 if (is_alias)
                 {
                     // column_node = buildQueryTree(column_default->expression, modified_context);
-                    column_node = std::make_shared<IdentifierNode>(Identifier{column});
+                    QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column});
 
-                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT before: {}\n{}", column_node->dumpTree(), modified_query_info.table_expression->dumpTree());
+                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT before: {}\n{}", fake_node->dumpTree(), modified_query_info.table_expression->dumpTree());
 
                     QueryAnalysisPass query_analysis_pass(modified_query_info.table_expression);
-                    query_analysis_pass.run(column_node, modified_context);
+                    query_analysis_pass.run(fake_node, modified_context);
+
+                    auto * resolved_column = fake_node->as<ColumnNode>();
+
+                    column_node = fake_node;
+                    ApplyAliasColumnExpressionsVisitor visitor;
+                    visitor.visit(column_node);
 
                     LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT after: {}", column_node->dumpTree());
 
-                    auto * resolved_column = column_node->as<ColumnNode>();
                     if (!resolved_column || !resolved_column->getExpression())
                         throw Exception(ErrorCodes::LOGICAL_ERROR, "Alias column is not resolved");
 
-                    column_node = resolved_column->getExpression();
                     column_name_to_node.emplace(column, column_node);
                     aliases.push_back({ .name = column, .type = resolved_column->getResultType(), .expression = column_node->toAST() });
                 }
@@ -1095,6 +1121,8 @@ void ReadFromMerge::convertingSourceStream(
         std::move(convert_actions_dag),
         ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
 
+    LOG_DEBUG(&Poco::Logger::get("convertingSourceStream"), "The header: {}", builder.getHeader().dumpStructure());
+
     builder.addSimpleTransform([&](const Block & stream_header)
     {
         return std::make_shared<ExpressionTransform>(stream_header, actions);

From f9e67fe0427ee2d698d2b946a8286e228d47b0ec Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 19 Jun 2023 15:10:29 +0000
Subject: [PATCH 0005/1081] Update broken_tests.txt

---
 tests/broken_tests.txt | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/broken_tests.txt b/tests/broken_tests.txt
index d49b4f391e5..1635c8740cc 100644
--- a/tests/broken_tests.txt
+++ b/tests/broken_tests.txt
@@ -24,7 +24,6 @@
 01173_transaction_control_queries
 01211_optimize_skip_unused_shards_type_mismatch
 01213_optimize_skip_unused_shards_DISTINCT
-01214_test_storage_merge_aliases_with_where
 01231_distributed_aggregation_memory_efficient_mix_levels
 01244_optimize_distributed_group_by_sharding_key
 01247_optimize_distributed_group_by_sharding_key_dist_on_dist
@@ -68,7 +67,6 @@
 01890_materialized_distributed_join
 01901_in_literal_shard_prune
 01925_join_materialized_columns
-01925_test_storage_merge_aliases
 01930_optimize_skip_unused_shards_rewrite_in
 01947_mv_subquery
 01951_distributed_push_down_limit

From dcdadd5f639def096bd330f987609d0c5740ca83 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 19 Jun 2023 15:18:04 +0000
Subject: [PATCH 0006/1081] Update broken_tests.txt

---
 tests/broken_tests.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/broken_tests.txt b/tests/broken_tests.txt
index 1635c8740cc..8b11c5f5413 100644
--- a/tests/broken_tests.txt
+++ b/tests/broken_tests.txt
@@ -99,7 +99,6 @@
 02494_optimize_group_by_function_keys_and_alias_columns
 02521_aggregation_by_partitions
 02554_fix_grouping_sets_predicate_push_down
-02575_merge_prewhere_different_default_kind
 02713_array_low_cardinality_string
 02707_skip_index_with_in
 02241_join_rocksdb_bs

From 20c752fb787a05f9180f791401afe56bf372acfc Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 19 Jun 2023 15:44:01 +0000
Subject: [PATCH 0007/1081] Fix generated query

---
 src/Storages/StorageMerge.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 13548a84826..22308c1d901 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -614,7 +614,11 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         std::unordered_map<std::string, QueryTreeNodePtr> column_name_to_node;
 
         if (!storage_snapshot->tryGetColumn(get_column_options, "_table"))
-            column_name_to_node.emplace("_table", std::make_shared<ConstantNode>(current_storage_id.table_name));
+        {
+            auto table_name_node = std::make_shared<ConstantNode>(current_storage_id.table_name);
+            table_name_node->setAlias("_table");
+            column_name_to_node.emplace("_table", table_name_node);
+        }
 
         if (!storage_snapshot->tryGetColumn(get_column_options, "_database"))
             column_name_to_node.emplace("_database", std::make_shared<ConstantNode>(current_storage_id.database_name));

From 118b84703bb0f08aa622b956b1207d9092f5f2d7 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 21 Jun 2023 01:51:34 +0200
Subject: [PATCH 0008/1081] WIP on StorageMerge and distributed JOIN

---
 src/Analyzer/ColumnNode.h     |  5 ++
 src/Storages/StorageMerge.cpp | 86 ++++++++++++++++++++++++++++++++---
 src/Storages/StorageMerge.h   |  2 +-
 3 files changed, 86 insertions(+), 7 deletions(-)

diff --git a/src/Analyzer/ColumnNode.h b/src/Analyzer/ColumnNode.h
index b320df788c5..46e7c8eb500 100644
--- a/src/Analyzer/ColumnNode.h
+++ b/src/Analyzer/ColumnNode.h
@@ -108,6 +108,11 @@ public:
       */
     QueryTreeNodePtr getColumnSourceOrNull() const;
 
+    void setColumnSource(const QueryTreeNodePtr & source)
+    {
+        getSourceWeakPointer() = source;
+    }
+
     QueryTreeNodeType getNodeType() const override
     {
         return QueryTreeNodeType::COLUMN;
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 22308c1d901..85ec21b4765 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1,5 +1,6 @@
 #include <QueryPipeline/narrowPipe.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
+#include <Storages/StorageDistributed.h>
 #include <Storages/StorageMerge.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/StorageView.h>
@@ -51,6 +52,7 @@
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <Databases/IDatabase.h>
 #include <base/range.h>
+#include <Poco/Logger.h>
 #include <algorithm>
 #include <memory>
 
@@ -583,6 +585,76 @@ public:
     }
 };
 
+bool hasUnknownColumn(const QueryTreeNodePtr & node,
+    QueryTreeNodePtr original_table_expression,
+    QueryTreeNodePtr replacement_table_expression)
+{
+    QueryTreeNodes stack = { node };
+    while (!stack.empty())
+    {
+        auto current = stack.back();
+        stack.pop_back();
+
+        switch (current->getNodeType())
+        {
+            case QueryTreeNodeType::CONSTANT:
+                break;
+            case QueryTreeNodeType::COLUMN:
+            {
+                auto * column_node = current->as<ColumnNode>();
+                auto source = column_node->getColumnSourceOrNull();
+                if (source != original_table_expression)
+                    return true;
+                else
+                    column_node->setColumnSource(replacement_table_expression);
+                break;
+            }
+            default:
+            {
+                for (const auto & child : node->getChildren())
+                {
+                    if (child)
+                        stack.push_back(child);
+                }
+            }
+        }
+    }
+    return false;
+}
+
+QueryTreeNodePtr removeJoin(
+    QueryTreeNodePtr query,
+    QueryTreeNodePtr original_table_expression,
+    QueryTreeNodePtr replacement_table_expression)
+{
+    auto * query_node = query->as<QueryNode>();
+    auto modified_query = query_node->cloneAndReplace(query_node->getJoinTree(), replacement_table_expression);
+
+    query_node = modified_query->as<QueryNode>();
+    query_node->getGroupBy().getNodes().clear();
+    query_node->getHaving() = {};
+    query_node->getOrderBy().getNodes().clear();
+
+    auto & projection = query_node->getProjection().getNodes();
+    auto projection_columns = query_node->getProjectionColumns();
+    for (size_t i = 0; i < projection.size();)
+    {
+        if (hasUnknownColumn(projection[i], original_table_expression, replacement_table_expression))
+        {
+            projection.erase(projection.begin() + i);
+            projection_columns.erase(projection_columns.begin() + i);
+            continue;
+        }
+        ++i;
+    }
+
+    query_node->resolveProjectionColumns(std::move(projection_columns));
+
+    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Query without JOIN:\n{}", modified_query->dumpTree());
+
+    return modified_query;
+}
+
 }
 
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
@@ -602,8 +674,9 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
-        modified_query_info.query_tree = modified_query_info.query_tree->cloneAndReplace(modified_query_info.table_expression,
-            replacement_table_expression);
+        modified_query_info.query_tree = removeJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression);
+        // modified_query_info.query_tree = modified_query_info.query_tree->cloneAndReplace(modified_query_info.table_expression,
+        //     replacement_table_expression);
         modified_query_info.table_expression = replacement_table_expression;
         modified_query_info.planner_context->getOrCreateTableExpressionData(replacement_table_expression);
 
@@ -877,7 +950,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
-        convertingSourceStream(header, modified_query_info, storage_snapshot->metadata, aliases, modified_context, *builder, processed_stage);
+        convertingSourceStream(header, modified_query_info, storage_snapshot, aliases, modified_context, *builder, processed_stage);
     }
 
     return builder;
@@ -1052,7 +1125,7 @@ void StorageMerge::alter(
 void ReadFromMerge::convertingSourceStream(
     const Block & header,
     SelectQueryInfo & modified_query_info,
-    const StorageMetadataPtr & metadata_snapshot,
+    const StorageSnapshotPtr & snapshot,
     const Aliases & aliases,
     ContextMutablePtr local_context,
     QueryPipelineBuilder & builder,
@@ -1060,7 +1133,7 @@ void ReadFromMerge::convertingSourceStream(
 {
     Block before_block_header = builder.getHeader();
 
-    auto storage_sample_block = metadata_snapshot->getSampleBlock();
+    auto storage_sample_block = snapshot->metadata->getSampleBlock();
     auto pipe_columns = builder.getHeader().getNamesAndTypesList();
 
     if (local_context->getSettingsRef().allow_experimental_analyzer)
@@ -1115,7 +1188,8 @@ void ReadFromMerge::convertingSourceStream(
 
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
 
-    if (local_context->getSettingsRef().allow_experimental_analyzer && processed_stage != QueryProcessingStage::FetchColumns)
+    if (local_context->getSettingsRef().allow_experimental_analyzer
+        && (processed_stage != QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr))
         convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Position;
 
     auto convert_actions_dag = ActionsDAG::makeConvertingActions(builder.getHeader().getColumnsWithTypeAndName(),
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 987869e5de3..de9480292f9 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -199,7 +199,7 @@ private:
     static void convertingSourceStream(
         const Block & header,
         SelectQueryInfo & modified_query_info,
-        const StorageMetadataPtr & metadata_snapshot,
+        const StorageSnapshotPtr & snapshot,
         const Aliases & aliases,
         ContextMutablePtr context,
         QueryPipelineBuilder & builder,

From 88fe30254a280286ac2bd2b6bcdc71865ec2aed2 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 21 Jun 2023 17:55:14 +0000
Subject: [PATCH 0009/1081] Small fixup

---
 src/Storages/StorageMerge.cpp | 12 +++++++++---
 tests/broken_tests.txt        |  1 -
 2 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 85ec21b4765..d1ac3f57ae1 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -631,6 +631,10 @@ QueryTreeNodePtr removeJoin(
     auto modified_query = query_node->cloneAndReplace(query_node->getJoinTree(), replacement_table_expression);
 
     query_node = modified_query->as<QueryNode>();
+
+    //TODO: change the predicates to make it valid and execute it on shards.
+    query_node->getPrewhere() = {};
+    query_node->getWhere() = {};
     query_node->getGroupBy().getNodes().clear();
     query_node->getHaving() = {};
     query_node->getOrderBy().getNodes().clear();
@@ -675,8 +679,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
         modified_query_info.query_tree = removeJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression);
-        // modified_query_info.query_tree = modified_query_info.query_tree->cloneAndReplace(modified_query_info.table_expression,
-        //     replacement_table_expression);
         modified_query_info.table_expression = replacement_table_expression;
         modified_query_info.planner_context->getOrCreateTableExpressionData(replacement_table_expression);
 
@@ -694,7 +696,11 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         }
 
         if (!storage_snapshot->tryGetColumn(get_column_options, "_database"))
-            column_name_to_node.emplace("_database", std::make_shared<ConstantNode>(current_storage_id.database_name));
+        {
+            auto database_name_node = std::make_shared<ConstantNode>(current_storage_id.database_name);
+            database_name_node->setAlias("_database");
+            column_name_to_node.emplace("_database", database_name_node);
+        }
 
         auto storage_columns = storage_snapshot->metadata->getColumns();
 
diff --git a/tests/broken_tests.txt b/tests/broken_tests.txt
index e6b5fb4f631..f6e21a29eed 100644
--- a/tests/broken_tests.txt
+++ b/tests/broken_tests.txt
@@ -38,7 +38,6 @@
 01527_dist_sharding_key_dictGet_reload
 01528_allow_nondeterministic_optimize_skip_unused_shards
 01540_verbatim_partition_pruning
-01560_merge_distributed_join
 01563_distributed_query_finish
 01576_alias_column_rewrite
 01583_const_column_in_set_index

From 47fafdc32c320464bbd65468208bbc8e5b7ac62f Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 21 Jun 2023 18:06:24 +0000
Subject: [PATCH 0010/1081] Code cleanup

---
 src/Storages/StorageDistributed.cpp |  1 -
 src/Storages/StorageMerge.cpp       | 35 ++++++++---------------------
 2 files changed, 9 insertions(+), 27 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 9f9f0fda9e2..b948ca946c3 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -30,7 +30,6 @@
 #include <Common/randomSeed.h>
 #include <Common/formatReadable.h>
 #include <Common/CurrentMetrics.h>
-#include "Analyzer/IQueryTreeNode.h"
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index d1ac3f57ae1..1a0376edbf5 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -28,19 +28,17 @@
 #include <Parsers/ASTExpressionList.h>
 #include <DataTypes/DataTypeString.h>
 #include <Columns/ColumnString.h>
-#include "Common/logger_useful.h"
 #include <Common/typeid_cast.h>
 #include <Common/checkStackSize.h>
-#include "Analyzer/ColumnNode.h"
-#include "Analyzer/IQueryTreeNode.h"
-#include "Analyzer/Identifier.h"
-#include "Analyzer/IdentifierNode.h"
-#include "Analyzer/InDepthQueryTreeVisitor.h"
-#include "Analyzer/Passes/QueryAnalysisPass.h"
-#include "Analyzer/QueryTreeBuilder.h"
-#include "Core/NamesAndTypes.h"
-#include "DataTypes/IDataType.h"
-#include "Planner/PlannerActionsVisitor.h"
+#include <Analyzer/ColumnNode.h>
+#include <Analyzer/Identifier.h>
+#include <Analyzer/IdentifierNode.h>
+#include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/Passes/QueryAnalysisPass.h>
+#include <Analyzer/QueryTreeBuilder.h>
+#include <Core/NamesAndTypes.h>
+#include <DataTypes/IDataType.h>
+#include <Planner/PlannerActionsVisitor.h>
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Processors/Sources/NullSource.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
@@ -52,7 +50,6 @@
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <Databases/IDatabase.h>
 #include <base/range.h>
-#include <Poco/Logger.h>
 #include <algorithm>
 #include <memory>
 
@@ -654,8 +651,6 @@ QueryTreeNodePtr removeJoin(
 
     query_node->resolveProjectionColumns(std::move(projection_columns));
 
-    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Query without JOIN:\n{}", modified_query->dumpTree());
-
     return modified_query;
 }
 
@@ -718,11 +713,8 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
 
                 if (is_alias)
                 {
-                    // column_node = buildQueryTree(column_default->expression, modified_context);
                     QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column});
 
-                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT before: {}\n{}", fake_node->dumpTree(), modified_query_info.table_expression->dumpTree());
-
                     QueryAnalysisPass query_analysis_pass(modified_query_info.table_expression);
                     query_analysis_pass.run(fake_node, modified_context);
 
@@ -732,8 +724,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
                     ApplyAliasColumnExpressionsVisitor visitor;
                     visitor.visit(column_node);
 
-                    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "QT after: {}", column_node->dumpTree());
-
                     if (!resolved_column || !resolved_column->getExpression())
                         throw Exception(ErrorCodes::LOGICAL_ERROR, "Alias column is not resolved");
 
@@ -752,8 +742,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
             column_names_as_aliases = filter_actions_dag->getRequiredColumnsNames();
             if (column_names_as_aliases.empty())
                 column_names_as_aliases.push_back(ExpressionActions::getSmallestColumn(storage_snapshot->metadata->getColumns().getAllPhysical()).name);
-
-            LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Required names: {}", toString(column_names_as_aliases));
         }
 
         if (!column_name_to_node.empty())
@@ -764,7 +752,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         }
 
         modified_query_info.query = queryNodeToSelectQuery(modified_query_info.query_tree);
-        LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Modified query: {}", modified_query_info.query->formatForLogging());
     }
     else
     {
@@ -811,8 +798,6 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         modified_select.setFinal();
     }
 
-    LOG_DEBUG(&Poco::Logger::get("createSources"), "real_column_names: {}", toString(real_column_names));
-
     bool allow_experimental_analyzer = modified_context->getSettingsRef().allow_experimental_analyzer;
 
     auto storage_stage = storage->getQueryProcessingStage(modified_context,
@@ -1205,8 +1190,6 @@ void ReadFromMerge::convertingSourceStream(
         std::move(convert_actions_dag),
         ExpressionActionsSettings::fromContext(local_context, CompileExpressions::yes));
 
-    LOG_DEBUG(&Poco::Logger::get("convertingSourceStream"), "The header: {}", builder.getHeader().dumpStructure());
-
     builder.addSimpleTransform([&](const Block & stream_header)
     {
         return std::make_shared<ExpressionTransform>(stream_header, actions);

From 97a1ea01badaba10235ab0b01777f324b2f8365e Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 22 Jun 2023 15:10:53 +0000
Subject: [PATCH 0011/1081] Fix removeJoin

---
 src/Storages/StorageMerge.cpp | 27 ++++++++++++++++-----------
 1 file changed, 16 insertions(+), 11 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 1a0376edbf5..fd7c0aae479 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -36,6 +36,7 @@
 #include <Analyzer/InDepthQueryTreeVisitor.h>
 #include <Analyzer/Passes/QueryAnalysisPass.h>
 #include <Analyzer/QueryTreeBuilder.h>
+#include <Analyzer/TableFunctionNode.h>
 #include <Core/NamesAndTypes.h>
 #include <DataTypes/IDataType.h>
 #include <Planner/PlannerActionsVisitor.h>
@@ -625,7 +626,8 @@ QueryTreeNodePtr removeJoin(
     QueryTreeNodePtr replacement_table_expression)
 {
     auto * query_node = query->as<QueryNode>();
-    auto modified_query = query_node->cloneAndReplace(query_node->getJoinTree(), replacement_table_expression);
+    auto join_tree = query_node->getJoinTree();
+    auto modified_query = query_node->cloneAndReplace(join_tree, replacement_table_expression);
 
     query_node = modified_query->as<QueryNode>();
 
@@ -636,20 +638,23 @@ QueryTreeNodePtr removeJoin(
     query_node->getHaving() = {};
     query_node->getOrderBy().getNodes().clear();
 
-    auto & projection = query_node->getProjection().getNodes();
-    auto projection_columns = query_node->getProjectionColumns();
-    for (size_t i = 0; i < projection.size();)
+    if (join_tree->as<TableNode>() == nullptr && join_tree->as<TableFunctionNode>() == nullptr)
     {
-        if (hasUnknownColumn(projection[i], original_table_expression, replacement_table_expression))
+        auto & projection = query_node->getProjection().getNodes();
+        auto projection_columns = query_node->getProjectionColumns();
+        for (size_t i = 0; i < projection.size();)
         {
-            projection.erase(projection.begin() + i);
-            projection_columns.erase(projection_columns.begin() + i);
-            continue;
+            if (hasUnknownColumn(projection[i], original_table_expression, replacement_table_expression))
+            {
+                projection.erase(projection.begin() + i);
+                projection_columns.erase(projection_columns.begin() + i);
+                continue;
+            }
+            ++i;
         }
-        ++i;
-    }
 
-    query_node->resolveProjectionColumns(std::move(projection_columns));
+        query_node->resolveProjectionColumns(std::move(projection_columns));
+    }
 
     return modified_query;
 }

From 83022b77714a204ef4025d0b5081fbc127f2a586 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sat, 2 Sep 2023 21:56:36 +0200
Subject: [PATCH 0012/1081] Added support for parameterized view with analyzer
 by analyzing the select part with default values

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp   | 47 +++++++++++++++++++++
 src/Analyzer/TableFunctionNode.cpp          |  7 +++
 src/Analyzer/TableFunctionNode.h            |  3 ++
 src/Interpreters/InterpreterCreateQuery.cpp | 38 +++++++++++++++--
 4 files changed, 92 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 348189854e8..c82d3079118 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -77,6 +77,12 @@
 #include <Analyzer/QueryTreeBuilder.h>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/Identifier.h>
+#include <Parsers/FunctionParameterValuesVisitor.h>
+#include <Parsers/ASTSelectWithUnionQuery.h>
+#include <Parsers/ASTCreateQuery.h>
+#include <Storages/StorageView.h>
+#include <Interpreters/InterpreterSelectWithUnionQuery.h>
+#include <Parsers/QueryParameterVisitor.h>
 
 namespace ProfileEvents
 {
@@ -6210,8 +6216,49 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     QueryExpressionsAliasVisitor & expressions_visitor,
     bool nested_table_function)
 {
+
+    String database_name = scope.context->getCurrentDatabase();
+    String table_name = table_function_node->getOriginalAST()->as<ASTFunction>()->name;
+
+    if (table_function_node->getOriginalAST()->as<ASTFunction>()->is_compound_name)
+    {
+        std::vector<std::string> parts;
+        splitInto<'.'>(parts, table_function_node->getOriginalAST()->as<ASTFunction>()->name);
+
+        if (parts.size() == 2)
+        {
+            database_name = parts[0];
+            table_name = parts[1];
+        }
+    }
+
     auto & table_function_node_typed = table_function_node->as<TableFunctionNode &>();
 
+    StoragePtr table = DatabaseCatalog::instance().tryGetTable({database_name, table_name}, scope.context->getQueryContext());
+    if (table)
+    {
+        if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())
+        {
+            auto query = table->getInMemoryMetadataPtr()->getSelectQuery().inner_query->clone();
+            NameToNameMap parameterized_view_values = analyzeFunctionParamValues(table_function_node->getOriginalAST());
+            StorageView::replaceQueryParametersIfParametrizedView(query, parameterized_view_values);
+
+            ASTCreateQuery create;
+            create.select = query->as<ASTSelectWithUnionQuery>();
+            auto sample_block = InterpreterSelectWithUnionQuery::getSampleBlock(query, scope.context);
+            auto res = std::make_shared<StorageView>(StorageID(database_name, table_name),
+                                                     create,
+                                                     ColumnsDescription(sample_block.getNamesAndTypesList()),
+                    /* comment */ "",
+                    /* is_parameterized_view */ true);
+            res->startup();
+            table_function_node->getOriginalAST()->as<ASTFunction>()->prefer_subquery_to_function_formatting = true;
+            table_function_node_typed.resolve(std::move(res), scope.context);
+            return;
+        }
+    }
+
+
     if (!nested_table_function)
         expressions_visitor.visit(table_function_node_typed.getArgumentsNode());
 
diff --git a/src/Analyzer/TableFunctionNode.cpp b/src/Analyzer/TableFunctionNode.cpp
index e5158a06373..f4ffe7f4ee5 100644
--- a/src/Analyzer/TableFunctionNode.cpp
+++ b/src/Analyzer/TableFunctionNode.cpp
@@ -36,6 +36,13 @@ void TableFunctionNode::resolve(TableFunctionPtr table_function_value, StoragePt
     unresolved_arguments_indexes = std::move(unresolved_arguments_indexes_);
 }
 
+void TableFunctionNode::resolve(StoragePtr storage_value, ContextPtr context)
+{
+    storage = std::move(storage_value);
+    storage_id = storage->getStorageID();
+    storage_snapshot = storage->getStorageSnapshot(storage->getInMemoryMetadataPtr(), context);
+}
+
 const StorageID & TableFunctionNode::getStorageID() const
 {
     if (!storage)
diff --git a/src/Analyzer/TableFunctionNode.h b/src/Analyzer/TableFunctionNode.h
index 69237ac8416..ed1a26c4dd4 100644
--- a/src/Analyzer/TableFunctionNode.h
+++ b/src/Analyzer/TableFunctionNode.h
@@ -100,6 +100,9 @@ public:
     /// Resolve table function with table function, storage and context
     void resolve(TableFunctionPtr table_function_value, StoragePtr storage_value, ContextPtr context, std::vector<size_t> unresolved_arguments_indexes_);
 
+    /// Resolve table function as parameterized view with storage and context
+    void resolve(StoragePtr storage_value, ContextPtr context);
+
     /// Get storage id, throws exception if function node is not resolved
     const StorageID & getStorageID() const;
 
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 92d74f4f18a..58b6722aae9 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -76,7 +76,8 @@
 
 #include <Functions/UserDefined/UserDefinedSQLFunctionFactory.h>
 #include <Functions/UserDefined/UserDefinedSQLFunctionVisitor.h>
-
+#include <Interpreters/ReplaceQueryParameterVisitor.h>
+#include <Parsers/QueryParameterVisitor.h>
 
 namespace DB
 {
@@ -745,12 +746,43 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
     }
     else if (create.select)
     {
-
         Block as_select_sample;
 
         if (getContext()->getSettingsRef().allow_experimental_analyzer)
         {
-            as_select_sample = InterpreterSelectQueryAnalyzer::getSampleBlock(create.select->clone(), getContext());
+            if (create.isParameterizedView())
+            {
+                auto select = create.select->clone();
+
+                ///Get all query parameters
+                const auto parameters = analyzeReceiveQueryParamsWithType(select);
+                NameToNameMap parameter_values;
+
+                for (const auto & parameter : parameters)
+                {
+                    const auto data_type = DataTypeFactory::instance().get(parameter.second);
+                    /// Todo improve getting default values & include more datatypes
+                    if (data_type->isValueRepresentedByNumber() || parameter.second == "String")
+                        parameter_values[parameter.first] = "1";
+                    else if (parameter.second.starts_with("Array") || parameter.second.starts_with("Map"))
+                        parameter_values[parameter.first] = "[]";
+                    else
+                        parameter_values[parameter.first] = " ";
+                    LOG_INFO(&Poco::Logger::get("InterpreterCreateQuery"), "parameter =  {}  = {} ", parameter.first, parameter_values[parameter.first]);
+
+                }
+
+                /// Replace with default parameters
+                ReplaceQueryParameterVisitor visitor(parameter_values);
+                visitor.visit(select);
+
+                as_select_sample = InterpreterSelectQueryAnalyzer::getSampleBlock(select, getContext());
+            }
+            else
+            {
+                as_select_sample = InterpreterSelectQueryAnalyzer::getSampleBlock(create.select->clone(), getContext());
+            }
+
         }
         else
         {

From 2dfda84da0e16c594df7df4eb2b05ee1baba1193 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sat, 2 Sep 2023 21:57:57 +0200
Subject: [PATCH 0013/1081] Removed parameterized view tests from
 analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 15d46403da9..5521234495f 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -88,7 +88,6 @@
 02402_merge_engine_with_view
 02404_memory_bound_merging
 02426_orc_bug
-02428_parameterized_view
 02458_use_structure_from_insertion_table
 02479_race_condition_between_insert_and_droppin_mv
 02493_inconsistent_hex_and_binary_number
@@ -123,7 +122,6 @@
 02581_share_big_sets_between_mutation_tasks_long
 02581_share_big_sets_between_multiple_mutations_tasks_long
 00992_system_parts_race_condition_zookeeper_long
-02818_parameterized_view_with_cte_multiple_usage
 02790_optimize_skip_unused_shards_join
 01940_custom_tld_sharding_key
 02815_range_dict_no_direct_join

From 59195e1199d5c8ed31f4243b58f3186771219295 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 4 Sep 2023 19:03:23 +0200
Subject: [PATCH 0014/1081] Removed log for each parameter

---
 src/Interpreters/InterpreterCreateQuery.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 58b6722aae9..66c219dcd56 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -768,8 +768,6 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
                         parameter_values[parameter.first] = "[]";
                     else
                         parameter_values[parameter.first] = " ";
-                    LOG_INFO(&Poco::Logger::get("InterpreterCreateQuery"), "parameter =  {}  = {} ", parameter.first, parameter_values[parameter.first]);
-
                 }
 
                 /// Replace with default parameters

From eb7aad00160b1418ed96ecc83770b62ce3bfaaf0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 14 Nov 2023 11:35:54 +0100
Subject: [PATCH 0015/1081] Do not consider parts broken if only projections
 are broken

---
 src/Interpreters/MutationsInterpreter.cpp     |  14 +
 src/Interpreters/MutationsInterpreter.h       |   1 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  61 +++-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  19 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |  26 +-
 src/Storages/MergeTree/MergeTreeData.h        |  11 +-
 .../MergeTree/MergeTreeDataPartChecksum.h     |   2 +
 src/Storages/MergeTree/MutateTask.cpp         |   8 +-
 .../ReplicatedMergeTreePartCheckThread.cpp    |  31 +-
 .../ReplicatedMergeTreePartCheckThread.h      |   4 +-
 src/Storages/MergeTree/checkDataPart.cpp      |  80 ++++-
 src/Storages/MergeTree/checkDataPart.h        |   4 +-
 src/Storages/StorageMergeTree.cpp             |   5 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |   3 +-
 src/Storages/System/StorageSystemDisks.cpp    |   2 +-
 .../System/StorageSystemPartsBase.cpp         |   8 +-
 src/Storages/System/StorageSystemPartsBase.h  |   2 +-
 .../System/StorageSystemProjectionParts.cpp   |  48 ++-
 .../StorageSystemProjectionPartsColumns.cpp   |  21 +-
 .../02916_broken_projection.reference         | 224 ++++++++++++++
 .../0_stateless/02916_broken_projection.sh    | 283 ++++++++++++++++++
 21 files changed, 795 insertions(+), 62 deletions(-)
 create mode 100644 tests/queries/0_stateless/02916_broken_projection.reference
 create mode 100755 tests/queries/0_stateless/02916_broken_projection.sh

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 0ace0a8b79c..a9a5d4f33d0 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -305,6 +305,11 @@ bool MutationsInterpreter::Source::hasProjection(const String & name) const
     return part && part->hasProjection(name);
 }
 
+bool MutationsInterpreter::Source::hasBrokenProjection(const String & name) const
+{
+    return part && part->hasBrokenProjection(name);
+}
+
 bool MutationsInterpreter::Source::isCompactPart() const
 {
     return part && part->getType() == MergeTreeDataPartType::Compact;
@@ -922,6 +927,15 @@ void MutationsInterpreter::prepare(bool dry_run)
             materialized_indices.insert(index.name);
     }
 
+    /// Always rebuild broken projections.
+    for (const auto & projection : metadata_snapshot->getProjections())
+    {
+        if (!source.hasBrokenProjection(projection.name))
+            continue;
+
+        materialized_projections.insert(projection.name);
+    }
+
     for (const auto & projection : metadata_snapshot->getProjections())
     {
         if (!source.hasProjection(projection.name))
diff --git a/src/Interpreters/MutationsInterpreter.h b/src/Interpreters/MutationsInterpreter.h
index c53b86ddb5e..33b8021a653 100644
--- a/src/Interpreters/MutationsInterpreter.h
+++ b/src/Interpreters/MutationsInterpreter.h
@@ -122,6 +122,7 @@ public:
         bool materializeTTLRecalculateOnly() const;
         bool hasSecondaryIndex(const String & name) const;
         bool hasProjection(const String & name) const;
+        bool hasBrokenProjection(const String & name) const;
         bool isCompactPart() const;
 
         void read(
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 9bc72577b25..bc81758675e 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -732,7 +732,23 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
             else
             {
                 auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
-                part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
+
+                try
+                {
+                    part->loadColumnsChecksumsIndexes(require_columns_checksums, check_consistency);
+                }
+                catch (...)
+                {
+                    if (isRetryableException(std::current_exception()))
+                        throw;
+
+                    LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
+                              "Cannot load projection {}, will consider it broken", projection.name);
+
+                    addBrokenProjectionPart(projection.name, std::move(part), getCurrentExceptionMessage(false), getCurrentExceptionCode());
+                    continue;
+                }
+
                 addProjectionPart(projection.name, std::move(part));
             }
         }
@@ -1129,7 +1145,8 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         /// Check the data while we are at it.
         LOG_WARNING(storage.log, "Checksums for part {} not found. Will calculate them from data on disk.", name);
 
-        checksums = checkDataPart(shared_from_this(), false);
+        bool noop;
+        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */false);
         writeChecksums(checksums, {});
 
         bytes_on_disk = checksums.getTotalSizeOnDisk();
@@ -2130,6 +2147,46 @@ std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
     return getStreamNameOrHash(stream_name, extension, storage_);
 }
 
+void IMergeTreeDataPart::addBrokenProjectionPart(
+    const String & projection_name,
+    std::shared_ptr<IMergeTreeDataPart> projection_part,
+    const String & message,
+    int code)
+{
+    projection_part->setBrokenReason(message, code);
+    bool inserted = broken_projection_parts.emplace(projection_name, projection_part).second;
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already added to a broken projection parts list", projection_name, name);
+}
+
+void IMergeTreeDataPart::markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const
+{
+    std::lock_guard lock(broken_projections_mutex);
+
+    auto it = projection_parts.find(projection_name);
+    if (it == projection_parts.end())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no projection part '{}'", projection_name);
+
+    it->second->setBrokenReason(message, code);
+
+    broken_projection_parts.emplace(projection_name, it->second);
+    projection_parts.erase(it);
+}
+
+void IMergeTreeDataPart::setBrokenReason(const String & message, int code)
+{
+    std::lock_guard lock(broken_projections_mutex);
+    is_broken = true;
+    exception = message;
+    exception_code = code;
+}
+
+bool IMergeTreeDataPart::hasBrokenProjection(const String & projection_name) const
+{
+    std::lock_guard lock(broken_projections_mutex);
+    return broken_projection_parts.contains(projection_name);
+}
+
 bool isCompactPart(const MergeTreeDataPartPtr & data_part)
 {
     return (data_part && data_part->getType() == MergeTreeDataPartType::Compact);
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index a9659d2f5f4..52a1541e15f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -255,6 +255,12 @@ public:
     /// Frozen by ALTER TABLE ... FREEZE ... It is used for information purposes in system.parts table.
     mutable std::atomic<bool> is_frozen {false};
 
+    /// If it is a projection part, it can be broken sometimes.
+    mutable std::atomic<bool> is_broken {false};
+    mutable std::string exception;
+    mutable int exception_code = 0;
+    mutable std::mutex broken_projections_mutex;
+
     /// Indicates that the part was marked Outdated by PartCheckThread because the part was not committed to ZooKeeper
     mutable bool is_unexpected_local_part = false;
 
@@ -405,12 +411,20 @@ public:
 
     const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getProjectionParts() const { return projection_parts; }
 
+    const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getBrokenProjectionParts() const { return broken_projection_parts; }
+
     MergeTreeDataPartBuilder getProjectionPartBuilder(const String & projection_name, bool is_temp_projection = false);
 
     void addProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> && projection_part);
 
+    void addBrokenProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> projection_part, const String & message, int code);
+
+    void markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const;
+
     bool hasProjection(const String & projection_name) const { return projection_parts.contains(projection_name); }
 
+    bool hasBrokenProjection(const String & projection_name) const;
+
     void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
     /// Return set of metadata file names without checksums. For example,
@@ -564,7 +578,8 @@ protected:
     const IMergeTreeDataPart * parent_part;
     String parent_part_name;
 
-    std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
+    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
+    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> broken_projection_parts;
 
     mutable PartMetadataManagerPtr metadata_manager;
 
@@ -678,6 +693,8 @@ private:
     void incrementStateMetric(MergeTreeDataPartState state) const;
     void decrementStateMetric(MergeTreeDataPartState state) const;
 
+    void setBrokenReason(const String & message, int code);
+
     /// This ugly flag is needed for debug assertions only
     mutable bool part_is_probably_removed_from_disk = false;
 };
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 1c0f9208fef..152c386e188 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5737,7 +5737,7 @@ MergeTreeData::getDataPartsVectorForInternalUsage(const DataPartStates & afforda
 }
 
 MergeTreeData::ProjectionPartsVector
-MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, DataPartStateVector * out_states) const
+MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, bool fill_states) const
 {
     auto lock = lockParts();
     ProjectionPartsVector res;
@@ -5749,14 +5749,20 @@ MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & a
             res.data_parts.push_back(part);
             for (const auto & [_, projection_part] : part->getProjectionParts())
                 res.projection_parts.push_back(projection_part);
+            for (const auto & [_, projection_part] : part->getBrokenProjectionParts())
+                res.broken_projection_parts.push_back(projection_part);
         }
     }
 
-    if (out_states != nullptr)
+    if (fill_states)
     {
-        out_states->resize(res.projection_parts.size());
+        res.projection_parts_states.resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+
+        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
+        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
+            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
     }
 
     return res;
@@ -5809,7 +5815,7 @@ bool MergeTreeData::supportsLightweightDelete() const
     return true;
 }
 
-MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states) const
+MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(bool fill_states) const
 {
     ProjectionPartsVector res;
     auto lock = lockParts();
@@ -5820,11 +5826,15 @@ MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(
             res.projection_parts.push_back(projection_part);
     }
 
-    if (out_states != nullptr)
+    if (fill_states)
     {
-        out_states->resize(res.projection_parts.size());
+        res.projection_parts_states.resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
+
+        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
+        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
+            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
     }
     return res;
 }
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 54104849fe4..4ef3b75988b 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -468,8 +468,13 @@ public:
 
     struct ProjectionPartsVector
     {
-        DataPartsVector projection_parts;
         DataPartsVector data_parts;
+
+        DataPartsVector projection_parts;
+        DataPartStateVector projection_parts_states;
+
+        DataPartsVector broken_projection_parts;
+        DataPartStateVector broken_projection_parts_states;
     };
 
     /// Returns a copy of the list so that the caller shouldn't worry about locks.
@@ -484,7 +489,7 @@ public:
         const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
     /// Same as above but only returns projection parts
     ProjectionPartsVector getProjectionPartsVectorForInternalUsage(
-        const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
+        const DataPartStates & affordable_states, bool fill_states = false) const;
 
 
     /// Returns absolutely all parts (and snapshot of their states)
@@ -496,7 +501,7 @@ public:
     size_t getTotalMarksCount() const;
 
     /// Same as above but only returns projection parts
-    ProjectionPartsVector getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states = nullptr) const;
+    ProjectionPartsVector getAllProjectionPartsVector(bool fill_states = false) const;
 
     /// Returns parts in Active state
     DataParts getDataPartsForInternalUsage() const;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 8e5e8c8c448..3595ce38db5 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -54,6 +54,8 @@ struct MergeTreeDataPartChecksums
 
     bool has(const String & file_name) const { return files.find(file_name) != files.end(); }
 
+    bool remove(const String & file_name) { return files.erase(file_name); }
+
     bool empty() const { return files.empty(); }
 
     /// Checks that the set of columns and their checksums are the same. If not, throws an exception.
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 911b25de2ad..8ef1621b647 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -513,7 +513,9 @@ static std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
     {
         bool need_recalculate =
             materialized_projections.contains(projection.name)
-            || (!is_full_part_storage && source_part->hasProjection(projection.name));
+            || (!is_full_part_storage
+                && (source_part->hasProjection(projection.name)
+                    || source_part->hasBrokenProjection(projection.name)));
 
         if (need_recalculate)
             projections_to_recalc.insert(&projection);
@@ -1367,7 +1369,9 @@ private:
 
             bool need_recalculate =
                 ctx->materialized_projections.contains(projection.name)
-                || (!is_full_part_storage && ctx->source_part->hasProjection(projection.name));
+                || (!is_full_part_storage
+                    && (ctx->source_part->hasProjection(projection.name)
+                        || ctx->source_part->hasBrokenProjection(projection.name)));
 
             if (need_recalculate)
             {
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index b1875464725..4468cf8e3bf 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -274,7 +274,7 @@ std::pair<bool, MergeTreeDataPartPtr> ReplicatedMergeTreePartCheckThread::findLo
     return std::make_pair(exists_in_zookeeper, part);
 }
 
-ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const String & part_name)
+ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const String & part_name, bool throw_on_broken_projection)
 {
     ReplicatedCheckResult result;
     auto [exists_in_zookeeper, part] = findLocalPart(part_name);
@@ -341,6 +341,7 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
         /// before the ReplicatedMergeTreePartHeader was introduced.
         String part_path = storage.replica_path + "/parts/" + part_name;
         String part_znode = zookeeper->get(part_path);
+        bool is_broken_projection = false;
 
         try
         {
@@ -362,8 +363,10 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 
             checkDataPart(
                 part,
-                true,
-                [this] { return need_stop.load(); });
+                /* require_checksums */true,
+                is_broken_projection,
+                [this] { return need_stop.load(); },
+                throw_on_broken_projection);
 
             if (need_stop)
             {
@@ -384,12 +387,22 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 
             tryLogCurrentException(log, __PRETTY_FUNCTION__);
 
-            auto message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
-            LOG_ERROR(log, message);
+            PreformattedMessage message;
+            if (is_broken_projection)
+            {
+                message = PreformattedMessage::create("Part {} has a broken projection. It will be ignored.", part_name);
+                LOG_DEBUG(log, message);
+                result.action = ReplicatedCheckResult::DoNothing;
+            }
+            else
+            {
+                message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
+                LOG_ERROR(log, message);
+                result.action = ReplicatedCheckResult::TryFetchMissing;
+            }
 
             /// Part is broken, let's try to find it and fetch.
             result.status = {part_name, false, message};
-            result.action = ReplicatedCheckResult::TryFetchMissing;
             return result;
 
         }
@@ -419,12 +432,12 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
 }
 
 
-CheckResult ReplicatedMergeTreePartCheckThread::checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after)
+CheckResult ReplicatedMergeTreePartCheckThread::checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after, bool throw_on_broken_projection)
 {
     LOG_INFO(log, "Checking part {}", part_name);
     ProfileEvents::increment(ProfileEvents::ReplicatedPartChecks);
 
-    ReplicatedCheckResult result = checkPartImpl(part_name);
+    ReplicatedCheckResult result = checkPartImpl(part_name, throw_on_broken_projection);
     switch (result.action)
     {
         case ReplicatedCheckResult::None: UNREACHABLE();
@@ -577,7 +590,7 @@ void ReplicatedMergeTreePartCheckThread::run()
         }
 
         std::optional<time_t> recheck_after;
-        checkPartAndFix(selected->name, &recheck_after);
+        checkPartAndFix(selected->name, &recheck_after, /* throw_on_broken_projection */false);
 
         if (need_stop)
             return;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
index 68dc6ca3d1d..26c4bfe9384 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.h
@@ -65,9 +65,9 @@ public:
     size_t size() const;
 
     /// Check part by name
-    CheckResult checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after = nullptr);
+    CheckResult checkPartAndFix(const String & part_name, std::optional<time_t> * recheck_after = nullptr, bool throw_on_broken_projection = true);
 
-    ReplicatedCheckResult checkPartImpl(const String & part_name);
+    ReplicatedCheckResult checkPartImpl(const String & part_name, bool throw_on_broken_projection);
 
     std::unique_lock<std::mutex> pausePartsCheck();
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index a75df00e8a7..74af7cbb77c 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -111,7 +111,9 @@ static IMergeTreeDataPart::Checksums checkDataPart(
     const NameSet & files_without_checksums,
     const ReadSettings & read_settings,
     bool require_checksums,
-    std::function<bool()> is_cancelled)
+    std::function<bool()> is_cancelled,
+    bool & is_broken_projection,
+    bool throw_on_broken_projection)
 {
     /** Responsibility:
       * - read list of columns from columns.txt;
@@ -120,6 +122,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
       */
 
     CurrentMetrics::Increment metric_increment{CurrentMetrics::ReplicatedChecks};
+    Poco::Logger * log = &Poco::Logger::get("checkDataPart");
 
     NamesAndTypesList columns_txt;
 
@@ -269,23 +272,68 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
-    for (const auto & [name, projection] : data_part->getProjectionParts())
+    auto check_projection = [&](const String & name, std::shared_ptr<IMergeTreeDataPart> projection)
     {
-        if (is_cancelled())
-            return {};
-
         auto projection_file = name + ".proj";
-        auto projection_checksums = checkDataPart(
-            projection, *data_part_storage.getProjection(projection_file),
-            projection->getColumns(), projection->getType(),
-            projection->getFileNamesWithoutChecksums(),
-            read_settings, require_checksums, is_cancelled);
+        if (!throw_on_broken_projection && projection->is_broken)
+        {
+            projections_on_disk.erase(projection_file);
+            checksums_txt.remove(projection_file);
+            return;
+        }
+
+        IMergeTreeDataPart::Checksums projection_checksums;
+        try
+        {
+            bool noop;
+            projection_checksums = checkDataPart(
+                projection, *data_part_storage.getProjection(projection_file),
+                projection->getColumns(), projection->getType(),
+                projection->getFileNamesWithoutChecksums(),
+                read_settings, require_checksums, is_cancelled, noop, /* throw_on_broken_projection */false);
+        }
+        catch (...)
+        {
+            if (isRetryableException(std::current_exception()))
+                throw;
+
+            LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
+
+            if (!data_part->hasBrokenProjection(name))
+                data_part->markProjectionPartAsBroken(name, getCurrentExceptionMessage(false), getCurrentExceptionCode());
+
+            is_broken_projection = true;
+            if (throw_on_broken_projection)
+                throw;
+
+            projections_on_disk.erase(projection_file);
+            checksums_txt.remove(projection_file);
+            return;
+        }
 
         checksums_data.files[projection_file] = IMergeTreeDataPart::Checksums::Checksum(
             projection_checksums.getTotalSizeOnDisk(),
             projection_checksums.getTotalChecksumUInt128());
 
         projections_on_disk.erase(projection_file);
+    };
+
+    auto broken_projection_parts = data_part->getBrokenProjectionParts(); /// Iterate over copy
+    for (const auto & [name, projection] : broken_projection_parts)
+    {
+        if (is_cancelled())
+            return {};
+        else
+            check_projection(name, projection);
+    }
+
+    auto projection_parts = data_part->getProjectionParts(); /// Iterate over copy
+    for (const auto & [name, projection] : projection_parts)
+    {
+        if (is_cancelled())
+            return {};
+        else
+            check_projection(name, projection);
     }
 
     if (require_checksums && !projections_on_disk.empty())
@@ -315,7 +363,9 @@ IMergeTreeDataPart::Checksums checkDataPartInMemory(const DataPartInMemoryPtr &
 IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     bool require_checksums,
-    std::function<bool()> is_cancelled)
+    bool & is_broken_projection,
+    std::function<bool()> is_cancelled,
+    bool throw_on_broken_projection)
 {
     if (auto part_in_memory = asInMemoryPart(data_part))
         return checkDataPartInMemory(part_in_memory);
@@ -357,7 +407,9 @@ IMergeTreeDataPart::Checksums checkDataPart(
             data_part->getFileNamesWithoutChecksums(),
             read_settings,
             require_checksums,
-            is_cancelled);
+            is_cancelled,
+            is_broken_projection,
+            throw_on_broken_projection);
     };
 
     try
@@ -371,7 +423,9 @@ IMergeTreeDataPart::Checksums checkDataPart(
             data_part->getFileNamesWithoutChecksums(),
             read_settings,
             require_checksums,
-            is_cancelled);
+            is_cancelled,
+            is_broken_projection,
+            throw_on_broken_projection);
     }
     catch (...)
     {
diff --git a/src/Storages/MergeTree/checkDataPart.h b/src/Storages/MergeTree/checkDataPart.h
index d0e48b6f80a..a01978f4efe 100644
--- a/src/Storages/MergeTree/checkDataPart.h
+++ b/src/Storages/MergeTree/checkDataPart.h
@@ -10,7 +10,9 @@ namespace DB
 IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     bool require_checksums,
-    std::function<bool()> is_cancelled = []{ return false; });
+    bool & is_broken_projection,
+    std::function<bool()> is_cancelled = []{ return false; },
+    bool throw_on_broken_projection = false);
 
 bool isNotEnoughMemoryErrorCode(int code);
 bool isRetryableException(const std::exception_ptr exception_ptr);
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index e9a0dd5fbf3..74277616e95 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2242,11 +2242,12 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
     {
         /// If the checksums file is not present, calculate the checksums and write them to disk.
         static constexpr auto checksums_path = "checksums.txt";
+        bool noop;
         if (part->isStoredOnDisk() && !part->getDataPartStorage().exists(checksums_path))
         {
             try
             {
-                auto calculated_checksums = checkDataPart(part, false);
+                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
                 calculated_checksums.checkEqual(part->checksums, true);
 
                 auto & part_mutable = const_cast<IMergeTreeDataPart &>(*part);
@@ -2267,7 +2268,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                checkDataPart(part, true);
+                checkDataPart(part, true, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
                 return CheckResult(part->name, true, "");
             }
             catch (...)
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 74821a9186c..1859fa03094 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -8690,12 +8690,11 @@ IStorage::DataValidationTasksPtr StorageReplicatedMergeTree::getCheckTaskList(
 
 std::optional<CheckResult> StorageReplicatedMergeTree::checkDataNext(DataValidationTasksPtr & check_task_list)
 {
-
     if (auto part = assert_cast<DataValidationTasks *>(check_task_list.get())->next())
     {
         try
         {
-            return CheckResult(part_check_thread.checkPartAndFix(part->name));
+            return part_check_thread.checkPartAndFix(part->name, /* recheck_after */nullptr, /* throw_on_broken_projection */true);
         }
         catch (const Exception & ex)
         {
diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 23a00cc7ae5..250fcdba641 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -63,7 +63,7 @@ Pipe StorageSystemDisks::read(
     for (const auto & [disk_name, disk_ptr] : context->getDisksMap())
     {
         col_name->insert(disk_name);
-        col_path->insert(disk_ptr->getPath());
+        col_path->insert(fs::absolute(disk_ptr->getPath()).string());
         col_free->insert(disk_ptr->getAvailableSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_total->insert(disk_ptr->getTotalSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 513af6cfc46..e97c13b1fed 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -64,7 +64,7 @@ StoragesInfo::getParts(MergeTreeData::DataPartStateVector & state, bool has_stat
 }
 
 MergeTreeData::ProjectionPartsVector
-StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const
+StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
 {
     if (data->getInMemoryMetadataPtr()->projections.empty())
         return {};
@@ -74,12 +74,12 @@ StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, boo
     {
         /// If has_state_column is requested, return all states.
         if (!has_state_column)
-            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, &state);
+            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, fill_states);
 
-        return data->getAllProjectionPartsVector(&state);
+        return data->getAllProjectionPartsVector(fill_states);
     }
 
-    return data->getProjectionPartsVectorForInternalUsage({State::Active}, &state);
+    return data->getProjectionPartsVectorForInternalUsage({State::Active}, fill_states);
 }
 
 StoragesInfoStream::StoragesInfoStream(const SelectQueryInfo & query_info, ContextPtr context)
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index c3d2e64b303..e0e81f0d24d 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -25,7 +25,7 @@ struct StoragesInfo
     explicit operator bool() const { return storage != nullptr; }
 
     MergeTreeData::DataPartsVector getParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
-    MergeTreeData::ProjectionPartsVector getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
+    MergeTreeData::ProjectionPartsVector getProjectionParts(bool fill_states, bool has_state_column) const;
 };
 
 /** A helper class that enumerates the storages that match given query. */
diff --git a/src/Storages/System/StorageSystemProjectionParts.cpp b/src/Storages/System/StorageSystemProjectionParts.cpp
index 213865a8d61..44bdb294a2d 100644
--- a/src/Storages/System/StorageSystemProjectionParts.cpp
+++ b/src/Storages/System/StorageSystemProjectionParts.cpp
@@ -83,7 +83,11 @@ StorageSystemProjectionParts::StorageSystemProjectionParts(const StorageID & tab
 
         {"rows_where_ttl_info.expression",              std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())},
         {"rows_where_ttl_info.min",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())},
-        {"rows_where_ttl_info.max",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())}
+        {"rows_where_ttl_info.max",                     std::make_shared<DataTypeArray>(std::make_shared<DataTypeDateTime>())},
+
+        {"is_broken",                                   std::make_shared<DataTypeUInt8>()},
+        {"exception_code",                              std::make_shared<DataTypeInt32>()},
+        {"exception",                                   std::make_shared<DataTypeString>()},
     }
     )
 {
@@ -93,15 +97,14 @@ void StorageSystemProjectionParts::processNextStorage(
     ContextPtr, MutableColumns & columns, std::vector<UInt8> & columns_mask, const StoragesInfo & info, bool has_state_column)
 {
     using State = MergeTreeDataPartState;
-    MergeTreeData::DataPartStateVector all_parts_state;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
+    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
     {
-        const auto & part = all_parts.projection_parts[part_number];
+        const auto & part = parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = all_parts_state[part_number];
+        auto part_state = states[part_number];
 
         ColumnSize columns_size = part->getTotalColumnsSize();
         ColumnSize parent_columns_size = parent_part->getTotalColumnsSize();
@@ -278,10 +281,43 @@ void StorageSystemProjectionParts::processNextStorage(
         add_ttl_info_map(part->ttl_infos.group_by_ttl);
         add_ttl_info_map(part->ttl_infos.rows_where_ttl);
 
+        {
+            if (columns_mask[src_index++])
+                columns[res_index++]->insert(part->is_broken.load(std::memory_order_relaxed));
+
+            if (part->is_broken)
+            {
+                std::lock_guard lock(part->broken_projections_mutex);
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insert(part->exception_code);
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insert(part->exception);
+            }
+            else
+            {
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insertDefault();
+                if (columns_mask[src_index++])
+                    columns[res_index++]->insertDefault();
+            }
+        }
+
         /// _state column should be the latest.
         /// Do not use part->getState*, it can be changed from different thread
         if (has_state_column)
             columns[res_index++]->insert(IMergeTreeDataPart::stateString(part_state));
+    };
+
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.projection_parts[part_number];
+        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
+    }
+
+    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.broken_projection_parts[part_number];
+        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
index 06becc6d91c..3f4224e46bb 100644
--- a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
@@ -103,15 +103,14 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
     }
 
     /// Go through the list of projection parts.
-    MergeTreeData::DataPartStateVector all_parts_state;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
+    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
     {
-        const auto & part = all_parts.projection_parts[part_number];
+        const auto & part = parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = all_parts_state[part_number];
+        auto part_state = states[part_number];
         auto columns_size = part->getTotalColumnsSize();
         auto parent_columns_size = parent_part->getTotalColumnsSize();
 
@@ -260,6 +259,18 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
             if (has_state_column)
                 columns[res_index++]->insert(part->stateString());
         }
+    };
+
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.projection_parts[part_number];
+        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
+    }
+
+    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
+    {
+        auto part = all_parts.broken_projection_parts[part_number];
+        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
new file mode 100644
index 00000000000..d0b07e081db
--- /dev/null
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -0,0 +1,224 @@
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
+0
+broke metadata of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+check table full
+all_0_0_0	1	
+all_1_1_0	1	
+all_3_3_0	1	
+all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+0
+broke data of part 'proj_2' (parent part: all_2_2_0)
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+FILE_DOESNT_EXIST
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	[]
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+0
+broke data of part 'proj_2' (parent part: all_3_3_0)
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+insert new part
+insert new part
+optimize
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
+all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	[]
+all_3_3_0	0	['proj']
+all_3_5_1	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+0
+broke metadata of part 'proj' (parent part: all_1_1_0)
+Detach - Attach
+broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj_2	FILE_DOESNT_EXIST
+all_3_3_0	proj_2	FILE_DOESNT_EXIST
+0
+broke data of part 'proj_2' (parent part: all_1_1_0)
+Detach - Attach
+broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
+all_1_1_0	proj_2	FILE_DOESNT_EXIST
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj_2	FILE_DOESNT_EXIST
+all_3_3_0	proj_2	FILE_DOESNT_EXIST
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	[]
+all_2_2_0	1	[]
+all_3_3_0	0	['proj']
+all_3_5_1	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+0
+check table full
+all_3_5_1	1	
+all_0_0_0	1	
+all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
+all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+materialize projection proj
+check table full
+all_3_5_1_6	1	
+all_0_0_0_6	1	
+all_2_2_0_6	1	
+all_1_1_0_6	1	
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_6	1	['proj','proj_2']
+all_1_1_0	0	[]
+all_1_1_0_6	1	['proj','proj_2']
+all_2_2_0	0	[]
+all_2_2_0_6	1	['proj','proj_2']
+all_3_3_0	0	['proj']
+all_3_5_1	0	['proj']
+all_3_5_1_6	1	['proj']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+16
+12
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
+materialize projection proj_2
+check table full
+all_3_5_1_7	1	
+all_0_0_0_7	1	
+all_2_2_0_7	1	
+all_1_1_0_7	1	
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_6	0	['proj','proj_2']
+all_0_0_0_7	1	['proj','proj_2']
+all_1_1_0	0	[]
+all_1_1_0_6	0	['proj','proj_2']
+all_1_1_0_7	1	['proj','proj_2']
+all_2_2_0	0	[]
+all_2_2_0_6	0	['proj','proj_2']
+all_2_2_0_7	1	['proj','proj_2']
+all_3_3_0	0	['proj']
+all_3_5_1	0	['proj']
+all_3_5_1_6	0	['proj']
+all_3_5_1_7	1	['proj','proj_2']
+all_4_4_0	0	['proj','proj_2']
+all_5_5_0	0	['proj','proj_2']
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+select from projection 'proj_2'
+16
+12
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+check table
+1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
new file mode 100755
index 00000000000..81adfe6e49d
--- /dev/null
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -0,0 +1,283 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE IF EXISTS test SYNC;
+CREATE TABLE test
+(
+    a String,
+    b String,
+    c Int32,
+    d Int32,
+    e Int32,
+
+    PROJECTION proj
+    (
+        SELECT c ORDER BY d
+    ),
+    PROJECTION proj_2
+    (
+        SELECT d ORDER BY c
+    )
+)
+ENGINE = ReplicatedMergeTree('/test2/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+SETTINGS min_bytes_for_wide_part = 0,
+    max_parts_to_merge_at_once=3,
+    enable_vertical_merge_algorithm=1,
+    vertical_merge_algorithm_min_rows_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1;
+"
+
+table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
+
+function random()
+{
+    cat /dev/urandom | LC_ALL=C tr -dc 'a-zA-Z' | fold -w ${1:-8} | head -n 1
+}
+
+function insert()
+{
+    offset=$1
+    size=$2
+    echo 'insert new part'
+    $CLICKHOUSE_CLIENT -q "INSERT INTO test SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+}
+
+function break_projection()
+{
+    part_name=$1
+    parent_name=$2
+    break_type=$3
+
+    read -r disk_name part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT disk_name, path
+    FROM system.projection_parts
+    WHERE table='test'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='$part_name'
+    AND parent_name='$parent_name'
+    LIMIT 1;
+    ")
+
+    path=$($CLICKHOUSE_CLIENT -q "SELECT path FROM system.disks WHERE name='$disk_name'")
+
+    # make sure path is absolute
+    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
+
+    if [ "$break_type" = "data" ]
+        then
+           rm "$path/$part_path/d.bin"
+           rm "$path/$part_path/c.bin"
+           echo "broke data of part '$part_name' (parent part: $parent_name)"
+        else
+           rm "$path/$part_path/columns.txt"
+           echo "broke metadata of part '$part_name' (parent part: $parent_name)"
+    fi
+}
+
+function broken_projections_info()
+{
+    echo 'broken projections info'
+    $CLICKHOUSE_CLIENT -q "
+    SELECT parent_name, name, errors.name FROM
+    (
+        SELECT parent_name, name, exception_code
+        FROM system.projection_parts
+        WHERE table='test'
+        AND database=currentDatabase()
+        AND is_broken = 1
+    ) AS parts_info
+    INNER JOIN system.errors AS errors
+    ON parts_info.exception_code = errors.code
+    ORDER BY parent_name, name
+"
+}
+
+function check()
+{
+    expect_broken_part=""
+    expected_error=""
+    if [ $# -ne 0 ]; then
+        expect_broken_part=$1
+        expected_error=$2
+    fi
+
+    echo 'system.parts'
+    $CLICKHOUSE_CLIENT -q "
+    SELECT name, active, projections
+    FROM system.parts
+    WHERE table='test' AND database=currentDatabase()
+    ORDER BY name;"
+
+    echo "select from projection 'proj'"
+    query_id=$(random 8)
+
+    if [ "$expect_broken_part" = "proj" ]
+        then
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12;" 2>&1 | grep -o $expected_error
+        else
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16;"
+            echo 'used projections'
+            $CLICKHOUSE_CLIENT -nm -q "
+            SYSTEM FLUSH LOGS;
+            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            "
+    fi
+
+    echo "select from projection 'proj_2'"
+    query_id=$(random 8)
+
+    if [ "$expect_broken_part" = "proj_2" ]
+        then
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12;" 2>&1 | grep -o $expected_error
+        else
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16;"
+            echo 'used projections'
+            $CLICKHOUSE_CLIENT -nm -q "
+            SYSTEM FLUSH LOGS;
+            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            "
+    fi
+
+    echo 'check table'
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
+}
+
+function optimize_no_wait()
+{
+    echo 'optimize'
+    $CLICKHOUSE_CLIENT -nm -q "OPTIMIZE TABLE test SETTINGS alter_sync=0;"
+}
+
+function reattach()
+{
+    echo 'Detach - Attach'
+    $CLICKHOUSE_CLIENT -nm -q "
+    DETACH TABLE test;
+    ATTACH TABLE test;
+    "
+}
+
+function materialize_projection
+{
+    projection=$1
+    echo "materialize projection $projection"
+    $CLICKHOUSE_CLIENT -q "ALTER TABLE test MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
+}
+
+function check_table_full()
+{
+    echo 'check table full'
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0"
+}
+
+
+insert 0 5
+
+insert 5 5
+
+insert 10 5
+
+insert 15 5
+
+check
+
+# Break metadata file of projection 'proj'
+break_projection proj all_2_2_0 metadata
+
+# Do select and after "check table" query.
+# Select works because it does not read columns.txt.
+check
+
+# Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+# because it was marked broken during "check table" query.
+# TODO: try to mark it during select as well
+broken_projections_info
+
+# Check table query will also show a list of parts which have broken projections.
+check_table_full
+
+# Break data file of projection 'proj_2' for part all_2_2_0
+break_projection proj_2 all_2_2_0 data
+
+# It will not yet appear in broken projections info.
+broken_projections_info
+
+# Select now fails with error "File doesn't exist"
+check "proj_2" "FILE_DOESNT_EXIST"
+
+# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+broken_projections_info
+
+# Second select works, because projection is now marked as broken.
+check
+
+# Break data file of projection 'proj_2' for part all_3_3_0
+break_projection proj_2 all_3_3_0 data
+
+# It will not yet appear in broken projections info.
+broken_projections_info
+
+insert 20 5
+
+insert 25 5
+
+# Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+# Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+# So a merge will be create for future part all_3_5_1.
+# During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+# Merge will be retried and on second attempt it will succeed.
+# The result part all_3_5_1 will have only 1 projection - 'proj', because
+# it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+optimize_no_wait
+sleep 2
+
+$CLICKHOUSE_CLIENT -nm -q "
+SYSTEM FLUSH LOGS;
+SELECT count() FROM system.text_log
+WHERE level='Error'
+AND logger_name='MergeTreeBackgroundExecutor'
+AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
+"
+
+# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+broken_projections_info
+
+check
+
+break_projection proj all_1_1_0 metadata
+
+reattach
+
+broken_projections_info
+
+break_projection proj_2 all_1_1_0 data
+
+reattach
+
+broken_projections_info
+
+check
+
+check_table_full
+
+materialize_projection proj
+
+check_table_full
+
+check
+
+materialize_projection proj_2
+
+check_table_full
+
+check
+
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE test;
+"

From 6c42a3fad6b58efdf91115c3b80f267f1f604c62 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 16 Nov 2023 16:43:34 +0100
Subject: [PATCH 0016/1081] Better

---
 src/Interpreters/MutationsInterpreter.cpp     | 18 ++--
 .../Optimizations/projectionsCommon.cpp       |  2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 45 +++------
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 11 +--
 src/Storages/MergeTree/MergeTask.cpp          |  5 +-
 src/Storages/MergeTree/MergeTreeData.cpp      | 57 ++++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  4 +-
 src/Storages/MergeTree/MutateTask.cpp         |  8 +-
 src/Storages/MergeTree/checkDataPart.cpp      | 34 ++-----
 .../System/StorageSystemPartsBase.cpp         |  8 +-
 src/Storages/System/StorageSystemPartsBase.h  |  2 +-
 .../System/StorageSystemProjectionParts.cpp   | 30 +++---
 .../StorageSystemProjectionPartsColumns.cpp   | 21 +---
 .../02916_broken_projection.reference         | 95 ++++++++-----------
 .../0_stateless/02916_broken_projection.sh    | 12 +--
 15 files changed, 146 insertions(+), 206 deletions(-)

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index a9a5d4f33d0..237bffe4a67 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -753,7 +753,7 @@ void MutationsInterpreter::prepare(bool dry_run)
         {
             mutation_kind.set(MutationKind::MUTATE_INDEX_PROJECTION);
             const auto & projection = projections_desc.get(command.projection_name);
-            if (!source.hasProjection(projection.name))
+            if (!source.hasProjection(projection.name) || source.hasBrokenProjection(projection.name))
             {
                 for (const auto & column : projection.required_columns)
                     dependencies.emplace(column, ColumnDependency::PROJECTION);
@@ -927,20 +927,18 @@ void MutationsInterpreter::prepare(bool dry_run)
             materialized_indices.insert(index.name);
     }
 
-    /// Always rebuild broken projections.
-    for (const auto & projection : metadata_snapshot->getProjections())
-    {
-        if (!source.hasBrokenProjection(projection.name))
-            continue;
-
-        materialized_projections.insert(projection.name);
-    }
-
     for (const auto & projection : metadata_snapshot->getProjections())
     {
         if (!source.hasProjection(projection.name))
             continue;
 
+        /// Always rebuild broken projections.
+        if (source.hasBrokenProjection(projection.name))
+        {
+            materialized_projections.insert(projection.name);
+            continue;
+        }
+
         if (need_rebuild_projections)
         {
             materialized_projections.insert(projection.name);
diff --git a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
index c3b3449857b..9ebd5aaa32f 100644
--- a/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
+++ b/src/Processors/QueryPlan/Optimizations/projectionsCommon.cpp
@@ -224,7 +224,7 @@ bool analyzeProjectionCandidate(
     {
         const auto & created_projections = part_with_ranges.data_part->getProjectionParts();
         auto it = created_projections.find(candidate.projection->name);
-        if (it != created_projections.end())
+        if (it != created_projections.end() && !it->second->is_broken)
         {
             projection_parts.push_back(it->second);
         }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index bc81758675e..85ce112d9a1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -745,8 +745,7 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                     LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
                               "Cannot load projection {}, will consider it broken", projection.name);
 
-                    addBrokenProjectionPart(projection.name, std::move(part), getCurrentExceptionMessage(false), getCurrentExceptionCode());
-                    continue;
+                    part->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
                 }
 
                 addProjectionPart(projection.name, std::move(part));
@@ -2147,44 +2146,30 @@ std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
     return getStreamNameOrHash(stream_name, extension, storage_);
 }
 
-void IMergeTreeDataPart::addBrokenProjectionPart(
-    const String & projection_name,
-    std::shared_ptr<IMergeTreeDataPart> projection_part,
-    const String & message,
-    int code)
-{
-    projection_part->setBrokenReason(message, code);
-    bool inserted = broken_projection_parts.emplace(projection_name, projection_part).second;
-    if (!inserted)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection part {} in part {} is already added to a broken projection parts list", projection_name, name);
-}
-
 void IMergeTreeDataPart::markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const
 {
-    std::lock_guard lock(broken_projections_mutex);
-
     auto it = projection_parts.find(projection_name);
     if (it == projection_parts.end())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "There is no projection part '{}'", projection_name);
-
     it->second->setBrokenReason(message, code);
-
-    broken_projection_parts.emplace(projection_name, it->second);
-    projection_parts.erase(it);
-}
-
-void IMergeTreeDataPart::setBrokenReason(const String & message, int code)
-{
-    std::lock_guard lock(broken_projections_mutex);
-    is_broken = true;
-    exception = message;
-    exception_code = code;
 }
 
 bool IMergeTreeDataPart::hasBrokenProjection(const String & projection_name) const
 {
-    std::lock_guard lock(broken_projections_mutex);
-    return broken_projection_parts.contains(projection_name);
+    auto it = projection_parts.find(projection_name);
+    if (it == projection_parts.end())
+        return false;
+    return it->second->is_broken;
+}
+
+void IMergeTreeDataPart::setBrokenReason(const String & message, int code) const
+{
+    std::lock_guard lock(broken_reason_mutex);
+    if (is_broken)
+        return;
+    is_broken = true;
+    exception = message;
+    exception_code = code;
 }
 
 bool isCompactPart(const MergeTreeDataPartPtr & data_part)
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 52a1541e15f..9af2c16f1e8 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -259,7 +259,7 @@ public:
     mutable std::atomic<bool> is_broken {false};
     mutable std::string exception;
     mutable int exception_code = 0;
-    mutable std::mutex broken_projections_mutex;
+    mutable std::mutex broken_reason_mutex;
 
     /// Indicates that the part was marked Outdated by PartCheckThread because the part was not committed to ZooKeeper
     mutable bool is_unexpected_local_part = false;
@@ -411,14 +411,10 @@ public:
 
     const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getProjectionParts() const { return projection_parts; }
 
-    const std::map<String, std::shared_ptr<IMergeTreeDataPart>> & getBrokenProjectionParts() const { return broken_projection_parts; }
-
     MergeTreeDataPartBuilder getProjectionPartBuilder(const String & projection_name, bool is_temp_projection = false);
 
     void addProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> && projection_part);
 
-    void addBrokenProjectionPart(const String & projection_name, std::shared_ptr<IMergeTreeDataPart> projection_part, const String & message, int code);
-
     void markProjectionPartAsBroken(const String & projection_name, const String & message, int code) const;
 
     bool hasProjection(const String & projection_name) const { return projection_parts.contains(projection_name); }
@@ -427,6 +423,8 @@ public:
 
     void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
+    void setBrokenReason(const String & message, int code) const;
+
     /// Return set of metadata file names without checksums. For example,
     /// columns.txt or checksums.txt itself.
     NameSet getFileNamesWithoutChecksums() const;
@@ -579,7 +577,6 @@ protected:
     String parent_part_name;
 
     mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> projection_parts;
-    mutable std::map<String, std::shared_ptr<IMergeTreeDataPart>> broken_projection_parts;
 
     mutable PartMetadataManagerPtr metadata_manager;
 
@@ -693,8 +690,6 @@ private:
     void incrementStateMetric(MergeTreeDataPartState state) const;
     void decrementStateMetric(MergeTreeDataPartState state) const;
 
-    void setBrokenReason(const String & message, int code);
-
     /// This ugly flag is needed for debug assertions only
     mutable bool part_is_probably_removed_from_disk = false;
 };
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index adb1ca72e46..53ba1a57b27 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -696,8 +696,9 @@ bool MergeTask::MergeProjectionsStage::mergeMinMaxIndexAndPrepareProjections() c
         MergeTreeData::DataPartsVector projection_parts;
         for (const auto & part : global_ctx->future_part->parts)
         {
-            auto it = part->getProjectionParts().find(projection.name);
-            if (it != part->getProjectionParts().end())
+            auto actual_projection_parts = part->getProjectionParts();
+            auto it = actual_projection_parts.find(projection.name);
+            if (it != actual_projection_parts.end() && !it->second->is_broken)
                 projection_parts.push_back(it->second);
         }
         if (projection_parts.size() < global_ctx->future_part->parts.size())
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 152c386e188..0725c3cbf32 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5737,7 +5737,7 @@ MergeTreeData::getDataPartsVectorForInternalUsage(const DataPartStates & afforda
 }
 
 MergeTreeData::ProjectionPartsVector
-MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, bool fill_states) const
+MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & affordable_states, DataPartStateVector * out_states) const
 {
     auto lock = lockParts();
     ProjectionPartsVector res;
@@ -5749,20 +5749,14 @@ MergeTreeData::getProjectionPartsVectorForInternalUsage(const DataPartStates & a
             res.data_parts.push_back(part);
             for (const auto & [_, projection_part] : part->getProjectionParts())
                 res.projection_parts.push_back(projection_part);
-            for (const auto & [_, projection_part] : part->getBrokenProjectionParts())
-                res.broken_projection_parts.push_back(projection_part);
         }
     }
 
-    if (fill_states)
+    if (out_states != nullptr)
     {
-        res.projection_parts_states.resize(res.projection_parts.size());
+        out_states->resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
-
-        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
-        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
-            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
+            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
     }
 
     return res;
@@ -5815,7 +5809,7 @@ bool MergeTreeData::supportsLightweightDelete() const
     return true;
 }
 
-MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(bool fill_states) const
+MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states) const
 {
     ProjectionPartsVector res;
     auto lock = lockParts();
@@ -5826,15 +5820,11 @@ MergeTreeData::ProjectionPartsVector MergeTreeData::getAllProjectionPartsVector(
             res.projection_parts.push_back(projection_part);
     }
 
-    if (fill_states)
+    if (out_states != nullptr)
     {
-        res.projection_parts_states.resize(res.projection_parts.size());
+        out_states->resize(res.projection_parts.size());
         for (size_t i = 0; i < res.projection_parts.size(); ++i)
-            (res.projection_parts_states)[i] = res.projection_parts[i]->getParentPart()->getState();
-
-        res.broken_projection_parts_states.resize(res.broken_projection_parts.size());
-        for (size_t i = 0; i < res.broken_projection_parts.size(); ++i)
-            (res.broken_projection_parts_states)[i] = res.broken_projection_parts[i]->getParentPart()->getState();
+            (*out_states)[i] = res.projection_parts[i]->getParentPart()->getState();
     }
     return res;
 }
@@ -7050,8 +7040,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
 
-        auto projections = src_part->getProjectionParts();
-        for (const auto & [name, projection_part] : projections)
+        for (const auto & [name, projection_part] : src_part->getProjectionParts())
         {
             const auto & projection_storage = projection_part->getDataPartStorage();
             for (auto it = projection_storage.iterate(); it->isValid(); it->next())
@@ -7654,21 +7643,39 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
 
 bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const DataPartPtr & right, String & out_reason)
 {
-    if (left->getProjectionParts().size() != right->getProjectionParts().size())
+    auto remove_broken_parts = [](auto & parts)
+    {
+        std::set<String> broken_projection_parts;
+        for (const auto & [name, part] : parts)
+        {
+            if (part->is_broken)
+                broken_projection_parts.emplace(name);
+        }
+        for (const auto & name : broken_projection_parts)
+            parts.erase(name);
+    };
+
+    auto left_projection_parts = left->getProjectionParts();
+    auto right_projection_parts = right->getProjectionParts();
+
+    remove_broken_parts(left_projection_parts);
+    remove_broken_parts(right_projection_parts);
+
+    if (left_projection_parts.size() != right_projection_parts.size())
     {
         out_reason = fmt::format(
             "Parts have different number of projections: {} in part '{}' and {} in part '{}'",
-            left->getProjectionParts().size(),
+            left_projection_parts.size(),
             left->name,
-            right->getProjectionParts().size(),
+            right_projection_parts.size(),
             right->name
         );
         return false;
     }
 
-    for (const auto & [name, _] : left->getProjectionParts())
+    for (const auto & [name, _] : left_projection_parts)
     {
-        if (!right->hasProjection(name))
+        if (!right_projection_parts.contains(name))
         {
             out_reason = fmt::format(
                 "The part '{}' doesn't have projection '{}' while part '{}' does", right->name, name, left->name
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 4ef3b75988b..18087c6b059 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -489,7 +489,7 @@ public:
         const DataPartStates & affordable_states, DataPartStateVector * out_states = nullptr) const;
     /// Same as above but only returns projection parts
     ProjectionPartsVector getProjectionPartsVectorForInternalUsage(
-        const DataPartStates & affordable_states, bool fill_states = false) const;
+        const DataPartStates & affordable_states, MergeTreeData::DataPartStateVector * out_states) const;
 
 
     /// Returns absolutely all parts (and snapshot of their states)
@@ -501,7 +501,7 @@ public:
     size_t getTotalMarksCount() const;
 
     /// Same as above but only returns projection parts
-    ProjectionPartsVector getAllProjectionPartsVector(bool fill_states = false) const;
+    ProjectionPartsVector getAllProjectionPartsVector(MergeTreeData::DataPartStateVector * out_states = nullptr) const;
 
     /// Returns parts in Active state
     DataParts getDataPartsForInternalUsage() const;
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 8ef1621b647..6a1ceec1cd3 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -514,8 +514,8 @@ static std::set<ProjectionDescriptionRawPtr> getProjectionsToRecalculate(
         bool need_recalculate =
             materialized_projections.contains(projection.name)
             || (!is_full_part_storage
-                && (source_part->hasProjection(projection.name)
-                    || source_part->hasBrokenProjection(projection.name)));
+                && source_part->hasProjection(projection.name)
+                && !source_part->hasBrokenProjection(projection.name));
 
         if (need_recalculate)
             projections_to_recalc.insert(&projection);
@@ -1370,8 +1370,8 @@ private:
             bool need_recalculate =
                 ctx->materialized_projections.contains(projection.name)
                 || (!is_full_part_storage
-                    && (ctx->source_part->hasProjection(projection.name)
-                        || ctx->source_part->hasBrokenProjection(projection.name)));
+                    && ctx->source_part->hasProjection(projection.name)
+                    && !ctx->source_part->hasBrokenProjection(projection.name));
 
             if (need_recalculate)
             {
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 74af7cbb77c..8feabf344b5 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -272,14 +272,16 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
-    auto check_projection = [&](const String & name, std::shared_ptr<IMergeTreeDataPart> projection)
+    for (const auto & [name, projection] : data_part->getProjectionParts())
     {
+        if (is_cancelled())
+            return {};
+
         auto projection_file = name + ".proj";
         if (!throw_on_broken_projection && projection->is_broken)
         {
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
-            return;
         }
 
         IMergeTreeDataPart::Checksums projection_checksums;
@@ -297,10 +299,11 @@ static IMergeTreeDataPart::Checksums checkDataPart(
             if (isRetryableException(std::current_exception()))
                 throw;
 
-            LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
-
-            if (!data_part->hasBrokenProjection(name))
-                data_part->markProjectionPartAsBroken(name, getCurrentExceptionMessage(false), getCurrentExceptionCode());
+            if (!projection->is_broken)
+            {
+                LOG_TEST(log, "Marking projection {} as broken ({})", name, projection_file);
+                projection->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
+            }
 
             is_broken_projection = true;
             if (throw_on_broken_projection)
@@ -308,7 +311,6 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
-            return;
         }
 
         checksums_data.files[projection_file] = IMergeTreeDataPart::Checksums::Checksum(
@@ -316,24 +318,6 @@ static IMergeTreeDataPart::Checksums checkDataPart(
             projection_checksums.getTotalChecksumUInt128());
 
         projections_on_disk.erase(projection_file);
-    };
-
-    auto broken_projection_parts = data_part->getBrokenProjectionParts(); /// Iterate over copy
-    for (const auto & [name, projection] : broken_projection_parts)
-    {
-        if (is_cancelled())
-            return {};
-        else
-            check_projection(name, projection);
-    }
-
-    auto projection_parts = data_part->getProjectionParts(); /// Iterate over copy
-    for (const auto & [name, projection] : projection_parts)
-    {
-        if (is_cancelled())
-            return {};
-        else
-            check_projection(name, projection);
     }
 
     if (require_checksums && !projections_on_disk.empty())
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index e97c13b1fed..513af6cfc46 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -64,7 +64,7 @@ StoragesInfo::getParts(MergeTreeData::DataPartStateVector & state, bool has_stat
 }
 
 MergeTreeData::ProjectionPartsVector
-StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
+StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const
 {
     if (data->getInMemoryMetadataPtr()->projections.empty())
         return {};
@@ -74,12 +74,12 @@ StoragesInfo::getProjectionParts(bool fill_states, bool has_state_column) const
     {
         /// If has_state_column is requested, return all states.
         if (!has_state_column)
-            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, fill_states);
+            return data->getProjectionPartsVectorForInternalUsage({State::Active, State::Outdated}, &state);
 
-        return data->getAllProjectionPartsVector(fill_states);
+        return data->getAllProjectionPartsVector(&state);
     }
 
-    return data->getProjectionPartsVectorForInternalUsage({State::Active}, fill_states);
+    return data->getProjectionPartsVectorForInternalUsage({State::Active}, &state);
 }
 
 StoragesInfoStream::StoragesInfoStream(const SelectQueryInfo & query_info, ContextPtr context)
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index e0e81f0d24d..c3d2e64b303 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -25,7 +25,7 @@ struct StoragesInfo
     explicit operator bool() const { return storage != nullptr; }
 
     MergeTreeData::DataPartsVector getParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
-    MergeTreeData::ProjectionPartsVector getProjectionParts(bool fill_states, bool has_state_column) const;
+    MergeTreeData::ProjectionPartsVector getProjectionParts(MergeTreeData::DataPartStateVector & state, bool has_state_column) const;
 };
 
 /** A helper class that enumerates the storages that match given query. */
diff --git a/src/Storages/System/StorageSystemProjectionParts.cpp b/src/Storages/System/StorageSystemProjectionParts.cpp
index 44bdb294a2d..3dbe6823dac 100644
--- a/src/Storages/System/StorageSystemProjectionParts.cpp
+++ b/src/Storages/System/StorageSystemProjectionParts.cpp
@@ -97,14 +97,15 @@ void StorageSystemProjectionParts::processNextStorage(
     ContextPtr, MutableColumns & columns, std::vector<UInt8> & columns_mask, const StoragesInfo & info, bool has_state_column)
 {
     using State = MergeTreeDataPartState;
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
-    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
+    MergeTreeData::DataPartStateVector all_parts_state;
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
     {
-        const auto & part = parts[part_number];
+        const auto & part = all_parts.projection_parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = states[part_number];
+        auto part_state = all_parts_state[part_number];
 
         ColumnSize columns_size = part->getTotalColumnsSize();
         ColumnSize parent_columns_size = parent_part->getTotalColumnsSize();
@@ -275,7 +276,12 @@ void StorageSystemProjectionParts::processNextStorage(
         add_ttl_info_map(part->ttl_infos.moves_ttl);
 
         if (columns_mask[src_index++])
-            columns[res_index++]->insert(queryToString(part->default_codec->getCodecDesc()));
+        {
+            if (part->default_codec)
+                columns[res_index++]->insert(queryToString(part->default_codec->getCodecDesc()));
+            else
+                columns[res_index++]->insertDefault();
+        }
 
         add_ttl_info_map(part->ttl_infos.recompression_ttl);
         add_ttl_info_map(part->ttl_infos.group_by_ttl);
@@ -287,7 +293,7 @@ void StorageSystemProjectionParts::processNextStorage(
 
             if (part->is_broken)
             {
-                std::lock_guard lock(part->broken_projections_mutex);
+                std::lock_guard lock(part->broken_reason_mutex);
                 if (columns_mask[src_index++])
                     columns[res_index++]->insert(part->exception_code);
                 if (columns_mask[src_index++])
@@ -306,18 +312,6 @@ void StorageSystemProjectionParts::processNextStorage(
         /// Do not use part->getState*, it can be changed from different thread
         if (has_state_column)
             columns[res_index++]->insert(IMergeTreeDataPart::stateString(part_state));
-    };
-
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.projection_parts[part_number];
-        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
-    }
-
-    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.broken_projection_parts[part_number];
-        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
index 3f4224e46bb..06becc6d91c 100644
--- a/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemProjectionPartsColumns.cpp
@@ -103,14 +103,15 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
     }
 
     /// Go through the list of projection parts.
-    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(true, has_state_column);
-    auto fill_part_info = [&](size_t part_number, const MergeTreeData::DataPartsVector & parts, const MergeTreeData::DataPartStateVector & states)
+    MergeTreeData::DataPartStateVector all_parts_state;
+    MergeTreeData::ProjectionPartsVector all_parts = info.getProjectionParts(all_parts_state, has_state_column);
+    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
     {
-        const auto & part = parts[part_number];
+        const auto & part = all_parts.projection_parts[part_number];
         const auto * parent_part = part->getParentPart();
         chassert(parent_part);
 
-        auto part_state = states[part_number];
+        auto part_state = all_parts_state[part_number];
         auto columns_size = part->getTotalColumnsSize();
         auto parent_columns_size = parent_part->getTotalColumnsSize();
 
@@ -259,18 +260,6 @@ void StorageSystemProjectionPartsColumns::processNextStorage(
             if (has_state_column)
                 columns[res_index++]->insert(part->stateString());
         }
-    };
-
-    for (size_t part_number = 0; part_number < all_parts.projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.projection_parts[part_number];
-        fill_part_info(part_number, all_parts.projection_parts, all_parts.projection_parts_states);
-    }
-
-    for (size_t part_number = 0; part_number < all_parts.broken_projection_parts.size(); ++part_number)
-    {
-        auto part = all_parts.broken_projection_parts[part_number];
-        fill_part_info(part_number, all_parts.broken_projection_parts, all_parts.broken_projection_parts_states);
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index d0b07e081db..62966036eed 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -8,15 +8,15 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
 0
@@ -27,23 +27,20 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 check table full
-all_0_0_0	1	
-all_1_1_0	1	
-all_3_3_0	1	
 all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
 0
 broke data of part 'proj_2' (parent part: all_2_2_0)
@@ -52,13 +49,13 @@ all_2_2_0	proj	FILE_DOESNT_EXIST
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj_2']
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 FILE_DOESNT_EXIST
 check table
@@ -69,18 +66,18 @@ all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	[]
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 0
@@ -99,21 +96,21 @@ all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	[]
-all_3_3_0	0	['proj']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 0
@@ -135,76 +132,66 @@ all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
 system.parts
 all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	[]
-all_2_2_0	1	[]
-all_3_3_0	0	['proj']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 0
 check table full
-all_3_5_1	1	
-all_0_0_0	1	
-all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
 all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
+all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
 materialize projection proj
 check table full
-all_3_5_1_6	1	
-all_0_0_0_6	1	
-all_2_2_0_6	1	
-all_1_1_0_6	1	
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
-all_1_1_0	0	[]
+all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	1	['proj','proj_2']
-all_2_2_0	0	[]
+all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	1	['proj','proj_2']
-all_3_3_0	0	['proj']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
-16
 12
+16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
 materialize projection proj_2
 check table full
-all_3_5_1_7	1	
-all_0_0_0_7	1	
-all_2_2_0_7	1	
-all_1_1_0_7	1	
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	0	['proj','proj_2']
 all_0_0_0_7	1	['proj','proj_2']
-all_1_1_0	0	[]
+all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	0	['proj','proj_2']
 all_1_1_0_7	1	['proj','proj_2']
-all_2_2_0	0	[]
+all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	0	['proj','proj_2']
 all_2_2_0_7	1	['proj','proj_2']
-all_3_3_0	0	['proj']
+all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	0	['proj']
 all_3_5_1_7	1	['proj','proj_2']
@@ -214,11 +201,11 @@ select from projection 'proj'
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16;	['default.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
 select from projection 'proj_2'
-16
 12
+16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 81adfe6e49d..4748506d9cf 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -23,7 +23,7 @@ CREATE TABLE test
         SELECT d ORDER BY c
     )
 )
-ENGINE = ReplicatedMergeTree('/test2/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+ENGINE = ReplicatedMergeTree('/test3/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
 SETTINGS min_bytes_for_wide_part = 0,
     max_parts_to_merge_at_once=3,
     enable_vertical_merge_algorithm=1,
@@ -119,9 +119,9 @@ function check()
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -134,9 +134,9 @@ function check()
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -173,7 +173,7 @@ function materialize_projection
 function check_table_full()
 {
     echo 'check table full'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0"
+    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0" | grep "broken"
 }
 
 
From 8ea4e302a50db872a798c6cd39c6f5edb255ec49 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 16 Nov 2023 19:43:32 +0100
Subject: [PATCH 0017/1081] Fix style check

---
 .../0_stateless/02916_broken_projection.sh    | 31 ++++++++++++++++---
 1 file changed, 26 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 4748506d9cf..bf0ec61fd76 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -125,7 +126,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -140,7 +141,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE query_id='$query_id' and type='QueryFinish'
+            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -148,10 +149,20 @@ function check()
     $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
 }
 
-function optimize_no_wait()
+function optimize()
 {
+    final=$1
+    no_wait=$2
+
     echo 'optimize'
-    $CLICKHOUSE_CLIENT -nm -q "OPTIMIZE TABLE test SETTINGS alter_sync=0;"
+    query="OPTIMIZE TABLE test"
+
+    if [ $final -eq 1 ]; then
+        query="$query FINAL"
+    if [ $no_wait -eq 1 ]; then
+        query="$query SETTINGS alter_sync=0"
+
+    $CLICKHOUSE_CLIENT -nm -q $query
 }
 
 function reattach()
@@ -234,7 +245,7 @@ insert 25 5
 # Merge will be retried and on second attempt it will succeed.
 # The result part all_3_5_1 will have only 1 projection - 'proj', because
 # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-optimize_no_wait
+optimize 0 1
 sleep 2
 
 $CLICKHOUSE_CLIENT -nm -q "
@@ -276,6 +287,16 @@ materialize_projection proj_2
 
 check_table_full
 
+break_projection proj all_3_5_1_7 data
+
+insert 30 5
+
+optimize 1 0
+
+insert 35 5
+
+optimize 1 0
+
 check
 
 $CLICKHOUSE_CLIENT -nm -q "

From 961bf074daf0c901a3e9d14b6caa4ba6cb37cc7c Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 20 Nov 2023 10:56:10 +0100
Subject: [PATCH 0018/1081] Initial draft version of adding backup support to
 AzureBlobStorage

---
 src/Backups/BackupFactory.cpp                 |   2 +
 src/Backups/BackupIO_AzureBlobStorage.cpp     | 336 ++++++++++++++++++
 src/Backups/BackupIO_AzureBlobStorage.h       |  69 ++++
 src/Backups/BackupImpl.cpp                    |   8 +-
 .../registerBackupEngineAzureBlobStorage.cpp  | 134 +++++++
 src/CMakeLists.txt                            |   3 +
 src/Common/ProfileEvents.cpp                  |   4 +
 .../copyAzureBlobStorageFile.cpp              | 324 +++++++++++++++++
 .../copyAzureBlobStorageFile.h                |  58 +++
 src/Storages/StorageAzureBlob.cpp             |  11 +
 src/Storages/StorageAzureBlob.h               |   1 +
 .../__init__.py                               |   1 +
 .../configs/config.xml                        |  11 +
 .../configs/disable_profilers.xml             |  13 +
 .../configs/users.xml                         |   8 +
 .../test.py                                   | 151 ++++++++
 16 files changed, 1132 insertions(+), 2 deletions(-)
 create mode 100644 src/Backups/BackupIO_AzureBlobStorage.cpp
 create mode 100644 src/Backups/BackupIO_AzureBlobStorage.h
 create mode 100644 src/Backups/registerBackupEngineAzureBlobStorage.cpp
 create mode 100644 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
 create mode 100644 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
 create mode 100644 tests/integration/test_backup_restore_azure_blob_storage/__init__.py
 create mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
 create mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
 create mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml
 create mode 100644 tests/integration/test_backup_restore_azure_blob_storage/test.py

diff --git a/src/Backups/BackupFactory.cpp b/src/Backups/BackupFactory.cpp
index 898ac7bc490..31e87a21fc2 100644
--- a/src/Backups/BackupFactory.cpp
+++ b/src/Backups/BackupFactory.cpp
@@ -33,11 +33,13 @@ void BackupFactory::registerBackupEngine(const String & engine_name, const Creat
 
 void registerBackupEnginesFileAndDisk(BackupFactory &);
 void registerBackupEngineS3(BackupFactory &);
+void registerBackupEngineAzureBlobStorage(BackupFactory &);
 
 void registerBackupEngines(BackupFactory & factory)
 {
     registerBackupEnginesFileAndDisk(factory);
     registerBackupEngineS3(factory);
+    registerBackupEngineAzureBlobStorage(factory);
 }
 
 BackupFactory::BackupFactory()
diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
new file mode 100644
index 00000000000..d41d23e3c36
--- /dev/null
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -0,0 +1,336 @@
+#include <Backups/BackupIO_AzureBlobStorage.h>
+
+#if USE_AZURE_BLOB_STORAGE
+#include <Common/quoteString.h>
+#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Interpreters/Context.h>
+#include <IO/SharedThreadPools.h>
+#include <IO/HTTPHeaderEntries.h>
+#include <Storages/StorageAzureBlobCluster.h>
+#include <Disks/IO/ReadBufferFromAzureBlobStorage.h>
+#include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
+#include <IO/AzureBlobStorage/copyAzureBlobStorageFile.h>
+#include <Disks/IDisk.h>
+
+#include <Poco/Util/AbstractConfiguration.h>
+
+#include <filesystem>
+
+
+namespace fs = std::filesystem;
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int AZURE_BLOB_STORAGE_ERROR;
+    extern const int LOGICAL_ERROR;
+}
+
+//using AzureClientPtr = std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient>;
+
+BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
+    StorageAzureBlob::Configuration configuration_,
+    const ReadSettings & read_settings_,
+    const WriteSettings & write_settings_,
+    const ContextPtr & context_)
+    : BackupReaderDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupReaderAzureBlobStorage"))
+    , data_source_description{DataSourceType::AzureBlobStorage, "AzureBlobStorage", false, false}
+    , configuration(configuration_)
+{
+    client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
+    settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
+    auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
+    object_storage = std::make_unique<AzureObjectStorage>("BackupReaderAzureBlobStorage",
+                                                          std::make_unique<Azure::Storage::Blobs::BlobContainerClient>(*client.get()),
+                                                          std::move(settings_as_unique_ptr));
+}
+
+BackupReaderAzureBlobStorage::~BackupReaderAzureBlobStorage() = default;
+
+bool BackupReaderAzureBlobStorage::fileExists(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    return object_storage->exists(StoredObject(key));
+}
+
+UInt64 BackupReaderAzureBlobStorage::getFileSize(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    ObjectMetadata object_metadata = object_storage->getObjectMetadata(key);
+    return object_metadata.size_bytes;
+}
+
+std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    return std::make_unique<ReadBufferFromAzureBlobStorage>(
+        client, key, read_settings, settings->max_single_read_retries,
+        settings->max_single_download_retries);
+}
+
+void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
+                                    DiskPtr destination_disk, const String & destination_path, WriteMode write_mode)
+{
+    LOG_INFO(&Poco::Logger::get("BackupReaderAzureBlobStorage"), "Enter copyFileToDisk");
+
+    /// Use the native copy as a more optimal way to copy a file from AzureBlobStorage to AzureBlobStorage if it's possible.
+    /// We don't check for `has_throttling` here because the native copy almost doesn't use network.
+    auto destination_data_source_description = destination_disk->getDataSourceDescription();
+    if (destination_data_source_description.sameKind(data_source_description)
+        && (destination_data_source_description.is_encrypted == encrypted_in_backup))
+    {
+        LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
+        auto write_blob_function = [&](const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> & object_attributes) -> size_t
+        {
+            /// Object storage always uses mode `Rewrite` because it simulates append using metadata and different files.
+            if (blob_path.size() != 2 || mode != WriteMode::Rewrite)
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                "Blob writing function called with unexpected blob_path.size={} or mode={}",
+                                blob_path.size(), mode);
+
+            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client;
+            if (configuration.container == blob_path[1])
+            {
+                dest_client = client;
+            }
+            else
+            {
+                StorageAzureBlob::Configuration dest_configuration = configuration;
+                dest_configuration.container = blob_path[1];
+                dest_configuration.blob_path = blob_path[0];
+                dest_client = StorageAzureBlob::createClient(dest_configuration, /* is_read_only */ false);
+            }
+
+
+            copyAzureBlobStorageFile(
+                client,
+                dest_client,
+                configuration.container,
+                fs::path(configuration.blob_path) / path_in_backup,
+                0,
+                file_size,
+                /* dest_bucket= */ blob_path[1],
+                /* dest_key= */ blob_path[0],
+                settings,
+                read_settings,
+                object_attributes,
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupReaderAzureBlobStorage"),
+                /* for_disk_azure_blob_storage= */ true);
+
+            return file_size;
+        };
+
+        destination_disk->writeFileUsingBlobWritingFunction(destination_path, write_mode, write_blob_function);
+        return; /// copied!
+    }
+
+    /// Fallback to copy through buffers.
+    BackupReaderDefault::copyFileToDisk(path_in_backup, file_size, encrypted_in_backup, destination_disk, destination_path, write_mode);
+}
+
+
+BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
+    StorageAzureBlob::Configuration configuration_,
+    const ReadSettings & read_settings_,
+    const WriteSettings & write_settings_,
+    const ContextPtr & context_)
+    : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterAzureBlobStorage"))
+    , data_source_description{DataSourceType::AzureBlobStorage, "AzureBlobStorage", false, false}
+    , configuration(configuration_)
+{
+    client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
+    settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
+    auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
+    object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
+                                                          std::make_unique<Azure::Storage::Blobs::BlobContainerClient>(*client.get()),
+                                                                  std::move(settings_as_unique_ptr));
+}
+
+void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
+                                      bool copy_encrypted, UInt64 start_pos, UInt64 length)
+{
+    /// Use the native copy as a more optimal way to copy a file from AzureBlobStorage to AzureBlobStorage if it's possible.
+    auto source_data_source_description = src_disk->getDataSourceDescription();
+    if (source_data_source_description.sameKind(data_source_description) && (source_data_source_description.is_encrypted == copy_encrypted))
+    {
+        /// getBlobPath() can return more than 3 elements if the file is stored as multiple objects in AzureBlobStorage bucket.
+        /// In this case we can't use the native copy.
+        if (auto blob_path = src_disk->getBlobPath(src_path); blob_path.size() == 2)
+        {
+
+            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client;
+            if (configuration.container == blob_path[1])
+            {
+                src_client = client;
+            }
+            else
+            {
+                StorageAzureBlob::Configuration src_configuration = configuration;
+                src_configuration.container = blob_path[1];
+                src_configuration.blob_path = blob_path[0];
+                src_client = StorageAzureBlob::createClient(src_configuration, /* is_read_only */ false);
+            }
+
+            LOG_TRACE(log, "Copying file {} from disk {} to AzureBlobStorag", src_path, src_disk->getName());
+            copyAzureBlobStorageFile(
+                src_client,
+                client,
+                /* src_bucket */ blob_path[1],
+                /* src_key= */ blob_path[0],
+                start_pos,
+                length,
+                configuration.container,
+                fs::path(configuration.blob_path) / path_in_backup,
+                settings,
+                read_settings,
+                {},
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterAzureBlobStorage"));
+            return; /// copied!
+        }
+    }
+
+    /// Fallback to copy through buffers.
+    BackupWriterDefault::copyFileFromDisk(path_in_backup, src_disk, src_path, copy_encrypted, start_pos, length);
+}
+
+void BackupWriterAzureBlobStorage::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
+{
+    copyDataToAzureBlobStorageFile(create_read_buffer, start_pos, length, client, configuration.container, path_in_backup, settings, {},
+                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterAzureBlobStorage"));
+}
+
+BackupWriterAzureBlobStorage::~BackupWriterAzureBlobStorage() = default;
+
+bool BackupWriterAzureBlobStorage::fileExists(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    LOG_INFO(&Poco::Logger::get("BackupWriterAzureBlobStorage"), "Result fileExists   {} ", object_storage->exists(StoredObject(key)));
+
+    return object_storage->exists(StoredObject(key));
+}
+
+UInt64 BackupWriterAzureBlobStorage::getFileSize(const String & file_name)
+{
+    LOG_INFO(&Poco::Logger::get("BackupWriterAzureBlobStorage"), "Enter getFileSize");
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    RelativePathsWithMetadata children;
+    object_storage->listObjects(key,children,/*max_keys*/0);
+    if (children.empty())
+        throw Exception(ErrorCodes::AZURE_BLOB_STORAGE_ERROR, "Object {} must exist");
+    return children[0].metadata.size_bytes;
+}
+
+std::unique_ptr<ReadBuffer> BackupWriterAzureBlobStorage::readFile(const String & file_name, size_t /*expected_file_size*/)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+
+    return std::make_unique<ReadBufferFromAzureBlobStorage>(
+        client, key, read_settings, settings->max_single_read_retries,
+        settings->max_single_download_retries);
+}
+
+std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    return std::make_unique<WriteBufferFromAzureBlobStorage>(
+        client,
+        key,
+        settings->max_single_part_upload_size,
+        DBMS_DEFAULT_BUFFER_SIZE,
+        write_settings);
+}
+
+void BackupWriterAzureBlobStorage::removeFile(const String & file_name)
+{
+    String key;
+    if (startsWith(file_name, "."))
+    {
+        key= configuration.blob_path + file_name;
+    }
+    else
+    {
+        key = file_name;
+    }
+    StoredObject object(key);
+    object_storage->removeObjectIfExists(object);
+}
+
+void BackupWriterAzureBlobStorage::removeFiles(const Strings & keys)
+{
+    StoredObjects objects;
+    for (const auto & key : keys)
+        objects.emplace_back(key);
+
+    object_storage->removeObjectsIfExist(objects);
+
+}
+
+void BackupWriterAzureBlobStorage::removeFilesBatch(const Strings & keys)
+{
+    StoredObjects objects;
+    for (const auto & key : keys)
+        objects.emplace_back(key);
+
+    object_storage->removeObjectsIfExist(objects);
+}
+
+}
+
+#endif
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
new file mode 100644
index 00000000000..6ef66fc432d
--- /dev/null
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -0,0 +1,69 @@
+#pragma once
+
+#include "config.h"
+
+#if USE_AZURE_BLOB_STORAGE
+#include <Backups/BackupIO_Default.h>
+#include <Disks/DiskType.h>
+#include <Storages/StorageAzureBlobCluster.h>
+#include <Interpreters/Context_fwd.h>
+
+
+namespace DB
+{
+
+//    using AzureClientPtr = std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient>;
+
+/// Represents a backup stored to Azure
+    class BackupReaderAzureBlobStorage : public BackupReaderDefault
+    {
+    public:
+        BackupReaderAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
+        ~BackupReaderAzureBlobStorage() override;
+
+        bool fileExists(const String & file_name) override;
+        UInt64 getFileSize(const String & file_name) override;
+        std::unique_ptr<SeekableReadBuffer> readFile(const String & file_name) override;
+
+        void copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
+                            DiskPtr destination_disk, const String & destination_path, WriteMode write_mode) override;
+
+    private:
+        const DataSourceDescription data_source_description;
+        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+        StorageAzureBlob::Configuration configuration;
+        std::unique_ptr<AzureObjectStorage> object_storage;
+        std::shared_ptr<AzureObjectStorageSettings> settings;
+    };
+
+
+    class BackupWriterAzureBlobStorage : public BackupWriterDefault
+    {
+    public:
+        BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
+        ~BackupWriterAzureBlobStorage() override;
+
+        bool fileExists(const String & file_name) override;
+        UInt64 getFileSize(const String & file_name) override;
+        std::unique_ptr<WriteBuffer> writeFile(const String & file_name) override;
+
+        void copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length) override;
+        void copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
+                              bool copy_encrypted, UInt64 start_pos, UInt64 length) override;
+
+        void removeFile(const String & file_name) override;
+        void removeFiles(const Strings & file_names) override;
+
+    private:
+        std::unique_ptr<ReadBuffer> readFile(const String & file_name, size_t expected_file_size) override;
+        void removeFilesBatch(const Strings & file_names);
+        const DataSourceDescription data_source_description;
+        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+        StorageAzureBlob::Configuration configuration;
+        std::unique_ptr<AzureObjectStorage> object_storage;
+        std::shared_ptr<AzureObjectStorageSettings> settings;
+    };
+
+}
+
+#endif
diff --git a/src/Backups/BackupImpl.cpp b/src/Backups/BackupImpl.cpp
index bb97335d8fb..9363ca5e7a7 100644
--- a/src/Backups/BackupImpl.cpp
+++ b/src/Backups/BackupImpl.cpp
@@ -492,6 +492,7 @@ void BackupImpl::checkBackupDoesntExist() const
     else
         file_name_to_check_existence = ".backup";
 
+    LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkBackupDoesntExist 1");
     if (writer->fileExists(file_name_to_check_existence))
         throw Exception(ErrorCodes::BACKUP_ALREADY_EXISTS, "Backup {} already exists", backup_name_for_logging);
 
@@ -499,6 +500,7 @@ void BackupImpl::checkBackupDoesntExist() const
     if (!is_internal_backup)
     {
         assert(!lock_file_name.empty());
+        LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkBackupDoesntExist 2");
         if (writer->fileExists(lock_file_name))
             throw Exception(ErrorCodes::BACKUP_ALREADY_EXISTS, "Backup {} is being written already", backup_name_for_logging);
     }
@@ -522,6 +524,8 @@ bool BackupImpl::checkLockFile(bool throw_if_failed) const
 
     if (throw_if_failed)
     {
+        LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkLockFile");
+
         if (!writer->fileExists(lock_file_name))
         {
             throw Exception(
@@ -886,12 +890,12 @@ void BackupImpl::writeFile(const BackupFileInfo & info, BackupEntryPtr entry)
     }
     else if (src_disk && from_immutable_file)
     {
-        LOG_TRACE(log, "Writing backup for file {} from {} (disk {}): data file #{}", info.data_file_name, src_file_desc, src_disk->getName(), info.data_file_index);
+        LOG_INFO(log, "Writing backup for file {} from {} (disk {}): data file #{}", info.data_file_name, src_file_desc, src_disk->getName(), info.data_file_index);
         writer->copyFileFromDisk(info.data_file_name, src_disk, src_file_path, info.encrypted_by_disk, info.base_size, info.size - info.base_size);
     }
     else
     {
-        LOG_TRACE(log, "Writing backup for file {} from {}: data file #{}", info.data_file_name, src_file_desc, info.data_file_index);
+        LOG_INFO(log, "Writing backup for file {} from {}: data file #{}", info.data_file_name, src_file_desc, info.data_file_index);
         auto create_read_buffer = [entry, read_settings = writer->getReadSettings()] { return entry->getReadBuffer(read_settings); };
         writer->copyDataToFile(info.data_file_name, create_read_buffer, info.base_size, info.size - info.base_size);
     }
diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
new file mode 100644
index 00000000000..6f7b5f38c28
--- /dev/null
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -0,0 +1,134 @@
+#include "config.h"
+
+#include <Backups/BackupFactory.h>
+#include <Common/Exception.h>
+
+#if USE_AZURE_BLOB_STORAGE
+#include <Backups/BackupIO_AzureBlobStorage.h>
+#include <Storages/StorageAzureBlob.h>
+#include <Backups/BackupImpl.h>
+#include <IO/Archives/hasRegisteredArchiveFileExtension.h>
+#include <Interpreters/Context.h>
+#include <Poco/Util/AbstractConfiguration.h>
+#include <filesystem>
+#endif
+
+
+namespace DB
+{
+namespace fs = std::filesystem;
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int SUPPORT_IS_DISABLED;
+}
+
+#if USE_AZURE_BLOB_STORAGE
+namespace
+{
+    String removeFileNameFromURL(String & url)
+    {
+        Poco::URI url2{url};
+        String path = url2.getPath();
+        size_t slash_pos = path.find_last_of('/');
+        String file_name = path.substr(slash_pos + 1);
+        path.resize(slash_pos + 1);
+        url2.setPath(path);
+        url = url2.toString();
+        return file_name;
+    }
+}
+#endif
+
+
+void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
+{
+    auto creator_fn = []([[maybe_unused]] const BackupFactory::CreateParams & params) -> std::unique_ptr<IBackup>
+    {
+#if USE_AZURE_BLOB_STORAGE
+        const String & id_arg = params.backup_info.id_arg;
+        const auto & args = params.backup_info.args;
+
+        LOG_INFO(&Poco::Logger::get("registerBackupEngineAzureBlobStorage"), "Begin id_arg={} args.size={}", id_arg, args.size());
+
+        StorageAzureBlob::Configuration configuration;
+
+        if (args.size() == 4)
+        {
+            configuration.connection_url = args[0].safeGet<String>();
+            configuration.is_connection_string = true;
+
+            configuration.container =  args[1].safeGet<String>();
+            configuration.blob_path = args[2].safeGet<String>();
+            configuration.format = args[3].safeGet<String>();
+
+            LOG_TRACE(&Poco::Logger::get("registerBackupEngineAzureBlobStorage"), "configuration.connection_url = {}"
+                                                                                 "configuration.container = {}"
+                                                                                 "configuration.blob_path = {}"
+                                                                                 "configuration.format = {}",
+                                                                                 configuration.connection_url, configuration.container, configuration.blob_path, configuration.format);
+        }
+
+
+        BackupImpl::ArchiveParams archive_params;
+        if (hasRegisteredArchiveFileExtension(configuration.blob_path))
+        {
+            if (params.is_internal_backup)
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Using archives with backups on clusters is disabled");
+
+            archive_params.archive_name = removeFileNameFromURL(configuration.blob_path);
+            archive_params.compression_method = params.compression_method;
+            archive_params.compression_level = params.compression_level;
+            archive_params.password = params.password;
+        }
+        else
+        {
+            if (!params.password.empty())
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Password is not applicable, backup cannot be encrypted");
+        }
+
+
+        if (params.open_mode == IBackup::OpenMode::READ)
+        {
+            auto reader = std::make_shared<BackupReaderAzureBlobStorage>(configuration,
+                                                           params.read_settings,
+                                                           params.write_settings,
+                                                           params.context);
+
+            return std::make_unique<BackupImpl>(
+                params.backup_info,
+                archive_params,
+                params.base_backup_info,
+                reader,
+                params.context,
+                /*params.use_same_s3_credentials_for_base_backup*/ false);
+        }
+        else
+        {
+            auto writer = std::make_shared<BackupWriterAzureBlobStorage>(configuration,
+                                                           params.read_settings,
+                                                           params.write_settings,
+                                                           params.context);
+
+            return std::make_unique<BackupImpl>(
+                params.backup_info,
+                archive_params,
+                params.base_backup_info,
+                writer,
+                params.context,
+                params.is_internal_backup,
+                params.backup_coordination,
+                params.backup_uuid,
+                params.deduplicate_files,
+                /*params.use_same_s3_credentials_for_base_backup*/ false);
+        }
+#else
+        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "AzureBlobStorage support is disabled");
+#endif
+    };
+
+    factory.registerBackupEngine("AzureBlobStorage", creator_fn);
+}
+
+}
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 0257b7d329b..984594a6541 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -87,6 +87,7 @@ add_headers_and_sources(clickhouse_common_io IO)
 add_headers_and_sources(clickhouse_common_io IO/Archives)
 add_headers_and_sources(clickhouse_common_io IO/Resource)
 add_headers_and_sources(clickhouse_common_io IO/S3)
+add_headers_and_sources(clickhouse_common_io IO/AzureBlobStorage)
 list (REMOVE_ITEM clickhouse_common_io_sources Common/malloc.cpp Common/new_delete.cpp)
 
 
@@ -139,6 +140,7 @@ endif()
 
 if (TARGET ch_contrib::azure_sdk)
     add_headers_and_sources(dbms Disks/ObjectStorages/AzureBlobStorage)
+    add_headers_and_sources(dbms IO/AzureBlobStorage)
 endif()
 
 if (TARGET ch_contrib::hdfs)
@@ -485,6 +487,7 @@ if (TARGET ch_contrib::aws_s3)
 endif()
 
 if (TARGET ch_contrib::azure_sdk)
+    target_link_libraries (clickhouse_common_io PUBLIC ch_contrib::azure_sdk)
     dbms_target_link_libraries (PRIVATE ch_contrib::azure_sdk)
 endif()
 
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 58e860ebcaf..1655d19986a 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -361,6 +361,10 @@ The server successfully detected this situation and will download merged part fr
     M(S3PutObject, "Number of S3 API PutObject calls.") \
     M(S3GetObject, "Number of S3 API GetObject calls.") \
     \
+    M(AzureUploadPart, "Number of Azure blob storage API UploadPart calls") \
+    M(DiskAzureUploadPart, "Number of Disk Azure blob storage API UploadPart calls") \
+    M(AzureCopyObject, "Number of Azure blob storage API CopyObject calls") \
+    M(DiskAzureCopyObject, "Number of Disk Azure blob storage API CopyObject calls") \
     M(AzureDeleteObjects, "Number of Azure blob storage API DeleteObject(s) calls.") \
     M(AzureListObjects, "Number of Azure blob storage API ListObjects calls.") \
     \
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
new file mode 100644
index 00000000000..bf0bcac664b
--- /dev/null
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -0,0 +1,324 @@
+#include <IO/AzureBlobStorage/copyAzureBlobStorageFile.h>
+
+#if USE_AZURE_BLOB_STORAGE
+
+#include <Common/ProfileEvents.h>
+#include <Common/typeid_cast.h>
+#include <Interpreters/Context.h>
+#include <IO/LimitSeekableReadBuffer.h>
+#include <IO/SeekableReadBuffer.h>
+#include <IO/StdStreamFromReadBuffer.h>
+#include <Disks/IO/ReadBufferFromAzureBlobStorage.h>
+#include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
+#include <Common/getRandomASCIIString.h>
+#include <IO/SharedThreadPools.h>
+
+namespace ProfileEvents
+{
+    extern const Event AzureCopyObject;
+    extern const Event AzureUploadPart;
+
+    extern const Event DiskAzureCopyObject;
+    extern const Event DiskAzureUploadPart;
+}
+
+
+namespace DB
+{
+
+size_t max_single_operation_copy_size = 256 * 1024 * 1024;
+
+
+namespace
+{
+    class UploadHelper
+    {
+    public:
+        UploadHelper(
+            const CreateReadBuffer & create_read_buffer_,
+            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client_,
+            size_t offset_,
+            size_t total_size_,
+            const String & dest_bucket_,
+            const String & dest_key_,
+            std::shared_ptr<AzureObjectStorageSettings> settings_,
+            const std::optional<std::map<String, String>> & object_metadata_,
+            ThreadPoolCallbackRunner<void> schedule_,
+            bool for_disk_azure_blob_storage_)
+            : create_read_buffer(create_read_buffer_)
+            , client(client_)
+            , offset (offset_)
+            , total_size (total_size_)
+            , dest_bucket(dest_bucket_)
+            , dest_key(dest_key_)
+            , settings(settings_)
+            , object_metadata(object_metadata_)
+            , schedule(schedule_)
+            , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
+            , log(&Poco::Logger::get("azureBlobStorageUploadHelper"))
+            , max_single_part_upload_size(settings_.get()->max_single_part_upload_size)
+        {
+        }
+
+        ~UploadHelper() {}
+
+    protected:
+        std::function<std::unique_ptr<SeekableReadBuffer>()> create_read_buffer;
+        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+        size_t offset;
+        size_t total_size;
+        const String & dest_bucket;
+        const String & dest_key;
+        std::shared_ptr<AzureObjectStorageSettings> settings;
+        const std::optional<std::map<String, String>> & object_metadata;
+        ThreadPoolCallbackRunner<void> schedule;
+        bool for_disk_azure_blob_storage;
+        const Poco::Logger * log;
+        size_t max_single_part_upload_size;
+
+        struct UploadPartTask
+        {
+            char *data = nullptr;
+            size_t size = 0;
+            std::string block_id;
+            bool is_finished = false;
+            std::exception_ptr exception;
+
+            ~UploadPartTask()
+            {
+                if (data != nullptr)
+                    free(data);
+            }
+        };
+
+        size_t normal_part_size;
+        std::vector<std::string> block_ids;
+
+        std::list<UploadPartTask> TSA_GUARDED_BY(bg_tasks_mutex) bg_tasks;
+        int num_added_bg_tasks TSA_GUARDED_BY(bg_tasks_mutex) = 0;
+        int num_finished_bg_tasks TSA_GUARDED_BY(bg_tasks_mutex) = 0;
+        std::mutex bg_tasks_mutex;
+        std::condition_variable bg_tasks_condvar;
+
+    public:
+        void performCopy()
+        {
+            performMultipartUpload();
+        }
+
+        void completeMultipartUpload()
+        {
+            auto block_blob_client = client->GetBlockBlobClient(dest_key);
+            block_blob_client.CommitBlockList(block_ids);
+        }
+
+        void performMultipartUpload()
+        {
+            normal_part_size = 1024;
+
+            size_t position = offset;
+            size_t end_position = offset + total_size;
+
+            try
+            {
+                while (position < end_position)
+                {
+                    size_t next_position = std::min(position + normal_part_size, end_position);
+                    size_t part_size = next_position - position; /// `part_size` is either `normal_part_size` or smaller if it's the final part.
+
+                    uploadPart(position, part_size);
+
+                    position = next_position;
+                }
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+                waitForAllBackgroundTasks();
+                throw;
+            }
+
+            waitForAllBackgroundTasks();
+            completeMultipartUpload();
+        }
+
+
+        void uploadPart(size_t part_offset, size_t part_size)
+        {
+            LOG_TRACE(log, "Writing part. Bucket: {}, Key: {}, Size: {}", dest_bucket, dest_key, part_size);
+
+            if (!part_size)
+            {
+                LOG_TRACE(log, "Skipping writing an empty part.");
+                return;
+            }
+
+            if (schedule)
+            {
+                UploadPartTask *  task = nullptr;
+
+                {
+                    std::lock_guard lock(bg_tasks_mutex);
+                    task = &bg_tasks.emplace_back();
+                    ++num_added_bg_tasks;
+                }
+
+                /// Notify waiting thread when task finished
+                auto task_finish_notify = [this, task]()
+                {
+                    std::lock_guard lock(bg_tasks_mutex);
+                    task->is_finished = true;
+                    ++num_finished_bg_tasks;
+
+                    /// Notification under mutex is important here.
+                    /// Otherwise, WriteBuffer could be destroyed in between
+                    /// Releasing lock and condvar notification.
+                    bg_tasks_condvar.notify_one();
+                };
+
+                try
+                {
+                    auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
+                    auto buffer = std::make_unique<StdStreamFromReadBuffer>(std::move(read_buffer), part_size);
+                    task->data = new char[part_size];
+                    task->size = part_size;
+                    buffer->read(task->data,part_size);
+                    task->block_id = getRandomASCIIString(64);
+
+                    schedule([this, task, task_finish_notify]()
+                    {
+                        try
+                        {
+                            processUploadTask(*task);
+                        }
+                        catch (...)
+                        {
+                            task->exception = std::current_exception();
+                        }
+                        task_finish_notify();
+                    }, Priority{});
+                }
+                catch (...)
+                {
+                    task_finish_notify();
+                    throw;
+                }
+            }
+            else
+            {
+                UploadPartTask task;
+                auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
+                auto buffer = std::make_unique<StdStreamFromReadBuffer>(std::move(read_buffer), part_size);
+                task.data = new char[part_size];
+                buffer->read(task.data,part_size);
+                task.size = part_size;
+                processUploadTask(task);
+                block_ids.emplace_back(task.block_id);
+            }
+        }
+
+        void processUploadTask(UploadPartTask & task)
+        {
+            auto block_id = processUploadPartRequest(task);
+
+            std::lock_guard lock(bg_tasks_mutex); /// Protect bg_tasks from race
+            task.block_id = block_id;
+            LOG_TRACE(log, "Writing part finished. Bucket: {}, Key: {}, block_id: {}, Parts: {}", dest_bucket, dest_key, block_id, bg_tasks.size());
+        }
+
+        String processUploadPartRequest(UploadPartTask & task)
+        {
+            ProfileEvents::increment(ProfileEvents::AzureUploadPart);
+            if (for_disk_azure_blob_storage)
+                ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
+
+            auto block_blob_client = client->GetBlockBlobClient(dest_key);
+            task.block_id = getRandomASCIIString(64);
+            Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.data), task.size);
+            block_blob_client.StageBlock(task.block_id, memory);
+
+            return task.block_id;
+        }
+
+
+        void waitForAllBackgroundTasks()
+        {
+            if (!schedule)
+                return;
+
+            std::unique_lock lock(bg_tasks_mutex);
+            /// Suppress warnings because bg_tasks_mutex is actually hold, but tsa annotations do not understand std::unique_lock
+            bg_tasks_condvar.wait(lock, [this]() {return TSA_SUPPRESS_WARNING_FOR_READ(num_added_bg_tasks) == TSA_SUPPRESS_WARNING_FOR_READ(num_finished_bg_tasks); });
+
+            auto & tasks = TSA_SUPPRESS_WARNING_FOR_WRITE(bg_tasks);
+            for (auto & task : tasks)
+            {
+                if (task.exception)
+                    std::rethrow_exception(task.exception);
+                block_ids.emplace_back(task.block_id);
+            }
+        }
+    };
+}
+
+
+void copyDataToAzureBlobStorageFile(
+    const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
+    size_t offset,
+    size_t size,
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
+    const String & dest_bucket,
+    const String & dest_key,
+    std::shared_ptr<AzureObjectStorageSettings> settings,
+    const std::optional<std::map<String, String>> & object_metadata,
+    ThreadPoolCallbackRunner<void> schedule,
+    bool for_disk_azure_blob_storage)
+{
+    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage};
+    helper.performCopy();
+}
+
+
+void copyAzureBlobStorageFile(
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
+    const String & src_bucket,
+    const String & src_key,
+    size_t offset,
+    size_t size,
+    const String & dest_bucket,
+    const String & dest_key,
+    std::shared_ptr<AzureObjectStorageSettings> settings,
+    const ReadSettings & read_settings,
+    const std::optional<std::map<String, String>> & object_metadata,
+    ThreadPoolCallbackRunner<void> schedule,
+    bool for_disk_azure_blob_storage)
+{
+
+    if (size < max_single_operation_copy_size)
+    {
+        ProfileEvents::increment(ProfileEvents::AzureCopyObject);
+        if (for_disk_azure_blob_storage)
+            ProfileEvents::increment(ProfileEvents::DiskAzureCopyObject);
+        auto block_blob_client_src = src_client->GetBlockBlobClient(src_key);
+        auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_key);
+        auto uri = block_blob_client_src.GetUrl();
+        block_blob_client_dest.CopyFromUri(uri);
+    }
+    else
+    {
+        LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Bucket: {}, Key: {}", src_bucket, src_key);
+        auto create_read_buffer = [&]
+        {
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_key, read_settings, settings->max_single_read_retries,
+            settings->max_single_download_retries);
+        };
+
+        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage};
+        helper.performCopy();
+    }
+}
+
+}
+
+#endif
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
new file mode 100644
index 00000000000..31228fbcb23
--- /dev/null
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -0,0 +1,58 @@
+#pragma once
+
+#include "config.h"
+
+#if USE_AZURE_BLOB_STORAGE
+
+#include <Storages/StorageAzureBlobCluster.h>
+#include <Storages/StorageAzureBlob.h>
+#include <Interpreters/threadPoolCallbackRunner.h>
+#include <base/types.h>
+#include <functional>
+#include <memory>
+
+
+namespace DB
+{
+class SeekableReadBuffer;
+
+using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
+
+/// Copies a file from AzureBlobStorage to AzureBlobStorage.
+/// The parameters `src_offset` and `src_size` specify a part in the source to copy.
+void copyAzureBlobStorageFile(
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
+    const String & src_bucket,
+    const String & src_key,
+    size_t src_offset,
+    size_t src_size,
+    const String & dest_bucket,
+    const String & dest_key,
+    std::shared_ptr<AzureObjectStorageSettings> settings,
+    const ReadSettings & read_settings,
+    const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
+    ThreadPoolCallbackRunner<void> schedule_ = {},
+    bool for_disk_azure_blob_storage = false);
+
+
+/// Copies data from any seekable source to AzureBlobStorage.
+/// The same functionality can be done by using the function copyData() and the class WriteBufferFromS3
+/// however copyDataToS3File() is faster and spends less memory.
+/// The callback `create_read_buffer` can be called from multiple threads in parallel, so that should be thread-safe.
+/// The parameters `offset` and `size` specify a part in the source to copy.
+void copyDataToAzureBlobStorageFile(
+    const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
+    size_t offset,
+    size_t size,
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & client,
+    const String & dest_bucket,
+    const String & dest_key,
+    std::shared_ptr<AzureObjectStorageSettings> settings,
+    const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
+    ThreadPoolCallbackRunner<void> schedule_ = {},
+    bool for_disk_azure_blob_storage = false);
+
+}
+
+#endif
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 2e0703a8df3..e36604cfb1a 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -258,6 +258,17 @@ AzureObjectStorage::SettingsPtr StorageAzureBlob::createSettings(ContextPtr loca
     return settings_ptr;
 }
 
+std::shared_ptr<AzureObjectStorageSettings> StorageAzureBlob::createSettingsAsSharedPtr(ContextPtr local_context)
+{
+    const auto & context_settings = local_context->getSettingsRef();
+    auto settings_ptr = std::make_shared<AzureObjectStorageSettings>();
+    settings_ptr->max_single_part_upload_size = context_settings.azure_max_single_part_upload_size;
+    settings_ptr->max_single_read_retries = context_settings.azure_max_single_read_retries;
+    settings_ptr->list_object_keys_size = static_cast<int32_t>(context_settings.azure_list_object_keys_size);
+
+    return settings_ptr;
+}
+
 void registerStorageAzureBlob(StorageFactory & factory)
 {
     factory.registerStorage("AzureBlobStorage", [](const StorageFactory::Arguments & args)
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index b97dee0caed..570e4124d73 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -80,6 +80,7 @@ public:
     static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration, bool is_read_only);
 
     static AzureObjectStorage::SettingsPtr createSettings(ContextPtr local_context);
+    static std::shared_ptr<AzureObjectStorageSettings> createSettingsAsSharedPtr(ContextPtr local_context);
 
     static void processNamedCollectionResult(StorageAzureBlob::Configuration & configuration, const NamedCollection & collection);
 
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/__init__.py b/tests/integration/test_backup_restore_azure_blob_storage/__init__.py
new file mode 100644
index 00000000000..e5a0d9b4834
--- /dev/null
+++ b/tests/integration/test_backup_restore_azure_blob_storage/__init__.py
@@ -0,0 +1 @@
+#!/usr/bin/env python3
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
new file mode 100644
index 00000000000..5725dce40cd
--- /dev/null
+++ b/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
@@ -0,0 +1,11 @@
+<clickhouse>
+    <background_processing_pool_thread_sleep_seconds>1</background_processing_pool_thread_sleep_seconds>
+    <background_processing_pool_thread_sleep_seconds_random_part>0</background_processing_pool_thread_sleep_seconds_random_part>
+    <background_processing_pool_thread_sleep_seconds_if_nothing_to_do>0.0</background_processing_pool_thread_sleep_seconds_if_nothing_to_do>
+    <background_processing_pool_task_sleep_seconds_when_no_work_min>0</background_processing_pool_task_sleep_seconds_when_no_work_min>
+    <background_processing_pool_task_sleep_seconds_when_no_work_max>1</background_processing_pool_task_sleep_seconds_when_no_work_max>
+    <background_processing_pool_task_sleep_seconds_when_no_work_multiplier>1</background_processing_pool_task_sleep_seconds_when_no_work_multiplier>
+    <background_processing_pool_task_sleep_seconds_when_no_work_random_part>0</background_processing_pool_task_sleep_seconds_when_no_work_random_part>
+    <backup_threads>16</backup_threads>
+    <restore_threads>16</restore_threads>
+</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
new file mode 100644
index 00000000000..b74bb1502ce
--- /dev/null
+++ b/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
@@ -0,0 +1,13 @@
+<!-- Sometime azurite is super slow, profiler make it even worse -->
+<clickhouse>
+    <profiles>
+        <default>
+            <query_profiler_real_time_period_ns>0</query_profiler_real_time_period_ns>
+            <query_profiler_cpu_time_period_ns>0</query_profiler_cpu_time_period_ns>
+            <load_marks_asynchronously>0</load_marks_asynchronously>
+            <backup_restore_keeper_max_retries>1000</backup_restore_keeper_max_retries>
+            <backup_restore_keeper_retry_initial_backoff_ms>1</backup_restore_keeper_retry_initial_backoff_ms>
+            <backup_restore_keeper_retry_max_backoff_ms>1</backup_restore_keeper_retry_max_backoff_ms>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml
new file mode 100644
index 00000000000..c12eb2f79f4
--- /dev/null
+++ b/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml
@@ -0,0 +1,8 @@
+<clickhouse>
+    <users>
+        <default>
+            <password></password>
+            <profile>default</profile>
+        </default>
+    </users>
+</clickhouse>
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
new file mode 100644
index 00000000000..2ecf08a4f40
--- /dev/null
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -0,0 +1,151 @@
+#!/usr/bin/env python3
+
+import gzip
+import json
+import logging
+import os
+import io
+import random
+import threading
+import time
+
+from azure.storage.blob import BlobServiceClient
+import helpers.client
+import pytest
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance
+from helpers.network import PartitionManager
+from helpers.mock_servers import start_mock_servers
+from helpers.test_tools import exec_query_with_retry
+
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        cluster.add_instance(
+            "node",
+            main_configs=["configs/config.xml"],
+            user_configs=["configs/disable_profilers.xml", "configs/users.xml"],
+            with_azurite=True,
+        )
+        cluster.start()
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def azure_query(
+    node, query, expect_error="false", try_num=10, settings={}, query_on_retry=None
+):
+    for i in range(try_num):
+        try:
+            if expect_error == "true":
+                return node.query_and_get_error(query, settings=settings)
+            else:
+                return node.query(query, settings=settings)
+        except Exception as ex:
+            retriable_errors = [
+                "DB::Exception: Azure::Core::Http::TransportException: Connection was closed by the server while trying to read a response",
+                "DB::Exception: Azure::Core::Http::TransportException: Connection closed before getting full response or response is less than expected",
+                "DB::Exception: Azure::Core::Http::TransportException: Connection was closed by the server while trying to read a response",
+                "DB::Exception: Azure::Core::Http::TransportException: Error while polling for socket ready read",
+                "Azure::Core::Http::TransportException, e.what() = Connection was closed by the server while trying to read a response",
+                "Azure::Core::Http::TransportException, e.what() = Connection closed before getting full response or response is less than expected",
+                "Azure::Core::Http::TransportException, e.what() = Connection was closed by the server while trying to read a response",
+                "Azure::Core::Http::TransportException, e.what() = Error while polling for socket ready read",
+            ]
+            retry = False
+            for error in retriable_errors:
+                if error in str(ex):
+                    retry = True
+                    print(f"Try num: {i}. Having retriable error: {ex}")
+                    time.sleep(i)
+                    break
+            if not retry or i == try_num - 1:
+                raise Exception(ex)
+            if query_on_retry is not None:
+                node.query(query_on_retry)
+            continue
+
+
+def get_azure_file_content(filename, port):
+    container_name = "cont"
+    connection_string = (
+        f"DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;"
+        f"AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;"
+        f"BlobEndpoint=http://127.0.0.1:{port}/devstoreaccount1;"
+    )
+    blob_service_client = BlobServiceClient.from_connection_string(
+        str(connection_string)
+    )
+    container_client = blob_service_client.get_container_client(container_name)
+    blob_client = container_client.get_blob_client(filename)
+    download_stream = blob_client.download_blob()
+    return download_stream.readall().decode("utf-8")
+
+
+def put_azure_file_content(filename, port, data):
+    container_name = "cont"
+    connection_string = (
+        f"DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;"
+        f"AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;"
+        f"BlobEndpoint=http://127.0.0.1:{port}/devstoreaccount1;"
+    )
+    blob_service_client = BlobServiceClient.from_connection_string(connection_string)
+    try:
+        container_client = blob_service_client.create_container(container_name)
+    except:
+        container_client = blob_service_client.get_container_client(container_name)
+
+    blob_client = container_client.get_blob_client(filename)
+    buf = io.BytesIO(data)
+    blob_client.upload_blob(buf)
+
+@pytest.fixture(autouse=True, scope="function")
+def delete_all_files(cluster):
+    port = cluster.env_variables["AZURITE_PORT"]
+    connection_string = (
+        f"DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;"
+        f"AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;"
+        f"BlobEndpoint=http://127.0.0.1:{port}/devstoreaccount1;"
+    )
+    blob_service_client = BlobServiceClient.from_connection_string(connection_string)
+    containers = blob_service_client.list_containers()
+    for container in containers:
+        container_client = blob_service_client.get_container_client(container)
+        blob_list = container_client.list_blobs()
+        for blob in blob_list:
+            print(blob)
+            blob_client = container_client.get_blob_client(blob)
+            blob_client.delete_blob()
+
+        assert len(list(container_client.list_blobs())) == 0
+
+    yield
+
+
+def test_create_table_connection_string(cluster):
+    node = cluster.instances["node"]
+    azure_query(
+        node,
+        f"CREATE TABLE test_create_table_conn_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_create_connection_string', 'CSV')",
+    )
+
+def test_backup_restore(cluster):
+    node = cluster.instances["node"]
+    port = cluster.env_variables["AZURITE_PORT"]
+    azure_query(
+        node,
+        f"CREATE TABLE test_simple_write_connection_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c.csv', 'CSV')",
+    )
+    azure_query(node, f"INSERT INTO test_simple_write_connection_string VALUES (1, 'a')")
+    print(get_azure_file_content("test_simple_write_c.csv", port))
+    assert get_azure_file_content("test_simple_write_c.csv", port) == '1,"a"\n'
+
+    backup_destination = f"AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c_backup.csv', 'CSV')"
+    azure_query(node,f"BACKUP TABLE test_simple_write_connection_string TO {backup_destination}")
+    print (get_azure_file_content("test_simple_write_c_backup.csv.backup", port))
+    azure_query(node, f"RESTORE TABLE test_simple_write_connection_string AS test_simple_write_connection_string_restored FROM {backup_destination};")
+    assert(azure_query(node,f"SELECT * from test_simple_write_connection_string_restored") == "1\ta\n")
\ No newline at end of file

From 05b608cd76da8995086887f812e1ab3fceb99551 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 20 Nov 2023 10:12:45 +0000
Subject: [PATCH 0019/1081] Automatic style fix

---
 .../test.py                                   | 24 ++++++++++++++-----
 1 file changed, 18 insertions(+), 6 deletions(-)

diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
index 2ecf08a4f40..cda3cab07e4 100644
--- a/tests/integration/test_backup_restore_azure_blob_storage/test.py
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -18,7 +18,6 @@ from helpers.mock_servers import start_mock_servers
 from helpers.test_tools import exec_query_with_retry
 
 
-
 @pytest.fixture(scope="module")
 def cluster():
     try:
@@ -103,6 +102,7 @@ def put_azure_file_content(filename, port, data):
     buf = io.BytesIO(data)
     blob_client.upload_blob(buf)
 
+
 @pytest.fixture(autouse=True, scope="function")
 def delete_all_files(cluster):
     port = cluster.env_variables["AZURITE_PORT"]
@@ -133,6 +133,7 @@ def test_create_table_connection_string(cluster):
         f"CREATE TABLE test_create_table_conn_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_create_connection_string', 'CSV')",
     )
 
+
 def test_backup_restore(cluster):
     node = cluster.instances["node"]
     port = cluster.env_variables["AZURITE_PORT"]
@@ -140,12 +141,23 @@ def test_backup_restore(cluster):
         node,
         f"CREATE TABLE test_simple_write_connection_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c.csv', 'CSV')",
     )
-    azure_query(node, f"INSERT INTO test_simple_write_connection_string VALUES (1, 'a')")
+    azure_query(
+        node, f"INSERT INTO test_simple_write_connection_string VALUES (1, 'a')"
+    )
     print(get_azure_file_content("test_simple_write_c.csv", port))
     assert get_azure_file_content("test_simple_write_c.csv", port) == '1,"a"\n'
 
     backup_destination = f"AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c_backup.csv', 'CSV')"
-    azure_query(node,f"BACKUP TABLE test_simple_write_connection_string TO {backup_destination}")
-    print (get_azure_file_content("test_simple_write_c_backup.csv.backup", port))
-    azure_query(node, f"RESTORE TABLE test_simple_write_connection_string AS test_simple_write_connection_string_restored FROM {backup_destination};")
-    assert(azure_query(node,f"SELECT * from test_simple_write_connection_string_restored") == "1\ta\n")
\ No newline at end of file
+    azure_query(
+        node,
+        f"BACKUP TABLE test_simple_write_connection_string TO {backup_destination}",
+    )
+    print(get_azure_file_content("test_simple_write_c_backup.csv.backup", port))
+    azure_query(
+        node,
+        f"RESTORE TABLE test_simple_write_connection_string AS test_simple_write_connection_string_restored FROM {backup_destination};",
+    )
+    assert (
+        azure_query(node, f"SELECT * from test_simple_write_connection_string_restored")
+        == "1\ta\n"
+    )

From 6dfb1c25ec6a4a61a4fe329191c10263eb19ad07 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 20 Nov 2023 11:37:06 +0100
Subject: [PATCH 0020/1081] Added docs

---
 docs/en/operations/backup.md | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 6068b185ede..15d953249a0 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -451,3 +451,24 @@ To disallow concurrent backup/restore, you can use these settings respectively.
 
 The default value for both is true, so by default concurrent backup/restores are allowed.
 When these settings are false on a cluster, only 1 backup/restore is allowed to run on a cluster at a time.
+
+## Configuring BACKUP/RESTORE to use an AzureBlobStorage Endpoint
+
+To write backups to an AzureBlobStorage container you need the following pieces of information:
+- AzureBlobStorage endpoint connection string / url,
+- Container,
+- Path,
+- Account name (if url is specified)
+- Account Key (if url is specified)
+
+The destination for a backup will be specified like this:
+```
+AzureBlobStorage('<connection string>/<url>', '<Container>', '<Path>', '<Account Name>', '<Account Key>)
+```
+
+```sql
+BACKUP TABLE data TO AzureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1/;',
+    'test_container', 'data_backup');
+RESTORE TABLE data AS data_restored FROM AzureBlobStorage('DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:10000/devstoreaccount1/;',
+    'test_container', 'data_backup');
+```

From 96c4b6bc35ee818afd2d2963dec7afdb5583969c Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 20 Nov 2023 14:41:14 +0100
Subject: [PATCH 0021/1081] Updated to not analyze create parameterized view
 for analyzer & old analyzer

---
 src/Interpreters/InterpreterCreateQuery.cpp   | 48 +++++--------------
 src/Storages/StorageView.cpp                  |  3 +-
 .../0_stateless/02428_parameterized_view.sh   |  2 +-
 3 files changed, 14 insertions(+), 39 deletions(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 747c0be009e..4ee666e2a9a 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -649,6 +649,7 @@ ColumnsDescription InterpreterCreateQuery::getColumnsDescription(
     if (!attach && !is_restore_from_backup && context_->getSettingsRef().flatten_nested)
         res.flattenNested();
 
+
     if (res.getAllPhysical().empty())
         throw Exception(ErrorCodes::EMPTY_LIST_OF_COLUMNS_PASSED, "Cannot CREATE table without physical columns");
 
@@ -755,49 +756,22 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
     {
         Block as_select_sample;
 
-        if (getContext()->getSettingsRef().allow_experimental_analyzer)
+        if (!create.isParameterizedView())
         {
-            if (create.isParameterizedView())
-            {
-                auto select = create.select->clone();
-
-                ///Get all query parameters
-                const auto parameters = analyzeReceiveQueryParamsWithType(select);
-                NameToNameMap parameter_values;
-
-                for (const auto & parameter : parameters)
-                {
-                    const auto data_type = DataTypeFactory::instance().get(parameter.second);
-                    /// Todo improve getting default values & include more datatypes
-                    if (data_type->isValueRepresentedByNumber() || parameter.second == "String")
-                        parameter_values[parameter.first] = "1";
-                    else if (parameter.second.starts_with("Array") || parameter.second.starts_with("Map"))
-                        parameter_values[parameter.first] = "[]";
-                    else
-                        parameter_values[parameter.first] = " ";
-                }
-
-                /// Replace with default parameters
-                ReplaceQueryParameterVisitor visitor(parameter_values);
-                visitor.visit(select);
-
-                as_select_sample = InterpreterSelectQueryAnalyzer::getSampleBlock(select, getContext());
-            }
-            else
+            if (getContext()->getSettingsRef().allow_experimental_analyzer)
             {
                 as_select_sample = InterpreterSelectQueryAnalyzer::getSampleBlock(create.select->clone(), getContext());
             }
+            else
+            {
+                as_select_sample = InterpreterSelectWithUnionQuery::getSampleBlock(create.select->clone(),
+                    getContext(),
+                    false /* is_subquery */,
+                    create.isParameterizedView());
+            }
 
+            properties.columns = ColumnsDescription(as_select_sample.getNamesAndTypesList());
         }
-        else
-        {
-            as_select_sample = InterpreterSelectWithUnionQuery::getSampleBlock(create.select->clone(),
-                getContext(),
-                false /* is_subquery */,
-                create.isParameterizedView());
-        }
-
-        properties.columns = ColumnsDescription(as_select_sample.getNamesAndTypesList());
     }
     else if (create.as_table_function)
     {
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index f0f9b9540de..2f7267e3701 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -112,7 +112,8 @@ StorageView::StorageView(
     : IStorage(table_id_)
 {
     StorageInMemoryMetadata storage_metadata;
-    storage_metadata.setColumns(columns_);
+    if (is_parameterized_view_ && !query.isParameterizedView())
+        storage_metadata.setColumns(columns_);
     storage_metadata.setComment(comment);
 
     if (!query.select)
diff --git a/tests/queries/0_stateless/02428_parameterized_view.sh b/tests/queries/0_stateless/02428_parameterized_view.sh
index ad9c672f4c5..499b8697ffc 100755
--- a/tests/queries/0_stateless/02428_parameterized_view.sh
+++ b/tests/queries/0_stateless/02428_parameterized_view.sh
@@ -37,7 +37,7 @@ $CLICKHOUSE_CLIENT -q "CREATE VIEW test_02428_pv1 AS SELECT * FROM test_02428_Ca
 $CLICKHOUSE_CLIENT -q "SELECT Price FROM test_02428_pv1(price=20)"
 $CLICKHOUSE_CLIENT -q "SELECT Price FROM \`test_02428_pv1\`(price=20)"
 
-$CLICKHOUSE_CLIENT -q "SELECT Price FROM test_02428_pv1" 2>&1 |  grep -Fq "UNKNOWN_QUERY_PARAMETER" && echo 'ERROR' || echo 'OK'
+$CLICKHOUSE_CLIENT -q "SELECT Price FROM test_02428_pv1" 2>&1 |  grep -q "UNKNOWN_QUERY_PARAMETER\|UNKNOWN_IDENTIFIER" && echo 'ERROR' || echo 'OK'
 $CLICKHOUSE_CLIENT --param_p 10 -q "SELECT Price FROM test_02428_pv1(price={p:UInt64})"
 
 $CLICKHOUSE_CLIENT --param_l 1 -q "SELECT Price FROM test_02428_pv1(price=50) LIMIT ({l:UInt64})"

From 42b2fe9adcf4596e8e36231068911c5dbdc4948f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 21 Nov 2023 13:21:35 +0100
Subject: [PATCH 0022/1081] Fxi

---
 src/Common/ErrorCodes.cpp                     |  1 +
 .../ReplicatedMergeTreePartCheckThread.cpp    | 10 +-
 src/Storages/MergeTree/checkDataPart.cpp      | 17 +++-
 .../02916_broken_projection.reference         | 93 ++++++++++---------
 .../0_stateless/02916_broken_projection.sh    | 39 ++++----
 5 files changed, 94 insertions(+), 66 deletions(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 28f8e6c6021..9c3aab5ad01 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -586,6 +586,7 @@
     M(704, CANNOT_USE_QUERY_CACHE_WITH_NONDETERMINISTIC_FUNCTIONS) \
     M(705, TABLE_NOT_EMPTY) \
     M(706, LIBSSH_ERROR) \
+    M(707, BROKEN_PROJECTION) \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
     M(1001, STD_EXCEPTION) \
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index 4468cf8e3bf..ba4d4869025 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -63,7 +63,7 @@ void ReplicatedMergeTreePartCheckThread::enqueuePart(const String & name, time_t
     if (parts_set.contains(name))
         return;
 
-    LOG_TRACE(log, "Enqueueing {} for check after after {}s", name, delay_to_check_seconds);
+    LOG_TRACE(log, "Enqueueing {} for check after {}s", name, delay_to_check_seconds);
     parts_queue.emplace_back(name, std::chrono::steady_clock::now() + std::chrono::seconds(delay_to_check_seconds));
     parts_set.insert(name);
     task->schedule();
@@ -385,17 +385,19 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
             if (isRetryableException(std::current_exception()))
                 throw;
 
-            tryLogCurrentException(log, __PRETTY_FUNCTION__);
-
             PreformattedMessage message;
             if (is_broken_projection)
             {
-                message = PreformattedMessage::create("Part {} has a broken projection. It will be ignored.", part_name);
+                message = PreformattedMessage::create(
+                    "Part {} has a broken projections. It will be ignored. Broken projections info: \n{}",
+                    part_name, getCurrentExceptionMessage(false));
                 LOG_DEBUG(log, message);
                 result.action = ReplicatedCheckResult::DoNothing;
             }
             else
             {
+                tryLogCurrentException(log, __PRETTY_FUNCTION__);
+
                 message = PreformattedMessage::create("Part {} looks broken. Removing it and will try to fetch.", part_name);
                 LOG_ERROR(log, message);
                 result.action = ReplicatedCheckResult::TryFetchMissing;
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 8feabf344b5..3bb6f763c8b 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -42,6 +42,7 @@ namespace ErrorCodes
     extern const int NO_FILE_IN_DATA_PART;
     extern const int NETWORK_ERROR;
     extern const int SOCKET_TIMEOUT;
+    extern const int BROKEN_PROJECTION;
 }
 
 
@@ -272,6 +273,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         }
     }
 
+    std::string broken_projections_message;
     for (const auto & [name, projection] : data_part->getProjectionParts())
     {
         if (is_cancelled())
@@ -307,7 +309,15 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
             is_broken_projection = true;
             if (throw_on_broken_projection)
-                throw;
+            {
+                if (!broken_projections_message.empty())
+                    broken_projections_message += "\n";
+
+                broken_projections_message += fmt::format(
+                    "Part {} has a broken projection {} (error: {})",
+                    data_part->name, name, getCurrentExceptionMessage(false));
+                continue;
+            }
 
             projections_on_disk.erase(projection_file);
             checksums_txt.remove(projection_file);
@@ -320,6 +330,11 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         projections_on_disk.erase(projection_file);
     }
 
+    if (throw_on_broken_projection && !broken_projections_message.empty())
+    {
+        throw Exception(ErrorCodes::BROKEN_PROJECTION, broken_projections_message.data());
+    }
+
     if (require_checksums && !projections_on_disk.empty())
     {
         throw Exception(ErrorCodes::UNEXPECTED_FILE_IN_DATA_PART,
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 62966036eed..aee18a21fb8 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -7,42 +7,40 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
-0
 broke metadata of part 'proj' (parent part: all_2_2_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
-0
+all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -51,13 +49,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: proj_2
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
-FILE_DOESNT_EXIST
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: proj_2
 check table
 0
 broken projections info
@@ -68,19 +65,18 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
-0
 broke data of part 'proj_2' (parent part: all_3_3_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -88,6 +84,7 @@ all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 insert new part
 insert new part
 optimize
+OPTIMIZE TABLE test SETTINGS alter_sync=0
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -101,19 +98,18 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
-0
 broke metadata of part 'proj' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -121,7 +117,6 @@ all_1_1_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
-0
 broke data of part 'proj_2' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -138,21 +133,21 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 0
 check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projection. It will be ignored.
-all_1_1_0	0	Part all_1_1_0 has a broken projection. It will be ignored.
+all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_2_2_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+all_1_1_0	0	Part all_1_1_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_1_1_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_1_1_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_1_1_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
 materialize projection proj
 check table full
 system.parts
@@ -167,45 +162,55 @@ all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
 materialize projection proj_2
 check table full
+broke data of part 'proj' (parent part: all_3_5_1_7)
+insert new part
+optimize
+OPTIMIZE TABLE test FINAL
+insert new part
+optimize
+OPTIMIZE TABLE test FINAL
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	0	['proj','proj_2']
-all_0_0_0_7	1	['proj','proj_2']
+all_0_0_0_7	0	['proj','proj_2']
+all_0_8_2_7	1	['proj_2']
 all_1_1_0	0	['proj','proj_2']
 all_1_1_0_6	0	['proj','proj_2']
-all_1_1_0_7	1	['proj','proj_2']
+all_1_1_0_7	0	['proj','proj_2']
 all_2_2_0	0	['proj','proj_2']
 all_2_2_0_6	0	['proj','proj_2']
-all_2_2_0_7	1	['proj','proj_2']
+all_2_2_0_7	0	['proj','proj_2']
 all_3_3_0	0	['proj','proj_2']
 all_3_5_1	0	['proj']
 all_3_5_1_6	0	['proj']
-all_3_5_1_7	1	['proj','proj_2']
+all_3_5_1_7	0	['proj','proj_2']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj'
+all_8_8_0	0	['proj','proj_2']
+all_9_9_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['default.test.proj']
-select from projection 'proj_2'
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj_2']
+select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['default.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bf0ec61fd76..bf382624787 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -24,7 +24,7 @@ CREATE TABLE test
         SELECT d ORDER BY c
     )
 )
-ENGINE = ReplicatedMergeTree('/test3/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
+ENGINE = ReplicatedMergeTree('/test4/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
 SETTINGS min_bytes_for_wide_part = 0,
     max_parts_to_merge_at_once=3,
     enable_vertical_merge_algorithm=1,
@@ -65,18 +65,13 @@ function break_projection()
     LIMIT 1;
     ")
 
-    path=$($CLICKHOUSE_CLIENT -q "SELECT path FROM system.disks WHERE name='$disk_name'")
-
-    # make sure path is absolute
-    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
-
     if [ "$break_type" = "data" ]
         then
-           rm "$path/$part_path/d.bin"
-           rm "$path/$part_path/c.bin"
+           rm "$part_path/d.bin"
+           rm "$part_path/c.bin"
            echo "broke data of part '$part_name' (parent part: $parent_name)"
         else
-           rm "$path/$part_path/columns.txt"
+           rm "$part_path/columns.txt"
            echo "broke metadata of part '$part_name' (parent part: $parent_name)"
     fi
 }
@@ -115,12 +110,12 @@ function check()
     WHERE table='test' AND database=currentDatabase()
     ORDER BY name;"
 
-    echo "select from projection 'proj'"
+    echo "select from projection 'proj', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
@@ -130,12 +125,12 @@ function check()
             "
     fi
 
-    echo "select from projection 'proj_2'"
+    echo "select from projection 'proj_2', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
@@ -146,7 +141,9 @@ function check()
     fi
 
     echo 'check table'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test"
+    $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
+    CHECK TABLE test;"
 }
 
 function optimize()
@@ -159,16 +156,21 @@ function optimize()
 
     if [ $final -eq 1 ]; then
         query="$query FINAL"
+    fi
     if [ $no_wait -eq 1 ]; then
         query="$query SETTINGS alter_sync=0"
+    fi
 
-    $CLICKHOUSE_CLIENT -nm -q $query
+    echo $query
+
+    $CLICKHOUSE_CLIENT -q "$query"
 }
 
 function reattach()
 {
     echo 'Detach - Attach'
     $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
     DETACH TABLE test;
     ATTACH TABLE test;
     "
@@ -184,7 +186,10 @@ function materialize_projection
 function check_table_full()
 {
     echo 'check table full'
-    $CLICKHOUSE_CLIENT -q "CHECK TABLE test SETTINGS check_query_single_value_result = 0" | grep "broken"
+    $CLICKHOUSE_CLIENT -nm -q "
+    SET send_logs_level='fatal';
+    CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+" | grep "broken"
 }
 
 
@@ -300,5 +305,5 @@ optimize 1 0
 check
 
 $CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE test;
+DROP TABLE test SYNC;
 "

From bcc87c01771414806fca705b5c9b5e0e925dea5f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 21 Nov 2023 17:17:36 +0100
Subject: [PATCH 0023/1081] Better test

---
 .../ReplicatedMergeTreePartCheckThread.cpp    |  3 +-
 src/Storages/System/StorageSystemDisks.cpp    |  2 +-
 .../02916_broken_projection.reference         | 43 +++++++++----------
 .../0_stateless/02916_broken_projection.sh    | 27 ++++++++----
 4 files changed, 42 insertions(+), 33 deletions(-)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
index ba4d4869025..d058113e134 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreePartCheckThread.cpp
@@ -388,8 +388,9 @@ ReplicatedCheckResult ReplicatedMergeTreePartCheckThread::checkPartImpl(const St
             PreformattedMessage message;
             if (is_broken_projection)
             {
+                WriteBufferFromOwnString wb;
                 message = PreformattedMessage::create(
-                    "Part {} has a broken projections. It will be ignored. Broken projections info: \n{}",
+                    "Part {} has a broken projections. It will be ignored. Broken projections info: {}",
                     part_name, getCurrentExceptionMessage(false));
                 LOG_DEBUG(log, message);
                 result.action = ReplicatedCheckResult::DoNothing;
diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 250fcdba641..23a00cc7ae5 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -63,7 +63,7 @@ Pipe StorageSystemDisks::read(
     for (const auto & [disk_name, disk_ptr] : context->getDisksMap())
     {
         col_name->insert(disk_name);
-        col_path->insert(fs::absolute(disk_ptr->getPath()).string());
+        col_path->insert(disk_ptr->getPath());
         col_free->insert(disk_ptr->getAvailableSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_total->insert(disk_ptr->getTotalSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index aee18a21fb8..1b84ca96840 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -11,12 +11,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 broke metadata of part 'proj' (parent part: all_2_2_0)
@@ -29,18 +29,18 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+check table full (all_2_2_0)
+all_2_2_0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -53,7 +53,7 @@ select from projection 'proj', expect error: proj_2
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: proj_2
 check table
 0
@@ -69,12 +69,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broke data of part 'proj_2' (parent part: all_3_3_0)
@@ -102,12 +102,12 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broke metadata of part 'proj' (parent part: all_1_1_0)
@@ -137,19 +137,18 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
-check table full
-all_2_2_0	0	Part all_2_2_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_2_2_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_2_2_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_2_2_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
-all_1_1_0	0	Part all_1_1_0 has a broken projections. It will be ignored. Broken projections info: \nCode: 707. DB::Exception: Part all_1_1_0 has a broken projection proj (error: Code: 107. DB::ErrnoException: Cannot open file /var/lib/clickhouse/store/521/521986ec-2fef-42c8-a402-83f937689286/all_1_1_0/proj.proj/columns.txt, errno: 2, strerror: No such file or directory. (FILE_DOESNT_EXIST) (version 23.11.1.1))\nPart all_1_1_0 has a broken projection proj_2 (error: Code: 226. DB::Exception: There is no file for column \'c\' in data part \'proj_2\'. (NO_FILE_IN_DATA_PART) (version 23.11.1.1)). (BROKEN_PROJECTION) (version 23.11.1.1)
+check table full (all_1_1_0)
+all_1_1_0
 materialize projection proj
-check table full
+check table full ()
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
@@ -166,16 +165,16 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 materialize projection proj_2
-check table full
+check table full ()
 broke data of part 'proj' (parent part: all_3_5_1_7)
 insert new part
 optimize
@@ -206,11 +205,11 @@ select from projection 'proj', expect error:
 12
 16
 used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	['test.test.proj_2']
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
 select from projection 'proj_2', expect error: 
 12
 16
 used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	['test.test.proj_2']
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bf382624787..a522de42c89 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -121,7 +121,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -136,7 +136,7 @@ function check()
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
-            SELECT query, projections FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -185,11 +185,20 @@ function materialize_projection
 
 function check_table_full()
 {
-    echo 'check table full'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    CHECK TABLE test SETTINGS check_query_single_value_result = 0;
-" | grep "broken"
+    echo "check table full ($1)"
+    expect_broken_part=$1
+    if [ "$expect_broken_part" = "" ]
+       then
+           $CLICKHOUSE_CLIENT -nm -q "
+           SET send_logs_level='fatal';
+           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           " | grep "broken"
+       else
+           $CLICKHOUSE_CLIENT -nm -q "
+           SET send_logs_level='fatal';
+           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           " | grep "broken" | grep -o $expect_broken_part | head -n 1
+    fi
 }
 
 
@@ -216,7 +225,7 @@ check
 broken_projections_info
 
 # Check table query will also show a list of parts which have broken projections.
-check_table_full
+check_table_full "all_2_2_0"
 
 # Break data file of projection 'proj_2' for part all_2_2_0
 break_projection proj_2 all_2_2_0 data
@@ -280,7 +289,7 @@ broken_projections_info
 
 check
 
-check_table_full
+check_table_full all_1_1_0
 
 materialize_projection proj
 

From e8d99cb29654645c5a89d6cb15856b48a55d7bdf Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 22 Nov 2023 12:34:31 +0100
Subject: [PATCH 0024/1081] Fix style check

---
 tests/queries/0_stateless/02916_broken_projection.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a522de42c89..6ed92e2e06e 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -54,8 +54,8 @@ function break_projection()
     parent_name=$2
     break_type=$3
 
-    read -r disk_name part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT disk_name, path
+    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT path
     FROM system.projection_parts
     WHERE table='test'
     AND database=currentDatabase()

From a57e612cf2ef657801cdeefb8410caf5cab804a2 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 24 Nov 2023 16:08:49 +0100
Subject: [PATCH 0025/1081] Fxi tests

---
 src/Storages/StorageMergeTree.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 74277616e95..84b48bb650b 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2247,7 +2247,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
+                auto calculated_checksums = checkDataPart(part, false, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */true);
                 calculated_checksums.checkEqual(part->checksums, true);
 
                 auto & part_mutable = const_cast<IMergeTreeDataPart &>(*part);
@@ -2268,7 +2268,7 @@ std::optional<CheckResult> StorageMergeTree::checkDataNext(DataValidationTasksPt
         {
             try
             {
-                checkDataPart(part, true, noop, /* is_cancelled */{}, /* throw_on_broken_projection */true);
+                checkDataPart(part, true, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */true);
                 return CheckResult(part->name, true, "");
             }
             catch (...)

From 8ebbc8d85dc3f1e37d109ddb1ad1a05a55283a79 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 24 Nov 2023 18:37:40 +0100
Subject: [PATCH 0026/1081] Update 02117_show_create_table_system.reference

---
 .../0_stateless/02117_show_create_table_system.reference       | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 9ed905a0df8..e122de8ef6c 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -685,6 +685,9 @@ CREATE TABLE system.projection_parts
     `rows_where_ttl_info.expression` Array(String),
     `rows_where_ttl_info.min` Array(DateTime),
     `rows_where_ttl_info.max` Array(DateTime),
+    `is_broken` UInt8,
+    `exception_code` Int32,
+    `exception` String,
     `bytes` UInt64 ALIAS bytes_on_disk,
     `marks_size` UInt64 ALIAS marks_bytes,
     `part_name` String ALIAS name

From b4dab194954845b76d1ce9a6bf8b18dded059d74 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 27 Nov 2023 12:42:09 +0100
Subject: [PATCH 0027/1081] Fix test

---
 .../0_stateless/02916_broken_projection.reference    |  1 +
 tests/queries/0_stateless/02916_broken_projection.sh | 12 +++++++++---
 2 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 1b84ca96840..1f072e207a7 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -55,6 +55,7 @@ select from projection 'proj', expect error: proj_2
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
 select from projection 'proj_2', expect error: proj_2
+FILE_DOESNT_EXIST
 check table
 0
 broken projections info
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 6ed92e2e06e..80805330577 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -115,7 +115,10 @@ function check()
 
     if [ "$expect_broken_part" = "proj" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT c FROM test WHERE d == 12 ORDER BY c;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
+SET send_logs_level='fatal';
+SELECT c FROM test WHERE d == 12 ORDER BY c;
+" 2>&1 | grep -oF "$expected_error"
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
@@ -130,7 +133,10 @@ function check()
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --send_logs_level 'fatal' --query_id $query_id -q "SELECT d FROM test WHERE c == 12 ORDER BY d;" 2>&1 | grep -o $expected_error
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
+SET send_logs_level='fatal';
+SELECT d FROM test WHERE c == 12 ORDER BY d;
+" 2>&1 | grep -oF "$expected_error"
         else
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
@@ -234,7 +240,7 @@ break_projection proj_2 all_2_2_0 data
 broken_projections_info
 
 # Select now fails with error "File doesn't exist"
-check "proj_2" "FILE_DOESNT_EXIST"
+check "proj_2" FILE_DOESNT_EXIST
 
 # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
 broken_projections_info

From a6972e7c90fd8ff775855cac13f47f9cd46b2da1 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 28 Nov 2023 10:22:10 +0100
Subject: [PATCH 0028/1081] Fxi

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 85ce112d9a1..be665a64f1c 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1145,7 +1145,7 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         LOG_WARNING(storage.log, "Checksums for part {} not found. Will calculate them from data on disk.", name);
 
         bool noop;
-        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */{}, /* throw_on_broken_projection */false);
+        checksums = checkDataPart(shared_from_this(), false, noop, /* is_cancelled */[]{ return false; }, /* throw_on_broken_projection */false);
         writeChecksums(checksums, {});
 
         bytes_on_disk = checksums.getTotalSizeOnDisk();

From 0e11eeaea546dd41231a4f180b877ada1291a23d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 30 Nov 2023 13:52:08 +0100
Subject: [PATCH 0029/1081] Allow to backup and restore parts with broken
 projections

---
 src/Backups/BackupSettings.cpp                |   2 +
 src/Backups/BackupSettings.h                  |   6 +
 .../MergeTree/DataPartStorageOnDiskBase.cpp   |  35 +-
 .../MergeTree/DataPartStorageOnDiskBase.h     |   4 +-
 src/Storages/MergeTree/IDataPartStorage.h     |   4 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  15 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   3 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |   9 +-
 .../02916_broken_projection.reference         | 226 +++++++++-
 .../0_stateless/02916_broken_projection.sh    | 426 +++++++++++++-----
 10 files changed, 588 insertions(+), 142 deletions(-)

diff --git a/src/Backups/BackupSettings.cpp b/src/Backups/BackupSettings.cpp
index 68d825e9468..51d713f03e1 100644
--- a/src/Backups/BackupSettings.cpp
+++ b/src/Backups/BackupSettings.cpp
@@ -32,6 +32,8 @@ namespace ErrorCodes
     M(UInt64, shard_num) \
     M(UInt64, replica_num) \
     M(Bool, check_parts) \
+    M(Bool, check_projection_parts) \
+    M(Bool, allow_backup_broken_projections) \
     M(Bool, internal) \
     M(String, host_id) \
     M(OptionalUUID, backup_uuid)
diff --git a/src/Backups/BackupSettings.h b/src/Backups/BackupSettings.h
index f26b992b348..ec430905f51 100644
--- a/src/Backups/BackupSettings.h
+++ b/src/Backups/BackupSettings.h
@@ -62,6 +62,12 @@ struct BackupSettings
     /// Check checksums of the data parts before writing them to a backup.
     bool check_parts = true;
 
+    /// Check checksums of the projection data parts before writing them to a backup.
+    bool check_projection_parts = true;
+
+    /// Allow to create backup with broken projections.
+    bool allow_backup_broken_projections = false;
+
     /// Internal, should not be specified by user.
     /// Whether this backup is a part of a distributed backup created by BACKUP ON CLUSTER.
     bool internal = false;
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
index 7fc8187aee5..6e5cbdde355 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
@@ -334,7 +334,9 @@ void DataPartStorageOnDiskBase::backup(
     const ReadSettings & read_settings,
     bool make_temporary_hard_links,
     BackupEntries & backup_entries,
-    TemporaryFilesOnDisks * temp_dirs) const
+    TemporaryFilesOnDisks * temp_dirs,
+    bool is_projection_part,
+    bool allow_backup_broken_projection) const
 {
     fs::path part_path_on_disk = fs::path{root_path} / part_dir;
     fs::path part_path_in_backup = fs::path{path_in_backup} / part_dir;
@@ -376,7 +378,7 @@ void DataPartStorageOnDiskBase::backup(
 
     bool copy_encrypted = !backup_settings.decrypt_files_from_encrypted_disks;
 
-    for (const auto & filepath : files_to_backup)
+    auto backup_file = [&](const String & filepath)
     {
         auto filepath_on_disk = part_path_on_disk / filepath;
         auto filepath_in_backup = part_path_in_backup / filepath;
@@ -384,8 +386,10 @@ void DataPartStorageOnDiskBase::backup(
         if (files_without_checksums.contains(filepath))
         {
             backup_entries.emplace_back(filepath_in_backup, std::make_unique<BackupEntryFromSmallFile>(disk, filepath_on_disk, read_settings, copy_encrypted));
-            continue;
+            return;
         }
+        else if (is_projection_part && allow_backup_broken_projection && !disk->exists(filepath_on_disk))
+            return;
 
         if (make_temporary_hard_links)
         {
@@ -410,6 +414,31 @@ void DataPartStorageOnDiskBase::backup(
             backup_entry = wrapBackupEntryWith(std::move(backup_entry), temp_dir_owner);
 
         backup_entries.emplace_back(filepath_in_backup, std::move(backup_entry));
+    };
+
+    auto * log = &Poco::Logger::get("DataPartStorageOnDiskBase::backup");
+
+    for (const auto & filepath : files_to_backup)
+    {
+        if (is_projection_part && allow_backup_broken_projection)
+        {
+            try
+            {
+                backup_file(filepath);
+            }
+            catch (Exception & e)
+            {
+                if (e.code() != ErrorCodes::FILE_DOESNT_EXIST)
+                    throw;
+
+                LOG_ERROR(log, "Cannot backup file {} of projection part {}. Will try to ignore it", filepath, part_dir);
+                continue;
+            }
+        }
+        else
+        {
+            backup_file(filepath);
+        }
     }
 }
 
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
index 1826e84c28d..6176a13c27b 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.h
@@ -58,7 +58,9 @@ public:
         const ReadSettings & read_settings,
         bool make_temporary_hard_links,
         BackupEntries & backup_entries,
-        TemporaryFilesOnDisks * temp_dirs) const override;
+        TemporaryFilesOnDisks * temp_dirs,
+        bool is_projection_part,
+        bool allow_backup_broken_projection) const override;
 
     MutableDataPartStoragePtr freeze(
         const std::string & to,
diff --git a/src/Storages/MergeTree/IDataPartStorage.h b/src/Storages/MergeTree/IDataPartStorage.h
index 072cb29626e..b3a6ab203d5 100644
--- a/src/Storages/MergeTree/IDataPartStorage.h
+++ b/src/Storages/MergeTree/IDataPartStorage.h
@@ -222,7 +222,9 @@ public:
         const ReadSettings & read_settings,
         bool make_temporary_hard_links,
         BackupEntries & backup_entries,
-        TemporaryFilesOnDisks * temp_dirs) const = 0;
+        TemporaryFilesOnDisks * temp_dirs,
+        bool is_projection_part,
+        bool allow_backup_broken_projection) const = 0;
 
     /// Creates hardlinks into 'to/dir_path' for every file in data part.
     /// Callback is called after hardlinks are created, but before 'delete-on-destroy.txt' marker is removed.
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index be665a64f1c..940b3991067 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -647,13 +647,14 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         loadIndex(); /// Must be called after loadIndexGranularity as it uses the value of `index_granularity`
         loadRowsCount(); /// Must be called after loadIndexGranularity() as it uses the value of `index_granularity`.
         loadPartitionAndMinMaxIndex();
+        bool has_broken_projections = false;
         if (!parent_part)
         {
             loadTTLInfos();
-            loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
+            has_broken_projections = !loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
         }
 
-        if (check_consistency)
+        if (check_consistency && !has_broken_projections)
             checkConsistency(require_columns_checksums);
 
         loadDefaultCompressionCodec();
@@ -715,9 +716,10 @@ void IMergeTreeDataPart::addProjectionPart(
     projection_parts[projection_name] = std::move(projection_part);
 }
 
-void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
+bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
+    bool has_broken_projection = false;
     for (const auto & projection : metadata_snapshot->projections)
     {
         auto path = projection.name + ".proj";
@@ -742,16 +744,19 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                     if (isRetryableException(std::current_exception()))
                         throw;
 
+                    auto message = getCurrentExceptionMessage(true);
                     LOG_ERROR(&Poco::Logger::get("IMergeTreeDataPart"),
-                              "Cannot load projection {}, will consider it broken", projection.name);
+                              "Cannot load projection {}, will consider it broken. Reason: {}", projection.name, message);
 
-                    part->setBrokenReason(getCurrentExceptionMessage(false), getCurrentExceptionCode());
+                    has_broken_projection = true;
+                    part->setBrokenReason(message, getCurrentExceptionCode());
                 }
 
                 addProjectionPart(projection.name, std::move(part));
             }
         }
     }
+    return has_broken_projection;
 }
 
 void IMergeTreeDataPart::loadIndexGranularity()
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 9af2c16f1e8..6e276284f4c 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -421,7 +421,8 @@ public:
 
     bool hasBrokenProjection(const String & projection_name) const;
 
-    void loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
+    /// Return true, if all projections were loaded successfully and none was marked as broken.
+    bool loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
 
     void setBrokenReason(const String & message, int code) const;
 
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 8683e4293e9..c95aee88aee 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5113,7 +5113,7 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
         if (hold_table_lock && !table_lock)
             table_lock = lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
 
-        if (backup_settings.check_parts)
+        if (backup_settings.check_projection_parts)
             part->checkConsistencyWithProjections(/* require_part_metadata= */ true);
 
         BackupEntries backup_entries_from_part;
@@ -5125,7 +5125,8 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
             read_settings,
             make_temporary_hard_links,
             backup_entries_from_part,
-            &temp_dirs);
+            &temp_dirs,
+            false, false);
 
         auto projection_parts = part->getProjectionParts();
         for (const auto & [projection_name, projection_part] : projection_parts)
@@ -5138,7 +5139,9 @@ MergeTreeData::PartsBackupEntries MergeTreeData::backupParts(
                 read_settings,
                 make_temporary_hard_links,
                 backup_entries_from_part,
-                &temp_dirs);
+                &temp_dirs,
+                projection_part->is_broken,
+                backup_settings.allow_backup_broken_projections);
         }
 
         if (hold_storage_and_part_ptrs)
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 1f072e207a7..4c4901ae99f 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -19,6 +19,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
+0
 broke metadata of part 'proj' (parent part: all_2_2_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
@@ -39,8 +40,9 @@ check table
 0
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full (all_2_2_0)
+check table full (test - all_2_2_0)
 all_2_2_0
+0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -78,6 +80,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
+0
 broke data of part 'proj_2' (parent part: all_3_3_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
@@ -111,6 +114,7 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
+0
 broke metadata of part 'proj' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -118,6 +122,7 @@ all_1_1_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
+0
 broke data of part 'proj_2' (parent part: all_1_1_0)
 Detach - Attach
 broken projections info
@@ -146,10 +151,10 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
-check table full (all_1_1_0)
+check table full (test - all_1_1_0)
 all_1_1_0
 materialize projection proj
-check table full ()
+check table full (test - )
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_0_0_0_6	1	['proj','proj_2']
@@ -175,7 +180,8 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 materialize projection proj_2
-check table full ()
+check table full (test - )
+0
 broke data of part 'proj' (parent part: all_3_5_1_7)
 insert new part
 optimize
@@ -214,3 +220,215 @@ used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+system.parts
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke data of part 'proj' (parent part: all_0_0_0)
+check table full (test2 - all_0_0_0)
+all_0_0_0
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broke data of part 'all_0_0_0'
+check table full (test2 - all_0_0_0)
+all_0_0_0
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+used projections
+SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+used projections
+SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+insert new part
+insert new part
+insert new part
+insert new part
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+FILE_DOESNT_EXIST
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+FILE_DOESNT_EXIST
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+0
+broke all data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+FILE_DOESNT_EXIST
+materialize projection proj
+system.parts
+all_0_0_0	0	['proj','proj_2']
+all_0_0_0_4	1	['proj','proj_2']
+all_1_1_0	0	['proj','proj_2']
+all_1_1_0_4	1	['proj','proj_2']
+all_2_2_0	0	['proj','proj_2']
+all_2_2_0_4	1	['proj','proj_2']
+all_3_3_0	0	['proj','proj_2']
+all_3_3_0_4	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+broken projections info
+all_2_2_0	proj	NO_FILE_IN_DATA_PART
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+1
+0
+broke all data of part 'proj' (parent part: all_2_2_0)
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj','proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: proj
+select from projection 'proj_2', expect error: proj
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
+all_2_2_0	proj	FILE_DOESNT_EXIST
+BACKUP_CREATED
+RESTORED
+system.parts
+all_0_0_0	1	['proj','proj_2']
+all_1_1_0	1	['proj','proj_2']
+all_2_2_0	1	['proj_2']
+all_3_3_0	1	['proj','proj_2']
+select from projection 'proj', expect error: 
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2', expect error: 
+12
+16
+used projections
+SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
+check table
+0
+broken projections info
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 80805330577..1555139e16f 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -5,35 +5,40 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE IF EXISTS test SYNC;
-CREATE TABLE test
-(
-    a String,
-    b String,
-    c Int32,
-    d Int32,
-    e Int32,
+function create_table()
+{
+    test_id=$1
+    name=$2
+    replica=$3
+    $CLICKHOUSE_CLIENT -nm -q "
+    DROP TABLE IF EXISTS $name SYNC;
+    CREATE TABLE $name
+    (
+        a String,
+        b String,
+        c Int64,
+        d Int64,
+        e Int64,
 
-    PROJECTION proj
-    (
-        SELECT c ORDER BY d
-    ),
-    PROJECTION proj_2
-    (
-        SELECT d ORDER BY c
+        PROJECTION proj
+        (
+            SELECT c ORDER BY d
+        ),
+        PROJECTION proj_2
+        (
+            SELECT d ORDER BY c
+        )
     )
-)
-ENGINE = ReplicatedMergeTree('/test4/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '1') PRIMARY KEY (a)
-SETTINGS min_bytes_for_wide_part = 0,
-    max_parts_to_merge_at_once=3,
-    enable_vertical_merge_algorithm=1,
-    vertical_merge_algorithm_min_rows_to_activate = 1,
-    vertical_merge_algorithm_min_columns_to_activate = 1,
-    vertical_merge_algorithm_min_columns_to_activate = 1;
-"
-
-table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_24_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    SETTINGS min_bytes_for_wide_part = 0,
+        max_parts_to_merge_at_once=3,
+        enable_vertical_merge_algorithm=1,
+        vertical_merge_algorithm_min_rows_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        compress_primary_key=0;
+    "
+}
 
 function random()
 {
@@ -42,49 +47,88 @@ function random()
 
 function insert()
 {
-    offset=$1
-    size=$2
+    table=$1
+    offset=$2
+    size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO test SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
 }
 
 function break_projection()
 {
-    part_name=$1
-    parent_name=$2
-    break_type=$3
+    table=$1
+    part_name=$2
+    parent_name=$3
+    break_type=$4
 
     read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
     SELECT path
     FROM system.projection_parts
-    WHERE table='test'
+    WHERE table='$table'
     AND database=currentDatabase()
     AND active=1
     AND part_name='$part_name'
     AND parent_name='$parent_name'
+    ORDER BY modification_time DESC
     LIMIT 1;
     ")
 
+    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$part_path', 1, 1) != '/', 'Path is relative: $part_path')" || exit
+
     if [ "$break_type" = "data" ]
         then
            rm "$part_path/d.bin"
            rm "$part_path/c.bin"
            echo "broke data of part '$part_name' (parent part: $parent_name)"
-        else
+    fi
+    if [ "$break_type" = "metadata" ]
+        then
            rm "$part_path/columns.txt"
            echo "broke metadata of part '$part_name' (parent part: $parent_name)"
     fi
+    if [ "$break_type" = "part" ]
+        then
+           rm -r "$part_path"
+           echo "broke all data of part '$part_name' (parent part: $parent_name)"
+    fi
+}
+
+function break_part()
+{
+    table=$1
+    part_name=$2
+
+    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
+    SELECT path
+    FROM system.parts
+    WHERE table='$table'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='$part_name'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    ")
+
+    if [ "$part_path" = "" ]
+       then
+           echo "Part path is empty"
+           exit
+    fi
+
+    rm $part_path/columns.txt
+    echo "broke data of part '$part_name'"
 }
 
 function broken_projections_info()
 {
+    table=$1
     echo 'broken projections info'
     $CLICKHOUSE_CLIENT -q "
     SELECT parent_name, name, errors.name FROM
     (
         SELECT parent_name, name, exception_code
         FROM system.projection_parts
-        WHERE table='test'
+        WHERE table='$table'
         AND database=currentDatabase()
         AND is_broken = 1
     ) AS parts_info
@@ -96,18 +140,19 @@ function broken_projections_info()
 
 function check()
 {
+    table=$1
     expect_broken_part=""
     expected_error=""
-    if [ $# -ne 0 ]; then
-        expect_broken_part=$1
-        expected_error=$2
+    if [ $# -gt 1 ]; then
+        expect_broken_part=$2
+        expected_error=$3
     fi
 
     echo 'system.parts'
     $CLICKHOUSE_CLIENT -q "
     SELECT name, active, projections
     FROM system.parts
-    WHERE table='test' AND database=currentDatabase()
+    WHERE table='$table' AND database=currentDatabase()
     ORDER BY name;"
 
     echo "select from projection 'proj', expect error: $expect_broken_part"
@@ -117,10 +162,10 @@ function check()
         then
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
 SET send_logs_level='fatal';
-SELECT c FROM test WHERE d == 12 ORDER BY c;
+SELECT c FROM $table WHERE d == 12 ORDER BY c;
 " 2>&1 | grep -oF "$expected_error"
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -135,10 +180,10 @@ SELECT c FROM test WHERE d == 12 ORDER BY c;
         then
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
 SET send_logs_level='fatal';
-SELECT d FROM test WHERE c == 12 ORDER BY d;
+SELECT d FROM $table WHERE c == 12 ORDER BY d;
 " 2>&1 | grep -oF "$expected_error"
         else
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;"
+            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
             SYSTEM FLUSH LOGS;
@@ -149,7 +194,7 @@ SELECT d FROM test WHERE c == 12 ORDER BY d;
     echo 'check table'
     $CLICKHOUSE_CLIENT -nm -q "
     SET send_logs_level='fatal';
-    CHECK TABLE test;"
+    CHECK TABLE $table;"
 }
 
 function optimize()
@@ -184,141 +229,274 @@ function reattach()
 
 function materialize_projection
 {
-    projection=$1
+    table=$1
+    projection=$2
     echo "materialize projection $projection"
-    $CLICKHOUSE_CLIENT -q "ALTER TABLE test MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
+    $CLICKHOUSE_CLIENT -q "ALTER TABLE $table MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
 }
 
 function check_table_full()
 {
-    echo "check table full ($1)"
-    expect_broken_part=$1
+    table=$1
+    expect_broken_part=$2
+    echo "check table full ($1 - $2)"
     if [ "$expect_broken_part" = "" ]
        then
            $CLICKHOUSE_CLIENT -nm -q "
            SET send_logs_level='fatal';
-           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
            " | grep "broken"
        else
            $CLICKHOUSE_CLIENT -nm -q "
            SET send_logs_level='fatal';
-           CHECK TABLE test SETTINGS check_query_single_value_result = 0;
+           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
            " | grep "broken" | grep -o $expect_broken_part | head -n 1
     fi
 }
 
+function test1()
+{
+    create_table test1 test 1
 
-insert 0 5
+    table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
 
-insert 5 5
+    insert test 0 5
 
-insert 10 5
+    insert test 5 5
 
-insert 15 5
+    insert test 10 5
 
-check
+    insert test 15 5
 
-# Break metadata file of projection 'proj'
-break_projection proj all_2_2_0 metadata
+    check test
 
-# Do select and after "check table" query.
-# Select works because it does not read columns.txt.
-check
+    # Break metadata file of projection 'proj'
+    break_projection test proj all_2_2_0 metadata
 
-# Projection 'proj' from part all_2_2_0 will now appear in broken parts info
-# because it was marked broken during "check table" query.
-# TODO: try to mark it during select as well
-broken_projections_info
+    # Do select and after "check table" query.
+    # Select works because it does not read columns.txt.
+    check test
 
-# Check table query will also show a list of parts which have broken projections.
-check_table_full "all_2_2_0"
+    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # because it was marked broken during "check table" query.
+    # TODO: try to mark it during select as well
+    broken_projections_info test
 
-# Break data file of projection 'proj_2' for part all_2_2_0
-break_projection proj_2 all_2_2_0 data
+    # Check table query will also show a list of parts which have broken projections.
+    check_table_full test "all_2_2_0"
 
-# It will not yet appear in broken projections info.
-broken_projections_info
+    # Break data file of projection 'proj_2' for part all_2_2_0
+    break_projection test proj_2 all_2_2_0 data
 
-# Select now fails with error "File doesn't exist"
-check "proj_2" FILE_DOESNT_EXIST
+    # It will not yet appear in broken projections info.
+    broken_projections_info test
 
-# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-broken_projections_info
+    # Select now fails with error "File doesn't exist"
+    check test "proj_2" FILE_DOESNT_EXIST
 
-# Second select works, because projection is now marked as broken.
-check
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    broken_projections_info test
 
-# Break data file of projection 'proj_2' for part all_3_3_0
-break_projection proj_2 all_3_3_0 data
+    # Second select works, because projection is now marked as broken.
+    check test
 
-# It will not yet appear in broken projections info.
-broken_projections_info
+    # Break data file of projection 'proj_2' for part all_3_3_0
+    break_projection test proj_2 all_3_3_0 data
 
-insert 20 5
+    # It will not yet appear in broken projections info.
+    broken_projections_info test
 
-insert 25 5
+    insert test 20 5
 
-# Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
-# Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
-# So a merge will be create for future part all_3_5_1.
-# During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
-# Merge will be retried and on second attempt it will succeed.
-# The result part all_3_5_1 will have only 1 projection - 'proj', because
-# it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-optimize 0 1
-sleep 2
+    insert test 25 5
 
-$CLICKHOUSE_CLIENT -nm -q "
-SYSTEM FLUSH LOGS;
-SELECT count() FROM system.text_log
-WHERE level='Error'
-AND logger_name='MergeTreeBackgroundExecutor'
-AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
-"
+    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+    # So a merge will be create for future part all_3_5_1.
+    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # Merge will be retried and on second attempt it will succeed.
+    # The result part all_3_5_1 will have only 1 projection - 'proj', because
+    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    optimize 0 1
+    sleep 2
 
-# Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-broken_projections_info
+    $CLICKHOUSE_CLIENT -nm -q "
+    SYSTEM FLUSH LOGS;
+    SELECT count() FROM system.text_log
+    WHERE level='Error'
+    AND logger_name='MergeTreeBackgroundExecutor'
+    AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
+    "
 
-check
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    broken_projections_info test
 
-break_projection proj all_1_1_0 metadata
+    check test
 
-reattach
+    break_projection test proj all_1_1_0 metadata
 
-broken_projections_info
+    reattach
 
-break_projection proj_2 all_1_1_0 data
+    broken_projections_info test
 
-reattach
+    break_projection test proj_2 all_1_1_0 data
 
-broken_projections_info
+    reattach
 
-check
+    broken_projections_info test
 
-check_table_full all_1_1_0
+    check test
 
-materialize_projection proj
+    check_table_full test all_1_1_0
 
-check_table_full
+    materialize_projection test proj
 
-check
+    check_table_full test
 
-materialize_projection proj_2
+    check test
 
-check_table_full
+    materialize_projection test proj_2
 
-break_projection proj all_3_5_1_7 data
+    check_table_full test
 
-insert 30 5
+    break_projection test proj all_3_5_1_7 data
 
-optimize 1 0
+    insert test 30 5
 
-insert 35 5
+    optimize 1 0
 
-optimize 1 0
+    insert test 35 5
 
-check
+    optimize 1 0
 
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE test SYNC;
-"
+    check test
+}
+
+function test2()
+{
+    create_table test2 test2 1
+
+    insert test2 0 5
+
+    insert test2 5 5
+
+    insert test 10 5
+
+    insert test 15 5
+
+    check test2
+
+    create_table test2 test2_replica 2
+
+    check test2_replica
+
+    break_projection test2 proj all_0_0_0 data
+
+    check_table_full test2 all_0_0_0
+
+    check test2
+
+    break_part test2 all_0_0_0
+
+    check_table_full test2 all_0_0_0
+
+    check test2
+
+    $CLICKHOUSE_CLIENT -q "SYSTEM SYNC REPLICA test2;"
+
+    check test2
+}
+
+CLICKHOUSE_TEST_UNIQUE_NAME="gghhhhhhhhhhhhhhhhhhh"
+function test3()
+{
+    create_table test3 test 1
+
+    insert test 0 5
+
+    insert test 5 5
+
+    insert test 10 5
+
+    insert test 15 5
+
+    check test
+
+    break_projection test proj all_2_2_0 data
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
+    " | grep -o "RESTORED"
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    break_projection test proj all_2_2_0 part
+
+    check test proj
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    " 2>&1 | grep -o "FILE_DOESNT_EXIST"
+
+    materialize_projection test proj
+
+    check test proj
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
+    " | grep -o "RESTORED"
+
+    check test proj
+
+    break_projection test proj all_2_2_0 part
+
+    check test proj FILE_DOESNT_EXIST
+
+    broken_projections_info test
+
+    ${CLICKHOUSE_CLIENT} -nm --query "
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    settings check_projection_parts=false, allow_backup_broken_projections=true;
+    " | grep -o "BACKUP_CREATED"
+
+    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
+    drop table test sync;
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
+    " | grep -o "RESTORED"
+
+    check test
+
+    broken_projections_info test
+}
+
+test1
+test2
+test3
+
+
+#$CLICKHOUSE_CLIENT -nm -q "
+#DROP TABLE test SYNC;
+#DROP TABLE test2 SYNC;
+#DROP TABLE test2_replica SYNC;
+#"

From 6632589d72ed270626e012c86a78a8f0c8411fb3 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 30 Nov 2023 13:54:22 +0100
Subject: [PATCH 0030/1081] Review fix

---
 src/Storages/MergeTree/MergeTreeData.cpp             |  6 +++---
 tests/queries/0_stateless/02916_broken_projection.sh | 10 +++++-----
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index c95aee88aee..1ba4153bc3e 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7669,7 +7669,7 @@ MovePartsOutcome MergeTreeData::moveParts(const CurrentlyMovingPartsTaggerPtr &
 
 bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const DataPartPtr & right, String & out_reason)
 {
-    auto remove_broken_parts = [](auto & parts)
+    auto remove_broken_parts_from_consideration = [](auto & parts)
     {
         std::set<String> broken_projection_parts;
         for (const auto & [name, part] : parts)
@@ -7684,8 +7684,8 @@ bool MergeTreeData::partsContainSameProjections(const DataPartPtr & left, const
     auto left_projection_parts = left->getProjectionParts();
     auto right_projection_parts = right->getProjectionParts();
 
-    remove_broken_parts(left_projection_parts);
-    remove_broken_parts(right_projection_parts);
+    remove_broken_parts_from_consideration(left_projection_parts);
+    remove_broken_parts_from_consideration(right_projection_parts);
 
     if (left_projection_parts.size() != right_projection_parts.size())
     {
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 1555139e16f..60b21216d1a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -495,8 +495,8 @@ test2
 test3
 
 
-#$CLICKHOUSE_CLIENT -nm -q "
-#DROP TABLE test SYNC;
-#DROP TABLE test2 SYNC;
-#DROP TABLE test2_replica SYNC;
-#"
+$CLICKHOUSE_CLIENT -nm -q "
+DROP TABLE IF EXISTS test SYNC;
+DROP TABLE IF EXISTS test2 SYNC;
+DROP TABLE IF EXISTS test2_replica SYNC;
+"

From caf4dc7e14e594da3c254822b345b79c57e76d19 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 1 Dec 2023 12:21:47 +0100
Subject: [PATCH 0031/1081] Fix style check

---
 src/Common/ErrorCodes.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index b0ed754536d..57aa82f3639 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -587,7 +587,7 @@
     M(705, TABLE_NOT_EMPTY) \
     M(706, LIBSSH_ERROR) \
     M(707, GCP_ERROR) \
-    M(708, ILLEGAL_STATISTIC) \ 
+    M(708, ILLEGAL_STATISTIC) \
     M(709, BROKEN_PROJECTION) \
     \
     M(999, KEEPER_EXCEPTION) \

From f609c44eb83fc769ba9e8fc5875bbc10e3e17b9b Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 1 Dec 2023 13:38:28 +0100
Subject: [PATCH 0032/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 60b21216d1a..bd141d1a122 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -459,11 +459,13 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set send_logs_level='fatal';
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
@@ -476,12 +478,14 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
+    set send_logs_level='fatal';
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set send_logs_level='fatal';
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
     " | grep -o "RESTORED"
 

From d0827e3ea77ff432c4a6a66145827428bcd62b5e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 1 Dec 2023 17:45:23 +0000
Subject: [PATCH 0033/1081] Add a test.

---
 .../0_stateless/02932_set_ttl_where.reference |  0
 .../0_stateless/02932_set_ttl_where.sql       | 22 +++++++++++++++++++
 2 files changed, 22 insertions(+)
 create mode 100644 tests/queries/0_stateless/02932_set_ttl_where.reference
 create mode 100644 tests/queries/0_stateless/02932_set_ttl_where.sql

diff --git a/tests/queries/0_stateless/02932_set_ttl_where.reference b/tests/queries/0_stateless/02932_set_ttl_where.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02932_set_ttl_where.sql b/tests/queries/0_stateless/02932_set_ttl_where.sql
new file mode 100644
index 00000000000..85fddf613e8
--- /dev/null
+++ b/tests/queries/0_stateless/02932_set_ttl_where.sql
@@ -0,0 +1,22 @@
+create or replace table temp (
+    a UInt32
+)
+engine = MergeTree
+order by a;
+
+insert into temp select number from system.numbers limit 100_000;
+
+create or replace table t_temp (
+    a UInt32,
+    timestamp DateTime
+)
+engine = MergeTree
+order by a
+TTL timestamp + INTERVAL 2 SECOND WHERE a in (select a from temp);
+
+select sleep(1);
+insert into t_temp select rand(), now() from system.numbers limit 1_000_000;
+select sleep(1);
+insert into t_temp select rand(), now() from system.numbers limit 1_000_000;
+select sleep(1);
+optimize table t_temp final;

From 508046e6922c0cb163ce5611f1e6ef6a22f8b7f1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 1 Dec 2023 20:31:26 +0000
Subject: [PATCH 0034/1081] Attempt to support subqueries in TTL.

---
 src/Interpreters/PreparedSets.cpp             |  8 ++-
 src/Interpreters/PreparedSets.h               |  1 +
 src/Processors/TTL/ITTLAlgorithm.cpp          |  5 +-
 src/Processors/TTL/ITTLAlgorithm.h            |  9 ++-
 .../TTL/TTLAggregationAlgorithm.cpp           | 11 ++--
 src/Processors/TTL/TTLAggregationAlgorithm.h  |  1 +
 src/Processors/TTL/TTLColumnAlgorithm.cpp     |  5 +-
 src/Processors/TTL/TTLColumnAlgorithm.h       |  1 +
 src/Processors/TTL/TTLDeleteAlgorithm.cpp     | 10 +--
 src/Processors/TTL/TTLDeleteAlgorithm.h       |  2 +-
 src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp |  5 +-
 src/Processors/TTL/TTLUpdateInfoAlgorithm.h   |  1 +
 src/Processors/Transforms/TTLTransform.cpp    |  2 +-
 .../MergeTree/MergeTreeDataWriter.cpp         | 19 +++---
 src/Storages/StorageInMemoryMetadata.cpp      | 21 +++----
 src/Storages/TTLDescription.cpp               | 62 ++++++++++++-------
 src/Storages/TTLDescription.h                 | 15 ++++-
 17 files changed, 116 insertions(+), 62 deletions(-)

diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index 955d8892284..ea8d9a62b8b 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -189,11 +189,17 @@ SetPtr FutureSetFromSubquery::buildOrderedSetInplace(const ContextPtr & context)
         }
     }
 
+    set_and_key->set->fillSetElements();
+
+    return buildSetInplace(context);
+}
+
+SetPtr FutureSetFromSubquery::buildSetInplace(const ContextPtr & context)
+{
     auto plan = build(context);
     if (!plan)
         return nullptr;
 
-    set_and_key->set->fillSetElements();
     auto builder = plan->buildQueryPipeline(QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
     auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
     pipeline.complete(std::make_shared<EmptySink>(Block()));
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index e237789c63c..3e751d309ba 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -107,6 +107,7 @@ public:
     SetPtr get() const override;
     DataTypes getTypes() const override;
     SetPtr buildOrderedSetInplace(const ContextPtr & context) override;
+    SetPtr buildSetInplace(const ContextPtr & context);
 
     std::unique_ptr<QueryPlan> build(const ContextPtr & context);
 
diff --git a/src/Processors/TTL/ITTLAlgorithm.cpp b/src/Processors/TTL/ITTLAlgorithm.cpp
index 79140137df8..af6c4e4ac35 100644
--- a/src/Processors/TTL/ITTLAlgorithm.cpp
+++ b/src/Processors/TTL/ITTLAlgorithm.cpp
@@ -11,8 +11,9 @@ namespace ErrorCodes
 }
 
 ITTLAlgorithm::ITTLAlgorithm(
-    const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
-    : description(description_)
+    const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
+    : ttl_expressions(ttl_expressions_)
+    , description(description_)
     , old_ttl_info(old_ttl_info_)
     , current_time(current_time_)
     , force(force_)
diff --git a/src/Processors/TTL/ITTLAlgorithm.h b/src/Processors/TTL/ITTLAlgorithm.h
index 49cd2c46d9d..6e73286b564 100644
--- a/src/Processors/TTL/ITTLAlgorithm.h
+++ b/src/Processors/TTL/ITTLAlgorithm.h
@@ -8,6 +8,12 @@
 namespace DB
 {
 
+struct TTlExpressions
+{
+    ExpressionActionsPtr expression;
+    ExpressionActionsPtr where_expression;
+};
+
 /**
  * Represents the actions, which are required to do
  * with data, when TTL is expired: delete, aggregate, etc.
@@ -18,7 +24,7 @@ public:
     using TTLInfo = IMergeTreeDataPart::TTLInfo;
     using MutableDataPartPtr = MergeTreeMutableDataPartPtr;
 
-    ITTLAlgorithm(const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
+    ITTLAlgorithm(const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
     virtual ~ITTLAlgorithm() = default;
 
     virtual void execute(Block & block) = 0;
@@ -39,6 +45,7 @@ protected:
     bool isTTLExpired(time_t ttl) const;
     UInt32 getTimestampByIndex(const IColumn * column, size_t index) const;
 
+    const TTlExpressions ttl_expressions;
     const TTLDescription description;
     const TTLInfo old_ttl_info;
     const time_t current_time;
diff --git a/src/Processors/TTL/TTLAggregationAlgorithm.cpp b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
index fa3436ec55d..ab2ba5f58fc 100644
--- a/src/Processors/TTL/TTLAggregationAlgorithm.cpp
+++ b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
@@ -5,13 +5,14 @@ namespace DB
 {
 
 TTLAggregationAlgorithm::TTLAggregationAlgorithm(
+    const TTlExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
     bool force_,
     const Block & header_,
     const MergeTreeData & storage_)
-    : ITTLAlgorithm(description_, old_ttl_info_, current_time_, force_)
+    : ITTLAlgorithm(ttl_expressions_, description_, old_ttl_info_, current_time_, force_)
     , header(header_)
 {
     current_key_value.resize(description.group_by_keys.size());
@@ -73,8 +74,8 @@ void TTLAggregationAlgorithm::execute(Block & block)
         const auto & column_names = header.getNames();
         MutableColumns aggregate_columns = header.cloneEmptyColumns();
 
-        auto ttl_column = executeExpressionAndGetColumn(description.expression, block, description.result_column);
-        auto where_column = executeExpressionAndGetColumn(description.where_expression, block, description.where_result_column);
+        auto ttl_column = executeExpressionAndGetColumn(ttl_expressions.expression, block, description.result_column);
+        auto where_column = executeExpressionAndGetColumn(ttl_expressions.where_expression, block, description.where_result_column);
 
         size_t rows_aggregated = 0;
         size_t current_key_start = 0;
@@ -145,8 +146,8 @@ void TTLAggregationAlgorithm::execute(Block & block)
     /// If some rows were aggregated we have to recalculate ttl info's
     if (some_rows_were_aggregated)
     {
-        auto ttl_column_after_aggregation = executeExpressionAndGetColumn(description.expression, block, description.result_column);
-        auto where_column_after_aggregation = executeExpressionAndGetColumn(description.where_expression, block, description.where_result_column);
+        auto ttl_column_after_aggregation = executeExpressionAndGetColumn(ttl_expressions.expression, block, description.result_column);
+        auto where_column_after_aggregation = executeExpressionAndGetColumn(ttl_expressions.where_expression, block, description.where_result_column);
         for (size_t i = 0; i < block.rows(); ++i)
         {
             bool where_filter_passed = !where_column_after_aggregation || where_column_after_aggregation->getBool(i);
diff --git a/src/Processors/TTL/TTLAggregationAlgorithm.h b/src/Processors/TTL/TTLAggregationAlgorithm.h
index 0e4bf092ed6..9fd074efba8 100644
--- a/src/Processors/TTL/TTLAggregationAlgorithm.h
+++ b/src/Processors/TTL/TTLAggregationAlgorithm.h
@@ -13,6 +13,7 @@ class TTLAggregationAlgorithm final : public ITTLAlgorithm
 {
 public:
     TTLAggregationAlgorithm(
+        const TTlExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLInfo & old_ttl_info_,
         time_t current_time_,
diff --git a/src/Processors/TTL/TTLColumnAlgorithm.cpp b/src/Processors/TTL/TTLColumnAlgorithm.cpp
index 04c4d7b9348..cb99dcf99b1 100644
--- a/src/Processors/TTL/TTLColumnAlgorithm.cpp
+++ b/src/Processors/TTL/TTLColumnAlgorithm.cpp
@@ -4,6 +4,7 @@ namespace DB
 {
 
 TTLColumnAlgorithm::TTLColumnAlgorithm(
+    const TTlExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
@@ -12,7 +13,7 @@ TTLColumnAlgorithm::TTLColumnAlgorithm(
     const ExpressionActionsPtr & default_expression_,
     const String & default_column_name_,
     bool is_compact_part_)
-    : ITTLAlgorithm(description_, old_ttl_info_, current_time_, force_)
+    : ITTLAlgorithm(ttl_expressions_, description_, old_ttl_info_, current_time_, force_)
     , column_name(column_name_)
     , default_expression(default_expression_)
     , default_column_name(default_column_name_)
@@ -49,7 +50,7 @@ void TTLColumnAlgorithm::execute(Block & block)
     if (default_column)
         default_column = default_column->convertToFullColumnIfConst();
 
-    auto ttl_column = executeExpressionAndGetColumn(description.expression, block, description.result_column);
+    auto ttl_column = executeExpressionAndGetColumn(ttl_expressions.expression, block, description.result_column);
 
     auto & column_with_type = block.getByName(column_name);
     const IColumn * values_column = column_with_type.column.get();
diff --git a/src/Processors/TTL/TTLColumnAlgorithm.h b/src/Processors/TTL/TTLColumnAlgorithm.h
index 30de77dcc2a..efcd7c74454 100644
--- a/src/Processors/TTL/TTLColumnAlgorithm.h
+++ b/src/Processors/TTL/TTLColumnAlgorithm.h
@@ -11,6 +11,7 @@ class TTLColumnAlgorithm final : public ITTLAlgorithm
 {
 public:
     TTLColumnAlgorithm(
+        const TTlExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLInfo & old_ttl_info_,
         time_t current_time_,
diff --git a/src/Processors/TTL/TTLDeleteAlgorithm.cpp b/src/Processors/TTL/TTLDeleteAlgorithm.cpp
index f176df2d003..6a172e9c3c3 100644
--- a/src/Processors/TTL/TTLDeleteAlgorithm.cpp
+++ b/src/Processors/TTL/TTLDeleteAlgorithm.cpp
@@ -4,8 +4,8 @@ namespace DB
 {
 
 TTLDeleteAlgorithm::TTLDeleteAlgorithm(
-    const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
-    : ITTLAlgorithm(description_, old_ttl_info_, current_time_, force_)
+    const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
+    : ITTLAlgorithm(ttl_expressions_, description_, old_ttl_info_, current_time_, force_)
 {
     if (!isMinTTLExpired())
         new_ttl_info = old_ttl_info;
@@ -19,8 +19,8 @@ void TTLDeleteAlgorithm::execute(Block & block)
     if (!block || !isMinTTLExpired())
         return;
 
-    auto ttl_column = executeExpressionAndGetColumn(description.expression, block, description.result_column);
-    auto where_column = executeExpressionAndGetColumn(description.where_expression, block, description.where_result_column);
+    auto ttl_column = executeExpressionAndGetColumn(ttl_expressions.expression, block, description.result_column);
+    auto where_column = executeExpressionAndGetColumn(ttl_expressions.where_expression, block, description.where_result_column);
 
     MutableColumns result_columns;
     const auto & column_names = block.getNames();
@@ -54,7 +54,7 @@ void TTLDeleteAlgorithm::execute(Block & block)
 
 void TTLDeleteAlgorithm::finalize(const MutableDataPartPtr & data_part) const
 {
-    if (description.where_expression)
+    if (ttl_expressions.where_expression)
         data_part->ttl_infos.rows_where_ttl[description.result_column] = new_ttl_info;
     else
         data_part->ttl_infos.table_ttl = new_ttl_info;
diff --git a/src/Processors/TTL/TTLDeleteAlgorithm.h b/src/Processors/TTL/TTLDeleteAlgorithm.h
index 292a29bfa27..23389070774 100644
--- a/src/Processors/TTL/TTLDeleteAlgorithm.h
+++ b/src/Processors/TTL/TTLDeleteAlgorithm.h
@@ -10,7 +10,7 @@ namespace DB
 class TTLDeleteAlgorithm final : public ITTLAlgorithm
 {
 public:
-    TTLDeleteAlgorithm(const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
+    TTLDeleteAlgorithm(const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
 
     void execute(Block & block) override;
     void finalize(const MutableDataPartPtr & data_part) const override;
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
index eba364aa2b8..34c0cad70ea 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
@@ -4,13 +4,14 @@ namespace DB
 {
 
 TTLUpdateInfoAlgorithm::TTLUpdateInfoAlgorithm(
+    const TTlExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLUpdateField ttl_update_field_,
     const String ttl_update_key_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
     bool force_)
-    : ITTLAlgorithm(description_, old_ttl_info_, current_time_, force_)
+    : ITTLAlgorithm(ttl_expressions_, description_, old_ttl_info_, current_time_, force_)
     , ttl_update_field(ttl_update_field_)
     , ttl_update_key(ttl_update_key_)
 {
@@ -21,7 +22,7 @@ void TTLUpdateInfoAlgorithm::execute(Block & block)
     if (!block)
         return;
 
-    auto ttl_column = executeExpressionAndGetColumn(description.expression, block, description.result_column);
+    auto ttl_column = executeExpressionAndGetColumn(ttl_expressions.expression, block, description.result_column);
     for (size_t i = 0; i < block.rows(); ++i)
     {
         UInt32 cur_ttl = ITTLAlgorithm::getTimestampByIndex(ttl_column.get(), i);
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
index 45eecbde3d0..e9bcfcdec88 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
@@ -20,6 +20,7 @@ class TTLUpdateInfoAlgorithm : public ITTLAlgorithm
 {
 public:
     TTLUpdateInfoAlgorithm(
+        const TTlExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLUpdateField ttl_update_field_,
         const String ttl_update_key_,
diff --git a/src/Processors/Transforms/TTLTransform.cpp b/src/Processors/Transforms/TTLTransform.cpp
index 7cde86098c7..d3d45f68d46 100644
--- a/src/Processors/Transforms/TTLTransform.cpp
+++ b/src/Processors/Transforms/TTLTransform.cpp
@@ -36,7 +36,7 @@ TTLTransform::TTLTransform(
             rows_ttl, old_ttl_infos.table_ttl, current_time_, force_);
 
         /// Skip all data if table ttl is expired for part
-        if (algorithm->isMaxTTLExpired() && !rows_ttl.where_expression)
+        if (algorithm->isMaxTTLExpired() && !rows_ttl.where_expression_ast)
             all_data_dropped = true;
 
         delete_algorithm = algorithm.get();
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index 2a381afa805..d080240b066 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -125,13 +125,18 @@ void buildScatterSelector(
 
 /// Computes ttls and updates ttl infos
 void updateTTL(
+    const ContextPtr context,
     const TTLDescription & ttl_entry,
     IMergeTreeDataPart::TTLInfos & ttl_infos,
     DB::MergeTreeDataPartTTLInfo & ttl_info,
     const Block & block,
     bool update_part_min_max_ttls)
 {
-    auto ttl_column = ITTLAlgorithm::executeExpressionAndGetColumn(ttl_entry.expression, block, ttl_entry.result_column);
+    auto expr_and_set = ttl_entry.buildExpression();
+    for (auto & subquery : expr_and_set.sets->getSubqueries())
+        subquery->buildSetInplace(context);
+
+    auto ttl_column = ITTLAlgorithm::executeExpressionAndGetColumn(expr_and_set.expression, block, ttl_entry.result_column);
 
     if (const ColumnUInt16 * column_date = typeid_cast<const ColumnUInt16 *>(ttl_column.get()))
     {
@@ -488,7 +493,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     DB::IMergeTreeDataPart::TTLInfos move_ttl_infos;
     const auto & move_ttl_entries = metadata_snapshot->getMoveTTLs();
     for (const auto & ttl_entry : move_ttl_entries)
-        updateTTL(ttl_entry, move_ttl_infos, move_ttl_infos.moves_ttl[ttl_entry.result_column], block, false);
+        updateTTL(context, ttl_entry, move_ttl_infos, move_ttl_infos.moves_ttl[ttl_entry.result_column], block, false);
 
     ReservationPtr reservation = data.reserveSpacePreferringTTLRules(metadata_snapshot, expected_size, move_ttl_infos, time(nullptr), 0, true);
     VolumePtr volume = data.getStoragePolicy()->getVolume(0);
@@ -543,20 +548,20 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     }
 
     if (metadata_snapshot->hasRowsTTL())
-        updateTTL(metadata_snapshot->getRowsTTL(), new_data_part->ttl_infos, new_data_part->ttl_infos.table_ttl, block, true);
+        updateTTL(context, metadata_snapshot->getRowsTTL(), new_data_part->ttl_infos, new_data_part->ttl_infos.table_ttl, block, true);
 
     for (const auto & ttl_entry : metadata_snapshot->getGroupByTTLs())
-        updateTTL(ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.group_by_ttl[ttl_entry.result_column], block, true);
+        updateTTL(context, ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.group_by_ttl[ttl_entry.result_column], block, true);
 
     for (const auto & ttl_entry : metadata_snapshot->getRowsWhereTTLs())
-        updateTTL(ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.rows_where_ttl[ttl_entry.result_column], block, true);
+        updateTTL(context, ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.rows_where_ttl[ttl_entry.result_column], block, true);
 
     for (const auto & [name, ttl_entry] : metadata_snapshot->getColumnTTLs())
-        updateTTL(ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.columns_ttl[name], block, true);
+        updateTTL(context, ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.columns_ttl[name], block, true);
 
     const auto & recompression_ttl_entries = metadata_snapshot->getRecompressionTTLs();
     for (const auto & ttl_entry : recompression_ttl_entries)
-        updateTTL(ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.recompression_ttl[ttl_entry.result_column], block, false);
+        updateTTL(context, ttl_entry, new_data_part->ttl_infos, new_data_part->ttl_infos.recompression_ttl[ttl_entry.result_column], block, false);
 
     new_data_part->ttl_infos.update(move_ttl_infos);
 
diff --git a/src/Storages/StorageInMemoryMetadata.cpp b/src/Storages/StorageInMemoryMetadata.cpp
index af285a953dc..7db5af82e0b 100644
--- a/src/Storages/StorageInMemoryMetadata.cpp
+++ b/src/Storages/StorageInMemoryMetadata.cpp
@@ -193,7 +193,7 @@ TTLDescription StorageInMemoryMetadata::getRowsTTL() const
 
 bool StorageInMemoryMetadata::hasRowsTTL() const
 {
-    return table_ttl.rows_ttl.expression != nullptr;
+    return table_ttl.rows_ttl.expression_ast != nullptr;
 }
 
 TTLDescriptions StorageInMemoryMetadata::getRowsWhereTTLs() const
@@ -251,9 +251,8 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
     NameSet required_ttl_columns;
     NameSet updated_ttl_columns;
 
-    auto add_dependent_columns = [&updated_columns](const auto & expression, auto & to_set)
+    auto add_dependent_columns = [&updated_columns](const Names & required_columns, auto & to_set)
     {
-        auto required_columns = expression->getRequiredColumns();
         for (const auto & dependency : required_columns)
         {
             if (updated_columns.contains(dependency))
@@ -269,13 +268,13 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
     for (const auto & index : getSecondaryIndices())
     {
         if (has_dependency(index.name, ColumnDependency::SKIP_INDEX))
-            add_dependent_columns(index.expression, indices_columns);
+            add_dependent_columns(index.expression->getRequiredColumns(), indices_columns);
     }
 
     for (const auto & projection : getProjections())
     {
         if (has_dependency(projection.name, ColumnDependency::PROJECTION))
-            add_dependent_columns(&projection, projections_columns);
+            add_dependent_columns(projection.getRequiredColumns(), projections_columns);
     }
 
     auto add_for_rows_ttl = [&](const auto & expression, auto & to_set)
@@ -289,25 +288,25 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
     };
 
     if (hasRowsTTL())
-        add_for_rows_ttl(getRowsTTL().expression, required_ttl_columns);
+        add_for_rows_ttl(getRowsTTL().expression_columns, required_ttl_columns);
 
     for (const auto & entry : getRowsWhereTTLs())
-        add_for_rows_ttl(entry.expression, required_ttl_columns);
+        add_for_rows_ttl(entry.expression_columns, required_ttl_columns);
 
     for (const auto & entry : getGroupByTTLs())
-        add_for_rows_ttl(entry.expression, required_ttl_columns);
+        add_for_rows_ttl(entry.expression_columns, required_ttl_columns);
 
     for (const auto & entry : getRecompressionTTLs())
-        add_dependent_columns(entry.expression, required_ttl_columns);
+        add_dependent_columns(entry.expression_columns, required_ttl_columns);
 
     for (const auto & [name, entry] : getColumnTTLs())
     {
-        if (add_dependent_columns(entry.expression, required_ttl_columns) && include_ttl_target)
+        if (add_dependent_columns(entry.expression_columns, required_ttl_columns) && include_ttl_target)
             updated_ttl_columns.insert(name);
     }
 
     for (const auto & entry : getMoveTTLs())
-        add_dependent_columns(entry.expression, required_ttl_columns);
+        add_dependent_columns(entry.expression_columns, required_ttl_columns);
 
     //TODO what about rows_where_ttl and group_by_ttl ??
 
diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index f601fed06ac..47138f30e4f 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -113,11 +113,11 @@ TTLDescription::TTLDescription(const TTLDescription & other)
     , if_exists(other.if_exists)
     , recompression_codec(other.recompression_codec)
 {
-    if (other.expression)
-        expression = other.expression->clone();
+    // if (other.expression)
+    //     expression = other.expression->clone();
 
-    if (other.where_expression)
-        where_expression = other.where_expression->clone();
+    // if (other.where_expression)
+    //     where_expression = other.where_expression->clone();
 }
 
 TTLDescription & TTLDescription::operator=(const TTLDescription & other)
@@ -131,16 +131,16 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
     else
         expression_ast.reset();
 
-    if (other.expression)
-        expression = other.expression->clone();
-    else
-        expression.reset();
+    // if (other.expression)
+    //     expression = other.expression->clone();
+    // else
+    //     expression.reset();
 
     result_column = other.result_column;
-    if (other.where_expression)
-        where_expression = other.where_expression->clone();
-    else
-        where_expression.reset();
+    // if (other.where_expression)
+    //     where_expression = other.where_expression->clone();
+    // else
+    //     where_expression.reset();
 
     where_result_column = other.where_result_column;
     group_by_keys = other.group_by_keys;
@@ -158,6 +158,17 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
     return * this;
 }
 
+static ExpressionAndSets buildExpressionAndSets(ASTPtr & ast, const NamesAndTypesList & columns, const ContextPtr & context)
+{
+    ExpressionAndSets result;
+    auto syntax_analyzer_result = TreeRewriter(context).analyze(ast, columns);
+    ExpressionAnalyzer analyzer(ast, syntax_analyzer_result, context);
+    result.expression = analyzer.getActions(false);
+    result.sets = analyzer.getPreparedSets();
+
+    return result;
+}
+
 TTLDescription TTLDescription::getTTLFromAST(
     const ASTPtr & definition_ast,
     const ColumnsDescription & columns,
@@ -174,10 +185,15 @@ TTLDescription TTLDescription::getTTLFromAST(
         result.expression_ast = definition_ast->clone();
 
     auto ttl_ast = result.expression_ast->clone();
-    auto syntax_analyzer_result = TreeRewriter(context).analyze(ttl_ast, columns.getAllPhysical());
-    result.expression = ExpressionAnalyzer(ttl_ast, syntax_analyzer_result, context).getActions(false);
+    auto expression = buildExpressionAndSets(ttl_ast, columns.getAllPhysical(), context).expression;
+    result.expression_columns = expression->getRequiredColumns();
+
+    // auto syntax_analyzer_result = TreeRewriter(context).analyze(ttl_ast, columns.getAllPhysical());
+    // result.expression = ExpressionAnalyzer(ttl_ast, syntax_analyzer_result, context).getActions(false);
     result.result_column = ttl_ast->getColumnName();
 
+    ExpressionActionsPtr where_expression;
+
     if (ttl_element == nullptr) /// columns TTL
     {
         result.destination_type = DataDestinationType::DELETE;
@@ -194,8 +210,10 @@ TTLDescription TTLDescription::getTTLFromAST(
         {
             if (ASTPtr where_expr_ast = ttl_element->where())
             {
-                auto where_syntax_result = TreeRewriter(context).analyze(where_expr_ast, columns.getAllPhysical());
-                result.where_expression = ExpressionAnalyzer(where_expr_ast, where_syntax_result, context).getActions(false);
+                result.where_expression_ast = where_expr_ast->clone();
+                where_expression = buildExpressionAndSets(where_expr_ast, columns.getAllPhysical(), context).expression;
+                // auto where_syntax_result = TreeRewriter(context).analyze(where_expr_ast, columns.getAllPhysical());
+                // result.where_expression = ExpressionAnalyzer(where_expr_ast, where_syntax_result, context).getActions(false);
                 result.where_result_column = where_expr_ast->getColumnName();
             }
         }
@@ -221,17 +239,17 @@ TTLDescription TTLDescription::getTTLFromAST(
             for (const auto & ast : ttl_element->group_by_assignments)
             {
                 const auto assignment = ast->as<const ASTAssignment &>();
-                auto expression = assignment.expression();
+                auto ass_expression = assignment.expression();
 
                 FindAggregateFunctionVisitor::Data data{false};
-                FindAggregateFunctionVisitor(data).visit(expression);
+                FindAggregateFunctionVisitor(data).visit(ass_expression);
 
                 if (!data.has_aggregate_function)
                     throw Exception(ErrorCodes::BAD_TTL_EXPRESSION,
                     "Invalid expression for assignment of column {}. Should contain an aggregate function", assignment.column_name);
 
-                expression = addTypeConversionToAST(std::move(expression), columns.getPhysical(assignment.column_name).type->getName());
-                aggregations.emplace_back(assignment.column_name, std::move(expression));
+                ass_expression = addTypeConversionToAST(std::move(ass_expression), columns.getPhysical(assignment.column_name).type->getName());
+                aggregations.emplace_back(assignment.column_name, std::move(ass_expression));
                 aggregation_columns_set.insert(assignment.column_name);
             }
 
@@ -289,7 +307,7 @@ TTLDescription TTLDescription::getTTLFromAST(
         }
     }
 
-    checkTTLExpression(result.expression, result.result_column);
+    checkTTLExpression(expression, result.result_column);
     return result;
 }
 
@@ -341,7 +359,7 @@ TTLTableDescription TTLTableDescription::getTTLForTableFromAST(
         auto ttl = TTLDescription::getTTLFromAST(ttl_element_ptr, columns, context, primary_key);
         if (ttl.mode == TTLMode::DELETE)
         {
-            if (!ttl.where_expression)
+            if (!ttl.where_expression_ast)
             {
                 if (have_unconditional_delete_ttl)
                     throw Exception(ErrorCodes::BAD_TTL_EXPRESSION, "More than one DELETE TTL expression without WHERE expression is not allowed");
diff --git a/src/Storages/TTLDescription.h b/src/Storages/TTLDescription.h
index 8f60eb604b5..5ea243424cb 100644
--- a/src/Storages/TTLDescription.h
+++ b/src/Storages/TTLDescription.h
@@ -33,6 +33,15 @@ struct TTLAggregateDescription
 
 using TTLAggregateDescriptions = std::vector<TTLAggregateDescription>;
 
+class PreparedSets;
+using PreparedSetsPtr = std::shared_ptr<PreparedSets>;
+
+struct ExpressionAndSets
+{
+    ExpressionActionsPtr expression;
+    PreparedSetsPtr sets;
+};
+
 /// Common struct for TTL record in storage
 struct TTLDescription
 {
@@ -42,9 +51,10 @@ struct TTLDescription
     /// TTL d + INTERVAL 1 DAY
     ///    ^~~~~~~~~~~~~~~~~~~^
     ASTPtr expression_ast;
+    Names expression_columns;
 
     /// Expression actions evaluated from AST
-    ExpressionActionsPtr expression;
+    ExpressionAndSets buildExpression() const;
 
     /// Result column of this TTL expression
     String result_column;
@@ -52,7 +62,8 @@ struct TTLDescription
     /// WHERE part in TTL expression
     /// TTL ... WHERE x % 10 == 0 and y > 5
     ///              ^~~~~~~~~~~~~~~~~~~~~~^
-    ExpressionActionsPtr where_expression;
+    ASTPtr where_expression_ast;
+    ExpressionAndSets buildWhereExpression() const;
 
     /// Name of result column from WHERE expression
     String where_result_column;

From 2b903003b4795eb3768fec3f84ec8321fa5485f6 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 4 Dec 2023 13:21:18 +0100
Subject: [PATCH 0035/1081] Update reference

---
 .../0_stateless/02916_broken_projection.reference        | 8 +++-----
 tests/queries/0_stateless/02916_broken_projection.sh     | 9 ++++-----
 2 files changed, 7 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 4c4901ae99f..acd1b87eb30 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -332,16 +332,14 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-FILE_DOESNT_EXIST
 select from projection 'proj_2', expect error: proj
 12
 16
 used projections
 SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
-0
+1
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
 system.parts
@@ -358,7 +356,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	FILE_DOESNT_EXIST
 FILE_DOESNT_EXIST
 materialize projection proj
 system.parts
@@ -379,7 +377,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
+all_2_2_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
 system.parts
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index bd141d1a122..7315cf5ce61 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -29,7 +29,7 @@ function create_table()
             SELECT d ORDER BY c
         )
     )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_24_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
@@ -407,7 +407,6 @@ function test2()
     check test2
 }
 
-CLICKHOUSE_TEST_UNIQUE_NAME="gghhhhhhhhhhhhhhhhhhh"
 function test3()
 {
     create_table test3 test 1
@@ -437,7 +436,7 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
-    check test proj FILE_DOESNT_EXIST
+    check test proj
 
     broken_projections_info test
 
@@ -479,14 +478,14 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2');
+    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
     " | grep -o "RESTORED"
 
     check test

From b77a6073aea98c7c5f5fcc28492a34e801d11b6b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 4 Dec 2023 16:57:09 +0100
Subject: [PATCH 0036/1081] Fix test

---
 .../02916_broken_projection.reference         | 90 +++++++++++--------
 .../0_stateless/02916_broken_projection.sh    | 36 ++++----
 2 files changed, 70 insertions(+), 56 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index acd1b87eb30..b7764a6434e 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -7,12 +7,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -26,12 +26,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -51,7 +51,7 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj_2
+select from projection 'proj'
 12
 16
 used projections
@@ -68,12 +68,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -102,12 +102,12 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -139,12 +139,12 @@ all_3_3_0	0	['proj','proj_2']
 all_3_5_1	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -167,12 +167,12 @@ all_3_5_1	0	['proj']
 all_3_5_1_6	1	['proj']
 all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -208,12 +208,12 @@ all_4_4_0	0	['proj','proj_2']
 all_5_5_0	0	['proj','proj_2']
 all_8_8_0	0	['proj','proj_2']
 all_9_9_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -227,20 +227,19 @@ insert new part
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 system.parts
-all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -252,10 +251,10 @@ all_0_0_0
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -266,10 +265,10 @@ all_0_0_0
 system.parts
 all_0_0_0	0	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -277,10 +276,10 @@ check table
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
@@ -294,12 +293,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
@@ -315,7 +314,7 @@ all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 FILE_DOESNT_EXIST
-select from projection 'proj_2', expect error: proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -331,8 +330,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -348,7 +351,8 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+STD_EXCEPTION
+select from projection 'proj_2'
 12
 16
 used projections
@@ -368,8 +372,12 @@ all_2_2_0	0	['proj','proj_2']
 all_2_2_0_4	1	['proj','proj_2']
 all_3_3_0	0	['proj','proj_2']
 all_3_3_0_4	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -385,8 +393,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj'
+12
+16
+used projections
+SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -401,7 +413,7 @@ all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
-select from projection 'proj_2', expect error: proj
+select from projection 'proj_2'
 12
 16
 used projections
@@ -417,12 +429,12 @@ all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
 all_2_2_0	1	['proj_2']
 all_3_3_0	1	['proj','proj_2']
-select from projection 'proj', expect error: 
+select from projection 'proj'
 12
 16
 used projections
 SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: 
+select from projection 'proj_2'
 12
 16
 used projections
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 7315cf5ce61..eeea512f14a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -29,7 +29,7 @@ function create_table()
             SELECT d ORDER BY c
         )
     )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_32_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
@@ -155,39 +155,41 @@ function check()
     WHERE table='$table' AND database=currentDatabase()
     ORDER BY name;"
 
-    echo "select from projection 'proj', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj" ]
         then
+            echo "select from projection 'proj', expect error: $expect_broken_part"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-SET send_logs_level='fatal';
-SELECT c FROM $table WHERE d == 12 ORDER BY c;
-" 2>&1 | grep -oF "$expected_error"
+                SET send_logs_level='fatal';
+                SELECT c FROM $table WHERE d == 12 ORDER BY c;
+            " 2>&1 | grep -oF "$expected_error"
         else
+            echo "select from projection 'proj'"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
-            SYSTEM FLUSH LOGS;
-            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+                SYSTEM FLUSH LOGS;
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
-    echo "select from projection 'proj_2', expect error: $expect_broken_part"
     query_id=$(random 8)
 
     if [ "$expect_broken_part" = "proj_2" ]
         then
+            echo "select from projection 'proj_2', expect error: $expect_broken_part"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-SET send_logs_level='fatal';
-SELECT d FROM $table WHERE c == 12 ORDER BY d;
-" 2>&1 | grep -oF "$expected_error"
+                SET send_logs_level='fatal';
+                SELECT d FROM $table WHERE c == 12 ORDER BY d;
+            " 2>&1 | grep -oF "$expected_error"
         else
+            echo "select from projection 'proj_2'"
             $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
             echo 'used projections'
             $CLICKHOUSE_CLIENT -nm -q "
-            SYSTEM FLUSH LOGS;
-            SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
+                SYSTEM FLUSH LOGS;
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
             "
     fi
 
@@ -436,13 +438,13 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
-    check test proj
+    check test
 
     broken_projections_info test
 
     break_projection test proj all_2_2_0 part
 
-    check test proj
+    check test proj STD_EXCEPTION
 
     broken_projections_info test
 
@@ -453,7 +455,7 @@ function test3()
 
     materialize_projection test proj
 
-    check test proj
+    check test
 
     broken_projections_info test
 
@@ -468,7 +470,7 @@ function test3()
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
-    check test proj
+    check test
 
     break_projection test proj all_2_2_0 part
 

From 7ab4af06df0d78e6728e3cc5c727e5c9e4cc33ef Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 4 Dec 2023 18:04:42 +0000
Subject: [PATCH 0037/1081] Attempt to support subqueries in TTL. (2)

---
 src/Processors/QueryPlan/CreatingSetsStep.cpp | 29 +++++++++++
 src/Processors/QueryPlan/CreatingSetsStep.h   |  2 +
 src/Processors/TTL/ITTLAlgorithm.cpp          |  2 +-
 src/Processors/TTL/ITTLAlgorithm.h            |  6 +--
 .../TTL/TTLAggregationAlgorithm.cpp           |  2 +-
 src/Processors/TTL/TTLAggregationAlgorithm.h  |  2 +-
 src/Processors/TTL/TTLColumnAlgorithm.cpp     |  2 +-
 src/Processors/TTL/TTLColumnAlgorithm.h       |  2 +-
 src/Processors/TTL/TTLDeleteAlgorithm.cpp     |  2 +-
 src/Processors/TTL/TTLDeleteAlgorithm.h       |  2 +-
 src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp |  2 +-
 src/Processors/TTL/TTLUpdateInfoAlgorithm.h   |  2 +-
 .../Transforms/TTLCalcTransform.cpp           | 33 ++++++++++---
 src/Processors/Transforms/TTLCalcTransform.h  |  4 ++
 src/Processors/Transforms/TTLTransform.cpp    | 33 ++++++++++---
 src/Processors/Transforms/TTLTransform.h      |  5 ++
 src/Storages/MergeTree/MergeTask.cpp          | 36 +++++++++-----
 .../MergeTree/MergeTreeDataWriter.cpp         |  2 +-
 src/Storages/MergeTree/MutateTask.cpp         | 49 ++++++++++++++-----
 src/Storages/StorageInMemoryMetadata.cpp      |  8 +--
 src/Storages/TTLDescription.cpp               | 21 +++++++-
 src/Storages/TTLDescription.h                 |  7 +--
 22 files changed, 197 insertions(+), 56 deletions(-)

diff --git a/src/Processors/QueryPlan/CreatingSetsStep.cpp b/src/Processors/QueryPlan/CreatingSetsStep.cpp
index 3e4dfb0c7d1..11415e8d815 100644
--- a/src/Processors/QueryPlan/CreatingSetsStep.cpp
+++ b/src/Processors/QueryPlan/CreatingSetsStep.cpp
@@ -157,6 +157,35 @@ void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::Subqueries subque
     query_plan.unitePlans(std::move(creating_sets), std::move(plans));
 }
 
+QueryPipelineBuilderPtr addCreatingSetsTransform(QueryPipelineBuilderPtr pipeline, PreparedSets::Subqueries subqueries, ContextPtr context)
+{
+    DataStreams input_streams;
+    input_streams.emplace_back(DataStream{pipeline->getHeader()});
+
+    QueryPipelineBuilders pipelines;
+    pipelines.reserve(1 + subqueries.size());
+    pipelines.push_back(std::move(pipeline));
+
+    auto plan_settings = QueryPlanOptimizationSettings::fromContext(context);
+    auto pipeline_settings = BuildQueryPipelineSettings::fromContext(context);
+
+    for (auto & future_set : subqueries)
+    {
+        if (future_set->get())
+            continue;
+
+        auto plan = future_set->build(context);
+        if (!plan)
+            continue;
+
+        input_streams.emplace_back(plan->getCurrentDataStream());
+        pipelines.emplace_back(plan->buildQueryPipeline(plan_settings, pipeline_settings));
+    }
+
+    CreatingSetsStep(input_streams).updatePipeline(std::move(pipelines), pipeline_settings);
+    return std::move(pipelines.front());
+}
+
 std::vector<std::unique_ptr<QueryPlan>> DelayedCreatingSetsStep::makePlansForSets(DelayedCreatingSetsStep && step)
 {
     std::vector<std::unique_ptr<QueryPlan>> plans;
diff --git a/src/Processors/QueryPlan/CreatingSetsStep.h b/src/Processors/QueryPlan/CreatingSetsStep.h
index a90b70a2fa4..292ec19914c 100644
--- a/src/Processors/QueryPlan/CreatingSetsStep.h
+++ b/src/Processors/QueryPlan/CreatingSetsStep.h
@@ -72,4 +72,6 @@ void addCreatingSetsStep(QueryPlan & query_plan, PreparedSets::Subqueries subque
 
 void addCreatingSetsStep(QueryPlan & query_plan, PreparedSetsPtr prepared_sets, ContextPtr context);
 
+QueryPipelineBuilderPtr addCreatingSetsTransform(QueryPipelineBuilderPtr pipeline, PreparedSets::Subqueries subqueries, ContextPtr context);
+
 }
diff --git a/src/Processors/TTL/ITTLAlgorithm.cpp b/src/Processors/TTL/ITTLAlgorithm.cpp
index af6c4e4ac35..761f43e2422 100644
--- a/src/Processors/TTL/ITTLAlgorithm.cpp
+++ b/src/Processors/TTL/ITTLAlgorithm.cpp
@@ -11,7 +11,7 @@ namespace ErrorCodes
 }
 
 ITTLAlgorithm::ITTLAlgorithm(
-    const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
+    const TTLExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
     : ttl_expressions(ttl_expressions_)
     , description(description_)
     , old_ttl_info(old_ttl_info_)
diff --git a/src/Processors/TTL/ITTLAlgorithm.h b/src/Processors/TTL/ITTLAlgorithm.h
index 6e73286b564..d79aa8a8dfc 100644
--- a/src/Processors/TTL/ITTLAlgorithm.h
+++ b/src/Processors/TTL/ITTLAlgorithm.h
@@ -8,7 +8,7 @@
 namespace DB
 {
 
-struct TTlExpressions
+struct TTLExpressions
 {
     ExpressionActionsPtr expression;
     ExpressionActionsPtr where_expression;
@@ -24,7 +24,7 @@ public:
     using TTLInfo = IMergeTreeDataPart::TTLInfo;
     using MutableDataPartPtr = MergeTreeMutableDataPartPtr;
 
-    ITTLAlgorithm(const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
+    ITTLAlgorithm(const TTLExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
     virtual ~ITTLAlgorithm() = default;
 
     virtual void execute(Block & block) = 0;
@@ -45,7 +45,7 @@ protected:
     bool isTTLExpired(time_t ttl) const;
     UInt32 getTimestampByIndex(const IColumn * column, size_t index) const;
 
-    const TTlExpressions ttl_expressions;
+    const TTLExpressions ttl_expressions;
     const TTLDescription description;
     const TTLInfo old_ttl_info;
     const time_t current_time;
diff --git a/src/Processors/TTL/TTLAggregationAlgorithm.cpp b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
index ab2ba5f58fc..0c6184a56e5 100644
--- a/src/Processors/TTL/TTLAggregationAlgorithm.cpp
+++ b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
@@ -5,7 +5,7 @@ namespace DB
 {
 
 TTLAggregationAlgorithm::TTLAggregationAlgorithm(
-    const TTlExpressions & ttl_expressions_,
+    const TTLExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
diff --git a/src/Processors/TTL/TTLAggregationAlgorithm.h b/src/Processors/TTL/TTLAggregationAlgorithm.h
index 9fd074efba8..f7bf19a202b 100644
--- a/src/Processors/TTL/TTLAggregationAlgorithm.h
+++ b/src/Processors/TTL/TTLAggregationAlgorithm.h
@@ -13,7 +13,7 @@ class TTLAggregationAlgorithm final : public ITTLAlgorithm
 {
 public:
     TTLAggregationAlgorithm(
-        const TTlExpressions & ttl_expressions_,
+        const TTLExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLInfo & old_ttl_info_,
         time_t current_time_,
diff --git a/src/Processors/TTL/TTLColumnAlgorithm.cpp b/src/Processors/TTL/TTLColumnAlgorithm.cpp
index cb99dcf99b1..e27050564ce 100644
--- a/src/Processors/TTL/TTLColumnAlgorithm.cpp
+++ b/src/Processors/TTL/TTLColumnAlgorithm.cpp
@@ -4,7 +4,7 @@ namespace DB
 {
 
 TTLColumnAlgorithm::TTLColumnAlgorithm(
-    const TTlExpressions & ttl_expressions_,
+    const TTLExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
diff --git a/src/Processors/TTL/TTLColumnAlgorithm.h b/src/Processors/TTL/TTLColumnAlgorithm.h
index efcd7c74454..f34dae952d1 100644
--- a/src/Processors/TTL/TTLColumnAlgorithm.h
+++ b/src/Processors/TTL/TTLColumnAlgorithm.h
@@ -11,7 +11,7 @@ class TTLColumnAlgorithm final : public ITTLAlgorithm
 {
 public:
     TTLColumnAlgorithm(
-        const TTlExpressions & ttl_expressions_,
+        const TTLExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLInfo & old_ttl_info_,
         time_t current_time_,
diff --git a/src/Processors/TTL/TTLDeleteAlgorithm.cpp b/src/Processors/TTL/TTLDeleteAlgorithm.cpp
index 6a172e9c3c3..6f9bc315276 100644
--- a/src/Processors/TTL/TTLDeleteAlgorithm.cpp
+++ b/src/Processors/TTL/TTLDeleteAlgorithm.cpp
@@ -4,7 +4,7 @@ namespace DB
 {
 
 TTLDeleteAlgorithm::TTLDeleteAlgorithm(
-    const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
+    const TTLExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_)
     : ITTLAlgorithm(ttl_expressions_, description_, old_ttl_info_, current_time_, force_)
 {
     if (!isMinTTLExpired())
diff --git a/src/Processors/TTL/TTLDeleteAlgorithm.h b/src/Processors/TTL/TTLDeleteAlgorithm.h
index 23389070774..622e45acecb 100644
--- a/src/Processors/TTL/TTLDeleteAlgorithm.h
+++ b/src/Processors/TTL/TTLDeleteAlgorithm.h
@@ -10,7 +10,7 @@ namespace DB
 class TTLDeleteAlgorithm final : public ITTLAlgorithm
 {
 public:
-    TTLDeleteAlgorithm(const TTlExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
+    TTLDeleteAlgorithm(const TTLExpressions & ttl_expressions_, const TTLDescription & description_, const TTLInfo & old_ttl_info_, time_t current_time_, bool force_);
 
     void execute(Block & block) override;
     void finalize(const MutableDataPartPtr & data_part) const override;
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
index 34c0cad70ea..b7cddf3c165 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
@@ -4,7 +4,7 @@ namespace DB
 {
 
 TTLUpdateInfoAlgorithm::TTLUpdateInfoAlgorithm(
-    const TTlExpressions & ttl_expressions_,
+    const TTLExpressions & ttl_expressions_,
     const TTLDescription & description_,
     const TTLUpdateField ttl_update_field_,
     const String ttl_update_key_,
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
index e9bcfcdec88..0cf31765aef 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
@@ -20,7 +20,7 @@ class TTLUpdateInfoAlgorithm : public ITTLAlgorithm
 {
 public:
     TTLUpdateInfoAlgorithm(
-        const TTlExpressions & ttl_expressions_,
+        const TTLExpressions & ttl_expressions_,
         const TTLDescription & description_,
         const TTLUpdateField ttl_update_field_,
         const String ttl_update_key_,
diff --git a/src/Processors/Transforms/TTLCalcTransform.cpp b/src/Processors/Transforms/TTLCalcTransform.cpp
index 31fb61239ef..204dfe21733 100644
--- a/src/Processors/Transforms/TTLCalcTransform.cpp
+++ b/src/Processors/Transforms/TTLCalcTransform.cpp
@@ -4,7 +4,22 @@
 namespace DB
 {
 
+static TTLExpressions getExpressions(const TTLDescription & ttl_descr, PreparedSets::Subqueries & subqueries_for_sets, const ContextPtr & context)
+{
+    auto expr = ttl_descr.buildExpression(context);
+    auto where_expr = ttl_descr.buildWhereExpression(context);
+
+    auto expr_queries = expr.sets->getSubqueries();
+    auto where_expr_queries = expr.sets->getSubqueries();
+
+    subqueries_for_sets.insert(subqueries_for_sets.end(), expr_queries.begin(), expr_queries.end());
+    subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+
+    return {expr.expression, where_expr.expression};
+}
+
 TTLCalcTransform::TTLCalcTransform(
+    const ContextPtr & context,
     const Block & header_,
     const MergeTreeData & storage_,
     const StorageMetadataPtr & metadata_snapshot_,
@@ -21,33 +36,39 @@ TTLCalcTransform::TTLCalcTransform(
     {
         const auto & rows_ttl = metadata_snapshot_->getRowsTTL();
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            rows_ttl, TTLUpdateField::TABLE_TTL, rows_ttl.result_column, old_ttl_infos.table_ttl, current_time_, force_));
+            getExpressions(rows_ttl, subqueries_for_sets, context), rows_ttl,
+            TTLUpdateField::TABLE_TTL, rows_ttl.result_column, old_ttl_infos.table_ttl, current_time_, force_));
     }
 
     for (const auto & where_ttl : metadata_snapshot_->getRowsWhereTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            where_ttl, TTLUpdateField::ROWS_WHERE_TTL, where_ttl.result_column, old_ttl_infos.rows_where_ttl[where_ttl.result_column], current_time_, force_));
+            getExpressions(where_ttl, subqueries_for_sets, context), where_ttl,
+            TTLUpdateField::ROWS_WHERE_TTL, where_ttl.result_column, old_ttl_infos.rows_where_ttl[where_ttl.result_column], current_time_, force_));
 
     for (const auto & group_by_ttl : metadata_snapshot_->getGroupByTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            group_by_ttl, TTLUpdateField::GROUP_BY_TTL, group_by_ttl.result_column, old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_));
+            getExpressions(group_by_ttl, subqueries_for_sets, context), group_by_ttl,
+            TTLUpdateField::GROUP_BY_TTL, group_by_ttl.result_column, old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_));
 
     if (metadata_snapshot_->hasAnyColumnTTL())
     {
         for (const auto & [name, description] : metadata_snapshot_->getColumnTTLs())
         {
             algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-                description, TTLUpdateField::COLUMNS_TTL, name, old_ttl_infos.columns_ttl[name], current_time_, force_));
+                getExpressions(description, subqueries_for_sets, context), description,
+                TTLUpdateField::COLUMNS_TTL, name, old_ttl_infos.columns_ttl[name], current_time_, force_));
         }
     }
 
     for (const auto & move_ttl : metadata_snapshot_->getMoveTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            move_ttl, TTLUpdateField::MOVES_TTL, move_ttl.result_column, old_ttl_infos.moves_ttl[move_ttl.result_column], current_time_, force_));
+            getExpressions(move_ttl, subqueries_for_sets, context), move_ttl,
+            TTLUpdateField::MOVES_TTL, move_ttl.result_column, old_ttl_infos.moves_ttl[move_ttl.result_column], current_time_, force_));
 
     for (const auto & recompression_ttl : metadata_snapshot_->getRecompressionTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            recompression_ttl, TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
+            getExpressions(recompression_ttl, subqueries_for_sets, context), recompression_ttl,
+            TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
 }
 
 void TTLCalcTransform::consume(Chunk chunk)
diff --git a/src/Processors/Transforms/TTLCalcTransform.h b/src/Processors/Transforms/TTLCalcTransform.h
index 495879400dc..960438f5f2b 100644
--- a/src/Processors/Transforms/TTLCalcTransform.h
+++ b/src/Processors/Transforms/TTLCalcTransform.h
@@ -15,6 +15,7 @@ class TTLCalcTransform : public IAccumulatingTransform
 {
 public:
     TTLCalcTransform(
+        const ContextPtr & context,
         const Block & header_,
         const MergeTreeData & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
@@ -23,6 +24,8 @@ public:
         bool force_
     );
 
+    PreparedSets::Subqueries getSubqueries() { return std::move(subqueries_for_sets); }
+
     String getName() const override { return "TTL_CALC"; }
     Status prepare() override;
 
@@ -35,6 +38,7 @@ protected:
 
 private:
     std::vector<TTLAlgorithmPtr> algorithms;
+    PreparedSets::Subqueries subqueries_for_sets;
 
     /// ttl_infos and empty_columns are updating while reading
     const MergeTreeData::MutableDataPartPtr & data_part;
diff --git a/src/Processors/Transforms/TTLTransform.cpp b/src/Processors/Transforms/TTLTransform.cpp
index d3d45f68d46..69e2e6e5fc0 100644
--- a/src/Processors/Transforms/TTLTransform.cpp
+++ b/src/Processors/Transforms/TTLTransform.cpp
@@ -16,7 +16,22 @@
 namespace DB
 {
 
+static TTLExpressions getExpressions(const TTLDescription & ttl_descr, PreparedSets::Subqueries & subqueries_for_sets, const ContextPtr & context)
+{
+    auto expr = ttl_descr.buildExpression(context);
+    auto where_expr = ttl_descr.buildWhereExpression(context);
+
+    auto expr_queries = expr.sets->getSubqueries();
+    auto where_expr_queries = expr.sets->getSubqueries();
+
+    subqueries_for_sets.insert(subqueries_for_sets.end(), expr_queries.begin(), expr_queries.end());
+    subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+
+    return {expr.expression, where_expr.expression};
+}
+
 TTLTransform::TTLTransform(
+    const ContextPtr & context,
     const Block & header_,
     const MergeTreeData & storage_,
     const StorageMetadataPtr & metadata_snapshot_,
@@ -33,7 +48,8 @@ TTLTransform::TTLTransform(
     {
         const auto & rows_ttl = metadata_snapshot_->getRowsTTL();
         auto algorithm = std::make_unique<TTLDeleteAlgorithm>(
-            rows_ttl, old_ttl_infos.table_ttl, current_time_, force_);
+            getExpressions(rows_ttl, subqueries_for_sets, context), rows_ttl,
+            old_ttl_infos.table_ttl, current_time_, force_);
 
         /// Skip all data if table ttl is expired for part
         if (algorithm->isMaxTTLExpired() && !rows_ttl.where_expression_ast)
@@ -45,11 +61,13 @@ TTLTransform::TTLTransform(
 
     for (const auto & where_ttl : metadata_snapshot_->getRowsWhereTTLs())
         algorithms.emplace_back(std::make_unique<TTLDeleteAlgorithm>(
-            where_ttl, old_ttl_infos.rows_where_ttl[where_ttl.result_column], current_time_, force_));
+            getExpressions(where_ttl, subqueries_for_sets, context), where_ttl,
+            old_ttl_infos.rows_where_ttl[where_ttl.result_column], current_time_, force_));
 
     for (const auto & group_by_ttl : metadata_snapshot_->getGroupByTTLs())
         algorithms.emplace_back(std::make_unique<TTLAggregationAlgorithm>(
-                group_by_ttl, old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_,
+                getExpressions(group_by_ttl, subqueries_for_sets, context), group_by_ttl,
+                old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_,
                 getInputPort().getHeader(), storage_));
 
     if (metadata_snapshot_->hasAnyColumnTTL())
@@ -75,18 +93,21 @@ TTLTransform::TTLTransform(
             }
 
             algorithms.emplace_back(std::make_unique<TTLColumnAlgorithm>(
-                description, old_ttl_infos.columns_ttl[name], current_time_,
+                getExpressions(description, subqueries_for_sets, context), description,
+                old_ttl_infos.columns_ttl[name], current_time_,
                 force_, name, default_expression, default_column_name, isCompactPart(data_part)));
         }
     }
 
     for (const auto & move_ttl : metadata_snapshot_->getMoveTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            move_ttl, TTLUpdateField::MOVES_TTL, move_ttl.result_column, old_ttl_infos.moves_ttl[move_ttl.result_column], current_time_, force_));
+            getExpressions(move_ttl, subqueries_for_sets, context), move_ttl,
+            TTLUpdateField::MOVES_TTL, move_ttl.result_column, old_ttl_infos.moves_ttl[move_ttl.result_column], current_time_, force_));
 
     for (const auto & recompression_ttl : metadata_snapshot_->getRecompressionTTLs())
         algorithms.emplace_back(std::make_unique<TTLUpdateInfoAlgorithm>(
-            recompression_ttl, TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
+            getExpressions(recompression_ttl, subqueries_for_sets, context), recompression_ttl,
+            TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
 }
 
 Block reorderColumns(Block block, const Block & header)
diff --git a/src/Processors/Transforms/TTLTransform.h b/src/Processors/Transforms/TTLTransform.h
index 3f0dffd1998..47da456a2e3 100644
--- a/src/Processors/Transforms/TTLTransform.h
+++ b/src/Processors/Transforms/TTLTransform.h
@@ -16,6 +16,7 @@ class TTLTransform : public IAccumulatingTransform
 {
 public:
     TTLTransform(
+        const ContextPtr & context,
         const Block & header_,
         const MergeTreeData & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
@@ -28,6 +29,8 @@ public:
 
     Status prepare() override;
 
+    PreparedSets::Subqueries getSubqueries() { return std::move(subqueries_for_sets); }
+
 protected:
     void consume(Chunk chunk) override;
     Chunk generate() override;
@@ -40,6 +43,8 @@ private:
     const TTLDeleteAlgorithm * delete_algorithm = nullptr;
     bool all_data_dropped = false;
 
+    PreparedSets::Subqueries subqueries_for_sets;
+
     /// ttl_infos and empty_columns are updating while reading
     const MergeTreeData::MutableDataPartPtr & data_part;
     Poco::Logger * log;
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index e8e307bb148..26b290d33d5 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -31,6 +31,9 @@
 #include <Processors/Transforms/TTLCalcTransform.h>
 #include <Processors/Transforms/DistinctSortedTransform.h>
 #include <Processors/Transforms/DistinctTransform.h>
+#include <Processors/QueryPlan/CreatingSetsStep.h>
+#include <Interpreters/PreparedSets.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
 
 namespace DB
 {
@@ -1004,8 +1007,9 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
             break;
     }
 
-    auto res_pipe = Pipe::unitePipes(std::move(pipes));
-    res_pipe.addTransform(std::move(merged_transform));
+    auto builder = std::make_unique<QueryPipelineBuilder>();
+    builder->init(Pipe::unitePipes(std::move(pipes)));
+    builder->addTransform(std::move(merged_transform));
 
     if (global_ctx->deduplicate)
     {
@@ -1021,26 +1025,34 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
         }
 
         if (DistinctSortedTransform::isApplicable(header, sort_description, global_ctx->deduplicate_by_columns))
-            res_pipe.addTransform(std::make_shared<DistinctSortedTransform>(
-                res_pipe.getHeader(), sort_description, SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns));
+            builder->addTransform(std::make_shared<DistinctSortedTransform>(
+                builder->getHeader(), sort_description, SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns));
         else
-            res_pipe.addTransform(std::make_shared<DistinctTransform>(
-                res_pipe.getHeader(), SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns));
+            builder->addTransform(std::make_shared<DistinctTransform>(
+                builder->getHeader(), SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns));
     }
 
+    PreparedSets::Subqueries subqueries;
+
     if (ctx->need_remove_expired_values)
-        res_pipe.addTransform(std::make_shared<TTLTransform>(
-            res_pipe.getHeader(), *global_ctx->data, global_ctx->metadata_snapshot, global_ctx->new_data_part, global_ctx->time_of_merge, ctx->force_ttl));
+    {
+        auto transform = std::make_shared<TTLTransform>(global_ctx->context, builder->getHeader(), *global_ctx->data, global_ctx->metadata_snapshot, global_ctx->new_data_part, global_ctx->time_of_merge, ctx->force_ttl);
+        subqueries = transform->getSubqueries();
+        builder->addTransform(std::move(transform));
+    }
 
     if (global_ctx->metadata_snapshot->hasSecondaryIndices())
     {
         const auto & indices = global_ctx->metadata_snapshot->getSecondaryIndices();
-        res_pipe.addTransform(std::make_shared<ExpressionTransform>(
-            res_pipe.getHeader(), indices.getSingleExpressionForIndices(global_ctx->metadata_snapshot->getColumns(), global_ctx->data->getContext())));
-        res_pipe.addTransform(std::make_shared<MaterializingTransform>(res_pipe.getHeader()));
+        builder->addTransform(std::make_shared<ExpressionTransform>(
+            builder->getHeader(), indices.getSingleExpressionForIndices(global_ctx->metadata_snapshot->getColumns(), global_ctx->data->getContext())));
+        builder->addTransform(std::make_shared<MaterializingTransform>(builder->getHeader()));
     }
 
-    global_ctx->merged_pipeline = QueryPipeline(std::move(res_pipe));
+    if (!subqueries.empty())
+        builder = addCreatingSetsTransform(std::move(builder), std::move(subqueries), global_ctx->context);
+
+    global_ctx->merged_pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
     /// Dereference unique_ptr and pass horizontal_stage_progress by reference
     global_ctx->merged_pipeline.setProgressCallback(MergeProgressCallback(global_ctx->merge_list_element_ptr, global_ctx->watch_prev_elapsed, *global_ctx->horizontal_stage_progress));
     /// Is calculated inside MergeProgressCallback.
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index d080240b066..ce9e5762cb4 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -132,7 +132,7 @@ void updateTTL(
     const Block & block,
     bool update_part_min_max_ttls)
 {
-    auto expr_and_set = ttl_entry.buildExpression();
+    auto expr_and_set = ttl_entry.buildExpression(context);
     for (auto & subquery : expr_and_set.sets->getSubqueries())
         subquery->buildSetInplace(context);
 
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 6b6b5947581..61849f94e44 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -8,6 +8,7 @@
 #include <Parsers/queryToString.h>
 #include <Interpreters/SquashingTransform.h>
 #include <Interpreters/MergeTreeTransaction.h>
+#include <Interpreters/PreparedSets.h>
 #include <Processors/Transforms/TTLTransform.h>
 #include <Processors/Transforms/TTLCalcTransform.h>
 #include <Processors/Transforms/DistinctSortedTransform.h>
@@ -16,6 +17,7 @@
 #include <Processors/Transforms/ExpressionTransform.h>
 #include <Processors/Transforms/MaterializingTransform.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
+#include <Processors/QueryPlan/CreatingSetsStep.h>
 #include <Storages/MergeTree/StorageFromMergeTreeDataPart.h>
 #include <Storages/MergeTree/MergeTreeDataWriter.h>
 #include <Storages/MutationCommands.h>
@@ -1507,21 +1509,34 @@ private:
         if (!ctx->mutating_pipeline_builder.initialized())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot mutate part columns with uninitialized mutations stream. It's a bug");
 
-        QueryPipelineBuilder builder(std::move(ctx->mutating_pipeline_builder));
+        auto builder = std::make_unique<QueryPipelineBuilder>(std::move(ctx->mutating_pipeline_builder));
 
         if (ctx->metadata_snapshot->hasPrimaryKey() || ctx->metadata_snapshot->hasSecondaryIndices())
         {
-            builder.addTransform(std::make_shared<ExpressionTransform>(
-                builder.getHeader(), ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot, skip_indices)));
+            builder->addTransform(std::make_shared<ExpressionTransform>(
+                builder->getHeader(), ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot, skip_indices)));
 
-            builder.addTransform(std::make_shared<MaterializingTransform>(builder.getHeader()));
+            builder->addTransform(std::make_shared<MaterializingTransform>(builder->getHeader()));
         }
 
+        PreparedSets::Subqueries subqueries;
+
         if (ctx->execute_ttl_type == ExecuteTTLType::NORMAL)
-            builder.addTransform(std::make_shared<TTLTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
+        {
+            auto transform = std::make_shared<TTLTransform>(ctx->context, builder->getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+            subqueries = transform->getSubqueries();
+            builder->addTransform(std::move(transform));
+        }
 
         if (ctx->execute_ttl_type == ExecuteTTLType::RECALCULATE)
-            builder.addTransform(std::make_shared<TTLCalcTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
+        {
+            auto transform = std::make_shared<TTLCalcTransform>(ctx->context, builder->getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+            subqueries = transform->getSubqueries();
+            builder->addTransform(std::move(transform));
+        }
+
+        if (!subqueries.empty())
+            builder = addCreatingSetsTransform(std::move(builder), std::move(subqueries), ctx->context);
 
         ctx->minmax_idx = std::make_shared<IMergeTreeDataPart::MinMaxIndex>();
 
@@ -1537,7 +1552,7 @@ private:
             /*blocks_are_granules_size=*/ false,
             ctx->context->getWriteSettings());
 
-        ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
+        ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
         ctx->mutating_pipeline.setProgressCallback(ctx->progress_callback);
         /// Is calculated inside MergeProgressCallback.
         ctx->mutating_pipeline.disableProfileEventUpdate();
@@ -1712,13 +1727,25 @@ private:
 
         if (ctx->mutating_pipeline_builder.initialized())
         {
-            QueryPipelineBuilder builder(std::move(ctx->mutating_pipeline_builder));
+            auto builder = std::make_unique<QueryPipelineBuilder>(std::move(ctx->mutating_pipeline_builder));
+            PreparedSets::Subqueries subqueries;
 
             if (ctx->execute_ttl_type == ExecuteTTLType::NORMAL)
-                builder.addTransform(std::make_shared<TTLTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
+            {
+                auto transform = std::make_shared<TTLTransform>(ctx->context, builder->getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+                subqueries = transform->getSubqueries();
+                builder->addTransform(std::move(transform));
+            }
 
             if (ctx->execute_ttl_type == ExecuteTTLType::RECALCULATE)
-                builder.addTransform(std::make_shared<TTLCalcTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
+            {
+                auto transform = std::make_shared<TTLCalcTransform>(ctx->context, builder->getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+                subqueries = transform->getSubqueries();
+                builder->addTransform(std::move(transform));
+            }
+
+            if (!subqueries.empty())
+                builder = addCreatingSetsTransform(std::move(builder), std::move(subqueries), ctx->context);
 
             ctx->out = std::make_shared<MergedColumnOnlyOutputStream>(
                 ctx->new_data_part,
@@ -1732,7 +1759,7 @@ private:
                 &ctx->source_part->index_granularity_info
             );
 
-            ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
+            ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
             ctx->mutating_pipeline.setProgressCallback(ctx->progress_callback);
             /// Is calculated inside MergeProgressCallback.
             ctx->mutating_pipeline.disableProfileEventUpdate();
diff --git a/src/Storages/StorageInMemoryMetadata.cpp b/src/Storages/StorageInMemoryMetadata.cpp
index 7db5af82e0b..158c13b653d 100644
--- a/src/Storages/StorageInMemoryMetadata.cpp
+++ b/src/Storages/StorageInMemoryMetadata.cpp
@@ -279,7 +279,7 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
 
     auto add_for_rows_ttl = [&](const auto & expression, auto & to_set)
     {
-        if (add_dependent_columns(expression, to_set) && include_ttl_target)
+        if (add_dependent_columns(expression.getNames(), to_set) && include_ttl_target)
         {
             /// Filter all columns, if rows TTL expression have to be recalculated.
             for (const auto & column : getColumns().getAllPhysical())
@@ -297,16 +297,16 @@ ColumnDependencies StorageInMemoryMetadata::getColumnDependencies(
         add_for_rows_ttl(entry.expression_columns, required_ttl_columns);
 
     for (const auto & entry : getRecompressionTTLs())
-        add_dependent_columns(entry.expression_columns, required_ttl_columns);
+        add_dependent_columns(entry.expression_columns.getNames(), required_ttl_columns);
 
     for (const auto & [name, entry] : getColumnTTLs())
     {
-        if (add_dependent_columns(entry.expression_columns, required_ttl_columns) && include_ttl_target)
+        if (add_dependent_columns(entry.expression_columns.getNames(), required_ttl_columns) && include_ttl_target)
             updated_ttl_columns.insert(name);
     }
 
     for (const auto & entry : getMoveTTLs())
-        add_dependent_columns(entry.expression_columns, required_ttl_columns);
+        add_dependent_columns(entry.expression_columns.getNames(), required_ttl_columns);
 
     //TODO what about rows_where_ttl and group_by_ttl ??
 
diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index 47138f30e4f..e02ac933028 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -169,6 +169,23 @@ static ExpressionAndSets buildExpressionAndSets(ASTPtr & ast, const NamesAndType
     return result;
 }
 
+ExpressionAndSets TTLDescription::buildExpression(const ContextPtr & context) const
+{
+    auto ast = expression_ast->clone();
+    return buildExpressionAndSets(ast, expression_columns, context);
+}
+
+ExpressionAndSets TTLDescription::buildWhereExpression(const ContextPtr & context) const
+{
+    if (where_expression_ast)
+    {
+        auto ast = where_expression_ast->clone();
+        return buildExpressionAndSets(ast, where_expression_columns, context);
+    }
+
+    return {};
+}
+
 TTLDescription TTLDescription::getTTLFromAST(
     const ASTPtr & definition_ast,
     const ColumnsDescription & columns,
@@ -186,7 +203,7 @@ TTLDescription TTLDescription::getTTLFromAST(
 
     auto ttl_ast = result.expression_ast->clone();
     auto expression = buildExpressionAndSets(ttl_ast, columns.getAllPhysical(), context).expression;
-    result.expression_columns = expression->getRequiredColumns();
+    result.expression_columns = expression->getRequiredColumnsWithTypes();
 
     // auto syntax_analyzer_result = TreeRewriter(context).analyze(ttl_ast, columns.getAllPhysical());
     // result.expression = ExpressionAnalyzer(ttl_ast, syntax_analyzer_result, context).getActions(false);
@@ -214,6 +231,8 @@ TTLDescription TTLDescription::getTTLFromAST(
                 where_expression = buildExpressionAndSets(where_expr_ast, columns.getAllPhysical(), context).expression;
                 // auto where_syntax_result = TreeRewriter(context).analyze(where_expr_ast, columns.getAllPhysical());
                 // result.where_expression = ExpressionAnalyzer(where_expr_ast, where_syntax_result, context).getActions(false);
+
+                result.where_expression_columns = where_expression->getRequiredColumnsWithTypes();
                 result.where_result_column = where_expr_ast->getColumnName();
             }
         }
diff --git a/src/Storages/TTLDescription.h b/src/Storages/TTLDescription.h
index 5ea243424cb..7dfc736ded2 100644
--- a/src/Storages/TTLDescription.h
+++ b/src/Storages/TTLDescription.h
@@ -51,10 +51,10 @@ struct TTLDescription
     /// TTL d + INTERVAL 1 DAY
     ///    ^~~~~~~~~~~~~~~~~~~^
     ASTPtr expression_ast;
-    Names expression_columns;
+    NamesAndTypesList expression_columns;
 
     /// Expression actions evaluated from AST
-    ExpressionAndSets buildExpression() const;
+    ExpressionAndSets buildExpression(const ContextPtr & context) const;
 
     /// Result column of this TTL expression
     String result_column;
@@ -63,7 +63,8 @@ struct TTLDescription
     /// TTL ... WHERE x % 10 == 0 and y > 5
     ///              ^~~~~~~~~~~~~~~~~~~~~~^
     ASTPtr where_expression_ast;
-    ExpressionAndSets buildWhereExpression() const;
+    NamesAndTypesList where_expression_columns;
+    ExpressionAndSets buildWhereExpression(const ContextPtr & context) const;
 
     /// Name of result column from WHERE expression
     String where_result_column;

From 16558ccc840d7a15efb2ab0fe691a79c38dd5086 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 4 Dec 2023 18:13:34 +0000
Subject: [PATCH 0038/1081] Fix some tests

---
 src/Storages/TTLDescription.cpp | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index e02ac933028..e32ff11860b 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -103,7 +103,10 @@ using FindAggregateFunctionVisitor = InDepthNodeVisitor<FindAggregateFunctionFin
 TTLDescription::TTLDescription(const TTLDescription & other)
     : mode(other.mode)
     , expression_ast(other.expression_ast ? other.expression_ast->clone() : nullptr)
+    , expression_columns(other.expression_columns)
     , result_column(other.result_column)
+    , where_expression_ast(other.where_expression_ast ? other.where_expression_ast->clone() : nullptr)
+    , where_expression_columns(other.where_expression_columns)
     , where_result_column(other.where_result_column)
     , group_by_keys(other.group_by_keys)
     , set_parts(other.set_parts)
@@ -136,12 +139,20 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
     // else
     //     expression.reset();
 
+    expression_columns = other.expression_columns;
     result_column = other.result_column;
+
+    if (other.where_expression_ast)
+        where_expression_ast = other.where_expression_ast->clone();
+    else
+        where_expression_ast.reset();
+
     // if (other.where_expression)
     //     where_expression = other.where_expression->clone();
     // else
     //     where_expression.reset();
 
+    where_expression_columns = other.where_expression_columns;
     where_result_column = other.where_result_column;
     group_by_keys = other.group_by_keys;
     set_parts = other.set_parts;

From 4de048904a3cbb6ff30e20b5a8defd1564f2e722 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Dec 2023 19:14:06 +0100
Subject: [PATCH 0039/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index eeea512f14a..261342da103 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: no-random-merge-tree-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From d3b80ac60cdb1fa17fb8907a7a6f11afde759bab Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Dec 2023 19:14:55 +0100
Subject: [PATCH 0040/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 261342da103..0910ba177fb 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-random-merge-tree-settings
+# Tags: long, no-random-merge-tree-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 6a821f9e737373b28bc98f25e10439dd04e7bdb8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 4 Dec 2023 19:24:27 +0000
Subject: [PATCH 0041/1081] Fix some staff

---
 src/Processors/QueryPlan/CreatingSetsStep.cpp  |  3 +--
 src/Processors/Transforms/TTLCalcTransform.cpp | 12 +++++++-----
 src/Processors/Transforms/TTLTransform.cpp     | 12 +++++++-----
 3 files changed, 15 insertions(+), 12 deletions(-)

diff --git a/src/Processors/QueryPlan/CreatingSetsStep.cpp b/src/Processors/QueryPlan/CreatingSetsStep.cpp
index 11415e8d815..f13a717004f 100644
--- a/src/Processors/QueryPlan/CreatingSetsStep.cpp
+++ b/src/Processors/QueryPlan/CreatingSetsStep.cpp
@@ -182,8 +182,7 @@ QueryPipelineBuilderPtr addCreatingSetsTransform(QueryPipelineBuilderPtr pipelin
         pipelines.emplace_back(plan->buildQueryPipeline(plan_settings, pipeline_settings));
     }
 
-    CreatingSetsStep(input_streams).updatePipeline(std::move(pipelines), pipeline_settings);
-    return std::move(pipelines.front());
+    return CreatingSetsStep(input_streams).updatePipeline(std::move(pipelines), pipeline_settings);
 }
 
 std::vector<std::unique_ptr<QueryPlan>> DelayedCreatingSetsStep::makePlansForSets(DelayedCreatingSetsStep && step)
diff --git a/src/Processors/Transforms/TTLCalcTransform.cpp b/src/Processors/Transforms/TTLCalcTransform.cpp
index 204dfe21733..0af9f38b20f 100644
--- a/src/Processors/Transforms/TTLCalcTransform.cpp
+++ b/src/Processors/Transforms/TTLCalcTransform.cpp
@@ -7,13 +7,15 @@ namespace DB
 static TTLExpressions getExpressions(const TTLDescription & ttl_descr, PreparedSets::Subqueries & subqueries_for_sets, const ContextPtr & context)
 {
     auto expr = ttl_descr.buildExpression(context);
-    auto where_expr = ttl_descr.buildWhereExpression(context);
-
     auto expr_queries = expr.sets->getSubqueries();
-    auto where_expr_queries = expr.sets->getSubqueries();
-
     subqueries_for_sets.insert(subqueries_for_sets.end(), expr_queries.begin(), expr_queries.end());
-    subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+
+    auto where_expr = ttl_descr.buildWhereExpression(context);
+    if (where_expr.sets)
+    {
+        auto where_expr_queries = where_expr.sets->getSubqueries();
+        subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+    }
 
     return {expr.expression, where_expr.expression};
 }
diff --git a/src/Processors/Transforms/TTLTransform.cpp b/src/Processors/Transforms/TTLTransform.cpp
index 69e2e6e5fc0..69b7d80c563 100644
--- a/src/Processors/Transforms/TTLTransform.cpp
+++ b/src/Processors/Transforms/TTLTransform.cpp
@@ -19,13 +19,15 @@ namespace DB
 static TTLExpressions getExpressions(const TTLDescription & ttl_descr, PreparedSets::Subqueries & subqueries_for_sets, const ContextPtr & context)
 {
     auto expr = ttl_descr.buildExpression(context);
-    auto where_expr = ttl_descr.buildWhereExpression(context);
-
     auto expr_queries = expr.sets->getSubqueries();
-    auto where_expr_queries = expr.sets->getSubqueries();
-
     subqueries_for_sets.insert(subqueries_for_sets.end(), expr_queries.begin(), expr_queries.end());
-    subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+
+    auto where_expr = ttl_descr.buildWhereExpression(context);
+    if (where_expr.sets)
+    {
+        auto where_expr_queries = where_expr.sets->getSubqueries();
+        subqueries_for_sets.insert(subqueries_for_sets.end(), where_expr_queries.begin(), where_expr_queries.end());
+    }
 
     return {expr.expression, where_expr.expression};
 }

From 0015ec28f9f70548c31e220f2dd826e4ac21f007 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 5 Dec 2023 12:45:25 +0000
Subject: [PATCH 0042/1081] Fixing test.

---
 src/Storages/TTLDescription.cpp | 22 +++++++++++++++++++---
 1 file changed, 19 insertions(+), 3 deletions(-)

diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index e32ff11860b..bfd3afc30d8 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -18,6 +18,7 @@
 #include <Interpreters/FunctionNameNormalizer.h>
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseQuery.h>
+#include <Parsers/queryToString.h>
 
 
 namespace DB
@@ -172,11 +173,26 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
 static ExpressionAndSets buildExpressionAndSets(ASTPtr & ast, const NamesAndTypesList & columns, const ContextPtr & context)
 {
     ExpressionAndSets result;
+    auto ttl_string = queryToString(ast);
     auto syntax_analyzer_result = TreeRewriter(context).analyze(ast, columns);
     ExpressionAnalyzer analyzer(ast, syntax_analyzer_result, context);
-    result.expression = analyzer.getActions(false);
+    auto dag = analyzer.getActionsDAG(false);
+
+    const auto * col = &dag->findInOutputs(ast->getColumnName());
+    // std::cerr << "buildExpressionAndSets " << ttl_string << std::endl;
+    if (col->result_name != ttl_string)
+        col = &dag->addAlias(*col, ttl_string);
+
+    dag->getOutputs() = {col};
+    dag->removeUnusedActions();
+
+    result.expression = std::make_shared<ExpressionActions>(dag, ExpressionActionsSettings::fromContext(context));
     result.sets = analyzer.getPreparedSets();
 
+    // std::cerr << "--------- buildExpressionAndSets\n";
+    // std::cerr << result.expression->dumpActions() << std::endl;
+    // std::cerr << result.sets->getSubqueries().size() << std::endl;
+
     return result;
 }
 
@@ -218,7 +234,7 @@ TTLDescription TTLDescription::getTTLFromAST(
 
     // auto syntax_analyzer_result = TreeRewriter(context).analyze(ttl_ast, columns.getAllPhysical());
     // result.expression = ExpressionAnalyzer(ttl_ast, syntax_analyzer_result, context).getActions(false);
-    result.result_column = ttl_ast->getColumnName();
+    result.result_column = expression->getSampleBlock().safeGetByPosition(0).name;
 
     ExpressionActionsPtr where_expression;
 
@@ -244,7 +260,7 @@ TTLDescription TTLDescription::getTTLFromAST(
                 // result.where_expression = ExpressionAnalyzer(where_expr_ast, where_syntax_result, context).getActions(false);
 
                 result.where_expression_columns = where_expression->getRequiredColumnsWithTypes();
-                result.where_result_column = where_expr_ast->getColumnName();
+                result.where_result_column = where_expression->getSampleBlock().safeGetByPosition(0).name;
             }
         }
         else if (ttl_element->mode == TTLMode::GROUP_BY)

From 43a23898e0ddb71fe810dafd850cef911dace902 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 5 Dec 2023 14:20:07 +0000
Subject: [PATCH 0043/1081] Updating the tests.

---
 .../0_stateless/01465_ttl_recompression.reference      |  6 +++---
 .../queries/0_stateless/02932_set_ttl_where.reference  |  3 +++
 tests/queries/0_stateless/02932_set_ttl_where.sql      | 10 +---------
 3 files changed, 7 insertions(+), 12 deletions(-)

diff --git a/tests/queries/0_stateless/01465_ttl_recompression.reference b/tests/queries/0_stateless/01465_ttl_recompression.reference
index 108df565669..90661a5dc78 100644
--- a/tests/queries/0_stateless/01465_ttl_recompression.reference
+++ b/tests/queries/0_stateless/01465_ttl_recompression.reference
@@ -13,9 +13,9 @@ CREATE TABLE default.recompression_table\n(\n    `dt` DateTime,\n    `key` UInt6
 1_1_1	LZ4
 2_2_2	ZSTD(12)
 3_3_3	ZSTD(12)
-1_1_1	['plus(dt, toIntervalDay(1))']
-2_2_2	['plus(dt, toIntervalDay(1))']
-3_3_3	['plus(dt, toIntervalDay(1))']
+1_1_1	['dt + toIntervalDay(1)']
+2_2_2	['dt + toIntervalDay(1)']
+3_3_3	['dt + toIntervalDay(1)']
 1_1_1	LZ4
 2_2_2	LZ4
 3_3_3	LZ4
diff --git a/tests/queries/0_stateless/02932_set_ttl_where.reference b/tests/queries/0_stateless/02932_set_ttl_where.reference
index e69de29bb2d..bb0b1cf658d 100644
--- a/tests/queries/0_stateless/02932_set_ttl_where.reference
+++ b/tests/queries/0_stateless/02932_set_ttl_where.reference
@@ -0,0 +1,3 @@
+0
+0
+0
diff --git a/tests/queries/0_stateless/02932_set_ttl_where.sql b/tests/queries/0_stateless/02932_set_ttl_where.sql
index 85fddf613e8..bf2b317c4bf 100644
--- a/tests/queries/0_stateless/02932_set_ttl_where.sql
+++ b/tests/queries/0_stateless/02932_set_ttl_where.sql
@@ -1,18 +1,10 @@
-create or replace table temp (
-    a UInt32
-)
-engine = MergeTree
-order by a;
-
-insert into temp select number from system.numbers limit 100_000;
-
 create or replace table t_temp (
     a UInt32,
     timestamp DateTime
 )
 engine = MergeTree
 order by a
-TTL timestamp + INTERVAL 2 SECOND WHERE a in (select a from temp);
+TTL timestamp + INTERVAL 2 SECOND WHERE a in (select number from system.numbers limit 100_000);
 
 select sleep(1);
 insert into t_temp select rand(), now() from system.numbers limit 1_000_000;

From 7dc7062dadd5ddf3bed3dea4364cabfa97bcd61a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 6 Dec 2023 12:53:14 +0000
Subject: [PATCH 0044/1081] Fixing test.

---
 src/Interpreters/PreparedSets.cpp | 3 ++-
 src/Interpreters/Set.h            | 1 +
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index ea8d9a62b8b..9f646825d9f 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -189,7 +189,8 @@ SetPtr FutureSetFromSubquery::buildOrderedSetInplace(const ContextPtr & context)
         }
     }
 
-    set_and_key->set->fillSetElements();
+    if (!set_and_key->set->hasSetElements())
+        set_and_key->set->fillSetElements();
 
     return buildSetInplace(context);
 }
diff --git a/src/Interpreters/Set.h b/src/Interpreters/Set.h
index 7136b090c42..7e8e0f2371b 100644
--- a/src/Interpreters/Set.h
+++ b/src/Interpreters/Set.h
@@ -77,6 +77,7 @@ public:
     const DataTypes & getElementsTypes() const { return set_elements_types; }
 
     bool hasExplicitSetElements() const { return fill_set_elements || (!set_elements.empty() && set_elements.front()->size() == data.getTotalRowCount()); }
+    bool hasSetElements() const { return !set_elements.empty(); }
     Columns getSetElements() const { checkIsCreated(); return { set_elements.begin(), set_elements.end() }; }
 
     void checkColumnsNumber(size_t num_key_columns) const;

From 23bde28ac4fc18e296daf6b04283ab50ee58d025 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 8 Dec 2023 19:11:47 +0100
Subject: [PATCH 0045/1081] Fxi

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 6 ++----
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 2 +-
 src/Storages/MergeTree/MutateTask.cpp         | 6 ++++--
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 52310802c9d..5418bcd83f3 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -677,7 +677,7 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         if (!parent_part)
         {
             loadTTLInfos();
-            has_broken_projections = !loadProjections(require_columns_checksums, check_consistency, false /* if_not_loaded */);
+            loadProjections(require_columns_checksums, check_consistency, has_broken_projections, false /* if_not_loaded */);
         }
 
         if (check_consistency && !has_broken_projections)
@@ -742,10 +742,9 @@ void IMergeTreeDataPart::addProjectionPart(
     projection_parts[projection_name] = std::move(projection_part);
 }
 
-bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded)
+void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool check_consistency, bool & has_broken_projection, bool if_not_loaded)
 {
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
-    bool has_broken_projection = false;
     for (const auto & projection : metadata_snapshot->projections)
     {
         auto path = projection.name + ".proj";
@@ -782,7 +781,6 @@ bool IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
             }
         }
     }
-    return has_broken_projection;
 }
 
 void IMergeTreeDataPart::loadIndexGranularity()
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 050bd76121c..9812529086b 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -434,7 +434,7 @@ public:
     bool hasBrokenProjection(const String & projection_name) const;
 
     /// Return true, if all projections were loaded successfully and none was marked as broken.
-    bool loadProjections(bool require_columns_checksums, bool check_consistency, bool if_not_loaded = false);
+    void loadProjections(bool require_columns_checksums, bool check_consistency, bool & has_broken_projection, bool if_not_loaded = false);
 
     void setBrokenReason(const String & message, int code) const;
 
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 93b241deae7..2b0cf60a7f1 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -870,7 +870,8 @@ void finalizeMutatedPart(
     new_data_part->modification_time = time(nullptr);
 
     /// Load rest projections which are hardlinked
-    new_data_part->loadProjections(false, false, true /* if_not_loaded */);
+    bool noop;
+    new_data_part->loadProjections(false, false, noop, true /* if_not_loaded */);
 
     /// All information about sizes is stored in checksums.
     /// It doesn't make sense to touch filesystem for sizes.
@@ -1570,8 +1571,9 @@ private:
 
     void finalize()
     {
+        bool noop;
         ctx->new_data_part->minmax_idx = std::move(ctx->minmax_idx);
-        ctx->new_data_part->loadProjections(false, false, true /* if_not_loaded */);
+        ctx->new_data_part->loadProjections(false, false, noop, true /* if_not_loaded */);
         ctx->mutating_executor.reset();
         ctx->mutating_pipeline.reset();
 

From c8c4db5984bf9101478e0d1f33c3432c257ea7a0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Dec 2023 13:24:31 +0100
Subject: [PATCH 0046/1081] Fxi test

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp              | 7 +++++++
 .../queries/0_stateless/02916_broken_projection.reference  | 7 ++++---
 tests/queries/0_stateless/02916_broken_projection.sh       | 4 +++-
 3 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 5418bcd83f3..7af49edf788 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -780,6 +780,13 @@ void IMergeTreeDataPart::loadProjections(bool require_columns_checksums, bool ch
                 addProjectionPart(projection.name, std::move(part));
             }
         }
+        else if (checksums.has(path))
+        {
+            auto part = getProjectionPartBuilder(projection.name).withPartFormatFromDisk().build();
+            part->setBrokenReason("Projection directory " + path + " does not exist while loading projections", ErrorCodes::NO_FILE_IN_DATA_PART);
+            addProjectionPart(projection.name, std::move(part));
+            has_broken_projection = true;
+        }
     }
 }
 
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index b7764a6434e..358304de74a 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -406,7 +406,7 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
 0
-broke all data of part 'proj' (parent part: all_2_2_0)
+broke all data of part 'proj' (parent part: all_1_1_0)
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
@@ -421,13 +421,13 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
+all_1_1_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
 system.parts
 all_0_0_0	1	['proj','proj_2']
 all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj_2']
+all_2_2_0	1	['proj','proj_2']
 all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
@@ -442,3 +442,4 @@ SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 0
 broken projections info
+all_1_1_0	proj	NO_FILE_IN_DATA_PART
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 0910ba177fb..eb68f8621a2 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -410,6 +410,8 @@ function test2()
     check test2
 }
 
+CLICKHOUSE_DATABASE="default"
+CLICKHOUSE_TEST_UNIQUE_NAME="test123456"
 function test3()
 {
     create_table test3 test 1
@@ -473,7 +475,7 @@ function test3()
 
     check test
 
-    break_projection test proj all_2_2_0 part
+    break_projection test proj all_1_1_0 part
 
     check test proj FILE_DOESNT_EXIST
 

From cd41802d7e5b056e0114c8ad7523f00828ad5940 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 11 Dec 2023 17:37:44 +0100
Subject: [PATCH 0047/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index eb68f8621a2..a52570f3d52 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -410,8 +410,6 @@ function test2()
     check test2
 }
 
-CLICKHOUSE_DATABASE="default"
-CLICKHOUSE_TEST_UNIQUE_NAME="test123456"
 function test3()
 {
     create_table test3 test 1

From 457032d2998a085fb9c10c0b9d536e79dbcc5dab Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Dec 2023 20:40:25 +0100
Subject: [PATCH 0048/1081] Disable fault injection because it breaks
 .reference

---
 tests/queries/0_stateless/02916_broken_projection.sh | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a52570f3d52..2049610e45b 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -52,7 +52,7 @@ function insert()
     offset=$2
     size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size);"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability;"
 }
 
 function break_projection()
@@ -431,11 +431,12 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false, backup_restore_keeper_fault_injection_probability=0.0;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
     " | grep -o "RESTORED"
 
@@ -451,6 +452,7 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
     " 2>&1 | grep -o "FILE_DOESNT_EXIST"
 
@@ -462,12 +464,14 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
     " | grep -o "RESTORED"
 
@@ -481,6 +485,7 @@ function test3()
 
     ${CLICKHOUSE_CLIENT} -nm --query "
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
     settings check_projection_parts=false, allow_backup_broken_projections=true;
     " | grep -o "BACKUP_CREATED"
@@ -488,6 +493,7 @@ function test3()
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
     drop table test sync;
     set send_logs_level='fatal';
+    set backup_restore_keeper_fault_injection_probability=0.0;
     restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
     " | grep -o "RESTORED"
 

From 8ef2638cfce90031213bbbd595a50d584406a916 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 12 Dec 2023 14:22:14 +0100
Subject: [PATCH 0049/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 2049610e45b..0418759eb26 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -52,7 +52,7 @@ function insert()
     offset=$2
     size=$3
     echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability;"
+    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability=0.0;"
 }
 
 function break_projection()

From d81edb4adf65c8c3724ec27fc83b65d5d1b3ebad Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 13 Dec 2023 12:29:28 +0100
Subject: [PATCH 0050/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 0418759eb26..07495c45214 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -431,7 +431,8 @@ function test3()
     broken_projections_info test
 
     ${CLICKHOUSE_CLIENT} -nm --query "
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false, backup_restore_keeper_fault_injection_probability=0.0;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
     " | grep -o "BACKUP_CREATED"
 
     ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "

From 79432255df02f696962858347c2207dbdbf2b69f Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 18 Dec 2023 12:45:24 +0100
Subject: [PATCH 0051/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 07495c45214..55e613b8f3a 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings
+# Tags: long, no-random-merge-tree-settings, no-random-settings
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 59153e865d4ffeda3c67cbdd945e14fdc860e446 Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Tue, 19 Dec 2023 09:53:04 +0000
Subject: [PATCH 0052/1081] materialize column not to override past values

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 src/Storages/MergeTree/MutateTask.cpp         | 23 +++++++--
 .../0_stateless/02008_materialize_column.sql  |  1 +
 ..._column_not_override_past_values.reference | 29 +++++++++++
 ...ialize_column_not_override_past_values.sql | 49 +++++++++++++++++++
 4 files changed, 97 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
 create mode 100644 tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 827749aa094..a04d9cdb886 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -65,6 +65,7 @@ static void splitAndModifyMutationCommands(
     Poco::Logger * log)
 {
     auto part_columns = part->getColumnsDescription();
+    const auto & table_columns = metadata_snapshot->getColumns();
 
     if (!isWidePart(part) || !isFullPartStorage(part->getDataPartStorage()))
     {
@@ -73,9 +74,16 @@ static void splitAndModifyMutationCommands(
 
         for (const auto & command : commands)
         {
+            if (command.type == MutationCommand::Type::MATERIALIZE_COLUMN)
+            {
+                /// For ordinary column with default expression, materialize column should not override past values
+                /// So we only mutated column if `command.column_name` is a materialized column or if the part does not have physical column file
+                auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
+                if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
+                    mutated_columns.emplace(command.column_name);
+            }
             if (command.type == MutationCommand::Type::MATERIALIZE_INDEX
                 || command.type == MutationCommand::Type::MATERIALIZE_STATISTIC
-                || command.type == MutationCommand::Type::MATERIALIZE_COLUMN
                 || command.type == MutationCommand::Type::MATERIALIZE_PROJECTION
                 || command.type == MutationCommand::Type::MATERIALIZE_TTL
                 || command.type == MutationCommand::Type::DELETE
@@ -85,8 +93,6 @@ static void splitAndModifyMutationCommands(
                 for (const auto & [column_name, expr] : command.column_to_update_expression)
                     mutated_columns.emplace(column_name);
 
-                if (command.type == MutationCommand::Type::MATERIALIZE_COLUMN)
-                    mutated_columns.emplace(command.column_name);
             }
             else if (command.type == MutationCommand::Type::DROP_INDEX
                      || command.type == MutationCommand::Type::DROP_PROJECTION
@@ -196,8 +202,15 @@ static void splitAndModifyMutationCommands(
     {
         for (const auto & command : commands)
         {
-            if (command.type == MutationCommand::Type::MATERIALIZE_INDEX
-                || command.type == MutationCommand::Type::MATERIALIZE_COLUMN
+            if (command.type == MutationCommand::Type::MATERIALIZE_COLUMN)
+            {
+                /// For ordinary column with default expression, materialize column should not override past values
+                /// So we only mutated column if `command.column_name` is a materialized column or if the part does not have physical column file
+                auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
+                if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
+                    for_interpreter.push_back(command);
+            }
+            else if (command.type == MutationCommand::Type::MATERIALIZE_INDEX
                 || command.type == MutationCommand::Type::MATERIALIZE_STATISTIC
                 || command.type == MutationCommand::Type::MATERIALIZE_PROJECTION
                 || command.type == MutationCommand::Type::MATERIALIZE_TTL
diff --git a/tests/queries/0_stateless/02008_materialize_column.sql b/tests/queries/0_stateless/02008_materialize_column.sql
index a78920d2525..cc7d3096402 100644
--- a/tests/queries/0_stateless/02008_materialize_column.sql
+++ b/tests/queries/0_stateless/02008_materialize_column.sql
@@ -17,6 +17,7 @@ ALTER TABLE tmp MATERIALIZE COLUMN s;
 ALTER TABLE tmp MODIFY COLUMN s String DEFAULT toString(x+2);
 SELECT arraySort(groupArray(x)), groupArray(s) FROM tmp;
 
+ALTER TABLE tmp CLEAR COLUMN s; -- Need to clear because MATERIALIZE COLUMN won't override past values;
 ALTER TABLE tmp MATERIALIZE COLUMN s;
 ALTER TABLE tmp MODIFY COLUMN s String DEFAULT toString(x+3);
 SELECT arraySort(groupArray(x)), groupArray(s) FROM tmp;
diff --git a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
new file mode 100644
index 00000000000..6b0d88bd09b
--- /dev/null
+++ b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
@@ -0,0 +1,29 @@
+--Origin--
+1	2
+2	54321
+--After materialize--
+1	2
+2	54321
+--Origin--
+1	2
+2	54321
+--After materialize--
+1	2
+2	54321
+--Origin--
+1	2
+2	\N
+3	54321
+--After materialize--
+1	2
+2	\N
+3	54321
+--Origin--
+1	2
+2	54321
+--After rename--
+1	2
+2	54321
+--After materialize--
+1	2
+2	54321
diff --git a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql
new file mode 100644
index 00000000000..1815661e097
--- /dev/null
+++ b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql
@@ -0,0 +1,49 @@
+
+SET mutations_sync = 2;
+-- Compact parts
+CREATE TABLE test (id Int64, foo Int64 default 54321) ENGINE MergeTree ORDER BY id;
+INSERT INTO test ( id, foo ) values ( 1, 2 );
+INSERT INTO test ( id ) values ( 2 );
+SELECT '--Origin--';
+SELECT * FROM test ORDER BY id;
+ALTER TABLE test MATERIALIZE COLUMN foo;
+SELECT '--After materialize--';
+SELECT * FROM test ORDER BY id;
+DROP TABLE test;
+
+-- Wide parts
+CREATE TABLE test (id Int64, foo Nullable(Int64) default 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
+INSERT INTO test ( id, foo ) values ( 1, 2 );
+INSERT INTO test ( id ) values ( 2 );
+SELECT '--Origin--';
+SELECT * FROM test ORDER BY id;
+ALTER TABLE test MATERIALIZE COLUMN foo;
+SELECT '--After materialize--';
+SELECT * FROM test ORDER BY id;
+DROP TABLE test;
+
+-- Nullable column != physically absent
+CREATE TABLE test (id Int64, foo Nullable(Int64) default 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
+INSERT INTO test ( id, foo ) values ( 1, 2 );
+INSERT INTO test ( id, foo ) values ( 2, NULL );
+INSERT INTO test ( id ) values ( 3 );
+SELECT '--Origin--';
+SELECT * FROM test ORDER BY id;
+ALTER TABLE test MATERIALIZE COLUMN foo;
+SELECT '--After materialize--';
+SELECT * FROM test ORDER BY id;
+DROP TABLE test;
+
+-- Parts with renamed column
+CREATE TABLE test (id Int64, foo Int64 default 54321) ENGINE MergeTree ORDER BY id;
+INSERT INTO test ( id, foo ) values ( 1, 2 );
+INSERT INTO test ( id ) values ( 2 );
+SELECT '--Origin--';
+SELECT * FROM test ORDER BY id;
+ALTER TABLE test RENAME COLUMN foo TO bar;
+SELECT '--After rename--';
+SELECT * FROM test ORDER BY id;
+ALTER TABLE test MATERIALIZE COLUMN bar;
+SELECT '--After materialize--';
+SELECT * FROM test ORDER BY id;
+DROP TABLE test;
\ No newline at end of file

From a924b01a023512727d6a36fc12052f67438ba199 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Tue, 19 Dec 2023 02:05:32 -0800
Subject: [PATCH 0053/1081] [Docs] Clarify to use query level settings in
 ClickHouse Cloud

---
 docs/en/operations/query-cache.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/operations/query-cache.md b/docs/en/operations/query-cache.md
index def0f48b968..2f05599e666 100644
--- a/docs/en/operations/query-cache.md
+++ b/docs/en/operations/query-cache.md
@@ -31,6 +31,10 @@ This reduces maintenance effort and avoids redundancy.
 
 ## Configuration Settings and Usage
 
+:::note
+In ClickHouse Cloud, you must use [query level settings](/en/operations/settings/query-level) to edit query cache settings. Editing [config level settings](/en/operations/configuration-files) is currently not supported.
+:::
+
 Setting [use_query_cache](settings/settings.md#use-query-cache) can be used to control whether a specific query or all queries of the
 current session should utilize the query cache. For example, the first execution of query
 

From 319ae440b6ba09b1dc21b355fab22a99d073592c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 16:43:30 +0000
Subject: [PATCH 0054/1081] Implement Variant data type

---
 docs/en/operations/settings/settings.md       |   52 +
 docs/en/sql-reference/data-types/variant.md   |  217 ++
 .../functions/other-functions.md              |   36 +
 src/Columns/ColumnNullable.cpp                |   22 +-
 src/Columns/ColumnNullable.h                  |    1 +
 src/Columns/ColumnVariant.cpp                 | 1360 +++++++++
 src/Columns/ColumnVariant.h                   |  306 ++
 src/Columns/IColumn.cpp                       |    6 +
 src/Columns/IColumn.h                         |   14 +
 src/Columns/MaskOperations.cpp                |    6 +-
 src/Columns/MaskOperations.h                  |    2 +-
 src/Columns/tests/gtest_column_variant.cpp    |  688 +++++
 src/Core/Settings.h                           |    2 +
 src/Core/TypeId.h                             |    1 +
 src/DataTypes/DataTypeFactory.cpp             |    1 +
 src/DataTypes/DataTypeFactory.h               |    1 +
 src/DataTypes/DataTypeNullable.cpp            |   28 +
 src/DataTypes/DataTypeNullable.h              |    3 +
 src/DataTypes/DataTypeTuple.cpp               |    9 +-
 src/DataTypes/DataTypeVariant.cpp             |  197 ++
 src/DataTypes/DataTypeVariant.h               |   64 +
 src/DataTypes/EnumValues.cpp                  |   21 +
 src/DataTypes/EnumValues.h                    |    8 +-
 src/DataTypes/IDataType.cpp                   |   23 +-
 src/DataTypes/IDataType.h                     |    3 +
 .../Serializations/ISerialization.cpp         |   61 +-
 src/DataTypes/Serializations/ISerialization.h |   13 +
 .../Serializations/SerializationArray.cpp     |  138 +-
 .../Serializations/SerializationArray.h       |    3 +
 .../Serializations/SerializationBool.cpp      |  179 +-
 .../Serializations/SerializationBool.h        |    8 +-
 .../SerializationCustomSimpleText.cpp         |   56 +
 .../SerializationCustomSimpleText.h           |    6 +
 .../Serializations/SerializationDate.cpp      |   46 +
 .../Serializations/SerializationDate.h        |    5 +
 .../Serializations/SerializationDate32.cpp    |   45 +
 .../Serializations/SerializationDate32.h      |    5 +
 .../Serializations/SerializationDateTime.cpp  |  157 +-
 .../Serializations/SerializationDateTime.h    |    5 +
 .../SerializationDateTime64.cpp               |  112 +
 .../Serializations/SerializationDateTime64.h  |    6 +
 .../Serializations/SerializationDecimal.cpp   |   46 +-
 .../Serializations/SerializationDecimal.h     |    6 +-
 .../Serializations/SerializationEnum.cpp      |   97 +
 .../Serializations/SerializationEnum.h        |   13 +
 .../SerializationFixedString.cpp              |   56 +
 .../Serializations/SerializationFixedString.h |    6 +
 .../SerializationIPv4andIPv6.cpp              |  188 ++
 .../Serializations/SerializationIPv4andIPv6.h |  129 +-
 .../SerializationLowCardinality.cpp           |   47 +-
 .../SerializationLowCardinality.h             |   12 +
 .../Serializations/SerializationMap.cpp       |  108 +-
 .../Serializations/SerializationMap.h         |    7 +-
 .../Serializations/SerializationNamed.cpp     |    1 +
 .../Serializations/SerializationNothing.h     |    1 +
 .../Serializations/SerializationNullable.cpp  |  532 +++-
 .../Serializations/SerializationNullable.h    |   53 +-
 .../Serializations/SerializationNumber.cpp    |   80 +-
 .../Serializations/SerializationNumber.h      |    3 +
 .../Serializations/SerializationString.cpp    |  101 +-
 .../Serializations/SerializationString.h      |    5 +
 .../Serializations/SerializationTuple.cpp     |  318 ++-
 .../Serializations/SerializationTuple.h       |   12 +
 .../Serializations/SerializationUUID.cpp      |   41 +-
 .../Serializations/SerializationUUID.h        |    6 +-
 .../Serializations/SerializationVariant.cpp   |  828 ++++++
 .../Serializations/SerializationVariant.h     |  116 +
 .../SerializationVariantElement.cpp           |  241 ++
 .../SerializationVariantElement.h             |   87 +
 .../Serializations/SerializationWrapper.cpp   |   25 +
 .../Serializations/SerializationWrapper.h     |    5 +
 .../Serializations/SimpleTextSerialization.h  |   38 +
 src/DataTypes/Utils.cpp                       |    1 +
 src/Databases/DatabaseReplicated.cpp          |    1 +
 src/Formats/EscapingRuleUtils.cpp             |   10 +-
 src/Formats/JSONUtils.cpp                     |    4 +-
 src/Formats/SchemaInferenceUtils.cpp          |    2 +-
 src/Functions/FunctionsConversion.h           |  262 +-
 src/Functions/if.cpp                          |   50 +-
 src/Functions/isNotNull.cpp                   |   13 +
 src/Functions/isNull.cpp                      |   13 +
 src/Functions/multiIf.cpp                     |   10 +
 src/Functions/variantElement.cpp              |  238 ++
 src/IO/ReadHelpers.cpp                        |  298 +-
 src/IO/ReadHelpers.h                          |  198 +-
 src/IO/readDecimalText.h                      |   20 +
 src/Interpreters/InterpreterCreateQuery.cpp   |   14 +
 src/Interpreters/InterpreterInsertQuery.cpp   |    2 +-
 src/Interpreters/inplaceBlockConversions.cpp  |   35 +-
 .../parseColumnsListForTableFunction.cpp      |   11 +
 .../parseColumnsListForTableFunction.h        |    2 +
 src/Parsers/ExpressionElementParsers.cpp      |    2 +-
 .../Formats/Impl/CSVRowInputFormat.cpp        |    2 +-
 .../Formats/Impl/MySQLDumpRowInputFormat.cpp  |    2 +-
 .../Formats/Impl/TSKVRowInputFormat.cpp       |    2 +-
 .../Impl/TabSeparatedRowInputFormat.cpp       |    4 +-
 .../Formats/Impl/ValuesBlockInputFormat.cpp   |    2 +-
 ...940_variant_text_deserialization.reference |  516 ++++
 .../02940_variant_text_deserialization.sql    |  266 ++
 .../02941_variant_type_1.reference            | 2472 +++++++++++++++++
 .../0_stateless/02941_variant_type_1.sh       |  124 +
 .../02941_variant_type_2.reference            |   51 +
 .../0_stateless/02941_variant_type_2.sh       |   71 +
 .../02941_variant_type_3.reference            |   51 +
 .../0_stateless/02941_variant_type_3.sh       |   71 +
 .../02941_variant_type_4.reference            |   56 +
 .../0_stateless/02941_variant_type_4.sh       |   66 +
 .../0_stateless/02942_variant_cast.reference  |   25 +
 .../0_stateless/02942_variant_cast.sql        |   23 +
 .../02943_variant_element.reference           |   44 +
 .../0_stateless/02943_variant_element.sql     |   16 +
 ...44_variant_as_if_multi_if_result.reference |   96 +
 .../02944_variant_as_if_multi_if_result.sql   |   64 +
 113 files changed, 11750 insertions(+), 584 deletions(-)
 create mode 100644 docs/en/sql-reference/data-types/variant.md
 create mode 100644 src/Columns/ColumnVariant.cpp
 create mode 100644 src/Columns/ColumnVariant.h
 create mode 100644 src/Columns/tests/gtest_column_variant.cpp
 create mode 100644 src/DataTypes/DataTypeVariant.cpp
 create mode 100644 src/DataTypes/DataTypeVariant.h
 create mode 100644 src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariant.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariant.h
 create mode 100644 src/DataTypes/Serializations/SerializationVariantElement.cpp
 create mode 100644 src/DataTypes/Serializations/SerializationVariantElement.h
 create mode 100644 src/Functions/variantElement.cpp
 create mode 100644 tests/queries/0_stateless/02940_variant_text_deserialization.reference
 create mode 100644 tests/queries/0_stateless/02940_variant_text_deserialization.sql
 create mode 100644 tests/queries/0_stateless/02941_variant_type_1.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_1.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_2.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_2.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_3.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_3.sh
 create mode 100644 tests/queries/0_stateless/02941_variant_type_4.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_4.sh
 create mode 100644 tests/queries/0_stateless/02942_variant_cast.reference
 create mode 100644 tests/queries/0_stateless/02942_variant_cast.sql
 create mode 100644 tests/queries/0_stateless/02943_variant_element.reference
 create mode 100644 tests/queries/0_stateless/02943_variant_element.sql
 create mode 100644 tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
 create mode 100644 tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index dc46a3f0dcd..dbf5bc341cc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5134,3 +5134,55 @@ When set to `true` than for all s3 requests first two attempts are made with low
 When set to `false` than all attempts are made with identical timeouts.
 
 Default value: `true`.
+
+## allow_experimental_variant_type {#allow_experimental_variant_type}
+
+Allows creation of experimental [Variant](../../sql-reference/data-types/variant.md).
+
+Default value: `false`.
+
+## use_variant_when_no_common_type_in_if {#use_variant_when_no_common_type_in_if}
+
+Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
+
+Example:
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT toTypeName(if(number % 2, number, range(number))) as variant_type FROM numbers(1);
+SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
+```
+
+```text
+┌─variant_type───────────────────┐
+│ Variant(Array(UInt64), UInt64) │
+└────────────────────────────────┘
+┌─variant───┐
+│ []        │
+│ 1         │
+│ [0,1]     │
+│ 3         │
+│ [0,1,2,3] │
+└───────────┘
+```
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT toTypeName(multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL)) AS variant_type FROM numbers(1);
+SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
+```
+
+```text
+─variant_type─────────────────────────┐
+│ Variant(Array(UInt8), String, UInt8) │
+└──────────────────────────────────────┘
+
+┌─variant───────┐
+│ 42            │
+│ [1,2,3]       │
+│ Hello, World! │
+│ ᴺᵁᴸᴸ          │
+└───────────────┘
+```
+
+Default value: `false`.
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
new file mode 100644
index 00000000000..34966d79079
--- /dev/null
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -0,0 +1,217 @@
+---
+slug: /en/sql-reference/data-types/json
+sidebar_position: 55
+sidebar_label: Variant
+---
+
+# Variant(T1, T2, T3, ...)
+
+This type represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type 
+has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value).
+
+The order of nested types doesn't matter: Variant(T1, T2) = Variant(T2, T1).
+Nested types can be arbitrary types except Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types.
+
+:::note
+The Variant data type is an experimental feature. To use it, set `allow_experimental_variant_type = 1`.
+:::
+
+## Creating Variant
+
+Using `Variant` type in table column definition:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v FROM test;
+```
+
+```text
+┌─v─────────────┐
+│ ᴺᵁᴸᴸ          │
+│ 42            │
+│ Hello, World! │
+│ [1,2,3]       │
+└───────────────┘
+```
+
+Using CAST from ordinary columns:
+
+```sql
+SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String, Array(UInt64)) as variant;
+```
+
+```text
+┌─type_name──────────────────────────────┬─variant───────┐
+│ Variant(Array(UInt64), String, UInt64) │ Hello, World! │
+└────────────────────────────────────────┴───────────────┘
+```
+
+Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_when_no_common_type_in_if` should be enabled for it):
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
+```
+
+```text
+┌─variant───┐
+│ []        │
+│ 1         │
+│ [0,1]     │
+│ 3         │
+│ [0,1,2,3] │
+└───────────┘
+```
+
+```sql
+SET use_variant_when_no_common_type_in_if = 1;
+SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
+```
+
+```text
+┌─variant───────┐
+│ 42            │
+│ [1,2,3]       │
+│ Hello, World! │
+│ ᴺᵁᴸᴸ          │
+└───────────────┘
+```
+
+## Reading Variant nested types as subcolumns
+
+Variant type supports reading a single nested type from a Variant column using the type name as a subcolumn.
+So, if you have column `variant Variant(T1, T2, T3)` you can read a subcolumn of type `T2` using syntax `variant.T2`,
+this subcolumn will have type `Nullable(T2)` if `T2` can be inside `Nullable` and `T2` otherwise. This subcolumn will
+be the same size as original `Variant` column and will contain `NULL` values (or empty values if `T2` cannot be inside `Nullable`)
+in all rows in which original `Variant` column doesn't have type `T2`.
+
+Variant subcolumns can be also read using function `variantElement(variant_column, type_name)`. 
+
+Examples:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, v.String, v.UInt64, v.`Array(UInt64)` FROM test;
+```
+
+```text
+┌─v─────────────┬─v.String──────┬─v.UInt64─┬─v.Array(UInt64)─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ          │     ᴺᵁᴸᴸ │ []              │
+│ 42            │ ᴺᵁᴸᴸ          │       42 │ []              │
+│ Hello, World! │ Hello, World! │     ᴺᵁᴸᴸ │ []              │
+│ [1,2,3]       │ ᴺᵁᴸᴸ          │     ᴺᵁᴸᴸ │ [1,2,3]         │
+└───────────────┴───────────────┴──────────┴─────────────────┘
+```
+
+```sql
+SELECT toTypeName(v.String), toTypeName(v.UInt64), toTypeName(v.`Array(UInt64)`) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(v.String)─┬─toTypeName(v.UInt64)─┬─toTypeName(v.Array(UInt64))─┐
+│ Nullable(String)     │ Nullable(UInt64)     │ Array(UInt64)               │
+└──────────────────────┴──────────────────────┴─────────────────────────────┘
+```
+
+```sql
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;
+```
+
+```text
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+```
+
+## Conversion between Variant column and other columns
+
+There are 3 possible conversions that can be performed with Variant column.
+
+### Converting an ordinary column to a Variant column
+
+It is possible to convert ordinary column with type `T` to a `Variant` column containing this type:
+
+```sql
+SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String, Array(UInt64)) as variant;
+```
+
+```text
+┌─type_name──────────────────────────────┬─variant───────┐
+│ Variant(Array(UInt64), String, UInt64) │ Hello, World! │
+└────────────────────────────────────────┴───────────────┘
+```
+
+### Converting a Variant column to an ordinary column
+
+It is possible to convert a `Variant` column to an ordinary column. In this case all nested variants will be converted to a destination type:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String)) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('42.42');
+SELECT v::Nullable(Float64) FROM test;
+```
+
+```text
+┌─CAST(v, 'Nullable(Float64)')─┐
+│                         ᴺᵁᴸᴸ │
+│                           42 │
+│                        42.42 │
+└──────────────────────────────┘
+```
+
+### Converting a Variant to another Variant
+
+It is possible to convert a `Variant` column to another `Variant` column, but only if the destination `Variant` column contains all nested types from the original `Variant`:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String)) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('String');
+SELECT v::Variant(UInt64, String, Array(UInt64)) FROM test;
+```
+
+```text
+┌─CAST(v, 'Variant(UInt64, String, Array(UInt64))')─┐
+│ ᴺᵁᴸᴸ                                              │
+│ 42                                                │
+│ String                                            │
+└───────────────────────────────────────────────────┘
+```
+
+
+## Reading Variant type from the data
+
+All text formats (TSV, CSV, CustomSeparated, Values, JSONEachRow, etc) supports reading `Variant` type. During data parsing ClickHouse tries to insert value into most appropriate variant type.
+
+Example:
+
+```sql
+SELECT
+    v,
+    variantElement(v, 'String') AS str,
+    variantElement(v, 'UInt64') AS num,
+    variantElement(v, 'Float64') AS float,
+    variantElement(v, 'DateTime') AS date,
+    variantElement(v, 'Array(UInt64)') AS arr
+FROM format(JSONEachRow, 'v Variant(String, UInt64, Float64, DateTime, Array(UInt64))', $$
+{"v" : "Hello, World!"},
+{"v" : 42},
+{"v" : 42.42},
+{"v" : "2020-01-01 00:00:00"},
+{"v" : [1, 2, 3]}
+$$)
+```
+
+```text
+┌─v───────────────────┬─str───────────┬──num─┬─float─┬────────────────date─┬─arr─────┐
+│ Hello, World!       │ Hello, World! │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ []      │
+│ 42                  │ ᴺᵁᴸᴸ          │   42 │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ []      │
+│ 42.42               │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │ 42.42 │                ᴺᵁᴸᴸ │ []      │
+│ 2020-01-01 00:00:00 │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │ 2020-01-01 00:00:00 │ []      │
+│ [1,2,3]             │ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ │  ᴺᵁᴸᴸ │                ᴺᵁᴸᴸ │ [1,2,3] │
+└─────────────────────┴───────────────┴──────┴───────┴─────────────────────┴─────────┘
+```
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 5b9d01985dd..47b5ac7b724 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2831,3 +2831,39 @@ Result:
 │ SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)                          │
 └─────────────────────────────────────────────────────────────────────────┘
 ```
+
+## variantElement
+
+Extracts a column with specified type from a `Variant` column.
+
+**Syntax**
+
+``` sql
+tupleElement(variant, type_name, [, default_value])
+```
+
+- `variant` — Variant column. [Variant](../../sql-reference/data-types/variant.md).
+- `type_name` — The name of the variant type to extract. [String](../../sql-reference/data-types/string.md).
+- `default_value` - The default value that will be used if variant doesn't have variant with specified type. Can be any type. Optional.
+
+**Returned value**
+
+- Subcolumn of a `Variant` column with specified type.
+
+**Example**
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;
+```
+
+```text
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+```
+
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 4ee6bb3d586..d2a579d6800 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -890,10 +890,7 @@ ColumnPtr makeNullable(const ColumnPtr & column)
 
 ColumnPtr makeNullableOrLowCardinalityNullable(const ColumnPtr & column)
 {
-    if (isColumnNullable(*column))
-        return column;
-
-    if (isColumnLowCardinalityNullable(*column))
+    if (isColumnNullableOrLowCardinalityNullable(*column))
         return column;
 
     if (isColumnConst(*column))
@@ -919,4 +916,21 @@ ColumnPtr makeNullableSafe(const ColumnPtr & column)
     return column;
 }
 
+ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column)
+{
+    if (isColumnNullableOrLowCardinalityNullable(*column))
+        return column;
+
+    if (isColumnConst(*column))
+        return ColumnConst::create(makeNullableOrLowCardinalityNullableSafe(assert_cast<const ColumnConst &>(*column).getDataColumnPtr()), column->size());
+
+    if (column->lowCardinality())
+        return assert_cast<const ColumnLowCardinality &>(*column).cloneNullable();
+
+    if (column->canBeInsideNullable())
+        return makeNullableSafe(column);
+
+    return column;
+}
+
 }
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index b57fdf3064d..60c7750f8fc 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -231,5 +231,6 @@ private:
 ColumnPtr makeNullable(const ColumnPtr & column);
 ColumnPtr makeNullableSafe(const ColumnPtr & column);
 ColumnPtr makeNullableOrLowCardinalityNullable(const ColumnPtr & column);
+ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column);
 
 }
diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
new file mode 100644
index 00000000000..67754e77992
--- /dev/null
+++ b/src/Columns/ColumnVariant.cpp
@@ -0,0 +1,1360 @@
+#include <Columns/ColumnVariant.h>
+
+#include <Columns/ColumnCompressed.h>
+#include <Columns/ColumnsCommon.h>
+#include <Core/Field.h>
+#include <Processors/Transforms/ColumnGathererTransform.h>
+#include <IO/Operators.h>
+#include <IO/WriteBufferFromString.h>
+#include <Common/WeakHash.h>
+#include <Common/assert_cast.h>
+#include <Common/typeid_cast.h>
+#include <Common/Arena.h>
+#include <Common/SipHash.h>
+#include <Common/HashTable/Hash.h>
+#include <DataTypes/Serializations/SerializationInfoTuple.h>
+#include <Columns/MaskOperations.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int ILLEGAL_COLUMN;
+    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
+    extern const int PARAMETER_OUT_OF_BOUND;
+    extern const int SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT;
+    extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
+}
+
+std::string ColumnVariant::getName() const
+{
+    WriteBufferFromOwnString res;
+    res << "Variant(";
+    bool is_first = true;
+    for (const auto & local_variant : global_to_local_discriminators)
+    {
+        if (!is_first)
+            res << ", ";
+        is_first = false;
+        res << variants[local_variant]->getName();
+    }
+    res << ")";
+    return res.str();
+}
+
+
+void ColumnVariant::initIdentityGlobalToLocalDiscriminatorsMapping()
+{
+    local_to_global_discriminators.reserve(variants.size());
+    global_to_local_discriminators.reserve(variants.size());
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        local_to_global_discriminators.push_back(i);
+        global_to_local_discriminators.push_back(i);
+    }
+}
+
+ColumnVariant::ColumnVariant(MutableColumns && variants_) : ColumnVariant(std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+{
+    /// Empty local_to_global_discriminators mapping means that variants are already in the global order.
+    if (!local_to_global_discriminators_.empty() && local_to_global_discriminators_.size() != variants_.size())
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "The number of values in local_to_global_discriminators mapping ({}) doesn't match the number of variants ({})",
+            local_to_global_discriminators_.size(),
+            variants_.size());
+
+    /// As variants are empty, column with local discriminators will be also empty and we can reorder variants according to global discriminators.
+    variants.resize(variants_.size());
+    for (size_t i = 0; i != variants_.size(); ++i)
+    {
+        if (isColumnConst(*variants_[i]))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+
+        if (!variants_[i]->empty())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not empty column passed to ColumnVariant, but no local_discriminators passed");
+
+        if (!local_to_global_discriminators_.empty() && local_to_global_discriminators_[i] > variants_.size())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator {}. The number of variants: {}", UInt64(local_to_global_discriminators_[i]), variants_.size());
+
+        if (local_to_global_discriminators_.empty())
+            variants[i] = std::move(variants_[i]);
+        else
+            variants[local_to_global_discriminators_[i]] = std::move(variants_[i]);
+    }
+
+    local_discriminators = ColumnDiscriminators::create();
+    offsets = ColumnOffsets::create();
+
+    /// Now global and local discriminators are the same.
+    initIdentityGlobalToLocalDiscriminatorsMapping();
+}
+
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & global_discriminators) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), global_discriminators)
+{
+}
+
+ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::MutableColumnPtr offsets_, DB::MutableColumns && variants_) : ColumnVariant(std::move(local_discriminators_), std::move(offsets_), std::move(variants_), {})
+{
+}
+
+ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::MutableColumnPtr offsets_, DB::MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+{
+    if (variants_.size() > MAX_NESTED_COLUMNS)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Variant type with more than {} nested types is not allowed", ColumnVariant::MAX_NESTED_COLUMNS);
+
+    local_discriminators = std::move(local_discriminators_);
+    const ColumnDiscriminators * discriminators_concrete = typeid_cast<const ColumnDiscriminators *>(local_discriminators.get());
+    if (!discriminators_concrete)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "discriminator column must be a ColumnUInt8");
+
+    variants.reserve(variants_.size());
+    size_t total_size = 0;
+    for (auto & variant : variants_)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+
+        total_size += variant->size();
+        variants.push_back(std::move(variant));
+    }
+
+    /// We can have more discriminators than values in columns
+    /// (because of NULL discriminators), but not less.
+    if (total_size > local_discriminators->size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested columns sizes are inconsistent with local_discriminators column size. Total column sizes: {}, local_discriminators size: {}", total_size, local_discriminators->size());
+
+    if (offsets_)
+    {
+        if (!typeid_cast<const ColumnOffsets *>(offsets_.get()))
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets column must be a ColumnUInt64");
+
+        offsets = std::move(offsets_);
+    }
+    else
+    {
+        /// If no offsets column was provided, construct offsets based on discriminators.
+        offsets = ColumnOffsets::create();
+        Offsets & offsets_data = typeid_cast<ColumnOffsets *>(offsets.get())->getData();
+        offsets_data.reserve(discriminators_concrete->size());
+        /// If we have only NULLs, offsets column will not contain any real offsets.
+        if (hasOnlyNulls())
+        {
+            offsets_data.resize(discriminators_concrete->size());
+        }
+        /// If we have only one non empty variant and no NULLs,
+        /// offsets column will contain just sequential offsets 0, 1, 2, ...
+        else if (getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+        {
+            for (size_t i = 0; i != discriminators_concrete->size(); ++i)
+                offsets_data.push_back(i);
+        }
+        /// Otherwise we should iterate through discriminators and
+        /// remember current offset for each variant column.
+        else
+        {
+            std::vector<Offset> nested_offsets;
+            nested_offsets.resize(variants.size());
+            for (Discriminator discr : discriminators_concrete->getData())
+            {
+                if (discr == NULL_DISCRIMINATOR)
+                    offsets_data.emplace_back();
+                else
+                    offsets_data.push_back(nested_offsets[discr]++);
+            }
+        }
+    }
+
+    /// Empty global_discriminators means that variants are already in global order.
+    if (local_to_global_discriminators_.empty())
+    {
+        initIdentityGlobalToLocalDiscriminatorsMapping();
+    }
+    else
+    {
+        if (local_to_global_discriminators_.size() != variants.size())
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "The number of values in local_to_global_discriminators mapping ({}) doesn't match the number of variants ({})",
+                local_to_global_discriminators_.size(),
+                variants.size());
+
+        local_to_global_discriminators = local_to_global_discriminators_;
+        global_to_local_discriminators.resize(local_to_global_discriminators.size());
+        /// Create mapping global discriminator -> local discriminator
+        for (size_t i = 0; i != local_to_global_discriminators.size(); ++i)
+        {
+            if (local_to_global_discriminators[i] > variants.size())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator {}. The number of variants: {}", UInt64(local_to_global_discriminators[i]), variants_.size());
+
+            global_to_local_discriminators[local_to_global_discriminators[i]] = i;
+        }
+    }
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(std::move(mutable_variants), local_to_global_discriminators);
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(local_discriminators->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::ColumnPtr & offsets, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    MutableColumns mutable_variants;
+    mutable_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        if (isColumnConst(*variant))
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
+        mutable_variants.emplace_back(variant->assumeMutable());
+    }
+
+    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+}
+
+MutableColumnPtr ColumnVariant::cloneEmpty() const
+{
+    MutableColumns new_variants;
+    new_variants.reserve(variants.size());
+    for (const auto & variant : variants)
+        new_variants.emplace_back(variant->cloneEmpty());
+
+    return ColumnVariant::create(std::move(new_variants), local_to_global_discriminators);
+}
+
+MutableColumnPtr ColumnVariant::cloneResized(size_t new_size) const
+{
+    if (new_size == 0)
+        return cloneEmpty();
+
+    const size_t num_variants = variants.size();
+    size_t size = local_discriminators->size();
+    /// If new size is bigger than the old one, just clone column and append default values.
+    if (new_size >= size)
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (const auto & variant : variants)
+            new_variants.emplace_back(IColumn::mutate(variant));
+
+        auto res = ColumnVariant::create(IColumn::mutate(local_discriminators), IColumn::mutate(offsets), std::move(new_variants), local_to_global_discriminators);
+        res->insertManyDefaults(new_size - size);
+        return res;
+    }
+
+    /// If new size is less than current size, we should find the new size for all variants.
+
+    /// Optimization for case when we have only NULLs. In this case we should just resize discriminators and offsets.
+    if (hasOnlyNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (const auto & variant : variants)
+            new_variants.emplace_back(IColumn::mutate(variant));
+
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can simply call cloneResized on this single variant, discriminators and offsets.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[i]->cloneResized(new_size));
+            else
+                new_variants.emplace_back(variants[i]->cloneEmpty());
+        }
+
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    const auto & offsets_data = getOffsets();
+
+    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating
+    /// sizes for all new variants. This code is below and commented.
+
+//    std::vector<size_t> new_nested_sizes(num_variants, 0);
+//    for (size_t i = 0; i != new_size; ++i)
+//    {
+//        Discriminator discr = local_discriminators_data[i];
+//        if (discr != NULL_DISCRIMINATOR)
+//            ++new_nested_sizes[discr];
+//    }
+//
+//    MutableColumns new_variants;
+//    new_variants.reserve(num_variants);
+//    for (size_t i = 0; i != num_variants; ++i)
+//    {
+//        if (new_nested_sizes[i])
+//            new_variants.emplace_back(variants[i]->cloneResized(new_nested_sizes[i]));
+//        else
+//            new_variants.emplace_back(variants[i]->cloneEmpty());
+//    }
+//
+//    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+
+    /// But instead we are trying to optimize it using offsets column:
+    /// For all non-empty variants we are trying to find last occurrence of its discriminator in local_discriminators[:new_size] or
+    /// first occurrence in local_discriminators[new_size:]. The same row in offsets column will contain the desired size (or size - 1) of variant.
+    /// All empty variants will remain empty.
+    /// Not sure how good this optimization is, feel free to remove it and use simpler version above.
+
+    MutableColumns new_variants(num_variants);
+    std::unordered_set<Discriminator> seen_variants;
+    /// First, check which variants are empty. They will remain empty.
+    for (Discriminator i = 0; i != num_variants; ++i)
+    {
+        if (variants[i]->empty())
+        {
+            seen_variants.insert(i);
+            new_variants[i] = variants[i]->cloneEmpty();
+        }
+    }
+
+    /// Now, iterate through local discriminators using two pointers.
+    /// First will go from new_size - 1 to 0, second from new_size to size.
+    /// Finish when we find all variants or hit lower or upper bound.
+    ssize_t i = new_size - 1;
+    size_t j = new_size;
+    while (i != -1 && j != size)
+    {
+        Discriminator i_discr = local_discriminators_data[i];
+        if (i_discr != NULL_DISCRIMINATOR)
+        {
+            auto [_, inserted] = seen_variants.insert(i_discr);
+            /// If this is the first occurrence of this discriminator,
+            /// we can get new size for this variant.
+            if (inserted)
+            {
+                new_variants[i_discr] = variants[i_discr]->cloneResized(offsets_data[i] + 1);
+                if (seen_variants.size() == num_variants)
+                    break;
+            }
+        }
+
+        Discriminator j_discr = local_discriminators_data[j];
+        if (j_discr != NULL_DISCRIMINATOR)
+        {
+            auto [_, inserted] = seen_variants.insert(j_discr);
+            /// If this is the first occurrence of this discriminator,
+            /// we can get new size for this variant.
+            if (inserted)
+            {
+                new_variants[j_discr] = variants[j_discr]->cloneResized(offsets_data[j]);
+                if (seen_variants.size() == num_variants)
+                    break;
+            }
+        }
+
+        --i;
+        ++j;
+    }
+
+    /// We can finish in 3 cases:
+    ///   1) seen_variants.size() == num_variants - we found local_discriminators of all variants, nothing to do.
+    ///   2) i == -1 - we scanned all values in local_discriminators[:new_size]. Not found variants doesn't have
+    /// values in local_discriminators[:new_size], so they should be empty in the resized version.
+    ///   3) j == size - we scanned all values in local_discriminators[new_size:]. Not found variants doesn't have
+    /// values in local_discriminators[new_size:], so, we should use the full variant in the resized version.
+    if (seen_variants.size() != num_variants)
+    {
+        for (size_t discr = 0; discr != num_variants; ++discr)
+        {
+            if (!seen_variants.contains(discr))
+            {
+                if (i == -1)
+                    new_variants[discr] = variants[discr]->cloneEmpty();
+                else
+                    new_variants[discr] = IColumn::mutate(variants[discr]);
+            }
+        }
+    }
+
+    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+}
+
+Field ColumnVariant::operator[](size_t n) const
+{
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        return Null();
+    return (*variants[discr])[offsetAt(n)];
+}
+
+void ColumnVariant::get(size_t n, Field & res) const
+{
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        res = Null();
+    else
+        variants[discr]->get(offsetAt(n), res);
+}
+
+bool ColumnVariant::isDefaultAt(size_t n) const
+{
+    return localDiscriminatorAt(n) == NULL_DISCRIMINATOR;
+}
+
+bool ColumnVariant::isNullAt(size_t n) const
+{
+    return localDiscriminatorAt(n) == NULL_DISCRIMINATOR;
+}
+
+StringRef ColumnVariant::getDataAt(size_t) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method getDataAt is not supported for {}", getName());
+}
+
+void ColumnVariant::insertData(const char *, size_t)
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method insertData is not supported for {}", getName());
+}
+
+void ColumnVariant::insert(const Field & field)
+{
+    if (field.isNull())
+        insertDefault();
+    else
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(field), getName());
+}
+
+void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
+{
+    const ColumnVariant & src = assert_cast<const ColumnVariant &>(src_);
+
+    const size_t num_variants = variants.size();
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    /// Remember that src column can have different local variants order.
+    Discriminator global_discr = src.globalDiscriminatorAt(n);
+    Discriminator local_discr = localDiscriminatorByGlobal(global_discr);
+    getLocalDiscriminators().push_back(local_discr);
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        getOffsets().emplace_back();
+    }
+    else
+    {
+        getOffsets().push_back(variants[local_discr]->size());
+        variants[local_discr]->insertFrom(src.getVariantByGlobalDiscriminator(global_discr), src.offsetAt(n));
+    }
+}
+
+void ColumnVariant::insertRangeFrom(const IColumn & src_, size_t start, size_t length)
+{
+    const size_t num_variants = variants.size();
+    const auto & src = assert_cast<const ColumnVariant &>(src_);
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    if (start + length > src.getLocalDiscriminators().size())
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Parameter out of bound in ColumnVariant::insertRangeFrom method. "
+                                                            "[start({}) + length({}) > local_discriminators.size({})]", start, length, src.getLocalDiscriminators().size());
+
+    /// If src column contains only NULLs, just insert NULLs.
+    if (src.hasOnlyNulls())
+    {
+        insertManyDefaults(length);
+        return;
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs in src column.
+    /// In this case we can simply call insertRangeFrom on this single variant.
+    if (auto non_empty_src_local_discr = src.getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(*non_empty_src_local_discr));
+        size_t offset = variants[local_discr]->size();
+        variants[local_discr]->insertRangeFrom(*src.variants[*non_empty_src_local_discr], start, length);
+        getLocalDiscriminators().resize_fill(local_discriminators->size() + length, local_discr);
+        auto & offsets_data = getOffsets();
+        offsets_data.reserve(offsets_data.size() + length);
+        for (size_t i = 0; i != length; ++i)
+            offsets_data.push_back(offset++);
+        return;
+    }
+
+    /// Iterate through src local_discriminators in range [start, start + length],
+    /// collect ranges we need to insert for all variants and update offsets.
+    /// nested_ranges[i].first - offset in src.variants[i]
+    /// nested_ranges[i].second - length in src.variants[i]
+    std::vector<std::pair<size_t, size_t>> nested_ranges(num_variants, {0, 0});
+    auto & offsets_data = getOffsets();
+    offsets_data.reserve(offsets_data.size() + length);
+    auto & local_discriminators_data = getLocalDiscriminators();
+    local_discriminators_data.reserve(local_discriminators_data.size() + length);
+    const auto & src_offsets_data = src.getOffsets();
+    const auto & src_local_discriminators_data = src.getLocalDiscriminators();
+    for (size_t i = start; i != start + length; ++i)
+    {
+        /// We insert from src.variants[src_local_discr] to variants[local_discr]
+        Discriminator src_local_discr = src_local_discriminators_data[i];
+        Discriminator local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+        local_discriminators_data.push_back(local_discr);
+        if (local_discr == NULL_DISCRIMINATOR)
+        {
+            offsets_data.emplace_back();
+        }
+        else
+        {
+            /// If we see this discriminator for the first time, set its range start.
+            if (!nested_ranges[src_local_discr].second)
+                nested_ranges[src_local_discr].first = src_offsets_data[i];
+            /// Update offsets column with correct offset.
+            offsets_data.push_back(variants[local_discr]->size() + nested_ranges[src_local_discr].second);
+            ++nested_ranges[src_local_discr].second;
+        }
+    }
+
+    for (size_t src_local_discr = 0; src_local_discr != nested_ranges.size(); ++src_local_discr)
+    {
+        auto [nested_start, nested_length] = nested_ranges[src_local_discr];
+        auto local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+        if (nested_length)
+            variants[local_discr]->insertRangeFrom(*src.variants[src_local_discr], nested_start, nested_length);
+    }
+}
+
+void ColumnVariant::insertManyFrom(const DB::IColumn & src_, size_t position, size_t length)
+{
+    const size_t num_variants = variants.size();
+    const auto & src = assert_cast<const ColumnVariant &>(src_);
+    if (src.variants.size() != num_variants)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert value of Variant type with different number of types");
+
+    /// Remember that src column can have different local variants order.
+    Discriminator src_local_discr = src.localDiscriminatorAt(position);
+    Discriminator local_discr = localDiscriminatorByGlobal(src.globalDiscriminatorByLocal(src_local_discr));
+    auto & local_discriminators_data = getLocalDiscriminators();
+    local_discriminators_data.resize_fill(local_discriminators_data.size() + length, local_discr);
+
+    auto & offsets_data = getOffsets();
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        offsets_data.resize_fill(offsets_data.size() + length);
+    }
+    else
+    {
+        size_t prev_offset = variants[local_discr]->size();
+        offsets_data.reserve(offsets_data.size() + length);
+        for (size_t i = 0; i != length; ++i)
+            offsets_data.push_back(prev_offset + i);
+
+        variants[local_discr]->insertManyFrom(*src.variants[src_local_discr], src.offsetAt(position), length);
+    }
+}
+
+void ColumnVariant::insertDefault()
+{
+    getLocalDiscriminators().push_back(NULL_DISCRIMINATOR);
+    getOffsets().emplace_back();
+}
+
+void ColumnVariant::insertManyDefaults(size_t length)
+{
+    size_t size = local_discriminators->size();
+    getLocalDiscriminators().resize_fill(size + length, NULL_DISCRIMINATOR);
+    getOffsets().resize_fill(size + length);
+}
+
+void ColumnVariant::popBack(size_t n)
+{
+    /// If we have only NULLs, just pop back from local_discriminators and offsets.
+    if (hasOnlyNulls())
+    {
+        local_discriminators->popBack(n);
+        offsets->popBack(n);
+        return;
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just popBack n elements from this variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        variants[*non_empty_local_discr]->popBack(n);
+        local_discriminators->popBack(n);
+        offsets->popBack(n);
+        return;
+    }
+
+    /// Calculate how many rows we need to pop from each variant
+    auto & local_discriminators_data = getLocalDiscriminators();
+    size_t size = local_discriminators_data.size();
+    const size_t num_variants = variants.size();
+    std::vector<size_t> nested_n(num_variants, 0);
+    for (size_t i = 0; i != n; ++i)
+    {
+        Discriminator discr = local_discriminators_data[size - i - 1];
+        if (discr != NULL_DISCRIMINATOR)
+            ++nested_n[discr];
+    }
+
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        if (nested_n[i])
+            variants[i]->popBack(nested_n[i]);
+    }
+
+    local_discriminators->popBack(n);
+    offsets->popBack(n);
+}
+
+StringRef ColumnVariant::serializeValueIntoArena(size_t n, Arena & arena, char const *& begin, const UInt8 *) const
+{
+    /// During any serialization/deserialization we should always use global discriminators.
+    Discriminator global_discr = globalDiscriminatorAt(n);
+    char * pos = arena.allocContinue(sizeof(global_discr), begin);
+    memcpy(pos, &global_discr, sizeof(global_discr));
+    StringRef res(pos, sizeof(global_discr));
+
+    if (global_discr == NULL_DISCRIMINATOR)
+        return res;
+
+    auto value_ref = variants[localDiscriminatorByGlobal(global_discr)]->serializeValueIntoArena(offsetAt(n), arena, begin);
+    res.data = value_ref.data - res.size;
+    res.size += value_ref.size;
+
+    return res;
+}
+
+const char * ColumnVariant::deserializeAndInsertFromArena(const char * pos)
+{
+    /// During any serialization/deserialization we should always use global discriminators.
+    Discriminator global_discr = unalignedLoad<Discriminator>(pos);
+    pos += sizeof(global_discr);
+    Discriminator local_discr = localDiscriminatorByGlobal(global_discr);
+    getLocalDiscriminators().push_back(local_discr);
+    if (local_discr == NULL_DISCRIMINATOR)
+    {
+        getOffsets().emplace_back();
+        return pos;
+    }
+
+    getOffsets().push_back(variants[local_discr]->size());
+    return variants[local_discr]->deserializeAndInsertFromArena(pos);
+}
+
+const char * ColumnVariant::skipSerializedInArena(const char * pos) const
+{
+    Discriminator global_discr = unalignedLoad<Discriminator>(pos);
+    pos += sizeof(global_discr);
+    if (global_discr == NULL_DISCRIMINATOR)
+        return pos;
+
+    return variants[localDiscriminatorByGlobal(global_discr)]->skipSerializedInArena(pos);
+}
+
+void ColumnVariant::updateHashWithValue(size_t n, SipHash & hash) const
+{
+    Discriminator global_discr = globalDiscriminatorAt(n);
+    hash.update(global_discr);
+    if (global_discr != NULL_DISCRIMINATOR)
+        variants[localDiscriminatorByGlobal(global_discr)]->updateHashWithValue(offsetAt(n), hash);
+}
+
+void ColumnVariant::updateWeakHash32(WeakHash32 & hash) const
+{
+    auto s = size();
+
+    if (hash.getData().size() != s)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Size of WeakHash32 does not match size of column: "
+                                                   "column size is {}, hash size is {}", std::to_string(s), std::to_string(hash.getData().size()));
+
+    /// If we have only NULLs, keep hash unchanged.
+    if (hasOnlyNulls())
+        return;
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just calculate weak hash for this variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        variants[*non_empty_local_discr]->updateWeakHash32(hash);
+        return;
+    }
+
+    /// Calculate weak hash for all variants.
+    std::vector<WeakHash32> nested_hashes;
+    for (const auto & variant : variants)
+    {
+        WeakHash32 nested_hash(variant->size());
+        variant->updateWeakHash32(nested_hash);
+        nested_hashes.emplace_back(std::move(nested_hash));
+    }
+
+    /// For each row hash is a hash of corresponding row from corresponding variant.
+    auto & hash_data = hash.getData();
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    const auto & offsets_data = getOffsets();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        /// Update hash only for non-NULL values
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            auto nested_hash = nested_hashes[local_discriminators_data[i]].getData()[offsets_data[i]];
+            hash_data[i] = static_cast<UInt32>(hashCRC32(nested_hash, hash_data[i]));
+        }
+    }
+}
+
+void ColumnVariant::updateHashFast(SipHash & hash) const
+{
+    local_discriminators->updateHashFast(hash);
+    for (const auto & variant : variants)
+        variant->updateHashFast(hash);
+}
+
+ColumnPtr ColumnVariant::filter(const Filter & filt, ssize_t result_size_hint) const
+{
+    if (size() != filt.size())
+        throw Exception(ErrorCodes::SIZES_OF_COLUMNS_DOESNT_MATCH, "Size of filter ({}) doesn't match size of column ({})", filt.size(), size());
+
+    /// If we have only NULLs, just filter local_discriminators column.
+    if (hasOnlyNulls())
+    {
+        Columns new_variants(variants.begin(), variants.end());
+        auto new_discriminators = local_discriminators->filter(filt, result_size_hint);
+        /// In case of all NULL values offsets doesn't contain any useful values, just resize it.
+        ColumnPtr new_offsets = offsets->cloneResized(new_discriminators->size());
+        return ColumnVariant::create(new_discriminators, new_offsets, new_variants, local_to_global_discriminators);
+    }
+
+    /// Optimization for case when there is only 1 non-empty variant and no NULLs.
+    /// In this case we can just filter this variant and resize discriminators/offsets.
+    if (auto non_empty_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        Columns new_variants(variants.begin(), variants.end());
+        new_variants[*non_empty_discr] = variants[*non_empty_discr]->filter(filt, result_size_hint);
+        size_t new_size = new_variants[*non_empty_discr]->size();
+        ColumnPtr new_discriminators = local_discriminators->cloneResized(new_size);
+        ColumnPtr new_offsets = offsets->cloneResized(new_size);
+        return ColumnVariant::create(new_discriminators, new_offsets, new_variants, local_to_global_discriminators);
+    }
+
+    /// We should create filter for each variant
+    /// according to local_discriminators and given filter.
+    const size_t num_variants = variants.size();
+    std::vector<Filter> nested_filters(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_filters[i].reserve(variants[i]->size());
+
+    /// As we will iterate through local_discriminators anyway, we can count
+    /// result size for each variant.
+    std::vector<ssize_t> variant_result_size_hints(num_variants);
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            nested_filters[local_discriminators_data[i]].push_back(filt[i]);
+            variant_result_size_hints[local_discriminators_data[i]] += !!(filt[i]);
+        }
+    }
+
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        /// It make sense to call filter() on variant only if the result size is not 0.
+        if (variant_result_size_hints[i])
+            new_variants.emplace_back(variants[i]->filter(nested_filters[i], variant_result_size_hints[i]));
+        else
+            new_variants.emplace_back(variants[i]->cloneEmpty());
+    }
+
+    /// We cannot use filtered offsets column, as it will be incorrect.
+    /// It will be reconstructed on ColumnVariant creation according to new local_discriminators.
+    return ColumnVariant::create(local_discriminators->filter(filt, result_size_hint), new_variants, local_to_global_discriminators);
+}
+
+void ColumnVariant::expand(const Filter & mask, bool inverted)
+{
+    /// Expand local_discriminators using NULL_DISCRIMINATOR for 0-rows.
+    expandDataByMask(getLocalDiscriminators(), mask, inverted, NULL_DISCRIMINATOR);
+    expandDataByMask(getOffsets(), mask, inverted);
+}
+
+ColumnPtr ColumnVariant::permute(const Permutation & perm, size_t limit) const
+{
+    /// If we have only NULLs, permutation will take no effect, just return resized column.
+    if (hasOnlyNulls())
+        return cloneResized(limit);
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. In this case we can just apply permutation to this
+    /// single non-empty variant and cut local_discriminators and offsets columns to the result size.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        const size_t num_variants = variants.size();
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->permute(perm, limit)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->assumeMutable());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    return permuteImpl(*this, perm, limit);
+}
+
+ColumnPtr ColumnVariant::index(const IColumn & indexes, size_t limit) const
+{
+    /// If we have only NULLs, index will take no effect, just return resized column.
+    if (hasOnlyNulls())
+        return cloneResized(limit);
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. So we can just apply indexes to this
+    /// single non-empty variant and cut local_discriminators and offsets columns to the result size.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        const size_t num_variants = variants.size();
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->index(indexes, limit)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->assumeMutable());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    return selectIndexImpl(*this, indexes, limit);
+}
+
+template <typename Type>
+ColumnPtr ColumnVariant::indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const
+{
+    /// First, apply indexes for local_discriminators and offsets.
+    ColumnPtr new_local_discriminators = assert_cast<const ColumnDiscriminators &>(*local_discriminators).indexImpl(indexes, limit);
+    ColumnPtr new_offsets = assert_cast<const ColumnOffsets &>(*offsets).indexImpl(indexes, limit);
+    const auto & new_local_discriminators_data =  assert_cast<const ColumnDiscriminators &>(*new_local_discriminators).getData();
+    const auto & new_offsets_data = assert_cast<const ColumnOffsets &>(*new_offsets).getData();
+    /// Then, create permutation for each variant.
+    const size_t num_variants = variants.size();
+    std::vector<Permutation> nested_perms(num_variants);
+    /// If there is no limit, we know the size of each permutation
+    /// in advance and can use reserve.
+    if (limit == 0)
+    {
+        for (size_t i = 0; i != num_variants; ++i)
+            nested_perms[i].reserve(variants[i]->size());
+    }
+
+    for (size_t i = 0; i != new_local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = new_local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+            nested_perms[discr].push_back(new_offsets_data[i]);
+    }
+
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+    {
+        size_t nested_limit = nested_perms[i].size() == variants[i]->size() ? 0 : nested_perms[i].size();
+        new_variants.emplace_back(variants[i]->permute(nested_perms[i], nested_limit));
+    }
+
+    /// We cannot use new_offsets column as an offset column, because it became invalid after variants permutation.
+    /// New offsets column will be created in constructor.
+    return ColumnVariant::create(new_local_discriminators, new_variants, local_to_global_discriminators);
+}
+
+ColumnPtr ColumnVariant::replicate(const Offsets & replicate_offsets) const
+{
+    if (size() != replicate_offsets.size())
+        throw Exception(ErrorCodes::SIZES_OF_COLUMNS_DOESNT_MATCH, "Size of offsets {} doesn't match size of column {}", replicate_offsets.size(), size());
+
+    if (empty())
+        return cloneEmpty();
+
+    /// If we have only NULLs, just resize column to the new size.
+    if (hasOnlyNulls())
+        return cloneResized(replicate_offsets.back());
+
+    const size_t num_variants = variants.size();
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case local_discriminators column is filled with identical values and offsets column
+    /// filled with sequential numbers. So we can just replicate this one non empty variant,
+    /// then resize local_discriminators to the result size and fill offsets column.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t i = 0; i != num_variants; ++i)
+        {
+            if (i == *non_empty_local_discr)
+                new_variants.emplace_back(variants[*non_empty_local_discr]->replicate(replicate_offsets)->assumeMutable());
+            else
+                new_variants.emplace_back(variants[i]->cloneEmpty());
+        }
+
+        size_t new_size = new_variants[*non_empty_local_discr]->size();
+        /// Create and fill new local_discriminators column with non_empty_index discriminator.
+        auto new_local_discriminators = IColumn::mutate(local_discriminators);
+        assert_cast<ColumnDiscriminators &>(*new_local_discriminators).getData().resize_fill(new_size, *non_empty_local_discr);
+        /// Create and fill new offsets column with sequential indexes.
+        auto new_offsets = IColumn::mutate(offsets);
+        auto & new_offsets_data = assert_cast<ColumnOffsets &>(*new_offsets).getData();
+        size_t old_size = offsets->size();
+        if (new_size > old_size)
+        {
+            new_offsets_data.reserve(new_size);
+            for (size_t i = old_size; i < new_size; ++i)
+                new_offsets_data.push_back(new_offsets_data[i - 1] + 1);
+        }
+        else
+        {
+            new_offsets_data.resize(new_size);
+        }
+
+        return ColumnVariant::create(std::move(new_local_discriminators), std::move(new_offsets), std::move(new_variants), local_to_global_discriminators);
+    }
+
+    /// Create replicate offsets for each variant according to
+    /// local_discriminators column.
+    std::vector<Offsets> nested_replicated_offsets(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_replicated_offsets[i].reserve(variants[i]->size());
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            size_t repeat_count = replicate_offsets[i] - replicate_offsets[i - 1];
+            nested_replicated_offsets[discr].push_back(nested_replicated_offsets[discr].back() + repeat_count);
+        }
+    }
+
+    auto new_local_discriminators = local_discriminators->replicate(replicate_offsets);
+    Columns new_variants;
+    new_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        new_variants.emplace_back(variants[i]->replicate(nested_replicated_offsets[i]));
+
+    /// New offsets column will be created in constructor.
+    return ColumnVariant::create(new_local_discriminators, new_variants, local_to_global_discriminators);
+}
+
+MutableColumns ColumnVariant::scatter(ColumnIndex num_columns, const Selector & selector) const
+{
+    const size_t num_variants = variants.size();
+
+    /// If we have only NULLs, we need to scatter only local_discriminators.
+    if (hasOnlyNulls())
+    {
+        auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+        MutableColumns result;
+        result.reserve(num_columns);
+        for (size_t i = 0; i != num_columns; ++i)
+        {
+            MutableColumns new_variants;
+            new_variants.reserve(num_variants);
+            for (const auto & variant : variants)
+                new_variants.emplace_back(IColumn::mutate(variant));
+
+            result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(new_variants), local_to_global_discriminators));
+        }
+
+        return result;
+    }
+
+    /// Optimization when we have only one non empty variant and no NULLs.
+    /// In this case we can just scatter local_discriminators and this non empty variant.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+        auto scattered_non_empty_variant = variants[*non_empty_local_discr]->scatter(num_columns, selector);
+        MutableColumns result;
+        result.reserve(num_columns);
+        for (size_t i = 0; i != num_columns; ++i)
+        {
+            MutableColumns scattered_nested_variants(num_variants);
+            for (size_t j = 0; j != num_variants; ++j)
+            {
+                if (j == *non_empty_local_discr)
+                    scattered_nested_variants[j] = std::move(scattered_non_empty_variant[i]);
+                else
+                    scattered_nested_variants[j] = IColumn::mutate(variants[j]);
+            }
+
+            result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(scattered_nested_variants), local_to_global_discriminators));
+        }
+
+        return result;
+    }
+
+    /// Create selector for each variant according to local_discriminators.
+    std::vector<Selector> nested_selectors(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_selectors[i].reserve(variants[i]->size());
+
+    const auto & local_discriminators_data = getLocalDiscriminators();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        Discriminator discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+            nested_selectors[discr].push_back(selector[i]);
+    }
+
+    auto scattered_local_discriminators = local_discriminators->scatter(num_columns, selector);
+    std::vector<MutableColumns> nested_scattered_variants;
+    nested_scattered_variants.reserve(num_variants);
+    for (size_t i = 0; i != num_variants; ++i)
+        nested_scattered_variants.emplace_back(variants[i]->scatter(num_columns, nested_selectors[i]));
+
+    MutableColumns result;
+    result.reserve(num_columns);
+    for (size_t i = 0; i != num_columns; ++i)
+    {
+        MutableColumns new_variants;
+        new_variants.reserve(num_variants);
+        for (size_t j = 0; j != num_variants; ++j)
+            new_variants.emplace_back(std::move(nested_scattered_variants[j][i]));
+        result.emplace_back(ColumnVariant::create(std::move(scattered_local_discriminators[i]), std::move(new_variants), local_to_global_discriminators));
+    }
+
+    return result;
+}
+
+void ColumnVariant::gather(ColumnGathererStream & gatherer)
+{
+    gatherer.gather(*this);
+}
+
+bool ColumnVariant::hasEqualValues() const
+{
+    if (local_discriminators->empty() || hasOnlyNulls())
+        return true;
+
+    return local_discriminators->hasEqualValues() && variants[localDiscriminatorAt(0)]->hasEqualValues();
+}
+
+void ColumnVariant::getPermutation(IColumn::PermutationSortDirection, IColumn::PermutationSortStability, size_t, int, IColumn::Permutation & res) const
+{
+    size_t s = local_discriminators->size();
+    res.resize(s);
+    for (size_t i = 0; i < s; ++i)
+        res[i] = i;
+}
+
+void ColumnVariant::updatePermutation(IColumn::PermutationSortDirection, IColumn::PermutationSortStability, size_t, int, IColumn::Permutation &, DB::EqualRanges &) const
+{
+}
+
+void ColumnVariant::reserve(size_t n)
+{
+    local_discriminators->reserve(n);
+    offsets->reserve(n);
+}
+
+void ColumnVariant::ensureOwnership()
+{
+    const size_t num_variants = variants.size();
+    for (size_t i = 0; i < num_variants; ++i)
+        getVariantByLocalDiscriminator(i).ensureOwnership();
+}
+
+size_t ColumnVariant::byteSize() const
+{
+    size_t res = local_discriminators->byteSize() + offsets->byteSize();
+    for (const auto & variant : variants)
+        res += variant->byteSize();
+    return res;
+}
+
+size_t ColumnVariant::byteSizeAt(size_t n) const
+{
+    size_t res = sizeof(Offset) + sizeof(Discriminator);
+    Discriminator discr = localDiscriminatorAt(n);
+    if (discr == NULL_DISCRIMINATOR)
+        return res;
+
+    return res + variants[discr]->byteSizeAt(offsetAt(n));
+}
+
+size_t ColumnVariant::allocatedBytes() const
+{
+    size_t res = local_discriminators->allocatedBytes() + offsets->allocatedBytes();
+    for (const auto & variant : variants)
+        res += variant->allocatedBytes();
+    return res;
+}
+
+void ColumnVariant::protect()
+{
+    local_discriminators->protect();
+    offsets->protect();
+    for (auto & variant : variants)
+        variant->protect();
+}
+
+void ColumnVariant::getExtremes(Field & min, Field & max) const
+{
+    min = Null();
+    max = Null();
+}
+
+void ColumnVariant::forEachSubcolumn(MutableColumnCallback callback)
+{
+    callback(local_discriminators);
+    callback(offsets);
+    for (auto & variant : variants)
+        callback(variant);
+}
+
+void ColumnVariant::forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback)
+{
+    callback(*local_discriminators);
+    local_discriminators->forEachSubcolumnRecursively(callback);
+    callback(*offsets);
+    offsets->forEachSubcolumnRecursively(callback);
+
+    for (auto & variant : variants)
+    {
+        callback(*variant);
+        variant->forEachSubcolumnRecursively(callback);
+    }
+}
+
+bool ColumnVariant::structureEquals(const IColumn & rhs) const
+{
+    const auto * rhs_variant = typeid_cast<const ColumnVariant *>(&rhs);
+    if (!rhs_variant)
+        return false;
+
+    const size_t num_variants = variants.size();
+    if (num_variants != rhs_variant->variants.size())
+        return false;
+
+    for (size_t i = 0; i < num_variants; ++i)
+        if (!variants[i]->structureEquals(rhs_variant->getVariantByGlobalDiscriminator(globalDiscriminatorByLocal(i))))
+            return false;
+
+    return true;
+}
+
+ColumnPtr ColumnVariant::compress() const
+{
+    ColumnPtr local_discriminators_compressed = local_discriminators->compress();
+    ColumnPtr offsets_compressed = offsets->compress();
+    size_t byte_size = local_discriminators_compressed->byteSize() + offsets_compressed->byteSize();
+    Columns compressed;
+    compressed.reserve(variants.size());
+    for (const auto & variant : variants)
+    {
+        auto compressed_variant = variant->compress();
+        byte_size += compressed_variant->byteSize();
+        compressed.emplace_back(std::move(compressed_variant));
+    }
+
+    return ColumnCompressed::create(size(), byte_size,
+        [my_local_discriminators_compressed = std::move(local_discriminators_compressed), my_offsets_compressed = std::move(offsets_compressed), my_compressed = std::move(compressed), my_local_to_global_discriminators = this->local_to_global_discriminators]() mutable
+        {
+            for (auto & variant : my_compressed)
+                variant = variant->decompress();
+            return ColumnVariant::create(my_local_discriminators_compressed->decompress(), my_offsets_compressed->decompress(), my_compressed, my_local_to_global_discriminators);
+        });
+}
+
+double ColumnVariant::getRatioOfDefaultRows(double) const
+{
+    UInt64 num_defaults = getNumberOfDefaultRows();
+    return static_cast<double>(num_defaults) / local_discriminators->size();
+}
+
+UInt64 ColumnVariant::getNumberOfDefaultRows() const
+{
+    size_t total_variant_sizes = 0;
+    for (const auto & variant : variants)
+        total_variant_sizes += variant->size();
+    return local_discriminators->size() - total_variant_sizes;
+}
+
+void ColumnVariant::getIndicesOfNonDefaultRows(Offsets & indices, size_t from, size_t limit) const
+{
+    return getIndicesOfNonDefaultRowsImpl<ColumnVariant>(indices, from, limit);
+}
+
+void ColumnVariant::finalize()
+{
+    for (auto & variant : variants)
+        variant->finalize();
+}
+
+bool ColumnVariant::isFinalized() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](const auto & variant) { return variant->isFinalized(); });
+}
+
+std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls() const
+{
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        if (variants[i]->size() == local_discriminators->size())
+            return i;
+    }
+
+    return std::nullopt;
+}
+
+void ColumnVariant::applyNullMap(const ColumnVector<UInt8>::Container & null_map)
+{
+    applyNullMapImpl<false>(null_map);
+}
+
+void ColumnVariant::applyNegatedNullMap(const ColumnVector<UInt8>::Container & null_map)
+{
+    applyNullMapImpl<true>(null_map);
+}
+
+template <bool inverted>
+void ColumnVariant::applyNullMapImpl(const ColumnVector<UInt8>::Container & null_map)
+{
+    if (null_map.size() != local_discriminators->size())
+        throw Exception(ErrorCodes::SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT,
+                        "Logical error: Sizes of discriminators column and null map data are not equal");
+
+    /// If we have only NULLs, nothing to do.
+    if (hasOnlyNulls())
+    {
+        return;
+    }
+
+    /// If we have only 1 non empty column and no NULLs, we can just filter that
+    /// variant according to the null_map.
+    if (auto non_empty_local_discr = getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        auto & local_discriminators_data = getLocalDiscriminators();
+        auto & offsets_data = getOffsets();
+        size_t size_hint = 0;
+
+        if constexpr (inverted)
+        {
+            for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+            {
+                if (null_map[i])
+                    offsets_data[i] = size_hint++;
+                else
+                    local_discriminators_data[i] = NULL_DISCRIMINATOR;
+            }
+            variants[*non_empty_local_discr] = variants[*non_empty_local_discr]->filter(null_map, size_hint);
+        }
+        else
+        {
+            ColumnVector<UInt8>::Container filter;
+            filter.reserve(null_map.size());
+            for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+            {
+               if (null_map[i])
+               {
+                    filter.push_back(0);
+                    local_discriminators_data[i] = NULL_DISCRIMINATOR;
+               }
+               else
+               {
+                   filter.push_back(1);
+                   offsets_data[i] = size_hint++;
+               }
+            }
+            variants[*non_empty_local_discr] = variants[*non_empty_local_discr]->filter(filter, size_hint);
+        }
+
+        return;
+    }
+
+    /// In general case we should iterate through null_map + discriminators,
+    /// create filter for each variant and update offsets column.
+    std::vector<Filter> variant_filters;
+    variant_filters.resize(variants.size());
+    std::vector<size_t> variant_new_sizes;
+    variant_new_sizes.resize(variants.size(), 0);
+
+    auto & local_discriminators_data = getLocalDiscriminators();
+    auto & offsets_data = getOffsets();
+    for (size_t i = 0; i != local_discriminators_data.size(); ++i)
+    {
+        auto & discr = local_discriminators_data[i];
+        if (discr != NULL_DISCRIMINATOR)
+        {
+            if (null_map[i] ^ inverted)
+            {
+                auto & variant_filter = variant_filters[discr];
+                /// We create filters lazily.
+                if (variant_filter.empty())
+                   variant_filter.resize_fill(variants[discr]->size(), 1);
+                variant_filter[offsets_data[i]] = 0;
+                discr = NULL_DISCRIMINATOR;
+            }
+            else
+            {
+                offsets_data[i] = variant_new_sizes[discr]++;
+            }
+        }
+    }
+
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        if (!variant_filters[i].empty())
+            variants[i] = variants[i]->filter(variant_filters[i], variant_new_sizes[i]);
+    }
+}
+
+}
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
new file mode 100644
index 00000000000..692fdd1709e
--- /dev/null
+++ b/src/Columns/ColumnVariant.h
@@ -0,0 +1,306 @@
+#pragma once
+
+#include <Columns/IColumn.h>
+#include <Columns/ColumnVector.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+/**
+ * Column for storing Variant(...) type values.
+ * Variant type represents a union of other data types.
+ * For example, type Variant(T1, T2, ..., TN) means that each row of this type
+ * has a value of either type T1 or T2 or ... or TN or none of them (NULL value)
+ *
+ * ColumnVariant stores:
+ *   - The discriminators column, which determines which variant is stored in each row.
+ *   - The offsets column, which determines the offset in the corresponding variant column in each row.
+ *   - The list of variant columns with only real values (so the sizes of variant columns can be different).
+ * Discriminator is an index of a variant in the variants list, it also has special value called NULL_DISCRIMINATOR
+ * that indicates that the value in the row is NULL.
+ *
+ * We want to be able to extend Variant column for free without rewriting the data, but as we don't care about the
+ * order of variants during Variant creation (we want Variant(T1, T2) to be the same as Variant(T2, T1)), we support
+ * some global order of nested types inside Variant during type creation, so after extension the order of variant types
+ * (and so their discriminators) can change. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
+ * To avoid full rewrite of discriminators column on Variant extension, we differentiate local order of variants
+ * inside a column and global order of variants created during type creation. So, ColumnVariant stores only local
+ * discriminators and additionally stores the mapping between global and local discriminators.
+ * So, when we need to extend Variant column with new variant, we can just append it to a list of variant columns
+ * with new local discriminator and update mapping from global to local orders.
+ *
+ * Note that two instances of ColumnVariant can have different local orders, so we should always use global
+ * discriminators during inter-column interactions.
+ *
+ * Let's take an example with type Variant(UInt32, String, Array(UInt32)):
+ * During type creation we will sort types by their names and get the global order: Array(UInt32), String, UInt32.
+ * So, type Array(UInt32) will have global discriminator 0, String - 1 and UInt32 - 2.
+ * Let's say we have a column with local order (String, UInt32, Array(UInt32)) and values:
+ * 'Hello', 42, NULL, 'World', 43, [1, 2, 3], NULL, 44
+ *
+ * Let's see how these values will be stored in ColumnVariant:
+ *
+ * local_to_global_discriminators: {0 : 1, 1 : 2, 2 : 0}
+ * global_to_local_discriminators: {0 : 2, 1 : 0, 2 : 1}
+ * local_discriminators    offsets    String    UInt32    Array(UInt32)
+ *         0                  0       'Hello'     42        [1, 2, 3]
+ *         1                  0       'World'     43
+ *  NULL_DISCRIMINATOR        0                   44
+ *         0                  1
+ *         1                  1
+ *         2                  0
+ *  NULL_DISCRIMINATOR        0
+ *         1                  2
+ *
+ */
+class ColumnVariant final : public COWHelper<IColumn, ColumnVariant>
+{
+public:
+    using Discriminator = UInt8;
+    using Discriminators = PaddedPODArray<Discriminator>;
+    using ColumnDiscriminators = ColumnVector<Discriminator>;
+    using ColumnOffsets = ColumnVector<Offset>;
+
+    static constexpr UInt8 NULL_DISCRIMINATOR = std::numeric_limits<Discriminator>::max(); /// 255
+    static constexpr size_t MAX_NESTED_COLUMNS = std::numeric_limits<Discriminator>::max(); /// 255
+
+private:
+    friend class COWHelper<IColumn, ColumnVariant>;
+
+    using NestedColumns = std::vector<WrappedPtr>;
+
+    /// Create an empty column with provided variants.
+    /// Variants are in global order.
+    explicit ColumnVariant(MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    explicit ColumnVariant(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    /// Create column from discriminators column and list of variant columns.
+    /// Offsets column should be constructed according to the discriminators.
+    /// Variants are in global order.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    /// Create column from discriminators column, offsets column and list of variant columns.
+    /// Variants are in global order.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_);
+    /// Variants are in local order according to provided mapping.
+    ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    ColumnVariant(const ColumnVariant &) = default;
+
+public:
+    /** Create immutable column using immutable arguments. This arguments may be shared with other variants.
+      * Use IColumn::mutate in order to make mutable column and mutate shared nested variants.
+      */
+    using Base = COWHelper<IColumn, ColumnVariant>;
+    static Ptr create(const Columns & variants_) { return create(variants_, {}); }
+    static Ptr create(const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+    static Ptr create(const ColumnPtr & local_discriminators_, const Columns & variants_) { return create(local_discriminators_, variants_, {}); }
+    static Ptr create(const ColumnPtr & local_discriminators_, const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+    static Ptr create(const ColumnPtr & local_discriminators_, const DB::ColumnPtr & offsets_, const Columns & variants_) { return create(local_discriminators_, offsets_, variants_, {}); }
+    static Ptr create(const ColumnPtr & local_discriminators_, const DB::ColumnPtr & offsets_, const Columns & variants_, const std::vector<Discriminator> & local_to_global_discriminators_);
+
+    static MutablePtr create(MutableColumns && variants_)
+    {
+        return Base::create(std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(variants_), local_to_global_discriminators_);
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumns && variants_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(variants_), local_to_global_discriminators_);
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(offsets_), std::move(variants_));
+    }
+
+    static MutablePtr create(MutableColumnPtr local_discriminators_, MutableColumnPtr offsets_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_)
+    {
+        return Base::create(std::move(local_discriminators_), std::move(offsets_), std::move(variants_), local_to_global_discriminators_);
+    }
+
+    std::string getName() const override;
+    const char * getFamilyName() const override { return "Variant"; }
+    TypeIndex getDataType() const override { return TypeIndex::Variant; }
+
+    MutableColumnPtr cloneEmpty() const override;
+    MutableColumnPtr cloneResized(size_t size) const override;
+
+    size_t ALWAYS_INLINE offsetAt(size_t i) const { return getOffsets()[i]; }
+    Discriminator ALWAYS_INLINE localDiscriminatorAt(size_t i) const { return getLocalDiscriminators()[i]; }
+    Discriminator ALWAYS_INLINE globalDiscriminatorAt(size_t i) const { return globalDiscriminatorByLocal(getLocalDiscriminators()[i]); }
+
+    Discriminator ALWAYS_INLINE globalDiscriminatorByLocal(Discriminator local_discr) const
+    {
+        /// NULL_DISCRIMINATOR is always the same in local and global orders.
+        return local_discr == NULL_DISCRIMINATOR ? NULL_DISCRIMINATOR : local_to_global_discriminators[local_discr];
+    }
+
+    Discriminator ALWAYS_INLINE localDiscriminatorByGlobal(Discriminator global_discr) const
+    {
+        /// NULL_DISCRIMINATOR is always the same in local and global orders.
+        return global_discr == NULL_DISCRIMINATOR ? NULL_DISCRIMINATOR : global_to_local_discriminators[global_discr];
+    }
+
+    size_t size() const override
+    {
+        return local_discriminators->size();
+    }
+
+    Field operator[](size_t n) const override;
+    void get(size_t n, Field & res) const override;
+
+    bool isDefaultAt(size_t n) const override;
+    bool isNullAt(size_t n) const override;
+    StringRef getDataAt(size_t n) const override;
+    void insertData(const char * pos, size_t length) override;
+    void insert(const Field & x) override;
+    void insertFrom(const IColumn & src_, size_t n) override;
+    void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
+    void insertDefault() override;
+    void insertManyDefaults(size_t length) override;
+    void popBack(size_t n) override;
+    StringRef serializeValueIntoArena(size_t n, Arena & arena, char const *& begin, const UInt8 *) const override;
+    const char * deserializeAndInsertFromArena(const char * pos) override;
+    const char * skipSerializedInArena(const char * pos) const override;
+    void updateHashWithValue(size_t n, SipHash & hash) const override;
+    void updateWeakHash32(WeakHash32 & hash) const override;
+    void updateHashFast(SipHash & hash) const override;
+    ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
+    void expand(const Filter & mask, bool inverted) override;
+    ColumnPtr permute(const Permutation & perm, size_t limit) const override;
+    ColumnPtr index(const IColumn & indexes, size_t limit) const override;
+    template <typename Type>
+    ColumnPtr indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const;
+    ColumnPtr replicate(const Offsets & replicate_offsets) const override;
+    MutableColumns scatter(ColumnIndex num_variants, const Selector & selector) const override;
+    void gather(ColumnGathererStream & gatherer_stream) override;
+
+    /// Variant type is not comparable.
+    int compareAt(size_t, size_t, const IColumn &, int) const override
+    {
+        return 0;
+    }
+
+    void compareColumn(const IColumn &, size_t, PaddedPODArray<UInt64> *, PaddedPODArray<Int8> &, int, int) const override
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnAggregateFunction");
+    }
+
+    bool hasEqualValues() const override;
+    void getExtremes(Field & min, Field & max) const override;
+    void getPermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
+                        size_t limit, int nan_direction_hint, IColumn::Permutation & res) const override;
+    void updatePermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
+                           size_t limit, int nan_direction_hint, IColumn::Permutation & res, EqualRanges & equal_ranges) const override;
+
+    void reserve(size_t n) override;
+    void ensureOwnership() override;
+    size_t byteSize() const override;
+    size_t byteSizeAt(size_t n) const override;
+    size_t allocatedBytes() const override;
+    void protect() override;
+    void forEachSubcolumn(MutableColumnCallback callback) override;
+    void forEachSubcolumnRecursively(RecursiveMutableColumnCallback callback) override;
+    bool structureEquals(const IColumn & rhs) const override;
+    ColumnPtr compress() const override;
+    double getRatioOfDefaultRows(double sample_ratio) const override;
+    UInt64 getNumberOfDefaultRows() const override;
+    void getIndicesOfNonDefaultRows(Offsets & indices, size_t from, size_t limit) const override;
+    void finalize() override;
+    bool isFinalized() const override;
+
+    const IColumn & getVariantByLocalDiscriminator(size_t discr) const { return *variants[discr]; }
+    const IColumn & getVariantByGlobalDiscriminator(size_t discr) const { return *variants[global_to_local_discriminators.at(discr)]; }
+    IColumn & getVariantByLocalDiscriminator(size_t discr) { return *variants[discr]; }
+    IColumn & getVariantByGlobalDiscriminator(size_t discr) { return *variants[global_to_local_discriminators.at(discr)]; }
+
+    const ColumnPtr & getVariantPtrByLocalDiscriminator(size_t discr) const { return variants[discr]; }
+    const ColumnPtr & getVariantPtrByGlobalDiscriminator(size_t discr) const { return variants[global_to_local_discriminators.at(discr)]; }
+    ColumnPtr & getVariantPtrByLocalDiscriminator(size_t discr) { return variants[discr]; }
+    ColumnPtr & getVariantPtrByGlobalDiscriminator(size_t discr) { return variants[global_to_local_discriminators.at(discr)]; }
+
+    const IColumn & getLocalDiscriminatorsColumn() const { return *local_discriminators; }
+    IColumn & getLocalDiscriminatorsColumn() { return *local_discriminators; }
+
+    const ColumnPtr & getLocalDiscriminatorsPtr() const { return local_discriminators; }
+    ColumnPtr & getLocalDiscriminatorsPtr() { return local_discriminators; }
+
+    const Discriminators & ALWAYS_INLINE getLocalDiscriminators() const { return assert_cast<const ColumnDiscriminators &>(*local_discriminators).getData(); }
+    Discriminators & ALWAYS_INLINE getLocalDiscriminators() { return assert_cast<ColumnDiscriminators &>(*local_discriminators).getData(); }
+
+    const IColumn & getOffsetsColumn() const { return *offsets; }
+    IColumn & getOffsetsColumn() { return *offsets; }
+
+    const ColumnPtr & getOffsetsPtr() const { return offsets; }
+    ColumnPtr & getOffsetsPtr() { return offsets; }
+
+    const Offsets & ALWAYS_INLINE getOffsets() const { return assert_cast<const ColumnOffsets &>(*offsets).getData(); }
+    Offsets & ALWAYS_INLINE getOffsets() { return assert_cast<ColumnOffsets &>(*offsets).getData(); }
+
+    size_t getNumVariants() const { return variants.size(); }
+
+    bool hasOnlyNulls() const
+    {
+        /// If all variants are empty, we have only NULL values.
+        return std::all_of(variants.begin(), variants.end(), [](const auto & v){ return v->empty(); } );
+    }
+
+    /// Check if local and global order is the same.
+    bool hasGlobalVariantsOrder() const
+    {
+        for (size_t i = 0; i != local_to_global_discriminators.size(); ++i)
+        {
+            if (local_to_global_discriminators[i] != i)
+                return false;
+        }
+
+        return true;
+    }
+
+    /// Check if we have only 1 non-empty variant and no NULL values,
+    /// and if so, return the discriminator of this non-empty column.
+    std::optional<Discriminator> getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls() const;
+
+    /// Apply null map to a Variant column.
+    /// Replace corresponding discriminators with NULL_DISCRIMINATOR
+    /// and filter out rows in variants if needed.
+    void applyNullMap(const ColumnVector<UInt8>::Container & null_map);
+    void applyNegatedNullMap(const ColumnVector<UInt8>::Container & null_map);
+
+private:
+    void initIdentityGlobalToLocalDiscriminatorsMapping();
+
+    template <bool inverted>
+    void applyNullMapImpl(const ColumnVector<UInt8>::Container & null_map);
+
+    WrappedPtr local_discriminators;
+    WrappedPtr offsets;
+    NestedColumns variants;
+
+    std::vector<Discriminator> global_to_local_discriminators;
+    std::vector<Discriminator> local_to_global_discriminators;
+};
+
+
+}
diff --git a/src/Columns/IColumn.cpp b/src/Columns/IColumn.cpp
index 7923bca6354..82dc82e0bd9 100644
--- a/src/Columns/IColumn.cpp
+++ b/src/Columns/IColumn.cpp
@@ -2,6 +2,7 @@
 #include <IO/Operators.h>
 #include <Columns/IColumn.h>
 #include <Columns/ColumnNullable.h>
+#include <Columns/ColumnLowCardinality.h>
 #include <Columns/ColumnConst.h>
 #include <Core/Field.h>
 #include <DataTypes/Serializations/SerializationInfo.h>
@@ -83,6 +84,11 @@ bool isColumnNullable(const IColumn & column)
     return checkColumn<ColumnNullable>(column);
 }
 
+bool isColumnNullableOrLowCardinalityNullable(const IColumn & column)
+{
+    return isColumnNullable(column) || isColumnLowCardinalityNullable(column);
+}
+
 bool isColumnConst(const IColumn & column)
 {
     return checkColumn<ColumnConst>(column);
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index f012eeca61f..0dcba5b310c 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -631,6 +631,17 @@ struct IsMutableColumns<Arg, Args ...>
 template <>
 struct IsMutableColumns<> { static const bool value = true; };
 
+template <typename ... Args>
+struct IsMutableColumnsOrRvalueReferences;
+
+template <typename Arg, typename ... Args>
+struct IsMutableColumnsOrRvalueReferences<Arg, Args ...>
+{
+    static const bool value = (std::is_assignable<MutableColumnPtr &&, Arg>::value || std::is_rvalue_reference_v<Arg &&>) && IsMutableColumnsOrRvalueReferences<Args ...>::value;
+};
+
+template <>
+struct IsMutableColumnsOrRvalueReferences<> { static const bool value = true; };
 
 template <typename Type>
 const Type * checkAndGetColumn(const IColumn & column)
@@ -662,4 +673,7 @@ bool isColumnConst(const IColumn & column);
 /// True if column's an ColumnNullable instance. It's just a syntax sugar for type check.
 bool isColumnNullable(const IColumn & column);
 
+/// True if column's is ColumnNullable or ColumnLowCardinality with nullable nested column.
+bool isColumnNullableOrLowCardinalityNullable(const IColumn & column);
+
 }
diff --git a/src/Columns/MaskOperations.cpp b/src/Columns/MaskOperations.cpp
index b84268356a7..518269e1728 100644
--- a/src/Columns/MaskOperations.cpp
+++ b/src/Columns/MaskOperations.cpp
@@ -17,7 +17,7 @@ namespace ErrorCodes
 }
 
 template <typename T>
-void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted)
+void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted, T default_value)
 {
     if (mask.size() < data.size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Mask size should be no less than data size.");
@@ -38,7 +38,7 @@ void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & ma
             --from;
         }
         else
-            data[index] = T();
+            data[index] = default_value;
 
         --index;
     }
@@ -49,7 +49,7 @@ void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & ma
 
 /// Explicit instantiations - not to place the implementation of the function above in the header file.
 #define INSTANTIATE(TYPE) \
-template void expandDataByMask<TYPE>(PaddedPODArray<TYPE> &, const PaddedPODArray<UInt8> &, bool);
+template void expandDataByMask<TYPE>(PaddedPODArray<TYPE> &, const PaddedPODArray<UInt8> &, bool, TYPE);
 
 INSTANTIATE(UInt8)
 INSTANTIATE(UInt16)
diff --git a/src/Columns/MaskOperations.h b/src/Columns/MaskOperations.h
index e43b4588258..cc5226bf0c1 100644
--- a/src/Columns/MaskOperations.h
+++ b/src/Columns/MaskOperations.h
@@ -13,7 +13,7 @@ namespace DB
 /// If inverted is true, we will work with inverted mask. This function is used in implementations of
 /// expand() method in IColumn interface.
 template <typename T>
-void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted);
+void expandDataByMask(PaddedPODArray<T> & data, const PaddedPODArray<UInt8> & mask, bool inverted, T default_value = T());
 
 struct MaskInfo
 {
diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
new file mode 100644
index 00000000000..b701e2d3183
--- /dev/null
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -0,0 +1,688 @@
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
+#include <gtest/gtest.h>
+
+using namespace DB;
+
+TEST(ColumnVariant, CreateFromEmptyColumns)
+{
+    MutableColumns columns;
+    columns.push_back(ColumnUInt32::create());
+    columns.push_back(ColumnString::create());
+    auto column = ColumnVariant::create(std::move(columns));
+    ASSERT_TRUE(column->empty() && column->getLocalDiscriminators().empty() && column->getOffsets().empty());
+}
+
+TEST(ColumnVariant, CreateFromEmptyColumnsWithLocalOrder)
+{
+    MutableColumns columns;
+    columns.push_back(ColumnUInt32::create());
+    columns.push_back(ColumnString::create());
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(1);
+    local_to_global_discriminators.push_back(0);
+    auto column = ColumnVariant::create(std::move(columns), local_to_global_discriminators);
+    ASSERT_TRUE(column->empty() && column->getLocalDiscriminators().empty() && column->getOffsets().empty());
+    ASSERT_EQ(column->localDiscriminatorByGlobal(0), 0);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(1), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(1), 1);
+}
+
+MutableColumns createColumns1()
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    column1->insertValue(42);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    column2->insertData("Hello", 5);
+    column2->insertData("World", 5);
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt32::create();
+    columns.push_back(std::move(column3));
+    return columns;
+}
+
+MutableColumnPtr createDiscriminators1()
+{
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    return discriminators_column;
+}
+
+void reorderColumns(const std::vector<ColumnVariant::Discriminator> & local_to_global_order, MutableColumns & columns)
+{
+    MutableColumns res;
+    for (auto global_discr : local_to_global_order)
+        res.push_back(std::move(columns[global_discr]));
+    columns = std::move(res);
+}
+
+template <typename Ptr>
+void reorderDiscriminators(const std::vector<ColumnVariant::Discriminator> & local_to_global_order, Ptr & discriminators)
+{
+    std::vector<ColumnVariant::Discriminator> global_to_local_order(local_to_global_order.size());
+    for (size_t i = 0; i != local_to_global_order.size(); ++i)
+        global_to_local_order[local_to_global_order[i]] = i;
+
+    auto & discriminators_data = assert_cast<ColumnVariant::ColumnDiscriminators *>(discriminators.get())->getData();
+    for (auto & discr : discriminators_data)
+    {
+        if (discr != ColumnVariant::NULL_DISCRIMINATOR)
+            discr = global_to_local_order[discr];
+    }
+}
+
+MutableColumnPtr createOffsets1()
+{
+    auto offsets = ColumnVariant::ColumnOffsets::create();
+    offsets->insertValue(0);
+    offsets->insertValue(0);
+    offsets->insertValue(0);
+    offsets->insertValue(1);
+    offsets->insertValue(0);
+    return offsets;
+}
+
+std::vector<ColumnVariant::Discriminator> createLocalToGlobalOrder1()
+{
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(1);
+    local_to_global_discriminators.push_back(2);
+    local_to_global_discriminators.push_back(0);
+    return local_to_global_discriminators;
+}
+
+void checkColumnVariant1(ColumnVariant * column)
+{
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 5);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_TRUE(column->isDefaultAt(2) && column->isDefaultAt(4));
+    ASSERT_EQ((*column)[0].get<UInt32>(), 42);
+    ASSERT_EQ((*column)[1].get<String>(), "Hello");
+    ASSERT_TRUE((*column)[2].isNull());
+    ASSERT_EQ((*column)[3].get<String>(), "World");
+    ASSERT_TRUE((*column)[4].isNull());
+}
+
+void checkColumnVariant1Order(ColumnVariant * column)
+{
+    ASSERT_EQ(column->localDiscriminatorByGlobal(0), 2);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(1), 0);
+    ASSERT_EQ(column->localDiscriminatorByGlobal(2), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(0), 1);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(1), 2);
+    ASSERT_EQ(column->globalDiscriminatorByLocal(2), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(0), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(1), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(2), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->localDiscriminatorAt(3), 0);
+    ASSERT_EQ(column->localDiscriminatorAt(4), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(1), 1);
+    ASSERT_EQ(column->globalDiscriminatorAt(2), ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(column->globalDiscriminatorAt(3), 1);
+    ASSERT_EQ(column->globalDiscriminatorAt(4), ColumnVariant::NULL_DISCRIMINATOR);
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndColumns)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(columns));
+    checkColumnVariant1(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndColumnsWithLocalOrder)
+{
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    auto columns = createColumns1();
+    reorderColumns(local_to_global_order, columns);
+    auto discriminators = createDiscriminators1();
+    reorderDiscriminators(local_to_global_order, discriminators);
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(columns), createLocalToGlobalOrder1());
+    checkColumnVariant1(column.get());
+    checkColumnVariant1Order(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsOffsetsAndColumns)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    auto offsets = createOffsets1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(offsets), std::move(columns));
+    checkColumnVariant1(column.get());
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsOffsetsAndColumnsWithLocalOrder)
+{
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    auto columns = createColumns1();
+    reorderColumns(local_to_global_order, columns);
+    auto discriminators = createDiscriminators1();
+    reorderDiscriminators(local_to_global_order, discriminators);
+    auto offsets = createOffsets1();
+    auto column = ColumnVariant::create(std::move(discriminators), std::move(offsets), std::move(columns), createLocalToGlobalOrder1());
+    checkColumnVariant1(column.get());
+    checkColumnVariant1Order(column.get());
+}
+
+ColumnVariant::MutablePtr createVariantWithOneFullColumNoNulls(size_t size, bool change_order)
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    for (size_t i = 0; i != size; ++i)
+        column1->insertValue(i);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt32::create();
+    columns.push_back(std::move(column3));
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    for (size_t i = 0; i != size; ++i)
+        discriminators_column->insertValue(0);
+    if (change_order)
+    {
+        auto local_to_global_order = createLocalToGlobalOrder1();
+        reorderColumns(local_to_global_order, columns);
+        reorderDiscriminators(local_to_global_order, discriminators_column);
+        return ColumnVariant::create(std::move(discriminators_column), std::move(columns), createLocalToGlobalOrder1());
+    }
+    return ColumnVariant::create(std::move(discriminators_column), std::move(columns));
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndOneFullColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 1);
+    ASSERT_EQ(offsets[2], 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*column)[2].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, CreateFromDiscriminatorsAndOneFullColumnNoNullsWithLocalOrder)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, true);
+    const auto & offsets = column->getOffsets();
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 1);
+    ASSERT_EQ(offsets[2], 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*column)[2].get<UInt64>(), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(0), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(1), 2);
+    ASSERT_EQ(column->localDiscriminatorAt(2), 2);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+    ASSERT_EQ(column->globalDiscriminatorAt(0), 0);
+}
+
+TEST(ColumnVariant, CloneResizedToEmpty)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createOffsets1(), createColumns1());
+    auto resized_column = column->cloneResized(0);
+    ASSERT_TRUE(resized_column->empty());
+}
+
+TEST(ColumnVariant, CloneResizedToLarge)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createOffsets1(), createColumns1());
+    auto resized_column = column->cloneResized(7);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 7);
+    const auto & offsets = resized_column_variant->getOffsets();
+    for (size_t i = 0; i != 7; ++i)
+    {
+        if (i == 3)
+            ASSERT_EQ(offsets[i], 1);
+        else
+            ASSERT_EQ(offsets[i], 0);
+    }
+
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    std::vector<size_t> null_indexes = {2, 4, 5, 6};
+    for (size_t i : null_indexes)
+        ASSERT_EQ(discriminators[i], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 2);
+}
+
+TEST(ColumnVariant, CloneResizedWithOneFullColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    auto resized_column = column->cloneResized(3);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 3);
+    const auto & offsets = resized_column_variant->getOffsets();
+    for (size_t i = 0; i != 3; ++i)
+        ASSERT_EQ(offsets[i], i);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    for (size_t i = 0; i != 3; ++i)
+        ASSERT_EQ(discriminators[i], 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 3);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+}
+
+MutableColumns createColumns2()
+{
+    MutableColumns columns;
+    auto column1 = ColumnUInt64::create();
+    column1->insertValue(42);
+    column1->insertValue(43);
+    column1->insertValue(44);
+    columns.push_back(std::move(column1));
+    auto column2 = ColumnString::create();
+    column2->insertData("Hello", 5);
+    column2->insertData("World", 5);
+    columns.push_back(std::move(column2));
+    auto column3 = ColumnUInt8::create();
+    columns.push_back(std::move(column3));
+    return columns;
+}
+
+TEST(ColumnVariant, CloneResizedGeneral1)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///   1     43   World
+    ///  NULL   44
+    ///   0
+    ///   1
+    ///  NULL
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(4);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 4);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], 1);
+    ASSERT_EQ(discriminators[2], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(discriminators[3], 0);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*resized_column_variant)[1].get<String>(), "Hello");
+    ASSERT_EQ((*resized_column_variant)[3].get<UInt64>(), 43);
+}
+
+TEST(ColumnVariant, CloneResizedGeneral2)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///  NULL   43   World
+    ///  NULL   44
+    ///   0
+    ///   1
+    ///   1
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(3);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 3);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 0);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], ColumnVariant::NULL_DISCRIMINATOR);
+    ASSERT_EQ(discriminators[2], ColumnVariant::NULL_DISCRIMINATOR);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+}
+
+TEST(ColumnVariant, CloneResizedGeneral3)
+{
+    ///   D     c1    c2    c3
+    ///   0     42   Hello
+    ///   1     43   World
+    ///   1     44
+    ///   0
+    ///  NULL
+    ///  NULL
+    ///   0
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    auto column = ColumnVariant::create(std::move(discriminators_column), createColumns2());
+    auto resized_column = column->cloneResized(5);
+    const auto * resized_column_variant = assert_cast<const ColumnVariant *>(resized_column.get());
+    ASSERT_EQ(resized_column_variant->size(), 5);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(1).size(), 2);
+    ASSERT_EQ(resized_column_variant->getVariantByLocalDiscriminator(2).size(), 0);
+    const auto & discriminators = resized_column_variant->getLocalDiscriminators();
+    ASSERT_EQ(discriminators[0], 0);
+    ASSERT_EQ(discriminators[1], 1);
+    ASSERT_EQ(discriminators[2], 1);
+    ASSERT_EQ(discriminators[3], 0);
+    const auto & offsets = resized_column_variant->getOffsets();
+    ASSERT_EQ(offsets[0], 0);
+    ASSERT_EQ(offsets[1], 0);
+    ASSERT_EQ(offsets[2], 1);
+    ASSERT_EQ(offsets[3], 1);
+    ASSERT_EQ((*resized_column_variant)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*resized_column_variant)[1].get<String>(), "Hello");
+    ASSERT_EQ((*resized_column_variant)[2].get<String>(), "World");
+    ASSERT_EQ((*resized_column_variant)[3].get<UInt64>(), 43);
+}
+
+MutableColumnPtr createDiscriminators2()
+{
+    auto discriminators_column = ColumnVariant::ColumnDiscriminators::create();
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    discriminators_column->insertValue(1);
+    discriminators_column->insertValue(ColumnVariant::NULL_DISCRIMINATOR);
+    discriminators_column->insertValue(0);
+    return discriminators_column;
+}
+
+std::vector<ColumnVariant::Discriminator> createLocalToGlobalOrder2()
+{
+    std::vector<ColumnVariant::Discriminator> local_to_global_discriminators;
+    local_to_global_discriminators.push_back(2);
+    local_to_global_discriminators.push_back(0);
+    local_to_global_discriminators.push_back(1);
+    return local_to_global_discriminators;
+}
+
+ColumnVariant::MutablePtr createVariantColumn1(bool reorder)
+{
+    auto columns = createColumns1();
+    auto discriminators = createDiscriminators1();
+    if (!reorder)
+        return ColumnVariant::create(std::move(discriminators), std::move(columns));
+    auto local_to_global_order = createLocalToGlobalOrder1();
+    reorderColumns(local_to_global_order, columns);
+    reorderDiscriminators(local_to_global_order, discriminators);
+    return ColumnVariant::create(std::move(discriminators), std::move(columns), local_to_global_order);
+}
+
+ColumnVariant::MutablePtr createVariantColumn2(bool reorder)
+{
+    auto columns = createColumns2();
+    auto discriminators = createDiscriminators2();
+    if (!reorder)
+        return ColumnVariant::create(std::move(discriminators), std::move(columns));
+    auto local_to_global_order = createLocalToGlobalOrder2();
+    reorderColumns(local_to_global_order, columns);
+    reorderDiscriminators(local_to_global_order, discriminators);
+    return ColumnVariant::create(std::move(discriminators), std::move(columns), local_to_global_order);
+}
+
+TEST(ColumnVariant, InsertFrom)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertFrom(*column_from, 3);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 0);
+        ASSERT_EQ((*column_to)[5].get<UInt64>(), 43);
+    }
+}
+
+TEST(ColumnVariant, InsertRangeFromOneColumnNoNulls)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn2(change_order);
+        auto column_from = createVariantWithOneFullColumNoNulls(5, change_order);
+        column_to->insertRangeFrom(*column_from, 2, 2);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(7), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(8), 0);
+        ASSERT_EQ((*column_to)[7].get<UInt64>(), 2);
+        ASSERT_EQ((*column_to)[8].get<UInt64>(), 3);
+    }
+}
+
+TEST(ColumnVariant, InsertRangeFromGeneral)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertRangeFrom(*column_from, 1, 4);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 1);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(6), ColumnVariant::NULL_DISCRIMINATOR);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(7), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(8), 1);
+        ASSERT_EQ((*column_to)[5].get<String>(), "Hello");
+        ASSERT_EQ((*column_to)[7].get<UInt64>(), 43);
+        ASSERT_EQ((*column_to)[8].get<String>(), "World");
+    }
+}
+
+TEST(ColumnVariant, InsertManyFrom)
+{
+    for (bool change_order : {false, true})
+    {
+        auto column_to = createVariantColumn1(change_order);
+        auto column_from = createVariantColumn2(change_order);
+        column_to->insertManyFrom(*column_from, 3, 2);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(5), 0);
+        ASSERT_EQ(column_to->globalDiscriminatorAt(6), 0);
+        ASSERT_EQ((*column_to)[5].get<UInt64>(), 43);
+        ASSERT_EQ((*column_to)[6].get<UInt64>(), 43);
+    }
+}
+
+TEST(ColumnVariant, PopBackOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    column->popBack(3);
+    ASSERT_EQ(column->size(), 2);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(0).size(), 2);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*column)[1].get<UInt64>(), 1);
+}
+
+TEST(ColumnVariant, PopBackGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    column->popBack(4);
+    ASSERT_EQ(column->size(), 3);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(0).size(), 1);
+    ASSERT_EQ(column->getVariantByLocalDiscriminator(1).size(), 1);
+    ASSERT_EQ((*column)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*column)[1].get<String>(), "Hello");
+    ASSERT_TRUE((*column)[2].isNull());
+}
+
+TEST(ColumnVariant, FilterOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    IColumn::Filter filter;
+    filter.push_back(1);
+    filter.push_back(0);
+    filter.push_back(1);
+    auto filtered_column = column->filter(filter, -1);
+    ASSERT_EQ(filtered_column->size(), 2);
+    ASSERT_EQ((*filtered_column)[0].get<UInt64>(), 0);
+    ASSERT_EQ((*filtered_column)[1].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, FilterGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Filter filter;
+    filter.push_back(0);
+    filter.push_back(1);
+    filter.push_back(1);
+    filter.push_back(0);
+    filter.push_back(0);
+    filter.push_back(1);
+    filter.push_back(0);
+    auto filtered_column = column->filter(filter, -1);
+    ASSERT_EQ(filtered_column->size(), 3);
+    ASSERT_EQ((*filtered_column)[0].get<String>(), "Hello");
+    ASSERT_TRUE((*filtered_column)[1].isNull());
+    ASSERT_TRUE((*filtered_column)[2].isNull());
+}
+
+TEST(ColumnVariant, PermuteAndIndexOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(4, false);
+    IColumn::Permutation permutation;
+    permutation.push_back(1);
+    permutation.push_back(3);
+    permutation.push_back(2);
+    permutation.push_back(0);
+    auto permuted_column = column->permute(permutation, 3);
+    ASSERT_EQ(permuted_column->size(), 3);
+    ASSERT_EQ((*permuted_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*permuted_column)[1].get<UInt64>(), 3);
+    ASSERT_EQ((*permuted_column)[2].get<UInt64>(), 2);
+
+    auto index = ColumnUInt64::create();
+    index->getData() = std::move(permutation);
+    auto indexed_column = column->index(*index, 3);
+    ASSERT_EQ(indexed_column->size(), 3);
+    ASSERT_EQ((*indexed_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*indexed_column)[1].get<UInt64>(), 3);
+    ASSERT_EQ((*indexed_column)[2].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, PermuteGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Permutation permutation;
+    permutation.push_back(3);
+    permutation.push_back(4);
+    permutation.push_back(1);
+    permutation.push_back(5);
+    auto permuted_column = column->permute(permutation, 4);
+    ASSERT_EQ(permuted_column->size(), 4);
+    ASSERT_EQ((*permuted_column)[0].get<UInt64>(), 43);
+    ASSERT_EQ((*permuted_column)[1].get<String>(), "World");
+    ASSERT_EQ((*permuted_column)[2].get<String>(), "Hello");
+    ASSERT_TRUE((*permuted_column)[3].isNull());
+}
+
+TEST(ColumnVariant, ReplicateOneColumnNoNull)
+{
+    auto column = createVariantWithOneFullColumNoNulls(3, false);
+    IColumn::Offsets offsets;
+    offsets.push_back(0);
+    offsets.push_back(3);
+    offsets.push_back(6);
+    auto replicated_column = column->replicate(offsets);
+    ASSERT_EQ(replicated_column->size(), 6);
+    ASSERT_EQ((*replicated_column)[0].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[1].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[2].get<UInt64>(), 1);
+    ASSERT_EQ((*replicated_column)[3].get<UInt64>(), 2);
+    ASSERT_EQ((*replicated_column)[4].get<UInt64>(), 2);
+    ASSERT_EQ((*replicated_column)[5].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, ReplicateGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators1(), createColumns1());
+    IColumn::Offsets offsets;
+    offsets.push_back(1);
+    offsets.push_back(3);
+    offsets.push_back(5);
+    offsets.push_back(5);
+    offsets.push_back(7);
+    auto replicated_column = column->replicate(offsets);
+    ASSERT_EQ(replicated_column->size(), 7);
+    ASSERT_EQ((*replicated_column)[0].get<UInt64>(), 42);
+    ASSERT_EQ((*replicated_column)[1].get<String>(), "Hello");
+    ASSERT_EQ((*replicated_column)[2].get<String>(), "Hello");
+    ASSERT_TRUE((*replicated_column)[3].isNull());
+    ASSERT_TRUE((*replicated_column)[4].isNull());
+    ASSERT_TRUE((*replicated_column)[5].isNull());
+    ASSERT_TRUE((*replicated_column)[6].isNull());
+}
+
+TEST(ColumnVariant, ScatterOneColumnNoNulls)
+{
+    auto column = createVariantWithOneFullColumNoNulls(5, false);
+    IColumn::Selector selector;
+    selector.push_back(0);
+    selector.push_back(1);
+    selector.push_back(2);
+    selector.push_back(0);
+    selector.push_back(1);
+    auto columns = column->scatter(3, selector);
+    ASSERT_EQ(columns[0]->size(), 2);
+    ASSERT_EQ((*columns[0])[0].get<UInt64>(), 0);
+    ASSERT_EQ((*columns[0])[1].get<UInt64>(), 3);
+    ASSERT_EQ(columns[1]->size(), 2);
+    ASSERT_EQ((*columns[1])[0].get<UInt64>(), 1);
+    ASSERT_EQ((*columns[1])[1].get<UInt64>(), 4);
+    ASSERT_EQ(columns[2]->size(), 1);
+    ASSERT_EQ((*columns[2])[0].get<UInt64>(), 2);
+}
+
+TEST(ColumnVariant, ScatterGeneral)
+{
+    auto column = ColumnVariant::create(createDiscriminators2(), createColumns2());
+    IColumn::Selector selector;
+    selector.push_back(0);
+    selector.push_back(0);
+    selector.push_back(2);
+    selector.push_back(0);
+    selector.push_back(1);
+    selector.push_back(2);
+    selector.push_back(1);
+    auto columns = column->scatter(3, selector);
+    ASSERT_EQ(columns[0]->size(), 3);
+    ASSERT_EQ((*columns[0])[0].get<UInt64>(), 42);
+    ASSERT_EQ((*columns[0])[1].get<String>(), "Hello");
+    ASSERT_EQ((*columns[0])[2].get<UInt64>(), 43);
+    ASSERT_EQ(columns[1]->size(), 2);
+    ASSERT_EQ((*columns[1])[0].get<String>(), "World");
+    ASSERT_EQ((*columns[1])[1].get<UInt64>(), 44);
+    ASSERT_EQ(columns[2]->size(), 2);
+    ASSERT_TRUE((*columns[2])[0].isNull());
+    ASSERT_TRUE((*columns[2])[1].isNull());
+}
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 7e50a81ada8..0151dcb982d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -816,6 +816,7 @@ class IColumn;
     M(Bool, function_json_value_return_type_allow_complex, false, "Allow function JSON_VALUE to return complex type, such as: struct, array, map.", 0) \
     M(Bool, use_with_fill_by_sorting_prefix, true, "Columns preceding WITH FILL columns in ORDER BY clause form sorting prefix. Rows with different values in sorting prefix are filled independently", 0) \
     M(Bool, optimize_uniq_to_count, true, "Rewrite uniq and its variants(except uniqUpTo) to count if subquery has distinct or group by clause.", 0) \
+    M(Bool, use_variant_when_no_common_type_in_if, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
     \
     /** Experimental functions */ \
     M(Bool, allow_experimental_materialized_postgresql_table, false, "Allows to use the MaterializedPostgreSQL table engine. Disabled by default, because this feature is experimental", 0) \
@@ -823,6 +824,7 @@ class IColumn;
     M(Bool, allow_experimental_nlp_functions, false, "Enable experimental functions for natural language processing.", 0) \
     M(Bool, allow_experimental_hash_functions, false, "Enable experimental hash functions", 0) \
     M(Bool, allow_experimental_object_type, false, "Allow Object and JSON data types", 0) \
+    M(Bool, allow_experimental_variant_type, false, "Allow Variant data type", 0) \
     M(Bool, allow_experimental_annoy_index, false, "Allows to use Annoy index. Disabled by default because this feature is experimental", 0) \
     M(Bool, allow_experimental_usearch_index, false, "Allows to use USearch index. Disabled by default because this feature is experimental", 0) \
     M(UInt64, max_limit_for_ann_queries, 1'000'000, "SELECT queries with LIMIT bigger than this setting cannot use ANN indexes. Helps to prevent memory overflows in ANN search indexes.", 0) \
diff --git a/src/Core/TypeId.h b/src/Core/TypeId.h
index 9c634d2321c..7003e880cd5 100644
--- a/src/Core/TypeId.h
+++ b/src/Core/TypeId.h
@@ -49,6 +49,7 @@ enum class TypeIndex
     IPv4,
     IPv6,
     JSONPaths,
+    Variant,
 };
 
 /**
diff --git a/src/DataTypes/DataTypeFactory.cpp b/src/DataTypes/DataTypeFactory.cpp
index 415f24d8151..d154b386ace 100644
--- a/src/DataTypes/DataTypeFactory.cpp
+++ b/src/DataTypes/DataTypeFactory.cpp
@@ -290,6 +290,7 @@ DataTypeFactory::DataTypeFactory()
     registerDataTypeDomainGeo(*this);
     registerDataTypeMap(*this);
     registerDataTypeObject(*this);
+    registerDataTypeVariant(*this);
 }
 
 DataTypeFactory & DataTypeFactory::instance()
diff --git a/src/DataTypes/DataTypeFactory.h b/src/DataTypes/DataTypeFactory.h
index ba7c1a3d7fe..a2aeb6f3646 100644
--- a/src/DataTypes/DataTypeFactory.h
+++ b/src/DataTypes/DataTypeFactory.h
@@ -100,5 +100,6 @@ void registerDataTypeDomainBool(DataTypeFactory & factory);
 void registerDataTypeDomainSimpleAggregateFunction(DataTypeFactory & factory);
 void registerDataTypeDomainGeo(DataTypeFactory & factory);
 void registerDataTypeObject(DataTypeFactory & factory);
+void registerDataTypeVariant(DataTypeFactory & factory);
 
 }
diff --git a/src/DataTypes/DataTypeNullable.cpp b/src/DataTypes/DataTypeNullable.cpp
index 41a9a1de543..484d779551f 100644
--- a/src/DataTypes/DataTypeNullable.cpp
+++ b/src/DataTypes/DataTypeNullable.cpp
@@ -114,5 +114,33 @@ DataTypePtr makeNullableOrLowCardinalityNullable(const DataTypePtr & type)
     return std::make_shared<DataTypeNullable>(type);
 }
 
+DataTypePtr makeNullableOrLowCardinalityNullableSafe(const DataTypePtr & type)
+{
+    if (isNullableOrLowCardinalityNullable(type))
+        return type;
+
+    if (type->lowCardinality())
+    {
+        const auto & dictionary_type = assert_cast<const DataTypeLowCardinality &>(*type).getDictionaryType();
+        return std::make_shared<DataTypeLowCardinality>(makeNullable(dictionary_type));
+    }
+
+    return makeNullableSafe(type);
+}
+
+DataTypePtr removeNullableOrLowCardinalityNullable(const DataTypePtr & type)
+{
+    if (type->isNullable())
+        return static_cast<const DataTypeNullable &>(*type).getNestedType();
+
+    if (type->isLowCardinalityNullable())
+    {
+        auto dict_type = removeNullable(static_cast<const DataTypeLowCardinality &>(*type).getDictionaryType());
+        return std::make_shared<DataTypeLowCardinality>(dict_type);
+    }
+
+    return type;
+
+}
 
 }
diff --git a/src/DataTypes/DataTypeNullable.h b/src/DataTypes/DataTypeNullable.h
index 06d46fb15ed..7ad0e1ba5f1 100644
--- a/src/DataTypes/DataTypeNullable.h
+++ b/src/DataTypes/DataTypeNullable.h
@@ -54,5 +54,8 @@ DataTypePtr makeNullable(const DataTypePtr & type);
 DataTypePtr makeNullableSafe(const DataTypePtr & type);
 DataTypePtr removeNullable(const DataTypePtr & type);
 DataTypePtr makeNullableOrLowCardinalityNullable(const DataTypePtr & type);
+DataTypePtr makeNullableOrLowCardinalityNullableSafe(const DataTypePtr & type);
+/// Nullable(T) -> T, LowCardinality(Nullable(T)) -> T
+DataTypePtr removeNullableOrLowCardinalityNullable(const DataTypePtr & type);
 
 }
diff --git a/src/DataTypes/DataTypeTuple.cpp b/src/DataTypes/DataTypeTuple.cpp
index fd2e5e6a784..df9af203618 100644
--- a/src/DataTypes/DataTypeTuple.cpp
+++ b/src/DataTypes/DataTypeTuple.cpp
@@ -11,6 +11,7 @@
 #include <DataTypes/Serializations/SerializationTuple.h>
 #include <DataTypes/Serializations/SerializationNamed.h>
 #include <DataTypes/Serializations/SerializationInfoTuple.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
 #include <DataTypes/NestedUtils.h>
 #include <Parsers/IAST.h>
 #include <Parsers/ASTNameTypePair.h>
@@ -172,11 +173,15 @@ MutableColumnPtr DataTypeTuple::createColumn() const
 
 MutableColumnPtr DataTypeTuple::createColumn(const ISerialization & serialization) const
 {
+    /// If we read Tuple as Variant subcolumn, it may be wrapped to SerializationVariantElement.
+    /// Here we don't need it, so we drop this wrapper.
+    const auto * current_serialization = &serialization;
+    while (const auto * serialization_variant_element = typeid_cast<const SerializationVariantElement *>(current_serialization))
+        current_serialization = serialization_variant_element->getNested().get();
+
     /// If we read subcolumn of nested Tuple, it may be wrapped to SerializationNamed
     /// several times to allow to reconstruct the substream path name.
     /// Here we don't need substream path name, so we drop first several wrapper serializations.
-
-    const auto * current_serialization = &serialization;
     while (const auto * serialization_named = typeid_cast<const SerializationNamed *>(current_serialization))
         current_serialization = serialization_named->getNested().get();
 
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
new file mode 100644
index 00000000000..77e1c504cf8
--- /dev/null
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -0,0 +1,197 @@
+#include <Columns/ColumnVariant.h>
+#include <Core/Field.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/Serializations/SerializationVariant.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Common/assert_cast.h>
+#include <IO/WriteHelpers.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+#include <Parsers/IAST.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+    extern const int EMPTY_DATA_PASSED;
+}
+
+
+DataTypeVariant::DataTypeVariant(const DataTypes & variants_)
+{
+    /// Sort nested types by their full names and squash identical types.
+    std::map<String, DataTypePtr> name_to_type;
+    for (const auto & type : variants_)
+    {
+        /// Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types are not allowed inside Variant type.
+        if (isNullableOrLowCardinalityNullable(type))
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Nullable/LowCardinality(Nullable) types are not allowed inside Variant type");
+        if (type->getTypeId() == TypeIndex::Variant)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Nested Variant types are not allowed");
+        /// Don't use Nothing type as a variant.
+        if (!isNothing(type))
+            name_to_type[type->getName()] = type;
+    }
+
+    variants.reserve(name_to_type.size());
+    for (const auto & [_, type] : name_to_type)
+        variants.push_back(type);
+
+    if (variants.empty())
+        throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "Variant cannot be empty");
+
+    if (variants.size() > ColumnVariant::MAX_NESTED_COLUMNS)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Variant type with more than {} nested types is not allowed", ColumnVariant::MAX_NESTED_COLUMNS);
+}
+
+std::string DataTypeVariant::doGetName() const
+{
+    size_t size = variants.size();
+    WriteBufferFromOwnString s;
+
+    s << "Variant(";
+    for (size_t i = 0; i < size; ++i)
+    {
+        if (i != 0)
+            s << ", ";
+
+        s << variants[i]->getName();
+    }
+    s << ")";
+
+    return s.str();
+}
+
+std::string DataTypeVariant::doGetPrettyName(size_t indent) const
+{
+    size_t size = variants.size();
+    WriteBufferFromOwnString s;
+    s << "Variant(\n";
+
+    for (size_t i = 0; i != size; ++i)
+    {
+        if (i != 0)
+            s << ",\n";
+
+        s << fourSpaceIndent(indent + 1) << variants[i]->getPrettyName(indent + 1);
+    }
+
+    s << '\n' << fourSpaceIndent(indent) << ')';
+    return s.str();
+}
+
+MutableColumnPtr DataTypeVariant::createColumn() const
+{
+    size_t size = variants.size();
+    MutableColumns nested_columns;
+    nested_columns.reserve(size);
+    for (size_t i = 0; i < size; ++i)
+        nested_columns.push_back(variants[i]->createColumn());
+
+    return ColumnVariant::create(std::move(nested_columns));
+}
+
+
+Field DataTypeVariant::getDefault() const
+{
+    return Null();
+}
+
+bool DataTypeVariant::equals(const IDataType & rhs) const
+{
+    if (typeid(rhs) != typeid(*this))
+        return false;
+
+    const DataTypeVariant & rhs_variant = static_cast<const DataTypeVariant &>(rhs);
+
+    size_t size = variants.size();
+    if (size != rhs_variant.variants.size())
+        return false;
+
+    for (size_t i = 0; i < size; ++i)
+        if (!variants[i]->equals(*rhs_variant.variants[i]))
+            return false;
+
+    return true;
+}
+
+bool DataTypeVariant::textCanContainOnlyValidUTF8() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](auto && elem) { return elem->textCanContainOnlyValidUTF8(); });
+}
+
+bool DataTypeVariant::haveMaximumSizeOfValue() const
+{
+    return std::all_of(variants.begin(), variants.end(), [](auto && elem) { return elem->haveMaximumSizeOfValue(); });
+}
+
+bool DataTypeVariant::hasDynamicSubcolumns() const
+{
+    return std::any_of(variants.begin(), variants.end(), [](auto && elem) { return elem->hasDynamicSubcolumns(); });
+}
+
+std::optional<ColumnVariant::Discriminator> DataTypeVariant::tryGetVariantDiscriminator(const DataTypePtr & type) const
+{
+    String type_name = type->getName();
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        /// We don't use equals here, because it doesn't respect custom type names.
+        if (variants[i]->getName() == type_name)
+            return i;
+    }
+
+    return std::nullopt;
+}
+
+size_t DataTypeVariant::getMaximumSizeOfValueInMemory() const
+{
+    size_t max_size = 0;
+    for (const auto & elem : variants)
+    {
+        size_t elem_max_size = elem->getMaximumSizeOfValueInMemory();
+        if (elem_max_size > max_size)
+            max_size = elem_max_size;
+    }
+    return max_size;
+}
+
+SerializationPtr DataTypeVariant::doGetDefaultSerialization() const
+{
+    SerializationVariant::VariantSerializations serializations;
+    serializations.reserve(variants.size());
+    Names variant_names;
+    variant_names.reserve(variants.size());
+
+    for (const auto & variant : variants)
+    {
+        serializations.push_back(variant->getDefaultSerialization());
+        variant_names.push_back(variant->getName());
+    }
+
+    return std::make_shared<SerializationVariant>(std::move(serializations), std::move(variant_names), SerializationVariant::getVariantsDeserializeTextOrder(variants), getName());
+}
+
+static DataTypePtr create(const ASTPtr & arguments)
+{
+    if (!arguments || arguments->children.empty())
+        throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "Variant cannot be empty");
+
+    DataTypes nested_types;
+    nested_types.reserve(arguments->children.size());
+
+    for (const ASTPtr & child : arguments->children)
+        nested_types.emplace_back(DataTypeFactory::instance().get(child));
+
+    return std::make_shared<DataTypeVariant>(nested_types);
+}
+
+
+void registerDataTypeVariant(DataTypeFactory & factory)
+{
+    factory.registerDataType("Variant", create);
+}
+
+}
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
new file mode 100644
index 00000000000..60113a188b0
--- /dev/null
+++ b/src/DataTypes/DataTypeVariant.h
@@ -0,0 +1,64 @@
+#pragma once
+
+#include <DataTypes/IDataType.h>
+#include <Columns/ColumnVariant.h>
+#include <optional>
+
+
+namespace DB
+{
+
+/** Variant data type.
+  * This type represents a union of other data types.
+  * For example, type Variant(T1, T2, ..., TN) means that each row of this type
+  * has a value of either type T1 or T2 or ... or TN or none of them (NULL value).
+  * Nullable(...), LowCardinality(Nullable(...)) and Variant(...) types are not allowed
+  * inside Variant type.
+  * The order of nested types doesn't matter: Variant(T1, T2) = Variant(T2, T1).
+  * To have global order of nested types we sort variants by type names on Variant creation.
+  * The index of a variant in a sorted list is called global variant discriminator.
+  */
+class DataTypeVariant final : public IDataType
+{
+private:
+    DataTypes variants;
+
+public:
+    static constexpr bool is_parametric = true;
+
+    explicit DataTypeVariant(const DataTypes & variants_);
+
+    TypeIndex getTypeId() const override { return TypeIndex::Variant; }
+    const char * getFamilyName() const override { return "Variant"; }
+
+    bool canBeInsideNullable() const override { return false; }
+    bool supportsSparseSerialization() const override { return false; }
+    bool canBeInsideSparseColumns() const override { return false; }
+
+    MutableColumnPtr createColumn() const override;
+
+    Field getDefault() const override;
+
+    bool equals(const IDataType & rhs) const override;
+
+    bool isParametric() const override { return true; }
+    bool haveSubtypes() const override { return true; }
+    bool textCanContainOnlyValidUTF8() const override;
+    bool haveMaximumSizeOfValue() const override;
+    bool hasDynamicSubcolumns() const override;
+    size_t getMaximumSizeOfValueInMemory() const override;
+
+    const DataTypePtr & getVariant(size_t i) const { return variants[i]; }
+    const DataTypes & getVariants() const { return variants; }
+
+    /// Check if Variant has provided type in the list of variants and return its discriminator.
+    std::optional<ColumnVariant::Discriminator> tryGetVariantDiscriminator(const DataTypePtr & type) const;
+
+private:
+    std::string doGetName() const override;
+    std::string doGetPrettyName(size_t indent) const override;
+    SerializationPtr doGetDefaultSerialization() const override;
+};
+
+}
+
diff --git a/src/DataTypes/EnumValues.cpp b/src/DataTypes/EnumValues.cpp
index 9df49e765a7..8a4b1304d5e 100644
--- a/src/DataTypes/EnumValues.cpp
+++ b/src/DataTypes/EnumValues.cpp
@@ -74,6 +74,27 @@ T EnumValues<T>::getValue(StringRef field_name, bool try_treat_as_id) const
     return it->getMapped();
 }
 
+template <typename T>
+bool EnumValues<T>::tryGetValue(T & x, StringRef field_name, bool try_treat_as_id) const
+{
+    const auto it = name_to_value_map.find(field_name);
+    if (!it)
+    {
+        /// It is used in CSV and TSV input formats. If we fail to find given string in
+        /// enum names, we will try to treat it as enum id.
+        if (try_treat_as_id)
+        {
+            ReadBufferFromMemory tmp_buf(field_name.data, field_name.size);
+            if (!tryReadText(x, tmp_buf) || !tmp_buf.eof() || !value_to_name_map.contains(x))
+                return false;
+            return true;
+        }
+        return false;
+    }
+    x = it->getMapped();
+    return true;
+}
+
 template <typename T>
 Names EnumValues<T>::getAllRegisteredNames() const
 {
diff --git a/src/DataTypes/EnumValues.h b/src/DataTypes/EnumValues.h
index 5189f7a56f5..889878bc60f 100644
--- a/src/DataTypes/EnumValues.h
+++ b/src/DataTypes/EnumValues.h
@@ -7,7 +7,7 @@
 namespace DB
 {
 
-namespace ErrorCodes
+namespace ErrorCodesEnumValues
 {
     extern const int BAD_ARGUMENTS;
 }
@@ -42,6 +42,11 @@ public:
         return it;
     }
 
+    bool hasValue(const T & value) const
+    {
+        return value_to_name_map.contains(value);
+    }
+
     /// throws exception if value is not valid
     const StringRef & getNameForValue(const T & value) const
     {
@@ -60,6 +65,7 @@ public:
     }
 
     T getValue(StringRef field_name, bool try_treat_as_id = false) const;
+    bool tryGetValue(T & x, StringRef field_name, bool try_treat_as_id = false) const;
 
     template <typename TValues>
     bool containsAll(const TValues & rhs_values) const
diff --git a/src/DataTypes/IDataType.cpp b/src/DataTypes/IDataType.cpp
index 2a7e0f246de..392c56343e3 100644
--- a/src/DataTypes/IDataType.cpp
+++ b/src/DataTypes/IDataType.cpp
@@ -109,11 +109,26 @@ Ptr IDataType::getForSubcolumn(
     bool throw_if_null) const
 {
     Ptr res;
-    forEachSubcolumn([&](const auto &, const auto & name, const auto & subdata)
+
+    ISerialization::StreamCallback callback_with_data = [&](const auto & subpath)
     {
-        if (name == subcolumn_name)
-            res = subdata.*member;
-    }, data);
+        for (size_t i = 0; i < subpath.size(); ++i)
+        {
+            size_t prefix_len = i + 1;
+            if (!subpath[i].visited && ISerialization::hasSubcolumnForPath(subpath, prefix_len))
+            {
+                auto name = ISerialization::getSubcolumnNameForStream(subpath, prefix_len);
+                /// Create data from path only if it's requested subcolumn.
+                if (name == subcolumn_name)
+                    res = ISerialization::createFromPath(subpath, prefix_len).*member;
+            }
+            subpath[i].visited = true;
+        }
+    };
+
+    ISerialization::EnumerateStreamsSettings settings;
+    settings.position_independent_encoding = false;
+    data.serialization->enumerateStreams(settings, callback_with_data, data);
 
     if (!res && throw_if_null)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "There is no subcolumn {} in type {}", subcolumn_name, getName());
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index eabf066bc3d..ccdf54f57c3 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -412,6 +412,8 @@ struct WhichDataType
     constexpr bool isSimple() const  { return isInt() || isUInt() || isFloat() || isString(); }
 
     constexpr bool isLowCardinality() const { return idx == TypeIndex::LowCardinality; }
+
+    constexpr bool isVariant() const { return idx == TypeIndex::Variant; }
 };
 
 /// IDataType helpers (alternative for IDataType virtual methods with single point of truth)
@@ -464,6 +466,7 @@ template <typename T> inline bool isTuple(const T & data_type) { return WhichDat
 template <typename T> inline bool isMap(const T & data_type) {return WhichDataType(data_type).isMap(); }
 template <typename T> inline bool isInterval(const T & data_type) {return WhichDataType(data_type).isInterval(); }
 template <typename T> inline bool isObject(const T & data_type) { return WhichDataType(data_type).isObject(); }
+template <typename T> inline bool isVariant(const T & data_type) { return WhichDataType(data_type).isVariant(); }
 
 template <typename T> inline bool isNothing(const T & data_type) { return WhichDataType(data_type).isNothing(); }
 
diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index e70dc6a2380..86a37949dc8 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -55,6 +55,9 @@ String ISerialization::Substream::toString() const
         return fmt::format("TupleElement({}, escape_tuple_delimiter = {})",
             tuple_element_name, escape_tuple_delimiter ? "true" : "false");
 
+    if (type == VariantElement)
+        return fmt::format("VariantElement({})", variant_element_name);
+
     return String(magic_enum::enum_name(type));
 }
 
@@ -172,6 +175,10 @@ String getNameForSubstreamPath(
             else
                 stream_name += "." + it->tuple_element_name;
         }
+        else if (it->type == Substream::VariantDiscriminators)
+            stream_name += ".discr";
+        else if (it->type == Substream::VariantElement)
+            stream_name += "." + it->variant_element_name;
     }
 
     return stream_name;
@@ -252,6 +259,45 @@ bool ISerialization::isSpecialCompressionAllowed(const SubstreamPath & path)
     return true;
 }
 
+#define TRY_DESERIALIZE_TEXT(deserialize)                \
+    size_t prev_size = column.size();                    \
+    try                                                  \
+    {                                                    \
+        deserialize(column, istr, settings);             \
+        return true;                                     \
+    }                                                    \
+    catch (...)                                          \
+    {                                                    \
+        if (column.size() > prev_size)                   \
+            column.popBack(column.size() - prev_size);   \
+        return false;                                    \
+    }                                                    \
+
+bool ISerialization::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextCSV)
+}
+
+bool ISerialization::tryDeserializeTextEscaped(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextEscaped)
+}
+
+bool ISerialization::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextJSON)
+}
+
+bool ISerialization::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeTextQuoted)
+}
+
+bool ISerialization::tryDeserializeWholeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    TRY_DESERIALIZE_TEXT(deserializeWholeText)
+}
+
 void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     String field;
@@ -261,6 +307,15 @@ void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, con
     deserializeWholeText(column, buf, settings);
 }
 
+bool ISerialization::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    /// Read until \t or \n.
+    readString(field, istr);
+    ReadBufferFromString buf(field);
+    return tryDeserializeWholeText(column, buf, settings);
+}
+
 void ISerialization::serializeTextMarkdown(
     const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
 {
@@ -288,7 +343,9 @@ bool ISerialization::hasSubcolumnForPath(const SubstreamPath & path, size_t pref
     size_t last_elem = prefix_len - 1;
     return path[last_elem].type == Substream::NullMap
             || path[last_elem].type == Substream::TupleElement
-            || path[last_elem].type == Substream::ArraySizes;
+            || path[last_elem].type == Substream::ArraySizes
+            || path[last_elem].type == Substream::VariantDiscriminators
+            || path[last_elem].type == Substream::VariantElement;
 }
 
 ISerialization::SubstreamData ISerialization::createFromPath(const SubstreamPath & path, size_t prefix_len)
@@ -317,6 +374,8 @@ void ISerialization::throwUnexpectedDataAfterParsedValue(IColumn & column, ReadB
 {
     WriteBufferFromOwnString ostr;
     serializeText(column, column.size() - 1, ostr, settings);
+    /// Restore correct column size.
+    column.popBack(1);
     throw Exception(
         ErrorCodes::UNEXPECTED_DATA_AFTER_PARSED_VALUE,
         "Unexpected data '{}' after parsed {} value '{}'",
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index 030c3c6d81e..f0273f59d1f 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -152,6 +152,10 @@ public:
             ObjectStructure,
             ObjectData,
 
+            VariantDiscriminators,
+            VariantElements,
+            VariantElement,
+
             Regular,
         };
 
@@ -160,6 +164,9 @@ public:
         /// Index of tuple element, starting at 1 or name.
         String tuple_element_name;
 
+        /// The name of a variant element type.
+        String variant_element_name;
+
         /// Do we need to escape a dot in filenames for tuple elements.
         bool escape_tuple_delimiter = true;
 
@@ -320,17 +327,20 @@ public:
     virtual void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
 
     virtual void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization as a literal that may be inserted into a query.
       */
     virtual void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
 
     virtual void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization for the CSV format.
       */
     virtual void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
     virtual void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization for displaying on a terminal or saving into a text file, and the like.
       * Without escaping or quoting.
@@ -340,11 +350,13 @@ public:
     /** Text deserialization in case when buffer contains only one value, without any escaping and delimiters.
       */
     virtual void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
 
     /** Text serialization intended for using in JSON format.
       */
     virtual void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
     virtual void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
+    virtual bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const;
     virtual void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t /*indent*/) const
     {
         serializeTextJSON(column, row_num, ostr, settings);
@@ -364,6 +376,7 @@ public:
      *  additional code in data types serialization and ReadHelpers.
      */
     virtual void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
+    virtual bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
     virtual void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const;
 
     virtual void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const;
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index c804f58c567..be23278ef25 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -417,9 +417,11 @@ static void serializeTextImpl(const IColumn & column, size_t row_num, WriteBuffe
 }
 
 
-template <typename Reader>
-static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && read_nested, bool allow_unenclosed)
+template <typename ReturnType = void, typename Reader>
+static ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && read_nested, bool allow_unenclosed)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     ColumnArray & column_array = assert_cast<ColumnArray &>(column);
     ColumnArray::Offsets & offsets = column_array.getOffsets();
 
@@ -431,7 +433,18 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
     if (checkChar('[', istr))
         has_braces = true;
     else if (!allow_unenclosed)
-        throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Array does not start with '[' character");
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Array does not start with '[' character");
+        return ReturnType(false);
+    }
+
+    auto on_error_no_throw = [&]()
+    {
+        if (size)
+            nested_column.popBack(size);
+        return ReturnType(false);
+    };
 
     try
     {
@@ -441,11 +454,17 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
             if (!first)
             {
                 if (*istr.position() == ',')
+                {
                     ++istr.position();
+                }
                 else
-                    throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
-                        "Cannot read array from text, expected comma or end of array, found '{}'",
-                        *istr.position());
+                {
+                    if constexpr (throw_exception)
+                        throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
+                            "Cannot read array from text, expected comma or end of array, found '{}'",
+                            *istr.position());
+                    return on_error_no_throw();
+                }
             }
 
             first = false;
@@ -455,25 +474,42 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
             if (*istr.position() == ']')
                 break;
 
-            read_nested(nested_column);
+            if constexpr (throw_exception)
+                read_nested(nested_column);
+            else if (!read_nested(nested_column))
+                return on_error_no_throw();
+
             ++size;
 
             skipWhitespaceIfAny(istr);
         }
 
         if (has_braces)
-            assertChar(']', istr);
+        {
+            if constexpr (throw_exception)
+                assertChar(']', istr);
+            else if (!checkChar(']', istr))
+                return on_error_no_throw();
+        }
         else /// If array is not enclosed in braces, we read until EOF.
-            assertEOF(istr);
+        {
+            if constexpr (throw_exception)
+                assertEOF(istr);
+            else if (!istr.eof())
+                return on_error_no_throw();
+        }
     }
     catch (...)
     {
         if (size)
             nested_column.popBack(size);
-        throw;
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
 
     offsets.push_back(offsets.back() + size);
+    return ReturnType(true);
 }
 
 
@@ -492,8 +528,8 @@ void SerializationArray::deserializeText(IColumn & column, ReadBuffer & istr, co
     deserializeTextImpl(column, istr,
         [&](IColumn & nested_column)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(nested_column, istr, settings, nested);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(nested_column, istr, settings, nested);
             else
                 nested->deserializeTextQuoted(nested_column, istr, settings);
         }, false);
@@ -502,6 +538,29 @@ void SerializationArray::deserializeText(IColumn & column, ReadBuffer & istr, co
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Array");
 }
 
+bool SerializationArray::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+{
+    auto read_nested = [&](IColumn & nested_column)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(nested_column, istr, settings, nested);
+        return nested->tryDeserializeTextQuoted(nested_column, istr, settings);
+    };
+
+    bool ok = deserializeTextImpl<bool>(column, istr, std::move(read_nested), false);
+
+    if (!ok)
+        return false;
+
+    if (whole && !istr.eof())
+    {
+        column.popBack(1);
+        return false;
+    }
+
+    return true;
+}
+
 void SerializationArray::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const ColumnArray & column_array = assert_cast<const ColumnArray &>(column);
@@ -557,13 +616,25 @@ void SerializationArray::deserializeTextJSON(IColumn & column, ReadBuffer & istr
     deserializeTextImpl(column, istr,
         [&](IColumn & nested_column)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextJSONImpl(nested_column, istr, settings, nested);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(nested_column, istr, settings, nested);
             else
                 nested->deserializeTextJSON(nested_column, istr, settings);
         }, false);
 }
 
+bool SerializationArray::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    auto read_nested = [&](IColumn & nested_column)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(nested_column, istr, settings, nested);
+        return nested->tryDeserializeTextJSON(nested_column, istr, settings);
+    };
+
+    return deserializeTextImpl<bool>(column, istr, std::move(read_nested), false);
+}
+
 
 void SerializationArray::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -606,8 +677,8 @@ void SerializationArray::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
         deserializeTextImpl(column, rb,
             [&](IColumn & nested_column)
             {
-                if (settings.null_as_default)
-                    SerializationNullable::deserializeTextCSVImpl(nested_column, rb, settings, nested);
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(nested_column, rb, settings, nested);
                 else
                     nested->deserializeTextCSV(nested_column, rb, settings);
             }, true);
@@ -617,12 +688,43 @@ void SerializationArray::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
         deserializeTextImpl(column, rb,
             [&](IColumn & nested_column)
             {
-                if (settings.null_as_default)
-                    SerializationNullable::deserializeTextQuotedImpl(nested_column, rb, settings, nested);
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(nested_column, rb, settings, nested);
                 else
                     nested->deserializeTextQuoted(nested_column, rb, settings);
             }, true);
     }
 }
 
+bool SerializationArray::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String s;
+    if (!tryReadCSV(s, istr, settings.csv))
+        return false;
+    ReadBufferFromString rb(s);
+
+    if (settings.csv.arrays_as_nested_csv)
+    {
+        auto read_nested = [&](IColumn & nested_column)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(nested_column, rb, settings, nested);
+            return nested->tryDeserializeTextCSV(nested_column, rb, settings);
+        };
+
+        return deserializeTextImpl<bool>(column, rb, read_nested, true);
+    }
+    else
+    {
+        auto read_nested = [&](IColumn & nested_column)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(nested_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(nested_column, rb, settings, nested);
+            return nested->tryDeserializeTextQuoted(nested_column, rb, settings);
+        };
+
+        return deserializeTextImpl<bool>(column, rb, read_nested, true);
+    }
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationArray.h b/src/DataTypes/Serializations/SerializationArray.h
index de331169db5..82f5e8bce45 100644
--- a/src/DataTypes/Serializations/SerializationArray.h
+++ b/src/DataTypes/Serializations/SerializationArray.h
@@ -20,15 +20,18 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Streaming serialization of arrays is arranged in a special way:
       * - elements placed in a row are written/read without array sizes;
diff --git a/src/DataTypes/Serializations/SerializationBool.cpp b/src/DataTypes/Serializations/SerializationBool.cpp
index 41b5bf806e5..f745fac4d30 100644
--- a/src/DataTypes/Serializations/SerializationBool.cpp
+++ b/src/DataTypes/Serializations/SerializationBool.cpp
@@ -150,30 +150,42 @@ bool tryDeserializeAllVariants(ColumnUInt8 * column, ReadBuffer & istr)
     return true;
 }
 
-void deserializeImpl(
+template <typename ReturnType = void>
+ReturnType deserializeImpl(
     IColumn & column, ReadBuffer & istr, const FormatSettings & settings, std::function<bool(ReadBuffer &)> check_end_of_value)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     ColumnUInt8 * col = checkAndGetDeserializeColumnType(column);
+    auto restore_column_if_needed = [&, prev_size = col->size()]()
+    {
+        if (col->size() > prev_size)
+            col->popBack(1);
+    };
 
     PeekableReadBuffer buf(istr);
     buf.setCheckpoint();
     if (checkString(settings.bool_true_representation, buf) && check_end_of_value(buf))
     {
         col->insert(true);
-        return;
+        return ReturnType(true);
     }
 
     buf.rollbackToCheckpoint();
     if (checkString(settings.bool_false_representation, buf) && check_end_of_value(buf))
     {
-        col->insert(false);
         buf.dropCheckpoint();
         if (buf.hasUnreadData())
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
-                "bool_true_representation or bool_false_representation contains some delimiters of input format");
-        return;
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
+                    "bool_true_representation or bool_false_representation contains some delimiters of input format");
+            return ReturnType(false);
+        }
+        col->insert(false);
+        return ReturnType(true);
     }
 
     buf.rollbackToCheckpoint();
@@ -181,22 +193,31 @@ void deserializeImpl(
     {
         buf.dropCheckpoint();
         if (buf.hasUnreadData())
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
-                "bool_true_representation or bool_false_representation contains some delimiters of input format");
-        return;
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot continue parsing after parsed bool value because it will result in the loss of some data. It may happen if "
+                    "bool_true_representation or bool_false_representation contains some delimiters of input format");
+            restore_column_if_needed();
+            return ReturnType(false);
+        }
+        return ReturnType(true);
     }
 
     buf.makeContinuousMemoryFromCheckpointToPos();
     buf.rollbackToCheckpoint();
-    throw Exception(
-        ErrorCodes::CANNOT_PARSE_BOOL,
-        "Cannot parse boolean value here: '{}', should be '{}' or '{}' controlled by setting bool_true_representation and "
-        "bool_false_representation or one of "
-        "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0",
-        String(buf.position(), std::min(10lu, buf.available())),
-        settings.bool_true_representation, settings.bool_false_representation);
+    restore_column_if_needed();
+    if constexpr (throw_exception)
+        throw Exception(
+            ErrorCodes::CANNOT_PARSE_BOOL,
+            "Cannot parse boolean value here: '{}', should be '{}' or '{}' controlled by setting bool_true_representation and "
+            "bool_false_representation or one of "
+            "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0",
+            String(buf.position(), std::min(10lu, buf.available())),
+            settings.bool_true_representation, settings.bool_false_representation);
+
+    return ReturnType(false);
 }
 
 }
@@ -225,6 +246,14 @@ void SerializationBool::deserializeTextEscaped(IColumn & column, ReadBuffer & is
     deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
 }
 
+bool SerializationBool::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
+}
+
 void SerializationBool::serializeTextJSON(const IColumn &column, size_t row_num, WriteBuffer &ostr, const FormatSettings &settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
@@ -250,6 +279,33 @@ void SerializationBool::deserializeTextJSON(IColumn &column, ReadBuffer &istr, c
     col->insert(value);
 }
 
+bool SerializationBool::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    if (istr.eof())
+        return false;
+
+    ColumnUInt8 * col = checkAndGetDeserializeColumnType(column);
+    bool value = false;
+    char first_char = *istr.position();
+    if (first_char == 't' || first_char == 'f')
+    {
+        if (!readBoolTextWord<bool>(value, istr))
+            return false;
+    }
+    else if (first_char == '1' || first_char == '0')
+    {
+        /// Doesn't throw.
+        readBoolText(value, istr);
+    }
+    else
+    {
+        return false;
+    }
+
+    col->insert(value);
+    return true;
+}
+
 void SerializationBool::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeCustom(column, row_num, ostr, settings);
@@ -263,6 +319,14 @@ void SerializationBool::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == settings.csv.delimiter || *buf.position() == '\n' || *buf.position() == '\r'; });
 }
 
+bool SerializationBool::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == settings.csv.delimiter || *buf.position() == '\n' || *buf.position() == '\r'; });
+}
+
 void SerializationBool::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeCustom(column, row_num, ostr, settings);
@@ -276,15 +340,30 @@ void SerializationBool::deserializeTextRaw(IColumn & column, ReadBuffer & istr,
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
 }
 
+bool SerializationBool::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'; });
+}
+
 void SerializationBool::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
 }
 
-void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename ReturnType>
+ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (istr.eof())
-        throw Exception(ErrorCodes::CANNOT_PARSE_BOOL, "Expected boolean value but get EOF.");
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::CANNOT_PARSE_BOOL, "Expected boolean value but get EOF.");
+        return ReturnType(false);
+    }
 
     auto * col = checkAndGetDeserializeColumnType(column);
 
@@ -292,11 +371,17 @@ void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     switch (symbol)
     {
         case 't':
-            assertStringCaseInsensitive("true", istr);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("true", istr);
+            else if (!checkStringCaseInsensitive("true", istr))
+                return ReturnType(false);
             col->insert(true);
             break;
         case 'f':
-            assertStringCaseInsensitive("false", istr);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("false", istr);
+            else if (!checkStringCaseInsensitive("false", istr))
+                return ReturnType(false);
             col->insert(false);
             break;
         case '1':
@@ -307,16 +392,40 @@ void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
             break;
         case '\'':
             ++istr.position();
-            deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return !buf.eof() && *buf.position() == '\''; });
-            assertChar('\'', istr);
+            if constexpr (throw_exception)
+            {
+                deserializeImpl(column, istr, settings, [](ReadBuffer & buf){ return !buf.eof() && *buf.position() == '\''; });
+                assertChar('\'', istr);
+            }
+            else
+            {
+                if (!deserializeImpl<bool>(column, istr, settings, [](ReadBuffer & buf) { return !buf.eof() && *buf.position() == '\''; }) || !checkChar('\'', istr))
+                    return ReturnType(false);
+            }
             break;
         default:
-            throw Exception(
-                ErrorCodes::CANNOT_PARSE_BOOL,
-                "Cannot parse boolean value here: '{}', should be true/false, 1/0 or on of "
-                "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0 in quotes",
-                String(istr.position(), std::min(10ul, istr.available())));
+        {
+            if constexpr (throw_exception)
+                throw Exception(
+                    ErrorCodes::CANNOT_PARSE_BOOL,
+                    "Cannot parse boolean value here: '{}', should be true/false, 1/0 or on of "
+                    "True/False/T/F/Y/N/Yes/No/On/Off/Enable/Disable/Enabled/Disabled/1/0 in quotes",
+                    String(istr.position(), std::min(10ul, istr.available())));
+            return ReturnType(false);
+        }
     }
+
+    return ReturnType(true);
+}
+
+void SerializationBool::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    deserializeTextQuotedImpl<void>(column, istr, settings);
+}
+
+bool SerializationBool::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return deserializeTextQuotedImpl<bool>(column, istr, settings);
 }
 
 void SerializationBool::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -327,6 +436,14 @@ void SerializationBool::deserializeWholeText(IColumn & column, ReadBuffer & istr
     deserializeImpl(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof(); });
 }
 
+bool SerializationBool::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (istr.eof())
+        return false;
+
+    return deserializeImpl<bool>(column, istr, settings, [&](ReadBuffer & buf){ return buf.eof(); });
+}
+
 void SerializationBool::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeSimple(column, row_num, ostr, settings);
diff --git a/src/DataTypes/Serializations/SerializationBool.h b/src/DataTypes/Serializations/SerializationBool.h
index a5aa0ca80a2..3e511b7249e 100644
--- a/src/DataTypes/Serializations/SerializationBool.h
+++ b/src/DataTypes/Serializations/SerializationBool.h
@@ -15,21 +15,27 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const  override;
+    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const  override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 };
diff --git a/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp b/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
index 03564bac64b..abe443cab1b 100644
--- a/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
+++ b/src/DataTypes/Serializations/SerializationCustomSimpleText.cpp
@@ -24,6 +24,12 @@ void deserializeFromString(const SerializationCustomSimpleText & domain, IColumn
     domain.deserializeText(column, istr, settings, true);
 }
 
+bool tryDeserializeFromString(const SerializationCustomSimpleText & domain, IColumn & column, const String & s, const FormatSettings & settings)
+{
+    ReadBufferFromString istr(s);
+    return domain.tryDeserializeText(column, istr, settings, true);
+}
+
 }
 
 namespace DB
@@ -34,6 +40,19 @@ SerializationCustomSimpleText::SerializationCustomSimpleText(const Serialization
 {
 }
 
+bool SerializationCustomSimpleText::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    try
+    {
+        deserializeText(column, istr, settings, whole);
+        return true;
+    }
+    catch (...)
+    {
+        return false;
+    }
+}
+
 void SerializationCustomSimpleText::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     String str;
@@ -41,6 +60,13 @@ void SerializationCustomSimpleText::deserializeWholeText(IColumn & column, ReadB
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readStringUntilEOF(str, istr);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeEscapedString(serializeToString(*this, column, row_num, settings), ostr);
@@ -53,6 +79,13 @@ void SerializationCustomSimpleText::deserializeTextEscaped(IColumn & column, Rea
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readEscapedString(str, istr);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeQuotedString(serializeToString(*this, column, row_num, settings), ostr);
@@ -65,6 +98,14 @@ void SerializationCustomSimpleText::deserializeTextQuoted(IColumn & column, Read
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    if (!tryReadQuotedString(str, istr))
+        return false;
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeCSVString(serializeToString(*this, column, row_num, settings), ostr);
@@ -77,6 +118,13 @@ void SerializationCustomSimpleText::deserializeTextCSV(IColumn & column, ReadBuf
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    readCSVStringInto<String, false, false>(str, istr, settings.csv);
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeJSONString(serializeToString(*this, column, row_num, settings), ostr, settings);
@@ -89,6 +137,14 @@ void SerializationCustomSimpleText::deserializeTextJSON(IColumn & column, ReadBu
     deserializeFromString(*this, column, str, settings);
 }
 
+bool SerializationCustomSimpleText::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String str;
+    if (!tryReadJSONStringInto(str, istr))
+        return false;
+    return tryDeserializeFromString(*this, column, str, settings);
+}
+
 void SerializationCustomSimpleText::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeXMLStringForTextElement(serializeToString(*this, column, row_num, settings), ostr);
diff --git a/src/DataTypes/Serializations/SerializationCustomSimpleText.h b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
index 0c909350002..c80a57e234c 100644
--- a/src/DataTypes/Serializations/SerializationCustomSimpleText.h
+++ b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
@@ -22,20 +22,24 @@ public:
     /// whole = true means that buffer contains only one value, so we should read until EOF.
     /// It's needed to check if there is garbage after parsed field.
     virtual void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const = 0;
+    virtual bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const;
 
     /** Text deserialization in case when buffer contains only one value, without any escaping and delimiters.
       */
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization with escaping but without quoting.
       */
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     /** Text serialization as a literal that may be inserted into a query.
       */
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const  override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const  override;
 
     /** Text serialization for the CSV format.
       */
@@ -44,12 +48,14 @@ public:
       * (the delimiter is not consumed).
       */
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization intended for using in JSON format.
       * force_quoting_64bit_integers parameter forces to brace UInt64 and Int64 types into quotes.
       */
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Text serialization for putting into the XML format.
       */
diff --git a/src/DataTypes/Serializations/SerializationDate.cpp b/src/DataTypes/Serializations/SerializationDate.cpp
index 534f599a072..38e1bb87b6d 100644
--- a/src/DataTypes/Serializations/SerializationDate.cpp
+++ b/src/DataTypes/Serializations/SerializationDate.cpp
@@ -22,6 +22,15 @@ void SerializationDate::deserializeWholeText(IColumn & column, ReadBuffer & istr
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Date");
 }
 
+bool SerializationDate::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!tryReadDateText(x, istr, time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     DayNum x;
@@ -29,6 +38,15 @@ void SerializationDate::deserializeTextEscaped(IColumn & column, ReadBuffer & is
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!tryReadDateText(x, istr, time_zone))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeText(column, row_num, ostr, settings);
@@ -50,6 +68,16 @@ void SerializationDate::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDate::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!checkChar('\'', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('\'', istr))
+        return false;
+
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -66,6 +94,15 @@ void SerializationDate::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum x;
+    if (!checkChar('"', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -80,6 +117,15 @@ void SerializationDate::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUInt16 &>(column).getData().push_back(value);
 }
 
+bool SerializationDate::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    DayNum value;
+    if (!tryReadCSV(value, istr, time_zone))
+        return false;
+    assert_cast<ColumnUInt16 &>(column).getData().push_back(value);
+    return true;
+}
+
 SerializationDate::SerializationDate(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
 {
 }
diff --git a/src/DataTypes/Serializations/SerializationDate.h b/src/DataTypes/Serializations/SerializationDate.h
index f751b06fba6..dcf79eb49da 100644
--- a/src/DataTypes/Serializations/SerializationDate.h
+++ b/src/DataTypes/Serializations/SerializationDate.h
@@ -13,14 +13,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
 protected:
     const DateLUTImpl & time_zone;
diff --git a/src/DataTypes/Serializations/SerializationDate32.cpp b/src/DataTypes/Serializations/SerializationDate32.cpp
index 851710de839..70a22d59e42 100644
--- a/src/DataTypes/Serializations/SerializationDate32.cpp
+++ b/src/DataTypes/Serializations/SerializationDate32.cpp
@@ -21,6 +21,15 @@ void SerializationDate32::deserializeWholeText(IColumn & column, ReadBuffer & is
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Date32");
 }
 
+bool SerializationDate32::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!tryReadDateText(x, istr, time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     ExtendedDayNum x;
@@ -28,6 +37,15 @@ void SerializationDate32::deserializeTextEscaped(IColumn & column, ReadBuffer &
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate32::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!tryReadDateText(x, istr, time_zone))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeText(column, row_num, ostr, settings);
@@ -49,6 +67,15 @@ void SerializationDate32::deserializeTextQuoted(IColumn & column, ReadBuffer & i
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDate32::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!checkChar('\'', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('\'', istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+    return true;
+}
+
 void SerializationDate32::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -65,6 +92,15 @@ void SerializationDate32::deserializeTextJSON(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnInt32 &>(column).getData().push_back(x);
 }
 
+bool SerializationDate32::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    ExtendedDayNum x;
+    if (!checkChar('"', istr) || !tryReadDateText(x, istr, time_zone) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDate32::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -79,6 +115,15 @@ void SerializationDate32::deserializeTextCSV(IColumn & column, ReadBuffer & istr
     assert_cast<ColumnInt32 &>(column).getData().push_back(value.getExtenedDayNum());
 }
 
+bool SerializationDate32::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    LocalDate value;
+    if (!tryReadCSV(value, istr))
+        return false;
+    assert_cast<ColumnInt32 &>(column).getData().push_back(value.getExtenedDayNum());
+    return true;
+}
+
 SerializationDate32::SerializationDate32(const DateLUTImpl & time_zone_) : time_zone(time_zone_)
 {
 }
diff --git a/src/DataTypes/Serializations/SerializationDate32.h b/src/DataTypes/Serializations/SerializationDate32.h
index 49560fb6c7d..be2e2b76c1d 100644
--- a/src/DataTypes/Serializations/SerializationDate32.h
+++ b/src/DataTypes/Serializations/SerializationDate32.h
@@ -12,14 +12,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
 protected:
     const DateLUTImpl & time_zone;
diff --git a/src/DataTypes/Serializations/SerializationDateTime.cpp b/src/DataTypes/Serializations/SerializationDateTime.cpp
index 77beb0d9b75..17465d85e9d 100644
--- a/src/DataTypes/Serializations/SerializationDateTime.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime.cpp
@@ -21,15 +21,56 @@ inline void readText(time_t & x, ReadBuffer & istr, const FormatSettings & setti
     switch (settings.date_time_input_format)
     {
         case FormatSettings::DateTimeInputFormat::Basic:
-            readDateTimeText(x, istr, time_zone);
-            return;
+            readDateTimeTextImpl<>(x, istr, time_zone);
+            break;
         case FormatSettings::DateTimeInputFormat::BestEffort:
             parseDateTimeBestEffort(x, istr, time_zone, utc_time_zone);
-            return;
+            break;
         case FormatSettings::DateTimeInputFormat::BestEffortUS:
             parseDateTimeBestEffortUS(x, istr, time_zone, utc_time_zone);
-            return;
+            break;
     }
+
+    if (x < 0)
+        x = 0;
+}
+
+inline void readAsIntText(time_t & x, ReadBuffer & istr)
+{
+    readIntText(x, istr);
+    if (x < 0)
+        x = 0;
+}
+
+inline bool tryReadText(time_t & x, ReadBuffer & istr, const FormatSettings & settings, const DateLUTImpl & time_zone, const DateLUTImpl & utc_time_zone)
+{
+    bool res;
+    switch (settings.date_time_input_format)
+    {
+        case FormatSettings::DateTimeInputFormat::Basic:
+            res = tryReadDateTimeText(x, istr, time_zone);
+            break;
+        case FormatSettings::DateTimeInputFormat::BestEffort:
+            res = tryParseDateTimeBestEffort(x, istr, time_zone, utc_time_zone);
+            break;
+        case FormatSettings::DateTimeInputFormat::BestEffortUS:
+            res = tryParseDateTimeBestEffortUS(x, istr, time_zone, utc_time_zone);
+            break;
+    }
+
+    if (x < 0)
+        x = 0;
+
+    return res;
+}
+
+inline bool tryReadAsIntText(time_t & x, ReadBuffer & istr)
+{
+    if (!tryReadIntText(x, istr))
+        return false;
+    if (x < 0)
+        x = 0;
+    return true;
 }
 
 }
@@ -68,15 +109,32 @@ void SerializationDateTime::deserializeWholeText(IColumn & column, ReadBuffer &
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime");
 }
 
+bool SerializationDateTime::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !istr.eof())
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     time_t x = 0;
     readText(x, istr, settings, time_zone, utc_time_zone);
-    if (x < 0)
-        x = 0;
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (!tryReadText(x, istr, settings, time_zone, utc_time_zone))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('\'', ostr);
@@ -94,15 +152,32 @@ void SerializationDateTime::deserializeTextQuoted(IColumn & column, ReadBuffer &
     }
     else /// Just 1504193808 or 01504193808
     {
-        readIntText(x, istr);
+        readAsIntText(x, istr);
     }
-    if (x < 0)
-        x = 0;
 
     /// It's important to do this at the end - for exception safety.
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
+    {
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+            return false;
+    }
+    else /// Just 1504193808 or 01504193808
+    {
+        if (!tryReadAsIntText(x, istr))
+            return false;
+    }
+
+    /// It's important to do this at the end - for exception safety.
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -120,13 +195,30 @@ void SerializationDateTime::deserializeTextJSON(IColumn & column, ReadBuffer & i
     }
     else
     {
-        readIntText(x, istr);
+        readAsIntText(x, istr);
     }
-    if (x < 0)
-        x = 0;
+
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+    if (checkChar('"', istr))
+    {
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar('"', istr))
+            return false;
+    }
+    else
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 void SerializationDateTime::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -165,13 +257,48 @@ void SerializationDateTime::deserializeTextCSV(IColumn & column, ReadBuffer & is
             readCSVString(datetime_str, istr, settings.csv);
             ReadBufferFromString buf(datetime_str);
             readText(x, buf, settings, time_zone, utc_time_zone);
+            if (!buf.eof())
+                throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime");
         }
     }
 
-    if (x < 0)
-        x = 0;
-
     assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
 }
 
+bool SerializationDateTime::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    time_t x = 0;
+
+    if (istr.eof())
+        return false;
+
+    char maybe_quote = *istr.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+    {
+        ++istr.position();
+        if (!tryReadText(x, istr, settings, time_zone, utc_time_zone) || !checkChar(maybe_quote, istr))
+            return false;
+    }
+    else
+    {
+        if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
+        {
+            if (!tryReadText(x, istr, settings, time_zone, utc_time_zone))
+                return false;
+        }
+        else
+        {
+            String datetime_str;
+            readCSVString(datetime_str, istr, settings.csv);
+            ReadBufferFromString buf(datetime_str);
+            if (!tryReadText(x, buf, settings, time_zone, utc_time_zone) || !buf.eof())
+                return false;
+        }
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(static_cast<UInt32>(x));
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime.h b/src/DataTypes/Serializations/SerializationDateTime.h
index f4a142483e5..584b0c4116b 100644
--- a/src/DataTypes/Serializations/SerializationDateTime.h
+++ b/src/DataTypes/Serializations/SerializationDateTime.h
@@ -15,14 +15,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime64.cpp b/src/DataTypes/Serializations/SerializationDateTime64.cpp
index 93891886000..a19619bf8d3 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime64.cpp
@@ -47,6 +47,16 @@ void SerializationDateTime64::deserializeText(IColumn & column, ReadBuffer & ist
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "DateTime64");
 }
 
+bool SerializationDateTime64::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    DateTime64 result = 0;
+    if (tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && istr.eof()))
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(result);
+    return true;
+}
+
 void SerializationDateTime64::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     deserializeTextEscaped(column, istr, settings);
@@ -75,6 +85,29 @@ static inline void readText(DateTime64 & x, UInt32 scale, ReadBuffer & istr, con
     }
 }
 
+static inline bool tryReadText(DateTime64 & x, UInt32 scale, ReadBuffer & istr, const FormatSettings & settings, const DateLUTImpl & time_zone, const DateLUTImpl & utc_time_zone)
+{
+    switch (settings.date_time_input_format)
+    {
+        case FormatSettings::DateTimeInputFormat::Basic:
+            return tryReadDateTime64Text(x, scale, istr, time_zone);
+        case FormatSettings::DateTimeInputFormat::BestEffort:
+            return tryParseDateTime64BestEffort(x, scale, istr, time_zone, utc_time_zone);
+        case FormatSettings::DateTimeInputFormat::BestEffortUS:
+            return tryParseDateTime64BestEffortUS(x, scale, istr, time_zone, utc_time_zone);
+    }
+}
+
+
+bool SerializationDateTime64::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !istr.eof())
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     DateTime64 x = 0;
@@ -82,6 +115,15 @@ void SerializationDateTime64::deserializeTextEscaped(IColumn & column, ReadBuffe
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('\'', ostr);
@@ -104,6 +146,23 @@ void SerializationDateTime64::deserializeTextQuoted(IColumn & column, ReadBuffer
     assert_cast<ColumnType &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationDateTime64::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
+    {
+        if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+            return false;
+    }
+    else /// Just 1504193808 or 01504193808
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+    assert_cast<ColumnType &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+    return true;
+}
+
 void SerializationDateTime64::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -126,6 +185,23 @@ void SerializationDateTime64::deserializeTextJSON(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+    if (checkChar('"', istr))
+    {
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('"', istr))
+            return false;
+    }
+    else
+    {
+        if (!tryReadIntText(x, istr))
+            return false;
+    }
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationDateTime64::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -170,4 +246,40 @@ void SerializationDateTime64::deserializeTextCSV(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+bool SerializationDateTime64::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    DateTime64 x = 0;
+
+    if (istr.eof())
+        return false;
+
+    char maybe_quote = *istr.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+    {
+        ++istr.position();
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar(maybe_quote, istr))
+            return false;
+    }
+    else
+    {
+        if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
+        {
+            if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+                return false;
+        }
+        else
+        {
+            String datetime_str;
+            readCSVString(datetime_str, istr, settings.csv);
+            ReadBufferFromString buf(datetime_str);
+            if (!tryReadText(x, scale, buf, settings, time_zone, utc_time_zone) || !buf.eof())
+                return false;
+        }
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationDateTime64.h b/src/DataTypes/Serializations/SerializationDateTime64.h
index f817edbf0dd..b49bd1e9098 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.h
+++ b/src/DataTypes/Serializations/SerializationDateTime64.h
@@ -15,15 +15,21 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationDecimal.cpp b/src/DataTypes/Serializations/SerializationDecimal.cpp
index b576b7a048c..d632c224783 100644
--- a/src/DataTypes/Serializations/SerializationDecimal.cpp
+++ b/src/DataTypes/Serializations/SerializationDecimal.cpp
@@ -16,11 +16,19 @@ namespace ErrorCodes
 }
 
 template <typename T>
-bool SerializationDecimal<T>::tryReadText(T & x, ReadBuffer & istr, UInt32 precision, UInt32 scale)
+bool SerializationDecimal<T>::tryReadText(T & x, ReadBuffer & istr, UInt32 precision, UInt32 scale, bool csv)
 {
     UInt32 unread_scale = scale;
-    if (!tryReadDecimalText(istr, x, precision, unread_scale))
-        return false;
+    if (csv)
+    {
+        if (!tryReadCSVDecimalText(istr, x, precision, unread_scale))
+            return false;
+    }
+    else
+    {
+        if (!tryReadDecimalText(istr, x, precision, unread_scale))
+            return false;
+    }
 
     if (common::mulOverflow(x.value, DecimalUtils::scaleMultiplier<T>(unread_scale), x.value))
         return false;
@@ -59,6 +67,16 @@ void SerializationDecimal<T>::deserializeText(IColumn & column, ReadBuffer & ist
         ISerialization::throwUnexpectedDataAfterParsedValue(column, istr, settings, "Decimal");
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    T x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationDecimal<T>::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
@@ -67,6 +85,16 @@ void SerializationDecimal<T>::deserializeTextCSV(IColumn & column, ReadBuffer &
     assert_cast<ColumnType &>(column).getData().push_back(x);
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    T x;
+    if (!tryReadText(x, istr, true))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationDecimal<T>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -88,6 +116,18 @@ void SerializationDecimal<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         assertChar('"', istr);
 }
 
+template <typename T>
+bool SerializationDecimal<T>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    bool have_quotes = checkChar('"', istr);
+    T x;
+    if (!tryReadText(x, istr) || (have_quotes && !checkChar('"', istr)))
+        return false;
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 
 template class SerializationDecimal<Decimal32>;
 template class SerializationDecimal<Decimal64>;
diff --git a/src/DataTypes/Serializations/SerializationDecimal.h b/src/DataTypes/Serializations/SerializationDecimal.h
index 57decdd0973..22a8eb1a47c 100644
--- a/src/DataTypes/Serializations/SerializationDecimal.h
+++ b/src/DataTypes/Serializations/SerializationDecimal.h
@@ -16,15 +16,19 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void readText(T & x, ReadBuffer & istr, bool csv = false) const { readText(x, istr, this->precision, this->scale, csv); }
+    bool tryReadText(T & x, ReadBuffer & istr, bool csv = false) const { return tryReadText(x, istr, this->precision, this->scale, csv); }
 
     static void readText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_, bool csv = false);
-    static bool tryReadText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_);
+    static bool tryReadText(T & x, ReadBuffer & istr, UInt32 precision_, UInt32 scale_, bool csv = false);
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index 9b3a437e9cf..6ad55913738 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -34,6 +34,27 @@ void SerializationEnum<Type>::deserializeTextEscaped(IColumn & column, ReadBuffe
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+    if (settings.tsv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readEscapedString(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -48,6 +69,18 @@ void SerializationEnum<Type>::deserializeTextQuoted(IColumn & column, ReadBuffer
     assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name)));
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    std::string field_name;
+    readQuotedStringWithSQLStyle(field_name, istr);
+    FieldType x;
+    if (!this->tryGetValue(x, StringRef(field_name)))
+        return false;
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
@@ -65,6 +98,27 @@ void SerializationEnum<Type>::deserializeWholeText(IColumn & column, ReadBuffer
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+    if (settings.tsv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x) || !istr.eof())
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readStringUntilEOF(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -90,6 +144,27 @@ void SerializationEnum<Type>::deserializeTextJSON(IColumn & column, ReadBuffer &
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    FieldType x;
+    if (!istr.eof() && *istr.position() != '"')
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readJSONString(field_name, istr);
+        if (!this->tryGetValue(x, StringRef(field_name)))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -109,6 +184,28 @@ void SerializationEnum<Type>::deserializeTextCSV(IColumn & column, ReadBuffer &
     }
 }
 
+template <typename Type>
+bool SerializationEnum<Type>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    FieldType x;
+
+    if (settings.csv.enum_as_number)
+    {
+        if (!tryReadValue(istr, x))
+            return false;
+    }
+    else
+    {
+        std::string field_name;
+        readCSVString(field_name, istr, settings.csv);
+        if (!this->tryGetValue(x, StringRef(field_name), true))
+            return false;
+    }
+
+    assert_cast<ColumnType &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename Type>
 void SerializationEnum<Type>::serializeTextMarkdown(
     const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 03b134e59a6..708161dc5fd 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -34,15 +34,20 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -53,6 +58,14 @@ public:
         return ref_enum_values.findByValue(x)->first;
     }
 
+    bool tryReadValue(ReadBuffer & istr, FieldType & x) const
+    {
+       if (!tryReadText(x, istr) || !this->hasValue(x))
+           return false;
+
+       return true;
+    }
+
     std::optional<EnumValues<Type>> own_enum_values;
     std::shared_ptr<const DataTypeEnum<Type>> own_enum_type;
     const EnumValues<Type> & ref_enum_values;
diff --git a/src/DataTypes/Serializations/SerializationFixedString.cpp b/src/DataTypes/Serializations/SerializationFixedString.cpp
index fa50af52f2f..23e959d80c9 100644
--- a/src/DataTypes/Serializations/SerializationFixedString.cpp
+++ b/src/DataTypes/Serializations/SerializationFixedString.cpp
@@ -150,12 +150,49 @@ static inline void read(const SerializationFixedString & self, IColumn & column,
     }
 }
 
+bool SerializationFixedString::tryAlignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start)
+{
+    size_t length = data.size() - string_start;
+    if (length < n)
+    {
+        data.resize_fill(string_start + n);
+    }
+    else if (length > n)
+    {
+        data.resize_assume_reserved(string_start);
+        return false;
+    }
+
+    return true;
+}
+
+template <typename Reader>
+static inline bool tryRead(const SerializationFixedString & self, IColumn & column, Reader && reader)
+{
+    ColumnFixedString::Chars & data = typeid_cast<ColumnFixedString &>(column).getChars();
+    size_t prev_size = data.size();
+    try
+    {
+        return reader(data) && SerializationFixedString::tryAlignStringLength(self.getN(), data, prev_size);
+    }
+    catch (...)
+    {
+        data.resize_assume_reserved(prev_size);
+        return false;
+    }
+}
+
 
 void SerializationFixedString::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readEscapedStringInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { readEscapedStringInto(data, istr); return true; });
+}
+
 
 void SerializationFixedString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -169,12 +206,22 @@ void SerializationFixedString::deserializeTextQuoted(IColumn & column, ReadBuffe
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readQuotedStringInto<true>(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { return tryReadQuotedStringInto<true>(data, istr); });
+}
+
 
 void SerializationFixedString::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readStringUntilEOFInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { readStringUntilEOFInto(data, istr); return true; });
+}
+
 
 void SerializationFixedString::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -188,6 +235,10 @@ void SerializationFixedString::deserializeTextJSON(IColumn & column, ReadBuffer
     read(*this, column, [&istr](ColumnFixedString::Chars & data) { readJSONStringInto(data, istr); });
 }
 
+bool SerializationFixedString::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return tryRead(*this, column, [&istr](ColumnFixedString::Chars & data) { return tryReadJSONStringInto(data, istr); });
+}
 
 void SerializationFixedString::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -208,6 +259,11 @@ void SerializationFixedString::deserializeTextCSV(IColumn & column, ReadBuffer &
     read(*this, column, [&istr, &csv = settings.csv](ColumnFixedString::Chars & data) { readCSVStringInto(data, istr, csv); });
 }
 
+bool SerializationFixedString::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryRead(*this, column, [&istr, &csv = settings.csv](ColumnFixedString::Chars & data) { readCSVStringInto<ColumnFixedString::Chars, false, false>(data, istr, csv); return true; });
+}
+
 void SerializationFixedString::serializeTextMarkdown(
     const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
 {
diff --git a/src/DataTypes/Serializations/SerializationFixedString.h b/src/DataTypes/Serializations/SerializationFixedString.h
index c27b10ad158..8eb4eacdbff 100644
--- a/src/DataTypes/Serializations/SerializationFixedString.h
+++ b/src/DataTypes/Serializations/SerializationFixedString.h
@@ -26,20 +26,25 @@ public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -47,6 +52,7 @@ public:
     /// If the length is less than getN() the function will add zero characters up to getN().
     /// If the length is greater than getN() the function will throw an exception.
     static void alignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start);
+    static bool tryAlignStringLength(size_t n, PaddedPODArray<UInt8> & data, size_t string_start);
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
new file mode 100644
index 00000000000..81c4af97401
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
@@ -0,0 +1,188 @@
+#include <DataTypes/Serializations/SerializationIPv4andIPv6.h>
+
+namespace DB
+{
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeText(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings &) const
+{
+    writeText(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    IPv x;
+    readText(x, istr);
+
+    if (whole && !istr.eof())
+        throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &, bool whole) const
+{
+    IPv x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextQuoted(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('\'', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('\'', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    assertChar('\'', istr);
+    readText(x, istr);
+    assertChar('\'', istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if (!checkChar('\'', istr) || !tryReadText(x, istr) || !checkChar('\'', istr))
+        return false;
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextJSON(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('"', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('"', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    IPv x;
+    assertChar('"', istr);
+    readText(x, istr);
+    /// this code looks weird, but we want to throw specific exception to match original behavior...
+    if (istr.eof())
+        assertChar('"', istr);
+    if (*istr.position() != '"')
+        throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+    istr.ignore();
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if (!checkChar('"', istr) || !tryReadText(x, istr) || !checkChar('"', istr))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeTextCSV(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings & settings) const
+{
+    writeChar('"', ostr);
+    serializeText(column, row_num, ostr, settings);
+    writeChar('"', ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv value;
+    readCSV(value, istr);
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
+}
+
+template <typename IPv>
+bool SerializationIP<IPv>::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv value;
+    if (!tryReadCSV(value, istr))
+        return false;
+
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
+    return true;
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
+{
+    IPv x = field.get<IPv>();
+    if constexpr (std::is_same_v<IPv, IPv6>)
+        writeBinary(x, ostr);
+    else
+        writeBinaryLittleEndian(x, ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinary(DB::Field & field, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    if constexpr (std::is_same_v<IPv, IPv6>)
+        readBinary(x, istr);
+    else
+        readBinaryLittleEndian(x, istr);
+    field = NearestFieldType<IPv>(x);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinary(const DB::IColumn & column, size_t row_num, DB::WriteBuffer & ostr, const DB::FormatSettings &) const
+{
+    writeBinary(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinary(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings &) const
+{
+    IPv x;
+    readBinary(x.toUnderType(), istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::serializeBinaryBulk(const DB::IColumn & column, DB::WriteBuffer & ostr, size_t offset, size_t limit) const
+{
+    const typename ColumnVector<IPv>::Container & x = typeid_cast<const ColumnVector<IPv> &>(column).getData();
+
+    size_t size = x.size();
+
+    if (limit == 0 || offset + limit > size)
+        limit = size - offset;
+
+    if (limit)
+        ostr.write(reinterpret_cast<const char *>(&x[offset]), sizeof(IPv) * limit);
+}
+
+template <typename IPv>
+void SerializationIP<IPv>::deserializeBinaryBulk(DB::IColumn & column, DB::ReadBuffer & istr, size_t limit, double) const
+{
+    typename ColumnVector<IPv>::Container & x = typeid_cast<ColumnVector<IPv> &>(column).getData();
+    size_t initial_size = x.size();
+    x.resize(initial_size + limit);
+    size_t size = istr.readBig(reinterpret_cast<char*>(&x[initial_size]), sizeof(IPv) * limit);
+    x.resize(initial_size + size / sizeof(IPv));
+}
+
+template class SerializationIP<IPv4>;
+template class SerializationIP<IPv6>;
+
+}
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.h b/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
index 7d8669fd444..a53f257646b 100644
--- a/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.h
@@ -13,123 +13,30 @@ template <typename IPv>
 class SerializationIP : public SimpleTextSerialization
 {
 public:
-    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        writeText(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
-    }
-    void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override
-    {
-        IPv x;
-        readText(x, istr);
+    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
 
-        if (whole && !istr.eof())
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
+    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        serializeText(column, row_num, ostr, settings);
-    }
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
-    {
-        deserializeText(column, istr, settings, false);
-    }
-    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('\'', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('\'', ostr);
-    }
-    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        assertChar('\'', istr);
-        readText(x, istr);
-        assertChar('\'', istr);
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);    /// It's important to do this at the end - for exception safety.
-    }
-    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('"', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('"', ostr);
-    }
-    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
-    {
-        IPv x;
-        assertChar('"', istr);
-        readText(x, istr);
-        /// this code looks weird, but we want to throw specific exception to match original behavior...
-        if (istr.eof())
-            assertChar('"', istr);
-        if (*istr.position() != '"')
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
-        istr.ignore();
+    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override
-    {
-        writeChar('"', ostr);
-        serializeText(column, row_num, ostr, settings);
-        writeChar('"', ostr);
-    }
-    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override
-    {
-        IPv value;
-        readCSV(value, istr);
+    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &/* settings*/) const override;
 
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(value);
-    }
+    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override;
 
-    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        IPv x = field.get<IPv>();
-        if constexpr (std::is_same_v<IPv, IPv6>)
-            writeBinary(x, ostr);
-        else
-            writeBinaryLittleEndian(x, ostr);
-    }
-    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        if constexpr (std::is_same_v<IPv, IPv6>)
-            readBinary(x, istr);
-        else
-            readBinaryLittleEndian(x, istr);
-        field = NearestFieldType<IPv>(x);
-    }
-    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override
-    {
-        writeBinary(assert_cast<const ColumnVector<IPv> &>(column).getData()[row_num], ostr);
-    }
-    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override
-    {
-        IPv x;
-        readBinary(x.toUnderType(), istr);
-        assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
-    }
-    void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override
-    {
-        const typename ColumnVector<IPv>::Container & x = typeid_cast<const ColumnVector<IPv> &>(column).getData();
+    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
+    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
-        size_t size = x.size();
-
-        if (limit == 0 || offset + limit > size)
-            limit = size - offset;
-
-        if (limit)
-            ostr.write(reinterpret_cast<const char *>(&x[offset]), sizeof(IPv) * limit);
-    }
-    void deserializeBinaryBulk(IColumn & column, ReadBuffer & istr, size_t limit, double /*avg_value_size_hint*/) const override
-    {
-        typename ColumnVector<IPv>::Container & x = typeid_cast<ColumnVector<IPv> &>(column).getData();
-        size_t initial_size = x.size();
-        x.resize(initial_size + limit);
-        size_t size = istr.readBig(reinterpret_cast<char*>(&x[initial_size]), sizeof(IPv) * limit);
-        x.resize(initial_size + size / sizeof(IPv));
-    }
+    void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override;
+    void deserializeBinaryBulk(IColumn & column, ReadBuffer & istr, size_t limit, double /*avg_value_size_hint*/) const override;
 };
 
 using SerializationIPv4 = SerializationIP<IPv4>;
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.cpp b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
index 3e1cbdb00f5..9efe05042ed 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.cpp
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.cpp
@@ -700,6 +700,11 @@ void SerializationLowCardinality::deserializeTextEscaped(IColumn & column, ReadB
     deserializeImpl(column, &ISerialization::deserializeTextEscaped, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextEscaped, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextQuoted, ostr, settings);
@@ -710,11 +715,21 @@ void SerializationLowCardinality::deserializeTextQuoted(IColumn & column, ReadBu
     deserializeImpl(column, &ISerialization::deserializeTextQuoted, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextQuoted, istr, settings);
+}
+
 void SerializationLowCardinality::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
     deserializeImpl(column, &ISerialization::deserializeWholeText, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeWholeText, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextCSV, ostr, settings);
@@ -725,6 +740,11 @@ void SerializationLowCardinality::deserializeTextCSV(IColumn & column, ReadBuffe
     deserializeImpl(column, &ISerialization::deserializeTextCSV, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextCSV, istr, settings);
+}
+
 void SerializationLowCardinality::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeText, ostr, settings);
@@ -740,6 +760,11 @@ void SerializationLowCardinality::deserializeTextJSON(IColumn & column, ReadBuff
     deserializeImpl(column, &ISerialization::deserializeTextJSON, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextJSON, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextXML, ostr, settings);
@@ -750,6 +775,11 @@ void SerializationLowCardinality::deserializeTextRaw(IColumn & column, ReadBuffe
     deserializeImpl(column, &ISerialization::deserializeTextRaw, istr, settings);
 }
 
+bool SerializationLowCardinality::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return tryDeserializeImpl(column, &ISerialization::tryDeserializeTextRaw, istr, settings);
+}
+
 void SerializationLowCardinality::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeImpl(column, row_num, &ISerialization::serializeTextRaw, ostr, settings);
@@ -769,7 +799,7 @@ template <typename... Params, typename... Args>
 void SerializationLowCardinality::deserializeImpl(
     IColumn & column, SerializationLowCardinality::DeserializeFunctionPtr<Params...> func, Args &&... args) const
 {
-    auto & low_cardinality_column= getColumnLowCardinality(column);
+    auto & low_cardinality_column = getColumnLowCardinality(column);
     auto temp_column = low_cardinality_column.getDictionary().getNestedColumn()->cloneEmpty();
 
     auto serialization = dictionary_type->getDefaultSerialization();
@@ -778,4 +808,19 @@ void SerializationLowCardinality::deserializeImpl(
     low_cardinality_column.insertFromFullColumn(*temp_column, 0);
 }
 
+template <typename... Params, typename... Args>
+bool SerializationLowCardinality::tryDeserializeImpl(
+    IColumn & column, SerializationLowCardinality::TryDeserializeFunctionPtr<Params...> func, Args &&... args) const
+{
+    auto & low_cardinality_column = getColumnLowCardinality(column);
+    auto temp_column = low_cardinality_column.getDictionary().getNestedColumn()->cloneEmpty();
+
+    auto serialization = dictionary_type->getDefaultSerialization();
+    if (!(serialization.get()->*func)(*temp_column, std::forward<Args>(args)...))
+        return false;
+
+    low_cardinality_column.insertFromFullColumn(*temp_column, 0);
+    return true;
+}
+
 }
diff --git a/src/DataTypes/Serializations/SerializationLowCardinality.h b/src/DataTypes/Serializations/SerializationLowCardinality.h
index 5f56bcf8108..d2c3a95c702 100644
--- a/src/DataTypes/Serializations/SerializationLowCardinality.h
+++ b/src/DataTypes/Serializations/SerializationLowCardinality.h
@@ -55,16 +55,22 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 
 private:
@@ -79,6 +85,12 @@ private:
 
     template <typename ... Params, typename... Args>
     void deserializeImpl(IColumn & column, DeserializeFunctionPtr<Params...> func, Args &&... args) const;
+
+    template <typename ... Params>
+    using TryDeserializeFunctionPtr = bool (ISerialization::*)(IColumn &, Params ...) const;
+
+    template <typename ... Params, typename... Args>
+    bool tryDeserializeImpl(IColumn & column, TryDeserializeFunctionPtr<Params...> func, Args &&... args) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationMap.cpp b/src/DataTypes/Serializations/SerializationMap.cpp
index 7588e630689..7b6f87baf2e 100644
--- a/src/DataTypes/Serializations/SerializationMap.cpp
+++ b/src/DataTypes/Serializations/SerializationMap.cpp
@@ -115,9 +115,11 @@ void SerializationMap::serializeTextImpl(
     writeChar('}', ostr);
 }
 
-template <typename Reader>
-void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const
+template <typename ReturnType, typename Reader>
+ReturnType SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     auto & column_map = assert_cast<ColumnMap &>(column);
 
     auto & nested_array = column_map.getNestedColumn();
@@ -128,7 +130,21 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
     auto & value_column = nested_tuple.getColumn(1);
 
     size_t size = 0;
-    assertChar('{', istr);
+    if constexpr (throw_exception)
+        assertChar('{', istr);
+    else if (!checkChar('{', istr))
+        return ReturnType(false);
+
+    auto on_error_no_throw = [&]()
+    {
+        if (size)
+        {
+            nested_tuple.getColumnPtr(0) = key_column.cut(0, offsets.back());
+            nested_tuple.getColumnPtr(1) = value_column.cut(0, offsets.back());
+        }
+
+        return ReturnType(false);
+    };
 
     try
     {
@@ -138,9 +154,15 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             if (!first)
             {
                 if (*istr.position() == ',')
+                {
                     ++istr.position();
+                }
                 else
-                    throw Exception(ErrorCodes::CANNOT_READ_MAP_FROM_TEXT, "Cannot read Map from text");
+                {
+                    if constexpr (throw_exception)
+                        throw Exception(ErrorCodes::CANNOT_READ_MAP_FROM_TEXT, "Cannot read Map from text");
+                    return on_error_no_throw();
+                }
             }
 
             first = false;
@@ -150,19 +172,32 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             if (*istr.position() == '}')
                 break;
 
-            reader(istr, key, key_column);
+            if constexpr (throw_exception)
+                reader(istr, key, key_column);
+            else if (!reader(istr, key, key_column))
+                return on_error_no_throw();
+
             ++size;
 
             skipWhitespaceIfAny(istr);
-            assertChar(':', istr);
+            if constexpr (throw_exception)
+                assertChar(':', istr);
+            else if (!checkChar(':', istr))
+                return on_error_no_throw();
             skipWhitespaceIfAny(istr);
 
-            reader(istr, value, value_column);
+            if constexpr (throw_exception)
+                reader(istr, value, value_column);
+            else if (!reader(istr, value, value_column))
+                return on_error_no_throw();
 
             skipWhitespaceIfAny(istr);
         }
 
-        assertChar('}', istr);
+        if constexpr (throw_exception)
+            assertChar('}', istr);
+        else if (!checkChar('}', istr))
+            return on_error_no_throw();
     }
     catch (...)
     {
@@ -171,10 +206,14 @@ void SerializationMap::deserializeTextImpl(IColumn & column, ReadBuffer & istr,
             nested_tuple.getColumnPtr(0) = key_column.cut(0, offsets.back());
             nested_tuple.getColumnPtr(1) = value_column.cut(0, offsets.back());
         }
-        throw;
+
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
 
     offsets.push_back(offsets.back() + size);
+    return ReturnType(true);
 }
 
 void SerializationMap::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -192,8 +231,8 @@ void SerializationMap::deserializeText(IColumn & column, ReadBuffer & istr, cons
     deserializeTextImpl(column, istr,
         [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(subcolumn, buf, settings, subcolumn_serialization);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(subcolumn, buf, settings, subcolumn_serialization);
             else
                 subcolumn_serialization->deserializeTextQuoted(subcolumn, buf, settings);
         });
@@ -202,6 +241,28 @@ void SerializationMap::deserializeText(IColumn & column, ReadBuffer & istr, cons
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Map");
 }
 
+bool SerializationMap::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+{
+    auto reader = [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(subcolumn, buf, settings, subcolumn_serialization);
+        return subcolumn_serialization->tryDeserializeTextQuoted(subcolumn, buf, settings);
+    };
+
+    auto ok = deserializeTextImpl<bool>(column, istr, reader);
+    if (!ok)
+        return false;
+
+    if (whole && !istr.eof())
+    {
+        column.popBack(1);
+        return false;
+    }
+
+    return true;
+}
+
 void SerializationMap::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     serializeTextImpl(column, row_num, ostr,
@@ -260,13 +321,25 @@ void SerializationMap::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     deserializeTextImpl(column, istr,
         [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
         {
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextJSONImpl(subcolumn, buf, settings, subcolumn_serialization);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(subcolumn, buf, settings, subcolumn_serialization);
             else
                 subcolumn_serialization->deserializeTextJSON(subcolumn, buf, settings);
         });
 }
 
+bool SerializationMap::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    auto reader = [&settings](ReadBuffer & buf, const SerializationPtr & subcolumn_serialization, IColumn & subcolumn)
+    {
+        if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(subcolumn))
+            return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(subcolumn, buf, settings, subcolumn_serialization);
+        return subcolumn_serialization->tryDeserializeTextJSON(subcolumn, buf, settings);
+    };
+
+    return deserializeTextImpl<bool>(column, istr, reader);
+}
+
 void SerializationMap::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const auto & column_map = assert_cast<const ColumnMap &>(column);
@@ -308,6 +381,15 @@ void SerializationMap::deserializeTextCSV(IColumn & column, ReadBuffer & istr, c
     deserializeText(column, rb, settings, true);
 }
 
+bool SerializationMap::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String s;
+    if (!tryReadCSV(s, istr, settings.csv))
+        return false;
+    ReadBufferFromString rb(s);
+    return tryDeserializeText(column, rb, settings, true);
+}
+
 void SerializationMap::enumerateStreams(
     EnumerateStreamsSettings & settings,
     const StreamCallback & callback,
diff --git a/src/DataTypes/Serializations/SerializationMap.h b/src/DataTypes/Serializations/SerializationMap.h
index f32c656757d..3e27ef1b04a 100644
--- a/src/DataTypes/Serializations/SerializationMap.h
+++ b/src/DataTypes/Serializations/SerializationMap.h
@@ -24,13 +24,16 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void enumerateStreams(
         EnumerateStreamsSettings & settings,
@@ -68,8 +71,8 @@ private:
     template <typename KeyWriter, typename ValueWriter>
     void serializeTextImpl(const IColumn & column, size_t row_num, WriteBuffer & ostr, KeyWriter && key_writer, ValueWriter && value_writer) const;
 
-    template <typename Reader>
-    void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const;
+    template <typename ReturnType = void, typename Reader>
+    ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && reader) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationNamed.cpp b/src/DataTypes/Serializations/SerializationNamed.cpp
index ca60948ce68..1a9cbe9a37d 100644
--- a/src/DataTypes/Serializations/SerializationNamed.cpp
+++ b/src/DataTypes/Serializations/SerializationNamed.cpp
@@ -1,4 +1,5 @@
 #include <DataTypes/Serializations/SerializationNamed.h>
+#include <iostream>
 
 namespace DB
 {
diff --git a/src/DataTypes/Serializations/SerializationNothing.h b/src/DataTypes/Serializations/SerializationNothing.h
index 02974d1ca76..7d1fff55b01 100644
--- a/src/DataTypes/Serializations/SerializationNothing.h
+++ b/src/DataTypes/Serializations/SerializationNothing.h
@@ -25,6 +25,7 @@ public:
     void deserializeBinary(IColumn &, ReadBuffer &, const FormatSettings &) const override                          { throwNoSerialization(); }
     void serializeText(const IColumn &, size_t, WriteBuffer &, const FormatSettings &) const override { throwNoSerialization(); }
     void deserializeText(IColumn &, ReadBuffer &, const FormatSettings &, bool) const override    { throwNoSerialization(); }
+    bool tryDeserializeText(IColumn &, ReadBuffer &, const FormatSettings &, bool) const override    { throwNoSerialization(); }
 
     /// These methods read and write zero bytes just to allow to figure out size of column.
     void serializeBinaryBulk(const IColumn & column, WriteBuffer & ostr, size_t offset, size_t limit) const override;
diff --git a/src/DataTypes/Serializations/SerializationNullable.cpp b/src/DataTypes/Serializations/SerializationNullable.cpp
index 15203bdc9fa..e7f0e61f2a5 100644
--- a/src/DataTypes/Serializations/SerializationNullable.cpp
+++ b/src/DataTypes/Serializations/SerializationNullable.cpp
@@ -187,55 +187,59 @@ void SerializationNullable::serializeBinary(const IColumn & column, size_t row_n
         nested->serializeBinary(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-/// Deserialize value into ColumnNullable.
-/// We need to insert both to nested column and to null byte map, or, in case of exception, to not insert at all.
-template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
-requires std::same_as<ReturnType, void>
-static ReturnType
-safeDeserialize(IColumn & column, const ISerialization &, CheckForNull && check_for_null, DeserializeNested && deserialize_nested)
+template <typename ReturnType>
+ReturnType safeAppendToNullMap(ColumnNullable & column, bool is_null)
 {
-    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
-
-    if (check_for_null())
+    try
     {
-        col.insertDefault();
+        column.getNullMapData().push_back(is_null);
     }
-    else
+    catch (...)
     {
-        deserialize_nested(col.getNestedColumn());
-
-        try
-        {
-            col.getNullMapData().push_back(0);
-        }
-        catch (...)
-        {
-            col.getNestedColumn().popBack(1);
+        column.getNestedColumn().popBack(1);
+        if constexpr (std::is_same_v<ReturnType, void>)
             throw;
-        }
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
 }
 
-/// Deserialize value into non-nullable column. In case of NULL, insert default value and return false.
+/// Deserialize value into non-nullable column. In case of NULL, insert default and set is_null to true.
+/// If ReturnType is bool, return true if parsing was succesfull and false in case of any error.
 template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
-requires std::same_as<ReturnType, bool>
-static ReturnType
-safeDeserialize(IColumn & column, const ISerialization &, CheckForNull && check_for_null, DeserializeNested && deserialize_nested)
+static ReturnType deserializeImpl(IColumn & column, ReadBuffer & buf, CheckForNull && check_for_null, DeserializeNested && deserialize_nested, bool & is_null)
 {
-    bool insert_default = check_for_null();
-    if (insert_default)
+    is_null = check_for_null(buf);
+    if (is_null)
+    {
         column.insertDefault();
+    }
     else
-        deserialize_nested(column);
-    return !insert_default;
+    {
+        if constexpr (std::is_same_v<ReturnType, void>)
+            deserialize_nested(column, buf);
+        else if (!deserialize_nested(column, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 
 void SerializationNullable::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    safeDeserialize(column, *nested,
-        [&istr] { bool is_null = false; readBinary(is_null, istr); return is_null; },
-        [this, &istr, settings] (IColumn & nested_column) { nested->deserializeBinary(nested_column, istr, settings); });
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    auto check_for_null = [](ReadBuffer & buf)
+    {
+        bool is_null_ = false;
+        readBinary(is_null_, buf);
+        return is_null_;
+    };
+    auto deserialize_nested = [this, &settings] (IColumn & nested_column, ReadBuffer & buf) { nested->deserializeBinary(nested_column, buf, settings); };
+    deserializeImpl(col.getNestedColumn(), istr, check_for_null, deserialize_nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
 }
 
 
@@ -244,20 +248,19 @@ void SerializationNullable::serializeTextEscaped(const IColumn & column, size_t
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeString(settings.tsv.null_representation, ostr);
+        serializeNullEscaped(ostr, settings);
     else
         nested->serializeTextEscaped(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-
-void SerializationNullable::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullEscaped(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    deserializeTextEscapedImpl<void>(column, istr, settings, nested);
+    writeString(settings.tsv.null_representation, ostr);
 }
 
-void SerializationNullable::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+bool SerializationNullable::tryDeserializeNullEscaped(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
 {
-    deserializeTextRawImpl<void>(column, istr, settings, nested);
+    return checkString(settings.tsv.null_representation, istr);
 }
 
 void SerializationNullable::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -265,72 +268,73 @@ void SerializationNullable::serializeTextRaw(const IColumn & column, size_t row_
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeString(settings.tsv.null_representation, ostr);
+        serializeNullRaw(ostr, settings);
     else
         nested->serializeTextRaw(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested)
+void SerializationNullable::serializeNullRaw(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    return deserializeTextEscapedAndRawImpl<ReturnType, false>(column, istr, settings, nested);
+    writeString(settings.tsv.null_representation, ostr);
 }
 
-template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextEscapedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                             const SerializationPtr & nested)
+bool SerializationNullable::tryDeserializeNullRaw(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
 {
-    return deserializeTextEscapedAndRawImpl<ReturnType, true>(column, istr, settings, nested);
+    return checkString(settings.tsv.null_representation, istr);
 }
 
 template<typename ReturnType, bool escaped>
-ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                    const SerializationPtr & nested_serialization)
+ReturnType deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     const String & null_representation = settings.tsv.null_representation;
+    auto deserialize_nested = [&nested_serialization, &settings] (IColumn & nested_column, ReadBuffer & buf_)
+    {
+        if constexpr (throw_exception)
+        {
+            if constexpr (escaped)
+                nested_serialization->deserializeTextEscaped(nested_column, buf_, settings);
+            else
+                nested_serialization->deserializeTextRaw(nested_column, buf_, settings);
+        }
+        else
+        {
+            if constexpr (escaped)
+                return nested_serialization->tryDeserializeTextEscaped(nested_column, buf_, settings);
+            else
+                return nested_serialization->tryDeserializeTextRaw(nested_column, buf_, settings);
+        }
+    };
 
     /// Some data types can deserialize absence of data (e.g. empty string), so eof is ok.
     if (istr.eof() || (!null_representation.empty() && *istr.position() != null_representation[0]))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested_serialization,
-            [] { return false; },
-            [&nested_serialization, &istr, &settings] (IColumn & nested_column)
-            {
-                if constexpr (escaped)
-                    nested_serialization->deserializeTextEscaped(nested_column, istr, settings);
-                else
-                    nested_serialization->deserializeTextRaw(nested_column, istr, settings);
-            });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (istr.available() > null_representation.size())
     {
-        auto check_for_null = [&istr, &null_representation]()
+        auto check_for_null = [&null_representation](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkString(null_representation, istr) && (*istr.position() == '\t' || *istr.position() == '\n'))
+            auto * pos = buf.position();
+            if (checkString(null_representation, buf) && (*buf.position() == '\t' || *buf.position() == '\n'))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested_serialization, &settings, &istr] (IColumn & nested_column)
-        {
-            if constexpr (escaped)
-                nested_serialization->deserializeTextEscaped(nested_column, istr, settings);
-            else
-                nested_serialization->deserializeTextRaw(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a null.
     /// Use PeekableReadBuffer to make a checkpoint before checking null
     /// representation and rollback if check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf, &null_representation]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [&null_representation](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkString(null_representation, buf) && (buf.eof() || *buf.position() == '\t' || *buf.position() == '\n'))
@@ -340,16 +344,18 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
         return false;
     };
 
-    auto deserialize_nested = [&nested_serialization, &settings, &buf, &null_representation, &istr] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested, &nested_serialization, &settings, &null_representation, &istr] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         auto * pos = buf.position();
-        if constexpr (escaped)
-            nested_serialization->deserializeTextEscaped(nested_column, buf, settings);
-        else
-            nested_serialization->deserializeTextRaw(nested_column, buf, settings);
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return ReturnType(false);
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is a string instead of a number
@@ -358,6 +364,9 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
 
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         if (null_representation.find('\t') != std::string::npos || null_representation.find('\n') != std::string::npos)
             throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "TSV custom null representation "
                                        "containing '\\t' or '\\n' may not work correctly for large input.");
@@ -375,7 +384,63 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
                                    istr.count(), std::string(pos, buf.position() - pos), parsed_value.str());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
+}
+
+void SerializationNullable::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, true>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, true>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, true>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, true>(nested_column, istr, settings, nested_serialization, is_null);
+}
+
+void SerializationNullable::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, false>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, false>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextEscapedAndRawImpl<void, false>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextEscapedAndRawImpl<bool, false>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -383,45 +448,51 @@ void SerializationNullable::serializeTextQuoted(const IColumn & column, size_t r
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeCString("NULL", ostr);
+        serializeNullQuoted(ostr);
     else
         nested->serializeTextQuoted(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-
-void SerializationNullable::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullQuoted(DB::WriteBuffer & ostr)
 {
-    deserializeTextQuotedImpl<void>(column, istr, settings, nested);
+    writeCString("NULL", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullQuoted(DB::ReadBuffer & istr)
+{
+    return checkStringCaseInsensitive("NULL", istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                   const SerializationPtr & nested)
+ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_nested = [&nested, &settings] (IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (!throw_exception)
+            return nested->tryDeserializeTextQuoted(nested_column, buf, settings);
+        nested->deserializeTextQuoted(nested_column, buf, settings);
+    };
+
     if (istr.eof() || (*istr.position() != 'N' && *istr.position() != 'n'))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested,
-            [] { return false; },
-            [&nested, &istr, &settings] (IColumn & nested_column) { nested->deserializeTextQuoted(nested_column, istr, settings); });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (istr.available() >= 4)
     {
-        auto check_for_null = [&istr]()
+        auto check_for_null = [](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkStringCaseInsensitive("NULL", istr))
+            auto * pos = buf.position();
+            if (checkStringCaseInsensitive("NULL", buf))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested, &settings, &istr] (IColumn & nested_column)
-        {
-            nested->deserializeTextQuoted(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a NULL
@@ -429,9 +500,10 @@ ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, Re
     /// to differentiate for example NULL and NaN for float)
     /// Use PeekableReadBuffer to make a checkpoint before checking
     /// null and rollback if the check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkStringCaseInsensitive("NULL", buf))
@@ -441,39 +513,74 @@ ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, Re
         return false;
     };
 
-    auto deserialize_nested = [&nested, &settings, &buf] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested] (IColumn & nested_column, ReadBuffer & buf_)
     {
-        nested->deserializeTextQuoted(nested_column, buf, settings);
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
+
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return false;
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is an unquoted string instead of a number.
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
+
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         throw DB::ParsingException(
             ErrorCodes::CANNOT_READ_ALL_DATA,
             "Error while parsing Nullable: got an unquoted string {} instead of a number",
             String(buf.position(), std::min(10ul, buf.available())));
     };
 
-    return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
 }
 
 
-void SerializationNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    deserializeWholeTextImpl<void>(column, istr, settings, nested);
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextQuotedImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextQuotedImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextQuotedImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextQuotedImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 template <typename ReturnType>
-ReturnType SerializationNullable::deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                  const SerializationPtr & nested)
+ReturnType deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf]()
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
 
@@ -488,15 +595,46 @@ ReturnType SerializationNullable::deserializeWholeTextImpl(IColumn & column, Rea
         return false;
     };
 
-    auto deserialize_nested = [&nested, &settings, &buf] (IColumn & nested_column)
+    auto deserialize_nested = [&nested, &settings] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
+        if constexpr (!throw_exception)
+            return nested->tryDeserializeWholeText(nested_column, buf, settings);
+
         nested->deserializeWholeText(nested_column, buf, settings);
         assert(!buf.hasUnreadData());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested, is_null);
 }
 
+void SerializationNullable::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeWholeTextImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeWholeTextImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedWholeText(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeWholeTextImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedWholeText(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeWholeTextImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
+}
 
 void SerializationNullable::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -508,48 +646,56 @@ void SerializationNullable::serializeTextCSV(const IColumn & column, size_t row_
         nested->serializeTextCSV(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-void SerializationNullable::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullCSV(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
 {
-    deserializeTextCSVImpl<void>(column, istr, settings, nested);
+    writeString(settings.csv.null_representation, ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullCSV(DB::ReadBuffer & istr, const DB::FormatSettings & settings)
+{
+    return checkString(settings.csv.null_representation, istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                         const SerializationPtr & nested_serialization)
+ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization, bool & is_null)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_nested = [&nested_serialization, &settings] (IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (!throw_exception)
+            return nested_serialization->tryDeserializeTextCSV(nested_column, buf, settings);
+        nested_serialization->deserializeTextCSV(nested_column, buf, settings);
+    };
+
     const String & null_representation = settings.csv.null_representation;
     if (istr.eof() || (!null_representation.empty() && *istr.position() != null_representation[0]))
     {
         /// This is not null, surely.
-        return safeDeserialize<ReturnType>(column, *nested_serialization,
-            [] { return false; },
-            [&nested_serialization, &istr, &settings] (IColumn & nested_column) { nested_serialization->deserializeTextCSV(nested_column, istr, settings); });
+        return deserializeImpl<ReturnType>(column, istr, [](ReadBuffer &){ return false; }, deserialize_nested, is_null);
     }
 
     /// Check if we have enough data in buffer to check if it's a null.
     if (settings.csv.custom_delimiter.empty() && istr.available() > null_representation.size())
     {
-        auto check_for_null = [&istr, &null_representation, &settings]()
+        auto check_for_null = [&null_representation, &settings](ReadBuffer & buf)
         {
-            auto * pos = istr.position();
-            if (checkString(null_representation, istr) && (*istr.position() == settings.csv.delimiter || *istr.position() == '\r' || *istr.position() == '\n'))
+            auto * pos = buf.position();
+            if (checkString(null_representation, buf) && (*buf.position() == settings.csv.delimiter || *buf.position() == '\r' || *buf.position() == '\n'))
                 return true;
-            istr.position() = pos;
+            buf.position() = pos;
             return false;
         };
-        auto deserialize_nested = [&nested_serialization, &settings, &istr] (IColumn & nested_column)
-        {
-            nested_serialization->deserializeTextCSV(nested_column, istr, settings);
-        };
-        return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+        return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
     }
 
     /// We don't have enough data in buffer to check if it's a null.
     /// Use PeekableReadBuffer to make a checkpoint before checking null
     /// representation and rollback if the check was failed.
-    PeekableReadBuffer buf(istr, true);
-    auto check_for_null = [&buf, &null_representation, &settings]()
+    PeekableReadBuffer peekable_buf(istr, true);
+    auto check_for_null = [&null_representation, &settings](ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         buf.setCheckpoint();
         SCOPE_EXIT(buf.dropCheckpoint());
         if (checkString(null_representation, buf))
@@ -572,13 +718,18 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
         return false;
     };
 
-    auto deserialize_nested = [&nested_serialization, &settings, &buf, &null_representation, &istr] (IColumn & nested_column)
+    auto deserialize_nested_with_check = [&deserialize_nested, &nested_serialization, &settings, &null_representation, &istr] (IColumn & nested_column, ReadBuffer & buf_)
     {
+        auto & buf = assert_cast<PeekableReadBuffer &>(buf_);
         auto * pos = buf.position();
-        nested_serialization->deserializeTextCSV(nested_column, buf, settings);
+        if constexpr (throw_exception)
+            deserialize_nested(nested_column, buf);
+        else if (!deserialize_nested(nested_column, buf))
+            return ReturnType(false);
+
         /// Check that we don't have any unread data in PeekableReadBuffer own memory.
         if (likely(!buf.hasUnreadData()))
-            return;
+            return ReturnType(true);
 
         /// We have some unread data in PeekableReadBuffer own memory.
         /// It can happen only if there is an unquoted string instead of a number
@@ -587,6 +738,9 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
 
+        if constexpr (!throw_exception)
+            return ReturnType(false);
+
         if (null_representation.find(settings.csv.delimiter) != std::string::npos || null_representation.find('\r') != std::string::npos
             || null_representation.find('\n') != std::string::npos)
             throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "CSV custom null representation containing "
@@ -602,7 +756,35 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
                                    istr.count(), std::string(pos, buf.position() - pos), parsed_value.str());
     };
 
-    return safeDeserialize<ReturnType>(column, *nested_serialization, check_for_null, deserialize_nested);
+    return deserializeImpl<ReturnType>(column, peekable_buf, check_for_null, deserialize_nested_with_check, is_null);
+}
+
+void SerializationNullable::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextCSVImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextCSVImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextCSVImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextCSVImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -616,38 +798,86 @@ void SerializationNullable::serializeText(const IColumn & column, size_t row_num
     /// This assumes UTF-8 and proper font support. This is Ok, because Pretty formats are "presentational", not for data exchange.
 
     if (col.isNullAt(row_num))
-    {
-        if (settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8)
-            writeCString("ᴺᵁᴸᴸ", ostr);
-        else
-            writeCString("NULL", ostr);
-    }
+        serializeNullText(ostr, settings);
     else
         nested->serializeText(col.getNestedColumn(), row_num, ostr, settings);
 }
 
+void SerializationNullable::serializeNullText(DB::WriteBuffer & ostr, const DB::FormatSettings & settings)
+{
+    if (settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8)
+        writeCString("ᴺᵁᴸᴸ", ostr);
+    else
+        writeCString("NULL", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullText(DB::ReadBuffer & istr)
+{
+    if (checkCharCaseInsensitive('N', istr))
+        return checkStringCaseInsensitive("ULL", istr);
+    return checkStringCaseInsensitive("ᴺᵁᴸᴸ", istr);
+}
+
 void SerializationNullable::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     const ColumnNullable & col = assert_cast<const ColumnNullable &>(column);
 
     if (col.isNullAt(row_num))
-        writeCString("null", ostr);
+        serializeNullJSON(ostr);
     else
         nested->serializeTextJSON(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-void SerializationNullable::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+void SerializationNullable::serializeNullJSON(DB::WriteBuffer & ostr)
 {
-    deserializeTextJSONImpl<void>(column, istr, settings, nested);
+    writeCString("null", ostr);
+}
+
+bool SerializationNullable::tryDeserializeNullJSON(DB::ReadBuffer & istr)
+{
+    return checkString("null", istr);
 }
 
 template<typename ReturnType>
-ReturnType SerializationNullable::deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings,
-                                                    const SerializationPtr & nested)
+ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested, bool & is_null)
 {
-    return safeDeserialize<ReturnType>(column, *nested,
-        [&istr] { return checkStringByFirstCharacterAndAssertTheRest("null", istr); },
-        [&nested, &istr, &settings] (IColumn & nested_column) { nested->deserializeTextJSON(nested_column, istr, settings); });
+    auto check_for_null = [](ReadBuffer & buf){ return checkStringByFirstCharacterAndAssertTheRest("null", buf); };
+    auto deserialize_nested = [&nested, &settings](IColumn & nested_column, ReadBuffer & buf)
+    {
+        if constexpr (std::is_same_v<ReturnType, bool>)
+            return nested->tryDeserializeTextJSON(nested_column, buf, settings);
+        nested->deserializeTextJSON(nested_column, buf, settings);
+    };
+
+    return deserializeImpl<ReturnType>(column, istr, check_for_null, deserialize_nested, is_null);
+}
+
+void SerializationNullable::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    deserializeTextJSONImpl<void>(col.getNestedColumn(), istr, settings, nested, is_null);
+    safeAppendToNullMap<void>(col, is_null);
+}
+
+bool SerializationNullable::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnNullable & col = assert_cast<ColumnNullable &>(column);
+    bool is_null;
+    return deserializeTextJSONImpl<bool>(col.getNestedColumn(), istr, settings, nested, is_null) && safeAppendToNullMap<bool>(col, is_null);
+}
+
+bool SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    deserializeTextJSONImpl<void>(nested_column, istr, settings, nested_serialization, is_null);
+    return !is_null;
+}
+
+bool SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(DB::IColumn & nested_column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, const DB::SerializationPtr & nested_serialization)
+{
+    bool is_null;
+    return deserializeTextJSONImpl<bool>(nested_column, istr, settings, nested_serialization, is_null);
 }
 
 void SerializationNullable::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -660,11 +890,9 @@ void SerializationNullable::serializeTextXML(const IColumn & column, size_t row_
         nested->serializeTextXML(col.getNestedColumn(), row_num, ostr, settings);
 }
 
-template bool SerializationNullable::deserializeWholeTextImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextEscapedImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextQuotedImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextCSVImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextJSONImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-template bool SerializationNullable::deserializeTextRawImpl<bool>(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
+void SerializationNullable::serializeNullXML(DB::WriteBuffer & ostr)
+{
+    writeCString("\\N", ostr);
+}
 
 }
diff --git a/src/DataTypes/Serializations/SerializationNullable.h b/src/DataTypes/Serializations/SerializationNullable.h
index 3ec01b46de5..37858ccdefd 100644
--- a/src/DataTypes/Serializations/SerializationNullable.h
+++ b/src/DataTypes/Serializations/SerializationNullable.h
@@ -51,9 +51,12 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
@@ -66,31 +69,49 @@ public:
       * In CSV, non-NULL string value, starting with \N characters, must be placed in quotes, to avoid ambiguity.
       */
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
 
-    /// If ReturnType is bool, check for NULL and deserialize value into non-nullable column (and return true) or insert default value of nested type (and return false)
-    /// If ReturnType is void, deserialize Nullable(T)
-    template <typename ReturnType = bool>
-    static ReturnType deserializeWholeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextEscapedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextQuotedImpl(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested);
-    template <typename ReturnType = bool>
-    static ReturnType deserializeTextRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
-    template <typename ReturnType = bool, bool escaped>
-    static ReturnType deserializeTextEscapedAndRawImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested);
+    /// If Check for NULL and deserialize value into non-nullable column (and return true) or insert default value of nested type (and return false)
+    static bool deserializeNullAsDefaultOrNestedWholeText(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextQuoted(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextCSV(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextJSON(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool deserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+
+    /// If Check for NULL and deserialize value into non-nullable column or insert default value of nested type.
+    /// Return true if parsing was successful and false in case of any error.
+    static bool tryDeserializeNullAsDefaultOrNestedWholeText(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextEscaped(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextQuoted(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextCSV(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextJSON(IColumn & nested_column, ReadBuffer & istr, const FormatSettings &, const SerializationPtr & nested_serialization);
+    static bool tryDeserializeNullAsDefaultOrNestedTextRaw(IColumn & nested_column, ReadBuffer & istr, const FormatSettings & settings, const SerializationPtr & nested_serialization);
+
+
+    static void serializeNullEscaped(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullEscaped(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullQuoted(WriteBuffer & ostr);
+    static bool tryDeserializeNullQuoted(ReadBuffer & istr);
+    static void serializeNullCSV(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullCSV(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullJSON(WriteBuffer & ostr);
+    static bool tryDeserializeNullJSON(ReadBuffer & istr);
+    static void serializeNullRaw(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullRaw(ReadBuffer & istr, const FormatSettings & settings);
+    static void serializeNullText(WriteBuffer & ostr, const FormatSettings & settings);
+    static bool tryDeserializeNullText(ReadBuffer & istr);
+    static void serializeNullXML(WriteBuffer & ostr);
 
 private:
     struct SubcolumnCreator : public ISubcolumnCreator
diff --git a/src/DataTypes/Serializations/SerializationNumber.cpp b/src/DataTypes/Serializations/SerializationNumber.cpp
index b6c7e4618b8..bdb4dfc6735 100644
--- a/src/DataTypes/Serializations/SerializationNumber.cpp
+++ b/src/DataTypes/Serializations/SerializationNumber.cpp
@@ -37,6 +37,18 @@ void SerializationNumber<T>::deserializeText(IColumn & column, ReadBuffer & istr
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "Number");
 }
 
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
+{
+    T x;
+
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationNumber<T>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -44,9 +56,10 @@ void SerializationNumber<T>::serializeTextJSON(const IColumn & column, size_t ro
     writeJSONNumber(x, ostr, settings);
 }
 
-template <typename T>
-void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename T, typename ReturnType>
+ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     bool has_quote = false;
     if (!istr.eof() && *istr.position() == '"')        /// We understand the number both in quotes and without.
     {
@@ -54,13 +67,16 @@ void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         ++istr.position();
     }
 
-    FieldType x;
+    T x;
 
     /// null
     if (!has_quote && !istr.eof() && *istr.position() == 'n')
     {
         ++istr.position();
-        assertString("ull", istr);
+        if constexpr (throw_exception)
+            assertString("ull", istr);
+        else if (!checkString("ull", istr))
+            return ReturnType(false);
 
         x = NaNOrZero<T>();
     }
@@ -73,26 +89,62 @@ void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer &
         {
             // extra conditions to parse true/false strings into 1/0
             if (istr.eof())
-                throwReadAfterEOF();
+            {
+                if constexpr (throw_exception)
+                    throwReadAfterEOF();
+                else
+                    return false;
+            }
+
             if (*istr.position() == 't' || *istr.position() == 'f')
             {
                 bool tmp = false;
-                readBoolTextWord(tmp, istr);
+                if constexpr (throw_exception)
+                    readBoolTextWord(tmp, istr);
+                else if (!readBoolTextWord<bool>(tmp, istr))
+                    return ReturnType(false);
+
                 x = tmp;
             }
             else
-                readText(x, istr);
+            {
+                if constexpr (throw_exception)
+                    readText(x, istr);
+                else if (!tryReadText(x, istr))
+                    return ReturnType(false);
+            }
         }
         else
         {
-            readText(x, istr);
+            if constexpr (throw_exception)
+                readText(x, istr);
+            else if (!tryReadText(x, istr))
+                return ReturnType(false);
         }
 
         if (has_quote)
-            assertChar('"', istr);
+        {
+            if constexpr (throw_exception)
+                assertChar('"', istr);
+            else if (!checkChar('"', istr))
+                return ReturnType(false);
+        }
     }
 
     assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return ReturnType(true);
+}
+
+template <typename T>
+void SerializationNumber<T>::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    deserializeTextJSONImpl<T, void>(column, istr, settings);
+}
+
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return deserializeTextJSONImpl<T, bool>(column, istr, settings);
 }
 
 template <typename T>
@@ -103,6 +155,16 @@ void SerializationNumber<T>::deserializeTextCSV(IColumn & column, ReadBuffer & i
     assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
 }
 
+template <typename T>
+bool SerializationNumber<T>::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & /*settings*/) const
+{
+    FieldType x;
+    if (!tryReadCSV(x, istr))
+        return false;
+    assert_cast<ColumnVector<T> &>(column).getData().push_back(x);
+    return true;
+}
+
 template <typename T>
 void SerializationNumber<T>::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
 {
diff --git a/src/DataTypes/Serializations/SerializationNumber.h b/src/DataTypes/Serializations/SerializationNumber.h
index 972c6c9a30f..9d53dc9c494 100644
--- a/src/DataTypes/Serializations/SerializationNumber.h
+++ b/src/DataTypes/Serializations/SerializationNumber.h
@@ -20,9 +20,12 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     /** Format is platform-dependent. */
     void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index 788ff429088..1680ec8a333 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -272,40 +272,67 @@ void SerializationString::serializeTextEscaped(const IColumn & column, size_t ro
 }
 
 
-template <typename Reader>
-static inline void read(IColumn & column, Reader && reader)
+template <typename ReturnType, typename Reader>
+static inline ReturnType read(IColumn & column, Reader && reader)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     ColumnString & column_string = assert_cast<ColumnString &>(column);
     ColumnString::Chars & data = column_string.getChars();
     ColumnString::Offsets & offsets = column_string.getOffsets();
     size_t old_chars_size = data.size();
     size_t old_offsets_size = offsets.size();
-    try
-    {
-        reader(data);
-        data.push_back(0);
-        offsets.push_back(data.size());
-    }
-    catch (...)
+    auto restore_column = [&]()
     {
         offsets.resize_assume_reserved(old_offsets_size);
         data.resize_assume_reserved(old_chars_size);
-        throw;
+    };
+
+    try
+    {
+        if constexpr (throw_exception)
+        {
+            reader(data);
+        }
+        else if (!reader(data))
+        {
+            restore_column();
+            return false;
+        }
+
+        data.push_back(0);
+        offsets.push_back(data.size());
+        return ReturnType(true);
+    }
+    catch (...)
+    {
+        restore_column();
+        if constexpr (throw_exception)
+            throw;
+        else
+            return false;
     }
 }
 
 
 void SerializationString::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); });
 }
 
+bool SerializationString::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readStringUntilEOFInto(data, istr); return true; });
+}
 
 void SerializationString::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); });
 }
 
+bool SerializationString::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); return true; });
+}
 
 void SerializationString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
@@ -315,7 +342,12 @@ void SerializationString::serializeTextQuoted(const IColumn & column, size_t row
 
 void SerializationString::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
-    read(column, [&](ColumnString::Chars & data) { readQuotedStringInto<true>(data, istr); });
+    read<void>(column, [&](ColumnString::Chars & data) { readQuotedStringInto<true>(data, istr); });
+}
+
+bool SerializationString::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { return tryReadQuotedStringInto<true>(data, istr); });
 }
 
 
@@ -329,11 +361,11 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
 {
     if (settings.json.read_objects_as_strings && !istr.eof() && *istr.position() == '{')
     {
-        read(column, [&](ColumnString::Chars & data) { readJSONObjectPossiblyInvalid(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONObjectPossiblyInvalid(data, istr); });
     }
     else if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
     {
-        read(column, [&](ColumnString::Chars & data) { readJSONArrayInto(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONArrayInto(data, istr); });
     }
     else if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
@@ -342,12 +374,40 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
         Float64 tmp;
         ReadBufferFromString buf(field);
         if (tryReadFloatText(tmp, buf) && buf.eof())
-            read(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
+            read<void>(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
         else
             throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse JSON String value here: {}", field);
     }
     else
-        read(column, [&](ColumnString::Chars & data) { readJSONStringInto(data, istr); });
+        read<void>(column, [&](ColumnString::Chars & data) { readJSONStringInto(data, istr); });
+}
+
+bool SerializationString::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    if (settings.json.read_objects_as_strings && !istr.eof() && *istr.position() == '{')
+        return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONObjectPossiblyInvalid<ColumnString::Chars, bool>(data, istr); });
+
+    if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
+        return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONArrayInto<ColumnString::Chars, bool>(data, istr); });
+
+    if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
+    {
+        String field;
+        if (!tryReadJSONField(field, istr))
+            return false;
+
+        Float64 tmp;
+        ReadBufferFromString buf(field);
+        if (tryReadFloatText(tmp, buf) && buf.eof())
+        {
+            read<void>(column, [&](ColumnString::Chars & data) { data.insert(field.begin(), field.end()); });
+            return true;
+        }
+
+        return false;
+    }
+
+    return read<bool>(column, [&](ColumnString::Chars & data) { return tryReadJSONStringInto(data, istr); });
 }
 
 
@@ -365,7 +425,12 @@ void SerializationString::serializeTextCSV(const IColumn & column, size_t row_nu
 
 void SerializationString::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    read(column, [&](ColumnString::Chars & data) { readCSVStringInto(data, istr, settings.csv); });
+    read<void>(column, [&](ColumnString::Chars & data) { readCSVStringInto(data, istr, settings.csv); });
+}
+
+bool SerializationString::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return read<bool>(column, [&](ColumnString::Chars & data) { readCSVStringInto<ColumnString::Chars, false, false>(data, istr, settings.csv); return true; });
 }
 
 void SerializationString::serializeTextMarkdown(
diff --git a/src/DataTypes/Serializations/SerializationString.h b/src/DataTypes/Serializations/SerializationString.h
index cd4cdf79c11..89ab84f0d22 100644
--- a/src/DataTypes/Serializations/SerializationString.h
+++ b/src/DataTypes/Serializations/SerializationString.h
@@ -18,20 +18,25 @@ public:
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextMarkdown(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 };
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index cbbe97eb05c..c0b0658e6b4 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -62,15 +62,35 @@ void SerializationTuple::serializeBinary(const IColumn & column, size_t row_num,
 }
 
 
-template <typename F>
-static void addElementSafe(size_t num_elems, IColumn & column, F && impl)
+template <typename ReturnType = void, typename F>
+static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     /// We use the assumption that tuples of zero size do not exist.
     size_t old_size = column.size();
 
+    auto restore_elements = [&]()
+    {
+        for (size_t i = 0; i < num_elems; ++i)
+        {
+            auto & element_column = extractElementColumn(column, i);
+            if (element_column.size() > old_size)
+                element_column.popBack(1);
+        }
+    };
+
     try
     {
-        impl();
+        if constexpr (throw_exception)
+        {
+            impl();
+        }
+        else if (!impl())
+        {
+            restore_elements();
+            return ReturnType(false);
+        }
 
         // Check that all columns now have the same size.
         size_t new_size = column.size();
@@ -81,22 +101,23 @@ static void addElementSafe(size_t num_elems, IColumn & column, F && impl)
             {
                 // This is not a logical error because it may work with
                 // user-supplied data.
-                throw Exception(ErrorCodes::SIZES_OF_COLUMNS_IN_TUPLE_DOESNT_MATCH,
-                    "Cannot read a tuple because not all elements are present");
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::SIZES_OF_COLUMNS_IN_TUPLE_DOESNT_MATCH,
+                        "Cannot read a tuple because not all elements are present");
+                restore_elements();
+                return ReturnType(false);
             }
         }
     }
     catch (...)
     {
-        for (size_t i = 0; i < num_elems; ++i)
-        {
-            auto & element_column = extractElementColumn(column, i);
-            if (element_column.size() > old_size)
-                element_column.popBack(1);
-        }
-
-        throw;
+        restore_elements();
+        if constexpr (throw_exception)
+            throw;
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
 }
 
 void SerializationTuple::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -120,25 +141,51 @@ void SerializationTuple::serializeText(const IColumn & column, size_t row_num, W
     writeChar(')', ostr);
 }
 
-void SerializationTuple::deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+template <typename ReturnType>
+ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
 {
-    const size_t size = elems.size();
-    assertChar('(', istr);
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
 
-    addElementSafe(elems.size(), column, [&]
+    const size_t size = elems.size();
+    if constexpr (throw_exception)
+        assertChar('(', istr);
+    else if (!checkChar('(', istr))
+        return ReturnType(false);
+
+    auto impl = [&]()
     {
         for (size_t i = 0; i < size; ++i)
         {
             skipWhitespaceIfAny(istr);
             if (i != 0)
             {
-                assertChar(',', istr);
+                if constexpr (throw_exception)
+                    assertChar(',', istr);
+                else if (!checkChar(',', istr))
+                    return ReturnType(false);
+
                 skipWhitespaceIfAny(istr);
             }
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextQuotedImpl(extractElementColumn(column, i), istr, settings, elems[i]);
+
+            auto & element_column = extractElementColumn(column, i);
+            if constexpr (throw_exception)
+            {
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                    SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(element_column, istr, settings, elems[i]);
+                else
+                    elems[i]->deserializeTextQuoted(element_column, istr, settings);
+            }
             else
-                elems[i]->deserializeTextQuoted(extractElementColumn(column, i), istr, settings);
+            {
+                bool ok;
+                if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                    ok = SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextQuoted(element_column, istr, settings, elems[i]);
+                else
+                    ok = elems[i]->tryDeserializeTextQuoted(element_column, istr, settings);
+
+                if (!ok)
+                    return false;
+            }
         }
 
         // Special format for one element tuple (1,)
@@ -150,11 +197,35 @@ void SerializationTuple::deserializeText(IColumn & column, ReadBuffer & istr, co
         }
 
         skipWhitespaceIfAny(istr);
-        assertChar(')', istr);
+        if constexpr (throw_exception)
+            assertChar(')', istr);
+        else if (!checkChar(')', istr))
+            return ReturnType(false);
 
         if (whole && !istr.eof())
-            throwUnexpectedDataAfterParsedValue(column, istr, settings, "Tuple");
-    });
+        {
+            if constexpr (throw_exception)
+                throwUnexpectedDataAfterParsedValue(column, istr, settings, "Tuple");
+            return ReturnType(false);
+        }
+
+        return ReturnType(true);
+    };
+
+    if constexpr (throw_exception)
+        addElementSafe<ReturnType>(elems.size(), column, impl);
+    else
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
+}
+
+void SerializationTuple::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    deserializeTextImpl(column, istr, settings, whole);
+}
+
+bool SerializationTuple::tryDeserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
+{
+    return deserializeTextImpl<bool>(column, istr, settings, whole);
 }
 
 void SerializationTuple::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
@@ -239,16 +310,39 @@ void SerializationTuple::serializeTextJSONPretty(const IColumn & column, size_t
     }
 }
 
-void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+template <typename ReturnType>
+ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    auto deserialize_element = [&](IColumn & element_column, size_t element_pos)
+    {
+        if constexpr (throw_exception)
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(element_column, istr, settings, elems[element_pos]);
+            else
+                elems[element_pos]->deserializeTextJSON(element_column, istr, settings);
+        }
+        else
+        {
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                return SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextJSON(element_column, istr, settings, elems[element_pos]);
+            return elems[element_pos]->tryDeserializeTextJSON(element_column, istr, settings);
+        }
+    };
+
     if (settings.json.read_named_tuples_as_objects
         && have_explicit_names)
     {
         skipWhitespaceIfAny(istr);
-        assertChar('{', istr);
+        if constexpr (throw_exception)
+            assertChar('{', istr);
+        else if (!checkChar('{', istr))
+            return ReturnType(false);
         skipWhitespaceIfAny(istr);
 
-        addElementSafe(elems.size(), column, [&]
+        auto impl = [&]()
         {
             std::vector<UInt8> seen_elements(elems.size(), 0);
             size_t processed = 0;
@@ -256,18 +350,32 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
             while (!istr.eof() && *istr.position() != '}')
             {
                 if (!settings.json.ignore_unknown_keys_in_named_tuple && processed == elems.size())
-                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected number of elements in named tuple. Expected no more than {} (consider enabling input_format_json_ignore_unknown_keys_in_named_tuple setting)", elems.size());
+                {
+                    if constexpr (throw_exception)
+                        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected number of elements in named tuple. Expected no more than {} (consider enabling input_format_json_ignore_unknown_keys_in_named_tuple setting)", elems.size());
+                    return ReturnType(false);
+                }
 
                 if (processed + skipped > 0)
                 {
-                    assertChar(',', istr);
+                    if constexpr (throw_exception)
+                        assertChar(',', istr);
+                    else if (!checkChar(',', istr))
+                        return ReturnType(false);
                     skipWhitespaceIfAny(istr);
                 }
 
                 std::string name;
-                readDoubleQuotedString(name, istr);
+                if constexpr (throw_exception)
+                    readDoubleQuotedString(name, istr);
+                else if (!tryReadDoubleQuotedString(name, istr))
+                    return ReturnType(false);
+
                 skipWhitespaceIfAny(istr);
-                assertChar(':', istr);
+                if constexpr (throw_exception)
+                    assertChar(':', istr);
+                else if (!checkChar(':', istr))
+                    return ReturnType(false);
                 skipWhitespaceIfAny(istr);
 
                 const size_t element_pos = getPositionByName(name);
@@ -275,36 +383,52 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
                 {
                     if (settings.json.ignore_unknown_keys_in_named_tuple)
                     {
-                        skipJSONField(istr, name);
+                        if constexpr (throw_exception)
+                            skipJSONField(istr, name);
+                        else if (!trySkipJSONField(istr, name))
+                            return ReturnType(false);
+
                         skipWhitespaceIfAny(istr);
                         ++skipped;
                         continue;
                     }
                     else
-                        throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}', enable setting input_format_json_ignore_unknown_keys_in_named_tuple", name);
+                    {
+                        if constexpr (throw_exception)
+                            throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}', enable setting input_format_json_ignore_unknown_keys_in_named_tuple", name);
+                        return ReturnType(false);
+                    }
                 }
 
                 seen_elements[element_pos] = 1;
                 auto & element_column = extractElementColumn(column, element_pos);
 
-                try
+                if constexpr (throw_exception)
                 {
-                    if (settings.null_as_default)
-                        SerializationNullable::deserializeTextJSONImpl(element_column, istr, settings, elems[element_pos]);
-                    else
-                        elems[element_pos]->deserializeTextJSON(element_column, istr, settings);
+                    try
+                    {
+                        deserialize_element(element_column, element_pos);
+                    }
+                    catch (Exception & e)
+                    {
+                        e.addMessage("(while reading the value of nested key " + name + ")");
+                        throw;
+                    }
                 }
-                catch (Exception & e)
+                else
                 {
-                    e.addMessage("(while reading the value of nested key " + name + ")");
-                    throw;
+                    if (!deserialize_element(element_column, element_pos))
+                        return ReturnType(false);
                 }
 
                 skipWhitespaceIfAny(istr);
                 ++processed;
             }
 
-            assertChar('}', istr);
+            if constexpr (throw_exception)
+                assertChar('}', istr);
+            else if (!checkChar('}', istr))
+                return ReturnType(false);
 
             /// Check if we have missing elements.
             if (processed != elems.size())
@@ -315,41 +439,87 @@ void SerializationTuple::deserializeTextJSON(IColumn & column, ReadBuffer & istr
                         continue;
 
                     if (!settings.json.defaults_for_missing_elements_in_named_tuple)
-                        throw Exception(
-                            ErrorCodes::INCORRECT_DATA,
-                            "JSON object doesn't contain tuple element {}. If you want to insert defaults in case of missing elements, "
-                            "enable setting input_format_json_defaults_for_missing_elements_in_named_tuple",
-                            elems[element_pos]->getElementName());
+                    {
+                        if constexpr (throw_exception)
+                            throw Exception(
+                                ErrorCodes::INCORRECT_DATA,
+                                "JSON object doesn't contain tuple element {}. If you want to insert defaults in case of missing elements, "
+                                "enable setting input_format_json_defaults_for_missing_elements_in_named_tuple",
+                                elems[element_pos]->getElementName());
+                        return ReturnType(false);
+                    }
 
                     auto & element_column = extractElementColumn(column, element_pos);
                     element_column.insertDefault();
                 }
             }
-        });
+
+            return ReturnType(true);
+        };
+
+        if constexpr (throw_exception)
+            addElementSafe<ReturnType>(elems.size(), column, impl);
+        else
+            return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
     else
     {
-        assertChar('[', istr);
+        skipWhitespaceIfAny(istr);
+        if constexpr (throw_exception)
+            assertChar('[', istr);
+        else if (!checkChar('[', istr))
+            return ReturnType(false);
+        skipWhitespaceIfAny(istr);
 
-        addElementSafe(elems.size(), column, [&]
+        auto impl = [&]()
         {
             for (size_t i = 0; i < elems.size(); ++i)
             {
                 skipWhitespaceIfAny(istr);
                 if (i != 0)
                 {
-                    assertChar(',', istr);
+                    if constexpr (throw_exception)
+                        assertChar(',', istr);
+                    else if (!checkChar(',', istr))
+                        return ReturnType(false);
                     skipWhitespaceIfAny(istr);
                 }
-                elems[i]->deserializeTextJSON(extractElementColumn(column, i), istr, settings);
+
+                auto & element_column = extractElementColumn(column, i);
+
+                if constexpr (throw_exception)
+                    deserialize_element(element_column, i);
+                else if (!deserialize_element(element_column, i))
+                    return ReturnType(false);
             }
 
             skipWhitespaceIfAny(istr);
-            assertChar(']', istr);
-        });
+            if constexpr (throw_exception)
+                assertChar(']', istr);
+            else if (!checkChar(']', istr))
+                return ReturnType(false);
+
+            return ReturnType(true);
+        };
+
+        if constexpr (throw_exception)
+            addElementSafe<ReturnType>(elems.size(), column, impl);
+        else
+            return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
 }
 
+void SerializationTuple::deserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    deserializeTextJSONImpl(column, istr, settings);
+}
+
+bool SerializationTuple::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
+{
+    return deserializeTextJSONImpl<bool>(column, istr, settings);
+}
+
+
 void SerializationTuple::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeCString("<tuple>", ostr);
@@ -385,14 +555,48 @@ void SerializationTuple::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
                 assertChar(settings.csv.tuple_delimiter, istr);
                 skipWhitespaceIfAny(istr);
             }
-            if (settings.null_as_default)
-                SerializationNullable::deserializeTextCSVImpl(extractElementColumn(column, i), istr, settings, elems[i]);
+
+            auto & element_column = extractElementColumn(column, i);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+                SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(element_column, istr, settings, elems[i]);
             else
-                elems[i]->deserializeTextCSV(extractElementColumn(column, i), istr, settings);
+                elems[i]->deserializeTextCSV(element_column, istr, settings);
         }
     });
 }
 
+bool SerializationTuple::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return addElementSafe<bool>(elems.size(), column, [&]
+    {
+        const size_t size = elems.size();
+        for (size_t i = 0; i < size; ++i)
+        {
+            if (i != 0)
+            {
+               skipWhitespaceIfAny(istr);
+               if (!checkChar(settings.csv.tuple_delimiter, istr))
+                   return false;
+               skipWhitespaceIfAny(istr);
+            }
+
+            auto & element_column = extractElementColumn(column, i);
+            if (settings.null_as_default && !isColumnNullableOrLowCardinalityNullable(element_column))
+            {
+               if (!SerializationNullable::tryDeserializeNullAsDefaultOrNestedTextCSV(element_column, istr, settings, elems[i]))
+                   return false;
+            }
+            else
+            {
+               if (!elems[i]->tryDeserializeTextCSV(element_column, istr, settings))
+                   return false;
+            }
+        }
+
+        return true;
+    });
+}
+
 void SerializationTuple::enumerateStreams(
     EnumerateStreamsSettings & settings,
     const StreamCallback & callback,
diff --git a/src/DataTypes/Serializations/SerializationTuple.h b/src/DataTypes/Serializations/SerializationTuple.h
index 7325259f440..d9c63a05217 100644
--- a/src/DataTypes/Serializations/SerializationTuple.h
+++ b/src/DataTypes/Serializations/SerializationTuple.h
@@ -23,14 +23,17 @@ public:
     void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
 
     /// Tuples in CSV format will be serialized as separate columns (that is, losing their nesting in the tuple).
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     /** Each sub-column in a tuple is serialized in separate stream.
       */
@@ -73,6 +76,15 @@ private:
     bool have_explicit_names;
 
     size_t getPositionByName(const String & name) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextJSONImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
+
+    template <typename ReturnType = void>
+    ReturnType deserializeTextCSVImpl(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationUUID.cpp b/src/DataTypes/Serializations/SerializationUUID.cpp
index 5cf17b4c0c8..5a7aeca67a0 100644
--- a/src/DataTypes/Serializations/SerializationUUID.cpp
+++ b/src/DataTypes/Serializations/SerializationUUID.cpp
@@ -25,15 +25,16 @@ void SerializationUUID::deserializeText(IColumn & column, ReadBuffer & istr, con
         throwUnexpectedDataAfterParsedValue(column, istr, settings, "UUID");
 }
 
-void SerializationUUID::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+bool SerializationUUID::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
 {
-    deserializeText(column, istr, settings, false);
+    UUID x;
+    if (!tryReadText(x, istr) || (whole && !istr.eof()))
+        return false;
+
+    assert_cast<ColumnUUID &>(column).getData().push_back(x);
+    return true;
 }
 
-void SerializationUUID::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
-{
-    serializeText(column, row_num, ostr, settings);
-}
 
 void SerializationUUID::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
@@ -76,6 +77,17 @@ void SerializationUUID::deserializeTextQuoted(IColumn & column, ReadBuffer & ist
     assert_cast<ColumnUUID &>(column).getData().push_back(std::move(uuid)); /// It's important to do this at the end - for exception safety.
 }
 
+bool SerializationUUID::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID uuid;
+    String field;
+    if (!checkChar('\'', istr) || !tryReadText(uuid, istr) || !checkChar('\'', istr))
+        return false;
+
+    assert_cast<ColumnUUID &>(column).getData().push_back(std::move(uuid));
+    return true;
+}
+
 void SerializationUUID::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -92,6 +104,15 @@ void SerializationUUID::deserializeTextJSON(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUUID &>(column).getData().push_back(x);
 }
 
+bool SerializationUUID::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID x;
+    if (!checkChar('"', istr) || !tryReadText(x, istr) || !checkChar('"', istr))
+        return false;
+    assert_cast<ColumnUUID &>(column).getData().push_back(x);
+    return true;
+}
+
 void SerializationUUID::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     writeChar('"', ostr);
@@ -106,6 +127,14 @@ void SerializationUUID::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
     assert_cast<ColumnUUID &>(column).getData().push_back(value);
 }
 
+bool SerializationUUID::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
+{
+    UUID value;
+    if (!tryReadCSV(value, istr))
+        return false;
+    assert_cast<ColumnUUID &>(column).getData().push_back(value);
+    return true;
+}
 
 void SerializationUUID::serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const
 {
diff --git a/src/DataTypes/Serializations/SerializationUUID.h b/src/DataTypes/Serializations/SerializationUUID.h
index da8c15f7279..458504f8f42 100644
--- a/src/DataTypes/Serializations/SerializationUUID.h
+++ b/src/DataTypes/Serializations/SerializationUUID.h
@@ -10,14 +10,16 @@ class SerializationUUID : public SimpleTextSerialization
 public:
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
-    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
-    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const override;
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
 
     void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings &) const override;
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
new file mode 100644
index 00000000000..ebd44fd6955
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -0,0 +1,828 @@
+#include <DataTypes/Serializations/SerializationVariant.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+#include <DataTypes/Serializations/SerializationNumber.h>
+#include <DataTypes/Serializations/SerializationNullable.h>
+#include <DataTypes/Serializations/SerializationNamed.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeMap.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Columns/ColumnVariant.h>
+
+#include <IO/ReadBuffer.h>
+#include <IO/WriteBuffer.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadHelpers.h>
+#include <IO/ReadBufferFromString.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
+    extern const int INCORRECT_DATA;
+}
+
+void SerializationVariant::enumerateStreams(
+    EnumerateStreamsSettings & settings,
+    const StreamCallback & callback,
+    const SubstreamData & data) const
+{
+    const auto * type_variant = data.type ? &assert_cast<const DataTypeVariant &>(*data.type) : nullptr;
+    const auto * column_variant = data.column ? &assert_cast<const ColumnVariant &>(*data.column) : nullptr;
+
+    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", false);
+    auto local_discriminators = column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr;
+
+    settings.path.push_back(Substream::VariantDiscriminators);
+    auto discriminators_data = SubstreamData(discriminators_serialization)
+                             .withType(type_variant ? std::make_shared<DataTypeNumber<ColumnVariant::Discriminator>>() : nullptr)
+                             .withColumn(column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr)
+                             .withSerializationInfo(data.serialization_info);
+
+    settings.path.back().data = discriminators_data;
+    callback(settings.path);
+    settings.path.pop_back();
+
+    settings.path.push_back(Substream::VariantElements);
+    settings.path.back().data = data;
+
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        settings.path.back().creator = std::make_shared<SerializationVariantElement::VariantSubcolumnCreator>(local_discriminators, variant_names[i], i, column_variant ? column_variant->localDiscriminatorByGlobal(i) : i);
+
+        auto variant_data = SubstreamData(variants[i])
+                             .withType(type_variant ? type_variant->getVariant(i) : nullptr)
+                             .withColumn(column_variant ? column_variant->getVariantPtrByGlobalDiscriminator(i) : nullptr)
+                             .withSerializationInfo(data.serialization_info);
+
+        addVariantElementToPath(settings.path, i);
+        settings.path.back().data = variant_data;
+        variants[i]->enumerateStreams(settings, callback, variant_data);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+}
+
+struct SerializeBinaryBulkStateVariant : public ISerialization::SerializeBinaryBulkState
+{
+    std::vector<ISerialization::SerializeBinaryBulkStatePtr> states;
+};
+
+struct DeserializeBinaryBulkStateVariant : public ISerialization::DeserializeBinaryBulkState
+{
+    std::vector<ISerialization::DeserializeBinaryBulkStatePtr> states;
+};
+
+void SerializationVariant::serializeBinaryBulkStatePrefix(
+    const IColumn & column,
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+
+    auto variant_state = std::make_shared<SerializeBinaryBulkStateVariant>();
+    variant_state->states.resize(variants.size());
+
+    settings.path.push_back(Substream::VariantElements);
+
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkStatePrefix(col.getVariantByGlobalDiscriminator(i), settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+    state = std::move(variant_state);
+}
+
+
+void SerializationVariant::serializeBinaryBulkStateSuffix(
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    auto * variant_state = checkAndGetState<SerializeBinaryBulkStateVariant>(state);
+
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkStateSuffix(settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+
+void SerializationVariant::deserializeBinaryBulkStatePrefix(
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state) const
+{
+    auto variant_state = std::make_shared<DeserializeBinaryBulkStateVariant>();
+    variant_state->states.resize(variants.size());
+
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i < variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->deserializeBinaryBulkStatePrefix(settings, variant_state->states[i]);
+        settings.path.pop_back();
+    }
+
+    settings.path.pop_back();
+    state = std::move(variant_state);
+}
+
+
+void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
+    const IColumn & column,
+    size_t offset,
+    size_t limit,
+    SerializeBinaryBulkSettings & settings,
+    SerializeBinaryBulkStatePtr & state) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    if (const size_t size = col.size(); limit == 0 || offset + limit > size)
+        limit = size - offset;
+
+    settings.path.push_back(Substream::VariantDiscriminators);
+    auto * discriminators_stream = settings.getter(settings.path);
+    settings.path.pop_back();
+
+    if (!discriminators_stream)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::serializeBinaryBulkWithMultipleStreams");
+
+    auto * variant_state = checkAndGetState<SerializeBinaryBulkStateVariant>(state);
+
+    /// If offset = 0 and limit == col.size() or we have only NULLs, we don't need to calculate
+    /// offsets and limits for variants and need to just serialize whole columns.
+    if ((offset == 0 && limit == col.size()) || col.hasOnlyNulls())
+    {
+        /// First, serialize discriminators.
+        /// If we have only NULLs or local and global discriminators are the same, just serialize the column as is.
+        if (col.hasOnlyNulls() || col.hasGlobalVariantsOrder())
+        {
+            SerializationNumber<ColumnVariant::Discriminator>().serializeBinaryBulk(col.getLocalDiscriminatorsColumn(), *discriminators_stream, offset, limit);
+        }
+        /// If local and global discriminators are different, we should convert local to global before serializing (because we don't serialize the mapping).
+        else
+        {
+            const auto & local_discriminators = col.getLocalDiscriminators();
+            for (size_t i = offset; i != offset + limit; ++i)
+                writeBinaryLittleEndian(col.globalDiscriminatorByLocal(local_discriminators[i]), *discriminators_stream);
+        }
+
+        /// Second, serialize variants in global order.
+        settings.path.push_back(Substream::VariantElements);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            addVariantElementToPath(settings.path, i);
+            variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
+            settings.path.pop_back();
+        }
+        settings.path.pop_back();
+        return;
+    }
+
+    /// If we have only one non empty variant and no NULLs, we can use the same limit offset for this variant.
+    if (auto non_empty_local_discr = col.getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+    {
+        /// First, serialize discriminators.
+        /// We know that all discriminators are the same, so we just need to serialize this discriminator limit times.
+        auto non_empty_global_discr = col.globalDiscriminatorByLocal(*non_empty_local_discr);
+        for (size_t i = 0; i != limit; ++i)
+            writeBinaryLittleEndian(non_empty_global_discr, *discriminators_stream);
+
+        /// Second, serialize variants in global order.
+        settings.path.push_back(Substream::VariantElements);
+        for (size_t i = 0; i != variants.size(); ++i)
+        {
+            addVariantElementToPath(settings.path, i);
+            /// For non empty variant use the same offset/limit as for whole Variant column
+            if (i == non_empty_global_discr)
+                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), offset, limit, settings, variant_state->states[i]);
+            /// For empty variants, use just 0/0, they won't serialize anything.
+            else
+                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
+            settings.path.pop_back();
+        }
+        settings.path.pop_back();
+        return;
+    }
+
+    /// In general case we should iterate through local discriminators in range [offset, offset + limit] to serialize global discriminators and calculate offset/limit pair for each variant.
+    const auto & local_discriminators = col.getLocalDiscriminators();
+    const auto & offsets = col.getOffsets();
+    std::vector<std::pair<size_t, size_t>> variant_offsets_and_limits(variants.size(), {0, 0});
+    size_t end = offset + limit;
+    for (size_t i = offset; i < end; ++i)
+    {
+        auto global_discr = col.globalDiscriminatorByLocal(local_discriminators[i]);
+        writeBinaryLittleEndian(global_discr, *discriminators_stream);
+
+        if (global_discr != ColumnVariant::NULL_DISCRIMINATOR)
+        {
+            /// If we see this discriminator for the first time, update offset
+            if (!variant_offsets_and_limits[global_discr].second)
+                variant_offsets_and_limits[global_discr].first = offsets[i];
+            /// Update limit for this discriminator.
+            ++variant_offsets_and_limits[global_discr].second;
+        }
+    }
+
+    /// If limit for some variant is 0, it means that we don't have its discriminator in the range.
+    /// Set offset to the size of column for such variants, so we won't serialize values from them.
+    for (size_t i = 0; i != variant_offsets_and_limits.size(); ++i)
+    {
+        if (!variant_offsets_and_limits[i].second)
+            variant_offsets_and_limits[i].first = col.getVariantByGlobalDiscriminator(i).size();
+    }
+
+    /// Serialize variants in global order.
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->serializeBinaryBulkWithMultipleStreams(
+            col.getVariantByGlobalDiscriminator(i),
+            variant_offsets_and_limits[i].first,
+            variant_offsets_and_limits[i].second,
+            settings,
+            variant_state->states[i]);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+
+void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
+    ColumnPtr & column,
+    size_t limit,
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state,
+    SubstreamsCache * cache) const
+{
+    auto mutable_column = column->assumeMutable();
+    ColumnVariant & col = assert_cast<ColumnVariant &>(*mutable_column);
+    /// We always serialize Variant column with global variants order,
+    /// so while deserialization column should be always with global variants order.
+    if (!col.hasGlobalVariantsOrder())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
+
+    /// First, deserialize new discriminators.
+    /// We deserialize them into a separate column to be able to use substream cache,
+    /// so if we also need to deserialize some of sub columns, we will read discriminators only once.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    ColumnPtr discriminators;
+    if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
+    {
+        discriminators = cached_discriminators;
+    }
+    else
+    {
+        auto * discriminators_stream = settings.getter(settings.path);
+        if (!discriminators_stream)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
+
+        discriminators = ColumnVariant::ColumnDiscriminators::create();
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, discriminators);
+    }
+
+    settings.path.pop_back();
+
+    /// Iterate through new discriminators, append them to column and calculate the limit for each variant.
+    /// While calculating limits we can also fill offsets column (we store offsets only in memory).
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
+    auto & local_discriminators = col.getLocalDiscriminators();
+    local_discriminators.reserve(local_discriminators.size() + limit);
+    auto & offsets = col.getOffsets();
+    offsets.reserve(offsets.size() + limit);
+    std::vector<size_t> variant_limits(variants.size(), 0);
+    for (size_t i = 0; i != limit; ++i)
+    {
+        ColumnVariant::Discriminator discr = discriminators_data[i];
+        local_discriminators.push_back(discr);
+        if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+            offsets.emplace_back();
+        else
+            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]++);
+    }
+
+    /// Now we can deserialize variants according to their limits.
+    auto * variant_state = checkAndGetState<DeserializeBinaryBulkStateVariant>(state);
+    settings.path.push_back(Substream::VariantElements);
+    for (size_t i = 0; i != variants.size(); ++i)
+    {
+        addVariantElementToPath(settings.path, i);
+        variants[i]->deserializeBinaryBulkWithMultipleStreams(col.getVariantPtrByLocalDiscriminator(i), variant_limits[i], settings, variant_state->states[i], cache);
+        settings.path.pop_back();
+    }
+    settings.path.pop_back();
+}
+
+void SerializationVariant::addVariantElementToPath(DB::ISerialization::SubstreamPath & path, size_t i) const
+{
+    path.push_back(Substream::VariantElement);
+    path.back().variant_element_name = variant_names[i];
+}
+
+void SerializationVariant::serializeBinary(const Field & /*field*/, WriteBuffer & /*ostr*/, const FormatSettings & /*settings*/) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinary from a field is not implemented for SerializationVariant");
+}
+
+void SerializationVariant::deserializeBinary(Field & /*field*/, ReadBuffer & /*istr*/, const FormatSettings & /*settings*/) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method deserializeBinary to a field is not implemented for SerializationVariant");
+}
+
+void SerializationVariant::serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    writeBinaryLittleEndian(global_discr, ostr);
+    if (global_discr != ColumnVariant::NULL_DISCRIMINATOR)
+        variants[global_discr]->serializeBinary(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+void SerializationVariant::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    ColumnVariant & col = assert_cast<ColumnVariant &>(column);
+    ColumnVariant::Discriminator global_discr;
+    readBinaryLittleEndian(global_discr, istr);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+    {
+        col.insertDefault();
+    }
+    else
+    {
+        auto & variant_column = col.getVariantByGlobalDiscriminator(global_discr);
+        variants[global_discr]->deserializeBinary(variant_column, istr, settings);
+        col.getLocalDiscriminators().push_back(col.localDiscriminatorByGlobal(global_discr));
+        col.getOffsets().push_back(variant_column.size() - 1);
+    }
+}
+
+namespace
+{
+
+std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
+{
+    static const std::vector<TypeIndex> priorities = {
+        /// Complex types have highest priority.
+        TypeIndex::Array,
+        TypeIndex::Tuple,
+        TypeIndex::Map,
+        TypeIndex::AggregateFunction,
+
+        /// Enums can be parsed both from strings and numbers.
+        /// So they have high enough priority.
+        TypeIndex::Enum8,
+        TypeIndex::Enum16,
+
+        /// Types that can be parsed from strings.
+        TypeIndex::UUID,
+        TypeIndex::IPv4,
+        TypeIndex::IPv6,
+
+        /// Types that can be parsed from numbers.
+        /// The order:
+        ///    1) Integers
+        ///    2) Big Integers
+        ///    3) Decimals
+        ///    4) Floats
+        /// In each group small types have higher priority.
+        TypeIndex::Int8,
+        TypeIndex::UInt8,
+        TypeIndex::Int16,
+        TypeIndex::UInt16,
+        TypeIndex::Int32,
+        TypeIndex::UInt32,
+        TypeIndex::Int64,
+        TypeIndex::UInt64,
+        TypeIndex::Int128,
+        TypeIndex::UInt128,
+        TypeIndex::Int256,
+        TypeIndex::UInt256,
+        TypeIndex::Decimal32,
+        TypeIndex::Decimal64,
+        TypeIndex::Decimal128,
+        TypeIndex::Decimal256,
+        TypeIndex::Float32,
+        TypeIndex::Float64,
+
+        /// Dates and DateTimes. More simple Date types have higher priority.
+        /// They have lower priority as numbers as some DateTimes sometimes can
+        /// be also parsed from numbers, but we don't want it usually.
+        TypeIndex::Date,
+        TypeIndex::Date32,
+        TypeIndex::DateTime,
+        TypeIndex::DateTime64,
+
+        /// String types have almost the lowest priority,
+        /// as in text formats almost all data can
+        /// be deserialized into String type.
+        TypeIndex::FixedString,
+        TypeIndex::String,
+    };
+
+    std::unordered_map<TypeIndex, size_t> priority_map;
+    priority_map.reserve(priorities.size());
+    for (size_t i = 0; i != priorities.size(); ++i)
+        priority_map[priorities[i]] = priorities.size() - i;
+    return priority_map;
+}
+
+/// We want to create more or less optimal order of types in which we will try text deserializations.
+/// To do it, for each type we calculate a priority and then sort them by this priority.
+/// Above we defined priority of each data type, but types can be nested and also we can have LowCardinality and Nullable.
+/// To sort any nested types we create a priority that is a tuple of 3 elements:
+/// 1) The maximum depth of nested types like Array/Map/Tuple.
+/// 2) The combination of simple and complex types priorities.
+/// 3) The depth of nested types LowCardinality/Nullable.
+/// So, when we will sort types, first we will sort by the maximum depth of nested types, so more nested types are deserialized first,
+/// then for types with the same depth we sort by the types priority, and last we sort by the depth of LowCardinality/Nullable types,
+/// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
+/// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
+/// This is just a batch of heuristics,
+std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
+{
+    if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
+        return getTypeTextDeserializePriority(nullable_type->getNestedType(), nested_depth, simple_nested_depth + 1, priority_map);
+
+    if (const auto * lc_type = typeid_cast<const DataTypeLowCardinality *>(type.get()))
+        return getTypeTextDeserializePriority(lc_type->getDictionaryType(), nested_depth, simple_nested_depth + 1, priority_map);
+
+    if (const auto * array_type = typeid_cast<const DataTypeArray *>(type.get()))
+    {
+        auto [elements_nested_depth, elements_priority, elements_simple_nested_depth] = getTypeTextDeserializePriority(array_type->getNestedType(), nested_depth + 1, simple_nested_depth, priority_map);
+        return {elements_nested_depth, elements_priority + priority_map[TypeIndex::Array], elements_simple_nested_depth};
+    }
+
+    if (const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get()))
+    {
+        size_t max_nested_depth = 0;
+        size_t sum_priority = 0;
+        size_t max_simple_nested_depth = 0;
+        for (const auto & elem : tuple_type->getElements())
+        {
+            auto [elem_nested_depth, elem_priority, elem_simple_nested_depth] = getTypeTextDeserializePriority(elem, nested_depth + 1, simple_nested_depth, priority_map);
+            sum_priority += elem_priority;
+            if (elem_nested_depth > max_nested_depth)
+                max_nested_depth = elem_nested_depth;
+            if (elem_simple_nested_depth > max_simple_nested_depth)
+                max_simple_nested_depth = elem_simple_nested_depth;
+        }
+
+        return {max_nested_depth, sum_priority + priority_map[TypeIndex::Tuple], max_simple_nested_depth};
+    }
+
+    if (const auto * map_type = typeid_cast<const DataTypeMap *>(type.get()))
+    {
+        auto [key_max_depth, key_priority, key_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getKeyType(), nested_depth + 1, simple_nested_depth, priority_map);
+        auto [value_max_depth, value_priority, value_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getValueType(), nested_depth + 1, simple_nested_depth, priority_map);
+        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map[TypeIndex::Map], std::max(key_simple_nested_depth, value_simple_nested_depth)};
+    }
+
+    if (const auto * variant_type = typeid_cast<const DataTypeVariant *>(type.get()))
+    {
+        size_t max_priority = 0;
+        size_t max_depth = 0;
+        size_t max_simple_nested_depth = 0;
+        for (const auto & variant : variant_type->getVariants())
+        {
+            auto [variant_max_depth, variant_priority, variant_simple_nested_depth] = getTypeTextDeserializePriority(variant, nested_depth, simple_nested_depth, priority_map);
+            if (variant_priority > max_priority)
+                max_priority = variant_priority;
+            if (variant_max_depth > max_depth)
+                max_depth = variant_max_depth;
+            if (variant_simple_nested_depth > max_simple_nested_depth)
+                max_simple_nested_depth = variant_simple_nested_depth;
+        }
+
+        return {max_depth, max_priority, max_simple_nested_depth};
+    }
+
+    return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
+}
+
+}
+
+std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const DB::DataTypes & variant_types)
+{
+    std::vector<std::tuple<size_t, size_t, size_t>> priorities;
+    priorities.reserve(variant_types.size());
+    std::vector<size_t> order;
+    order.reserve(variant_types.size());
+    auto priority_map = getTypesTextDeserializePriorityMap();
+    for (size_t i = 0; i != variant_types.size(); ++i)
+    {
+        priorities.push_back(getTypeTextDeserializePriority(variant_types[i], 0, 0, priority_map));
+        order.push_back(i);
+    }
+
+    std::sort(order.begin(), order.end(), [&](size_t left, size_t right) { return priorities[left] > priorities[right]; });
+    String types_order;
+    for (auto i : order)
+        types_order += " " + variant_types[i]->getName();
+    return order;
+}
+
+
+bool SerializationVariant::tryDeserializeImpl(
+    IColumn & column,
+    const String & field,
+    std::function<bool(ReadBuffer &)> check_for_null,
+    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_variant) const
+{
+    auto & column_variant = assert_cast<ColumnVariant &>(column);
+    ReadBufferFromString null_buf(field);
+    if (check_for_null(null_buf) && null_buf.eof())
+    {
+        column_variant.insertDefault();
+        return true;
+    }
+
+    for (size_t global_discr : deserialize_text_order)
+    {
+        ReadBufferFromString variant_buf(field);
+        /// Usually try_deserialize_variant should not throw an exception, but let's use try/catch just in case.
+        try
+        {
+            auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
+            size_t prev_size = variant_column.size();
+            if (try_deserialize_variant(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
+            {
+                column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
+                column_variant.getOffsets().push_back(prev_size);
+                return true;
+            }
+            else if (variant_column.size() > prev_size)
+            {
+                variant_column.popBack(1);
+            }
+        }
+        catch (...)
+        {
+            /// Try next variant.
+        }
+    }
+
+    return false;
+}
+
+void SerializationVariant::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullEscaped(ostr, settings);
+    else
+        variants[global_discr]->serializeTextEscaped(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readEscapedString(field, istr);
+    return tryDeserializeTextEscapedImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readEscapedString(field, istr);
+    if (!tryDeserializeTextEscapedImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse escaped value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextEscapedImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullEscaped(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextEscaped(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullRaw(ostr, settings);
+    else
+        variants[global_discr]->serializeTextRaw(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readString(field, istr);
+    return tryDeserializeTextRawImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readString(field, istr);
+    if (!tryDeserializeTextRawImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse raw value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextRawImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullRaw(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextRaw(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullQuoted(ostr);
+    else
+        variants[global_discr]->serializeTextQuoted(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    if (!tryReadQuotedField(field, istr))
+        return false;
+    return tryDeserializeTextQuotedImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readQuotedField(field, istr);
+    if (!tryDeserializeTextQuotedImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse quoted value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextQuotedImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullQuoted(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextQuoted(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullCSV(ostr, settings);
+    else
+        variants[global_discr]->serializeTextCSV(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readCSVStringInto<String, true, false>(field, istr, settings.csv);
+    return tryDeserializeTextCSVImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readCSVField(field, istr, settings.csv);
+    if (!tryDeserializeTextCSVImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse CSV value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextCSVImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullCSV(buf, settings);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextCSV(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullText(ostr, settings);
+    else
+        variants[global_discr]->serializeText(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readStringUntilEOF(field, istr);
+    return tryDeserializeWholeTextImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readStringUntilEOF(field, istr);
+    if (!tryDeserializeWholeTextImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse text value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeWholeTextImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullText(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeWholeText(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullJSON(ostr);
+    else
+        variants[global_discr]->serializeTextJSON(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+bool SerializationVariant::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    if (!tryReadJSONField(field, istr))
+        return false;
+    return tryDeserializeTextJSONImpl(column, field, settings);
+}
+
+void SerializationVariant::deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    String field;
+    readJSONField(field, istr);
+    if (!tryDeserializeTextJSONImpl(column, field, settings))
+        throw Exception(ErrorCodes::INCORRECT_DATA, "Cannot parse JSON value of type {} here: {}", variant_name, field);
+}
+
+bool SerializationVariant::tryDeserializeTextJSONImpl(DB::IColumn & column, const String & field, const DB::FormatSettings & settings) const
+{
+    auto check_for_null = [&](ReadBuffer & buf)
+    {
+        return SerializationNullable::tryDeserializeNullJSON(buf);
+    };
+    auto try_deserialize_variant =[&](IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer & buf)
+    {
+        return variant_serialization->tryDeserializeTextJSON(variant_column, buf, settings);
+    };
+
+    return tryDeserializeImpl(column, field, check_for_null, try_deserialize_variant);
+}
+
+void SerializationVariant::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
+{
+    const ColumnVariant & col = assert_cast<const ColumnVariant &>(column);
+    auto global_discr = col.globalDiscriminatorAt(row_num);
+    if (global_discr == ColumnVariant::NULL_DISCRIMINATOR)
+        SerializationNullable::serializeNullXML(ostr);
+    else
+        variants[global_discr]->serializeTextXML(col.getVariantByGlobalDiscriminator(global_discr), col.offsetAt(row_num), ostr, settings);
+}
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariant.h b/src/DataTypes/Serializations/SerializationVariant.h
new file mode 100644
index 00000000000..b6bee94c65f
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariant.h
@@ -0,0 +1,116 @@
+#pragma once
+
+#include <DataTypes/Serializations/ISerialization.h>
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+
+namespace DB
+{
+
+class SerializationVariant : public ISerialization
+{
+public:
+    using VariantSerializations = std::vector<SerializationPtr>;
+
+    explicit SerializationVariant(
+        const VariantSerializations & variants_,
+        const std::vector<String> & variant_names_,
+        const std::vector<size_t> & deserialize_text_order_,
+        const String & variant_name_)
+        : variants(variants_), variant_names(variant_names_), deserialize_text_order(deserialize_text_order_), variant_name(variant_name_)
+    {
+    }
+
+    void enumerateStreams(
+        EnumerateStreamsSettings & settings,
+        const StreamCallback & callback,
+        const SubstreamData & data) const override;
+
+    void serializeBinaryBulkStatePrefix(
+        const IColumn & column,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkStateSuffix(
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkStatePrefix(
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkWithMultipleStreams(
+        const IColumn & column,
+        size_t offset,
+        size_t limit,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkWithMultipleStreams(
+        ColumnPtr & column,
+        size_t limit,
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state,
+        SubstreamsCache * cache) const override;
+
+    void serializeBinary(const Field & field, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeBinary(Field & field, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextRaw(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+    void deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+    bool tryDeserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override;
+
+    void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
+
+    /// Determine the order in which we should try to deserialize variants.
+    /// In some cases the text representation of a value can be deserialized
+    /// into several types (for example, almost all text values can be deserialized
+    /// into String type), so we uses some heuristics to determine the more optimal order.
+    static std::vector<size_t> getVariantsDeserializeTextOrder(const DataTypes & variant_types);
+
+private:
+    void addVariantElementToPath(SubstreamPath & path, size_t i) const;
+
+    bool tryDeserializeTextEscapedImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextQuotedImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeWholeTextImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextCSVImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextJSONImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+    bool tryDeserializeTextRawImpl(IColumn & column, const String & field, const FormatSettings & settings) const;
+
+    bool tryDeserializeImpl(
+        IColumn & column,
+        const String & field,
+        std::function<bool(ReadBuffer &)> check_for_null,
+        std::function<bool(IColumn & variant_columm, const SerializationPtr & nested, ReadBuffer &)> try_deserialize_nested) const;
+
+    VariantSerializations variants;
+    std::vector<String> variant_names;
+    std::vector<size_t> deserialize_text_order;
+    /// Name of Variant data type for better exception messages.
+    String variant_name;
+};
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
new file mode 100644
index 00000000000..4b24ee5754e
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -0,0 +1,241 @@
+#include <DataTypes/Serializations/SerializationVariantElement.h>
+#include <DataTypes/Serializations/SerializationNumber.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnNullable.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
+}
+
+void SerializationVariantElement::enumerateStreams(
+    DB::ISerialization::EnumerateStreamsSettings & settings,
+    const DB::ISerialization::StreamCallback & callback,
+    const DB::ISerialization::SubstreamData & data) const
+{
+    /// We will need stream for discriminators during deserialization.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    callback(settings.path);
+    settings.path.pop_back();
+
+    addVariantToPath(settings.path);
+    settings.path.back().data = data;
+    nested_serialization->enumerateStreams(settings, callback, data);
+    removeVariantFromPath(settings.path);
+}
+
+void SerializationVariantElement::serializeBinaryBulkStatePrefix(const IColumn &, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(
+        ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStatePrefix is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::serializeBinaryBulkStateSuffix(SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(
+        ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStateSuffix is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::deserializeBinaryBulkStatePrefix(DeserializeBinaryBulkSettings & settings, DeserializeBinaryBulkStatePtr & state) const
+{
+    addVariantToPath(settings.path);
+    nested_serialization->deserializeBinaryBulkStatePrefix(settings, state);
+    removeVariantFromPath(settings.path);
+}
+
+void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const IColumn &, size_t, size_t, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkWithMultipleStreams is not implemented for SerializationVariantElement");
+}
+
+void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
+    ColumnPtr & column,
+    size_t limit,
+    DeserializeBinaryBulkSettings & settings,
+    DeserializeBinaryBulkStatePtr & state,
+    SubstreamsCache * cache) const
+{
+    auto mutable_column = column->assumeMutable();
+    ColumnNullable * nullable_col = typeid_cast<ColumnNullable *>(mutable_column.get());
+    NullMap * null_map = nullable_col ? &nullable_col->getNullMapData() : nullptr;
+
+    /// First, deserialize discriminators from Variant column.
+    settings.path.push_back(Substream::VariantDiscriminators);
+    ColumnPtr discriminators;
+    if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
+    {
+        discriminators = cached_discriminators;
+    }
+    else
+    {
+        auto * discriminators_stream = settings.getter(settings.path);
+        if (!discriminators_stream)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
+
+        discriminators = ColumnVariant::ColumnDiscriminators::create();
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, discriminators);
+    }
+    settings.path.pop_back();
+
+    /// Iterate through discriminators to calculate the size of the variant.
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
+    size_t variant_size = 0;
+    for (auto discr : discriminators_data)
+        variant_size += discr == variant_discriminator;
+
+    /// Now we know the size of the variant and can deserialize it.
+
+    /// If the size of variant column is the same as the size of discriminators,
+    /// we can deserialize new values directly into our column.
+    if (variant_size == discriminators_data.size())
+    {
+        addVariantToPath(settings.path);
+        /// Special case when our result column is LowCardinality(Nullable(T)).
+        /// In this case the variant type is LowCardinality(T), and we cannot just
+        /// deserialize its values directly into LowCardinality(Nullable(T)) column.
+        /// We create a separate column with type LowCardinality(T), deserialize
+        /// values into it and then insert into result column using insertRangeFrom.
+        if (isColumnLowCardinalityNullable(*column))
+        {
+            ColumnPtr variant_col = mutable_column->cloneEmpty();
+            /// LowCardinality(Nullable(T)) -> LowCardinality(T)
+            assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
+            nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, limit, settings, state, cache);
+            mutable_column->insertRangeFrom(*variant_col, 0, variant_col->size());
+        }
+        else
+        {
+            nested_serialization->deserializeBinaryBulkWithMultipleStreams(nullable_col ? nullable_col->getNestedColumnPtr() : column, limit, settings, state, cache);
+        }
+        if (nullable_col)
+            null_map->resize_fill(null_map->size() + limit, 0);
+        removeVariantFromPath(settings.path);
+        return;
+    }
+
+    /// If variant size is 0, just fill column with default values.
+    if (variant_size == 0)
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
+    /// In general case we should deserialize variant into a separate column,
+    /// iterate through discriminators and insert values from variant only when
+    /// row contains its discriminator and default value otherwise.
+    mutable_column->reserve(mutable_column->size() + limit);
+    mutable_column = nullable_col ? nullable_col->getNestedColumnPtr()->assumeMutable() : std::move(mutable_column);
+    ColumnPtr variant_col = mutable_column->cloneEmpty();
+
+    /// Special case when our result column is LowCardinality(Nullable(T)).
+    /// We should remove Nullable from variant column before deserialization.
+    if (isColumnLowCardinalityNullable(*column))
+        assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
+
+    addVariantToPath(settings.path);
+    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, variant_size, settings, state, cache);
+    removeVariantFromPath(settings.path);
+
+    size_t variant_index = 0;
+    for (auto discr : discriminators_data)
+    {
+        if (discr == variant_discriminator)
+        {
+            if (null_map)
+                null_map->push_back(0);
+            mutable_column->insertFrom(*variant_col, variant_index++);
+        }
+        else
+        {
+            if (null_map)
+                null_map->push_back(1);
+            mutable_column->insertDefault();
+        }
+    }
+}
+
+void SerializationVariantElement::addVariantToPath(DB::ISerialization::SubstreamPath & path) const
+{
+    path.push_back(Substream::VariantElements);
+    path.push_back(Substream::VariantElement);
+    path.back().variant_element_name = variant_element_name;
+}
+
+void SerializationVariantElement::removeVariantFromPath(DB::ISerialization::SubstreamPath & path) const
+{
+    path.pop_back();
+    path.pop_back();
+}
+
+SerializationVariantElement::VariantSubcolumnCreator::VariantSubcolumnCreator(
+    const DB::ColumnPtr & local_discriminators_,
+    const DB::String & variant_element_name_,
+    const ColumnVariant::Discriminator global_variant_discriminator_,
+    const ColumnVariant::Discriminator local_variant_discriminator_)
+    : local_discriminators(local_discriminators_)
+    , variant_element_name(variant_element_name_)
+    , global_variant_discriminator(global_variant_discriminator_)
+    , local_variant_discriminator(local_variant_discriminator_)
+{
+}
+
+DataTypePtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::DataTypePtr & prev) const
+{
+    return makeNullableOrLowCardinalityNullableSafe(prev);
+}
+
+SerializationPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::SerializationPtr & prev) const
+{
+    return std::make_shared<SerializationVariantElement>(prev, variant_element_name, global_variant_discriminator);
+}
+
+ColumnPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB::ColumnPtr & prev) const
+{
+    /// Case when original Variant column contained only one non-empty variant and no NULLs.
+    /// In this case just use this variant.
+    if (prev->size() == local_discriminators->size())
+        return makeNullableOrLowCardinalityNullableSafe(prev);
+
+    /// If this variant is empty, fill result column with default values.
+    if (prev->empty())
+    {
+        auto res = IColumn::mutate(makeNullableOrLowCardinalityNullableSafe(prev));
+        res->insertManyDefaults(local_discriminators->size());
+        return res;
+    }
+
+    /// In general case we should iterate through discriminators and create null-map for our variant.
+    NullMap null_map;
+    null_map.reserve(local_discriminators->size());
+    const auto & local_discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*local_discriminators).getData();
+    for (auto local_discr : local_discriminators_data)
+        null_map.push_back(local_discr != local_variant_discriminator);
+
+    /// Now we can create new column from null-map and variant column using IColumn::expand.
+    auto res_column = IColumn::mutate(prev);
+
+    /// Special case for LowCardinality. We want the result to be LowCardinality(Nullable),
+    /// but we don't have a good way to apply null-mask for LowCardinality(), so, we first
+    /// convert our column to LowCardinality(Nullable()) and then use expand which will
+    /// fill rows with 0 in mask with default value (that is NULL).
+    if (prev->lowCardinality())
+        res_column = assert_cast<ColumnLowCardinality &>(*res_column).cloneNullable();
+
+    res_column->expand(null_map, /*inverted = */ true);
+
+    if (res_column->canBeInsideNullable())
+    {
+        auto null_map_col = ColumnUInt8::create();
+        null_map_col->getData() = std::move(null_map);
+        return ColumnNullable::create(std::move(res_column), std::move(null_map_col));
+    }
+
+    return res_column;
+}
+
+}
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.h b/src/DataTypes/Serializations/SerializationVariantElement.h
new file mode 100644
index 00000000000..c343c219cf3
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationVariantElement.h
@@ -0,0 +1,87 @@
+#pragma once
+
+#include <DataTypes/Serializations/SerializationWrapper.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnVariant.h>
+
+namespace DB
+{
+
+class SerializationVariant;
+
+/// Serialization for Variant element when we read it as a subcolumn.
+class SerializationVariantElement final : public SerializationWrapper
+{
+private:
+    /// To be able to deserialize Variant element as a subcolumn
+    /// we need its type name and global discriminator.
+    String variant_element_name;
+    ColumnVariant::Discriminator variant_discriminator;
+
+public:
+    SerializationVariantElement(const SerializationPtr & nested_, const String & variant_element_name_, ColumnVariant::Discriminator variant_discriminator_)
+        : SerializationWrapper(nested_)
+        , variant_element_name(variant_element_name_)
+        , variant_discriminator(variant_discriminator_)
+    {
+    }
+
+    void enumerateStreams(
+        EnumerateStreamsSettings & settings,
+        const StreamCallback & callback,
+        const SubstreamData & data) const override;
+
+    void serializeBinaryBulkStatePrefix(
+        const IColumn & column,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkStateSuffix(
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkStatePrefix(
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state) const override;
+
+    void serializeBinaryBulkWithMultipleStreams(
+        const IColumn & column,
+        size_t offset,
+        size_t limit,
+        SerializeBinaryBulkSettings & settings,
+        SerializeBinaryBulkStatePtr & state) const override;
+
+    void deserializeBinaryBulkWithMultipleStreams(
+        ColumnPtr & column,
+        size_t limit,
+        DeserializeBinaryBulkSettings & settings,
+        DeserializeBinaryBulkStatePtr & state,
+        SubstreamsCache * cache) const override;
+
+private:
+    friend SerializationVariant;
+
+    void addVariantToPath(SubstreamPath & path) const;
+    void removeVariantFromPath(SubstreamPath & path) const;
+
+    struct VariantSubcolumnCreator : public ISubcolumnCreator
+    {
+        const ColumnPtr local_discriminators;
+        const String variant_element_name;
+        const ColumnVariant::Discriminator global_variant_discriminator;
+        const ColumnVariant::Discriminator local_variant_discriminator;
+
+        VariantSubcolumnCreator(
+            const ColumnPtr & local_discriminators_,
+            const String & variant_element_name_,
+            const ColumnVariant::Discriminator global_variant_discriminator_,
+            const ColumnVariant::Discriminator local_variant_discriminator_);
+
+        DataTypePtr create(const DataTypePtr & prev) const override;
+        ColumnPtr create(const ColumnPtr & prev) const override;
+        SerializationPtr create(const SerializationPtr & prev) const override;
+    };
+};
+
+}
diff --git a/src/DataTypes/Serializations/SerializationWrapper.cpp b/src/DataTypes/Serializations/SerializationWrapper.cpp
index 18e4891ee65..bde52bb8096 100644
--- a/src/DataTypes/Serializations/SerializationWrapper.cpp
+++ b/src/DataTypes/Serializations/SerializationWrapper.cpp
@@ -96,6 +96,11 @@ void SerializationWrapper::deserializeTextEscaped(IColumn & column, ReadBuffer &
     nested_serialization->deserializeTextEscaped(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextEscaped(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextQuoted(column, row_num, ostr, settings);
@@ -106,6 +111,11 @@ void SerializationWrapper::deserializeTextQuoted(IColumn & column, ReadBuffer &
     nested_serialization->deserializeTextQuoted(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextQuoted(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextCSV(column, row_num, ostr, settings);
@@ -116,6 +126,11 @@ void SerializationWrapper::deserializeTextCSV(IColumn & column, ReadBuffer & ist
     nested_serialization->deserializeTextCSV(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextCSV(column, istr, settings);
+}
+
 void SerializationWrapper::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeText(column, row_num, ostr, settings);
@@ -126,6 +141,11 @@ void SerializationWrapper::deserializeWholeText(IColumn & column, ReadBuffer & i
     nested_serialization->deserializeWholeText(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeWholeText(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     nested_serialization->serializeTextJSON(column, row_num, ostr, settings);
@@ -136,6 +156,11 @@ void SerializationWrapper::deserializeTextJSON(IColumn & column, ReadBuffer & is
     nested_serialization->deserializeTextJSON(column, istr, settings);
 }
 
+bool SerializationWrapper::tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
+{
+    return nested_serialization->tryDeserializeTextJSON(column, istr, settings);
+}
+
 void SerializationWrapper::serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const
 {
     nested_serialization->serializeTextJSONPretty(column, row_num, ostr, settings, indent);
diff --git a/src/DataTypes/Serializations/SerializationWrapper.h b/src/DataTypes/Serializations/SerializationWrapper.h
index 31900f93148..6c5e2046062 100644
--- a/src/DataTypes/Serializations/SerializationWrapper.h
+++ b/src/DataTypes/Serializations/SerializationWrapper.h
@@ -63,18 +63,23 @@ public:
 
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
 
     void serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings &) const override;
     void serializeTextJSONPretty(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings, size_t indent) const override;
 
     void serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const override;
diff --git a/src/DataTypes/Serializations/SimpleTextSerialization.h b/src/DataTypes/Serializations/SimpleTextSerialization.h
index 0247f30b30a..11f56de73d1 100644
--- a/src/DataTypes/Serializations/SimpleTextSerialization.h
+++ b/src/DataTypes/Serializations/SimpleTextSerialization.h
@@ -36,29 +36,67 @@ protected:
         deserializeText(column, istr, settings, true);
     }
 
+    bool tryDeserializeWholeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, true);
+    }
+
     void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextJSON(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     void deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
     {
         deserializeText(column, istr, settings, false);
     }
 
+    bool tryDeserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const override
+    {
+        return tryDeserializeText(column, istr, settings, false);
+    }
+
     /// whole = true means that buffer contains only one value, so we should read until EOF.
     /// It's needed to check if there is garbage after parsed field.
     virtual void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const = 0;
+
+    virtual bool tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings & settings, bool whole) const
+    {
+        try
+        {
+            deserializeText(column, istr, settings, whole);
+            return true;
+        }
+        catch (...)
+        {
+            return false;
+        }
+    }
 };
 
 }
diff --git a/src/DataTypes/Utils.cpp b/src/DataTypes/Utils.cpp
index e58331a8bcb..2f29d57d454 100644
--- a/src/DataTypes/Utils.cpp
+++ b/src/DataTypes/Utils.cpp
@@ -223,6 +223,7 @@ bool canBeSafelyCasted(const DataTypePtr & from_type, const DataTypePtr & to_typ
         case TypeIndex::AggregateFunction:
         case TypeIndex::Nothing:
         case TypeIndex::JSONPaths:
+        case TypeIndex::Variant:
             return false;
     }
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 36dd858dcf7..76f6dc25aae 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -907,6 +907,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
         query_context->setSetting("allow_experimental_nlp_functions", 1);
         query_context->setSetting("allow_experimental_hash_functions", 1);
         query_context->setSetting("allow_experimental_object_type", 1);
+        query_context->setSetting("allow_experimental_variant_type", 1);
         query_context->setSetting("allow_experimental_annoy_index", 1);
         query_context->setSetting("allow_experimental_usearch_index", 1);
         query_context->setSetting("allow_experimental_bigint_types", 1);
diff --git a/src/Formats/EscapingRuleUtils.cpp b/src/Formats/EscapingRuleUtils.cpp
index 9cc7cb3b89e..a2528f9f948 100644
--- a/src/Formats/EscapingRuleUtils.cpp
+++ b/src/Formats/EscapingRuleUtils.cpp
@@ -109,31 +109,31 @@ bool deserializeFieldByEscapingRule(
     {
         case FormatSettings::EscapingRule::Escaped:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextEscapedImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextEscaped(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::Quoted:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextQuotedImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextQuoted(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::CSV:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextCSVImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextCSV(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::JSON:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextJSONImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextJSON(column, buf, format_settings);
             break;
         case FormatSettings::EscapingRule::Raw:
             if (parse_as_nullable)
-                read = SerializationNullable::deserializeTextRawImpl(column, buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(column, buf, format_settings, serialization);
             else
                 serialization->deserializeTextRaw(column, buf, format_settings);
             break;
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 7ddfdb6b572..4e7795f61bd 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -288,14 +288,14 @@ namespace JSONUtils
                 ReadBufferFromString buf(str);
 
                 if (as_nullable)
-                    return SerializationNullable::deserializeWholeTextImpl(column, buf, format_settings, serialization);
+                    return SerializationNullable::deserializeNullAsDefaultOrNestedWholeText(column, buf, format_settings, serialization);
 
                 serialization->deserializeWholeText(column, buf, format_settings);
                 return true;
             }
 
             if (as_nullable)
-                return SerializationNullable::deserializeTextJSONImpl(column, in, format_settings, serialization);
+                return SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(column, in, format_settings, serialization);
 
             serialization->deserializeTextJSON(column, in, format_settings);
             return true;
diff --git a/src/Formats/SchemaInferenceUtils.cpp b/src/Formats/SchemaInferenceUtils.cpp
index e2ba188d015..6890e412f75 100644
--- a/src/Formats/SchemaInferenceUtils.cpp
+++ b/src/Formats/SchemaInferenceUtils.cpp
@@ -946,7 +946,7 @@ namespace
         if constexpr (is_json)
             ok = tryReadJSONStringInto(field, buf);
         else
-            ok = tryReadQuotedStringInto(field, buf);
+            ok = tryReadQuotedString(field, buf);
 
         if (!ok)
             return nullptr;
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index bef1e7b420a..f9f61ceed0d 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -28,6 +28,7 @@
 #include <DataTypes/DataTypeObject.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/DataTypeNested.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/Serializations/SerializationDecimal.h>
 #include <Formats/FormatSettings.h>
 #include <Columns/ColumnString.h>
@@ -40,6 +41,7 @@
 #include <Columns/ColumnMap.h>
 #include <Columns/ColumnObject.h>
 #include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnVariant.h>
 #include <Columns/ColumnStringHelpers.h>
 #include <Common/assert_cast.h>
 #include <Common/Concepts.h>
@@ -4067,6 +4069,259 @@ arguments, result_type, input_rows_count); \
             "Cast to Object can be performed only from flatten named Tuple, Map or String. Got: {}", from_type->getName());
     }
 
+    WrapperType createVariantToVariantWrapper(const DataTypeVariant & from_variant, const DataTypeVariant & to_variant) const
+    {
+        /// We support only extension of variant type, so, only new types can be added.
+        /// For example: Variant(T1, T2) -> Variant(T1, T2, T3) is supported, but Variant(T1, T2) -> Variant(T1, T3) is not supported.
+        /// We want to extend Variant type for free without rewriting the data, but we sort data types inside Variant during type creation
+        /// (we do it because we want Variant(T1, T2) to be the same as Variant(T2, T1)), but after extension the order of variant types
+        /// (and so their discriminators) can be different. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
+        /// To avoid full rewrite of discriminators column, ColumnVariant supports it's local order of variant columns (and so local
+        /// discriminators) and stores mapping global order -> local order.
+        /// So, to extend Variant with new types for free, we should keep old local order for old variants, append new variants and change
+        /// mapping global order -> local order according to the new global order.
+
+        /// Create map (new variant type) -> (it's global discriminator in new order).
+        const auto & new_variants = to_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> new_variant_types_to_new_global_discriminator;
+        new_variant_types_to_new_global_discriminator.reserve(new_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+            new_variant_types_to_new_global_discriminator[new_variants[i]->getName()] = i;
+
+        /// Create set of old variant types.
+        const auto & old_variants = from_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> old_variant_types_to_old_global_discriminator;
+        old_variant_types_to_old_global_discriminator.reserve(old_variants.size());
+        for (size_t i = 0; i != old_variants.size(); ++i)
+            old_variant_types_to_old_global_discriminator[old_variants[i]->getName()] = i;
+
+        /// Check that the set of old variants types is a subset of new variant types and collect new global discriminator for each old global discriminator.
+        std::unordered_map<ColumnVariant::Discriminator, ColumnVariant::Discriminator> old_global_discriminator_to_new;
+        old_global_discriminator_to_new.reserve(old_variants.size());
+        for (const auto & [old_variant_type, old_discriminator] : old_variant_types_to_old_global_discriminator)
+        {
+            auto it = new_variant_types_to_new_global_discriminator.find(old_variant_type);
+            if (it == new_variant_types_to_new_global_discriminator.end())
+                throw Exception(
+                    ErrorCodes::CANNOT_CONVERT_TYPE,
+                    "Cannot convert type {} to {}. Conversion between Variant types is allowed only when new Variant type is an extension "
+                    "of an initial one", from_variant.getName(), to_variant.getName());
+            old_global_discriminator_to_new[old_discriminator] = it->second;
+        }
+
+        /// Collect variant types and their global discriminators that should be added to the old Variant to get the new Variant.
+        std::vector<std::pair<DataTypePtr, ColumnVariant::Discriminator>> variant_types_and_discriminators_to_add;
+        variant_types_and_discriminators_to_add.reserve(new_variants.size() - old_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+        {
+            if (!old_variant_types_to_old_global_discriminator.contains(new_variants[i]->getName()))
+                variant_types_and_discriminators_to_add.emplace_back(new_variants[i], i);
+        }
+
+        return [old_global_discriminator_to_new, variant_types_and_discriminators_to_add]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+            size_t num_old_variants = column_variant.getNumVariants();
+            Columns new_variant_columns;
+            new_variant_columns.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            std::vector<ColumnVariant::Discriminator> new_local_to_global_discriminators;
+            new_local_to_global_discriminators.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            for (size_t i = 0; i != num_old_variants; ++i)
+            {
+                new_variant_columns.push_back(column_variant.getVariantPtrByLocalDiscriminator(i));
+                new_local_to_global_discriminators.push_back(old_global_discriminator_to_new.at(column_variant.globalDiscriminatorByLocal(i)));
+            }
+
+            for (const auto & [new_variant_type, new_global_discriminator] : variant_types_and_discriminators_to_add)
+            {
+                new_variant_columns.push_back(new_variant_type->createColumn());
+                new_local_to_global_discriminators.push_back(new_global_discriminator);
+            }
+
+            return ColumnVariant::create(column_variant.getLocalDiscriminatorsPtr(), column_variant.getOffsetsPtr(), new_variant_columns, new_local_to_global_discriminators);
+        };
+    }
+
+    WrapperType createVariantToColumnWrapper(const DataTypeVariant & from_variant, const DataTypePtr & to_type) const
+    {
+        const auto & variant_types = from_variant.getVariants();
+        std::vector<WrapperType> variant_wrappers;
+        variant_wrappers.reserve(variant_types.size());
+
+        /// Create conversion wrapper for each variant.
+        for (const auto & variant_type : variant_types)
+            variant_wrappers.push_back(prepareUnpackDictionaries(variant_type, to_type));
+
+        return [variant_wrappers, variant_types, to_type]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+
+            /// First, cast each variant to the result type.
+            std::vector<ColumnPtr> casted_variant_columns;
+            casted_variant_columns.reserve(variant_types.size());
+            for (size_t i = 0; i != variant_types.size(); ++i)
+            {
+                auto variant_col = column_variant.getVariantPtrByLocalDiscriminator(i);
+                ColumnsWithTypeAndName variant = {{variant_col, variant_types[i], "" }};
+                const auto & variant_wrapper = variant_wrappers[column_variant.globalDiscriminatorByLocal(i)];
+                casted_variant_columns.push_back(variant_wrapper(variant, result_type, nullptr, variant_col->size()));
+            }
+
+            /// Second, construct resulting column from casted variant columns according to discriminators.
+            const auto & local_discriminators = column_variant.getLocalDiscriminators();
+            auto res = result_type->createColumn();
+            res->reserve(input_rows_count);
+            for (size_t i = 0; i != input_rows_count; ++i)
+            {
+                auto local_discr = local_discriminators[i];
+                if (local_discr == ColumnVariant::NULL_DISCRIMINATOR)
+                    res->insertDefault();
+                else
+                    res->insertFrom(*casted_variant_columns[local_discr], column_variant.offsetAt(i));
+            }
+
+            return res;
+        };
+    }
+
+    static ColumnPtr createVariantFromDescriptorsAndOneNonEmptyVariant(const DataTypes & variant_types, const ColumnPtr & discriminators, const ColumnPtr & variant, ColumnVariant::Discriminator variant_discr)
+    {
+        Columns variants;
+        variants.reserve(variant_types.size());
+        for (size_t i = 0; i != variant_types.size(); ++i)
+        {
+            if (i == variant_discr)
+                variants.emplace_back(variant);
+            else
+                variants.push_back(variant_types[i]->createColumn());
+        }
+
+        return ColumnVariant::create(discriminators, variants);
+    }
+
+    WrapperType createColumnToVariantWrapper(const DataTypePtr & from_type, const DataTypeVariant & to_variant) const
+    {
+        /// We allow converting NULL to Variant(...) as Variant can store NULLs.
+        if (from_type->onlyNull())
+        {
+            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+            {
+                auto result_column = result_type->createColumn();
+                result_column->insertManyDefaults(input_rows_count);
+                return result_column;
+            };
+        }
+
+        auto variant_discr_opt = to_variant.tryGetVariantDiscriminator(removeNullableOrLowCardinalityNullable(from_type));
+        if (!variant_discr_opt)
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert type {} to {}. Conversion to Variant allowed only for types from this Variant", from_type->getName(), to_variant.getName());
+
+        return [variant_discr = *variant_discr_opt]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & result_variant_type = assert_cast<const DataTypeVariant &>(*result_type);
+            const auto & variant_types = result_variant_type.getVariants();
+            if (const ColumnNullable * col_nullable = typeid_cast<const ColumnNullable *>(arguments.front().column.get()))
+            {
+                const auto & column = col_nullable->getNestedColumnPtr();
+                const auto & null_map = col_nullable->getNullMapData();
+                IColumn::Filter filter;
+                filter.reserve(column->size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(column->size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != column->size(); ++i)
+                {
+                    if (null_map[i])
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                ColumnPtr variant_column;
+                /// If there were no NULLs, just use the column.
+                if (variant_size_hint == column->size())
+                    variant_column = column;
+                /// Otherwise we should use filtered column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), variant_column, variant_discr);
+            }
+            else if (isColumnLowCardinalityNullable(*arguments.front().column))
+            {
+                const auto & column = arguments.front().column;
+
+                /// Variant column cannot have LowCardinality(Nullable(...)) variant, as Variant column stores NULLs itself.
+                /// We should create a null-map, insert NULL_DISCRIMINATOR on NULL values and filter initial column.
+                const auto & col_lc = assert_cast<const ColumnLowCardinality &>(*column);
+                const auto & indexes = col_lc.getIndexes();
+                auto null_index = col_lc.getDictionary().getNullValueIndex();
+                IColumn::Filter filter;
+                filter.reserve(col_lc.size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(col_lc.size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != col_lc.size(); ++i)
+                {
+                    if (indexes.getUInt(i) == null_index)
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                MutableColumnPtr variant_column;
+                /// If there were no NULLs, we can just clone the column.
+                if (variant_size_hint == col_lc.size())
+                    variant_column = IColumn::mutate(column);
+                /// Otherwise we should filter column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint)->assumeMutable();
+
+                assert_cast<ColumnLowCardinality &>(*variant_column).nestedRemoveNullable();
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), std::move(variant_column), variant_discr);
+            }
+            else
+            {
+                const auto & column = arguments.front().column;
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                discriminators->getData().resize_fill(column->size(), variant_discr);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), column, variant_discr);
+            }
+        };
+    }
+
+    /// Wrapper for conversion to/from Variant type
+    WrapperType createVariantWrapper(const DataTypePtr & from_type, const DataTypePtr & to_type) const
+    {
+        if (const auto * from_variant = checkAndGetDataType<DataTypeVariant>(from_type.get()))
+        {
+            if (const auto * to_variant = checkAndGetDataType<DataTypeVariant>(to_type.get()))
+                return createVariantToVariantWrapper(*from_variant, *to_variant);
+
+            return createVariantToColumnWrapper(*from_variant, to_type);
+        }
+
+        return createColumnToVariantWrapper(from_type, assert_cast<const DataTypeVariant &>(*to_type));
+    }
+
     template <typename FieldType>
     WrapperType createEnumWrapper(const DataTypePtr & from_type, const DataTypeEnum<FieldType> * to_type) const
     {
@@ -4246,6 +4501,11 @@ arguments, result_type, input_rows_count); \
 
     WrapperType prepareUnpackDictionaries(const DataTypePtr & from_type, const DataTypePtr & to_type) const
     {
+        /// Conversion from/to Variant data type is processed in a special way.
+        /// We don't need to remove LowCardinality/Nullable.
+        if (isVariant(to_type) || isVariant(from_type))
+            return createVariantWrapper(from_type, to_type);
+
         const auto * from_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(from_type.get());
         const auto * to_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(to_type.get());
         const auto & from_nested = from_low_cardinality ? from_low_cardinality->getDictionaryType() : from_type;
@@ -4253,7 +4513,7 @@ arguments, result_type, input_rows_count); \
 
         if (from_type->onlyNull())
         {
-            if (!to_nested->isNullable())
+            if (!to_nested->isNullable() && !isVariant(to_type))
             {
                 if (cast_type == CastType::accurateOrNull)
                 {
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index eba1733c683..b15bc5938be 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/DataTypeFixedString.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/NumberTraits.h>
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnVector.h>
@@ -14,6 +15,7 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnTuple.h>
 #include <Columns/ColumnNullable.h>
+#include <Columns/ColumnVariant.h>
 #include <Columns/MaskOperations.h>
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
@@ -22,6 +24,8 @@
 #include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/FunctionIfBase.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
+
 #include <Functions/FunctionFactory.h>
 
 
@@ -215,9 +219,16 @@ class FunctionIf : public FunctionIfBase
 {
 public:
     static constexpr auto name = "if";
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionIf>(); }
+    static FunctionPtr create(ContextPtr context)
+    {
+        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
+    }
+
+    FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
 
 private:
+    bool use_variant_when_no_common_type = false;
+
     template <typename T0, typename T1>
     static UInt32 decimalScale(const ColumnsWithTypeAndName & arguments [[maybe_unused]])
     {
@@ -626,13 +637,23 @@ private:
     }
 
     static ColumnPtr executeGeneric(
-        const ColumnUInt8 * cond_col, const ColumnsWithTypeAndName & arguments, size_t input_rows_count)
+        const ColumnUInt8 * cond_col, const ColumnsWithTypeAndName & arguments, size_t input_rows_count, bool use_variant_when_no_common_type)
     {
         /// Convert both columns to the common type (if needed).
         const ColumnWithTypeAndName & arg1 = arguments[1];
         const ColumnWithTypeAndName & arg2 = arguments[2];
 
-        DataTypePtr common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
+        DataTypePtr common_type;
+        if (use_variant_when_no_common_type)
+        {
+            common_type = tryGetLeastSupertype(DataTypes{arg1.type, arg2.type});
+            if (!common_type)
+                common_type = std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arg1.type), removeNullableOrLowCardinalityNullable(arg2.type)});
+        }
+        else
+        {
+            common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
+        }
 
         ColumnPtr col_then = castColumn(arg1, common_type);
         ColumnPtr col_else = castColumn(arg2, common_type);
@@ -807,6 +828,10 @@ private:
 
     ColumnPtr executeForNullableThenElse(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
     {
+        /// If result type is Variant, we don't need to remove Nullable.
+        if (isVariant(result_type))
+            return nullptr;
+
         const ColumnWithTypeAndName & arg_cond = arguments[0];
         const ColumnWithTypeAndName & arg_then = arguments[1];
         const ColumnWithTypeAndName & arg_else = arguments[2];
@@ -912,6 +937,11 @@ private:
                     assert_cast<ColumnNullable &>(*result_column).applyNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column));
                     return result_column;
                 }
+                else if (auto * variant_column = typeid_cast<ColumnVariant *>(result_column.get()))
+                {
+                    variant_column->applyNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column).getData());
+                    return result_column;
+                }
                 else
                     return ColumnNullable::create(materializeColumnIfConst(result_column), arg_cond.column);
             }
@@ -950,6 +980,11 @@ private:
                     assert_cast<ColumnNullable &>(*result_column).applyNegatedNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column));
                     return result_column;
                 }
+                else if (auto * variant_column = typeid_cast<ColumnVariant *>(result_column.get()))
+                {
+                    variant_column->applyNegatedNullMap(assert_cast<const ColumnUInt8 &>(*arg_cond.column).getData());
+                    return result_column;
+                }
                 else
                 {
                     size_t size = input_rows_count;
@@ -1039,6 +1074,13 @@ public:
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument (condition) of function if. "
                 "Must be UInt8.", arguments[0]->getName());
 
+        if (use_variant_when_no_common_type)
+        {
+            if (auto res = tryGetLeastSupertype(DataTypes{arguments[1], arguments[2]}))
+                return res;
+            return std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arguments[1]), removeNullableOrLowCardinalityNullable(arguments[2])});
+        }
+
         return getLeastSupertype(DataTypes{arguments[1], arguments[2]});
     }
 
@@ -1122,7 +1164,7 @@ public:
             || (res = executeGenericArray(cond_col, arguments, result_type))
             || (res = executeTuple(arguments, result_type, input_rows_count))))
         {
-            return executeGeneric(cond_col, arguments, input_rows_count);
+            return executeGeneric(cond_col, arguments, input_rows_count, use_variant_when_no_common_type);
         }
 
         return res;
diff --git a/src/Functions/isNotNull.cpp b/src/Functions/isNotNull.cpp
index cbdc08c2fab..360c2fc7f9f 100644
--- a/src/Functions/isNotNull.cpp
+++ b/src/Functions/isNotNull.cpp
@@ -5,6 +5,7 @@
 #include <Core/ColumnNumbers.h>
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnVariant.h>
 #include <Common/assert_cast.h>
 
 
@@ -45,6 +46,18 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         const ColumnWithTypeAndName & elem = arguments[0];
+
+        if (isVariant(elem.type))
+        {
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            auto res = DataTypeUInt8().createColumn();
+            auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
+            data.reserve(discriminators.size());
+            for (auto discr : discriminators)
+                data.push_back(discr != ColumnVariant::NULL_DISCRIMINATOR);
+            return res;
+        }
+
         if (elem.type->isLowCardinalityNullable())
         {
             const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
diff --git a/src/Functions/isNull.cpp b/src/Functions/isNull.cpp
index cdce037088d..4bf4e44f866 100644
--- a/src/Functions/isNull.cpp
+++ b/src/Functions/isNull.cpp
@@ -5,6 +5,7 @@
 #include <Core/ColumnNumbers.h>
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnVariant.h>
 
 
 namespace DB
@@ -44,6 +45,18 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
     {
         const ColumnWithTypeAndName & elem = arguments[0];
+
+        if (isVariant(elem.type))
+        {
+            const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
+            auto res = DataTypeUInt8().createColumn();
+            auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
+            data.reserve(discriminators.size());
+            for (auto discr : discriminators)
+                data.push_back(discr == ColumnVariant::NULL_DISCRIMINATOR);
+            return res;
+        }
+
         if (elem.type->isLowCardinalityNullable())
         {
             const auto * low_cardinality_column = checkAndGetColumn<ColumnLowCardinality>(*elem.column);
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index cdb9ca061c3..7a2e9444b2c 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -9,6 +9,7 @@
 #include <Common/typeid_cast.h>
 #include <Interpreters/Context.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/getLeastSupertype.h>
 
 
@@ -117,6 +118,15 @@ public:
             types_of_branches.emplace_back(arg);
         });
 
+        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
+        {
+            if (auto res = tryGetLeastSupertype(types_of_branches))
+                return res;
+            for (auto & type : types_of_branches)
+                type = removeNullableOrLowCardinalityNullable(type);
+            return std::make_shared<DataTypeVariant>(types_of_branches);
+        }
+
         return getLeastSupertype(types_of_branches);
     }
 
diff --git a/src/Functions/variantElement.cpp b/src/Functions/variantElement.cpp
new file mode 100644
index 00000000000..7c63e1266e6
--- /dev/null
+++ b/src/Functions/variantElement.cpp
@@ -0,0 +1,238 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/IDataType.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Common/assert_cast.h>
+#include <memory>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+namespace
+{
+
+/** Extract element of Variant by variant type name.
+  * Also the function looks through Arrays: you can get Array of Variant elements from Array of Variants.
+  */
+class FunctionVariantElement : public IFunction
+{
+public:
+    static constexpr auto name = "variantElement";
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionVariantElement>(); }
+    String getName() const override { return name; }
+    bool isVariadic() const override { return true; }
+    size_t getNumberOfArguments() const override { return 0; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        const size_t number_of_arguments = arguments.size();
+
+        if (number_of_arguments < 2 || number_of_arguments > 3)
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                            "Number of arguments for function {} doesn't match: passed {}, should be 2 or 3",
+                            getName(), number_of_arguments);
+
+        size_t count_arrays = 0;
+        const IDataType * input_type = arguments[0].type.get();
+        while (const DataTypeArray * array = checkAndGetDataType<DataTypeArray>(input_type))
+        {
+            input_type = array->getNestedType().get();
+            ++count_arrays;
+        }
+
+        const DataTypeVariant * variant_type = checkAndGetDataType<DataTypeVariant>(input_type);
+        if (!variant_type)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "First argument for function {} must be Variant or Array of Variant. Actual {}",
+                    getName(),
+                    arguments[0].type->getName());
+
+        std::optional<size_t> variant_global_discr = getVariantGlobalDiscriminator(arguments[1].column, *variant_type, number_of_arguments);
+        if (variant_global_discr.has_value())
+        {
+            DataTypePtr return_type = makeNullableOrLowCardinalityNullableSafe(variant_type->getVariant(variant_global_discr.value()));
+
+            for (; count_arrays; --count_arrays)
+                return_type = std::make_shared<DataTypeArray>(return_type);
+
+            return return_type;
+        }
+        else
+            return arguments[2].type;
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
+    {
+        const auto & input_arg = arguments[0];
+        const IDataType * input_type = input_arg.type.get();
+        const IColumn * input_col = input_arg.column.get();
+
+        bool input_arg_is_const = false;
+        if (typeid_cast<const ColumnConst *>(input_col))
+        {
+            input_col = assert_cast<const ColumnConst *>(input_col)->getDataColumnPtr().get();
+            input_arg_is_const = true;
+        }
+
+        Columns array_offsets;
+        while (const DataTypeArray * array_type = checkAndGetDataType<DataTypeArray>(input_type))
+        {
+            const ColumnArray * array_col = assert_cast<const ColumnArray *>(input_col);
+
+            input_type = array_type->getNestedType().get();
+            input_col = &array_col->getData();
+            array_offsets.push_back(array_col->getOffsetsPtr());
+        }
+
+        const DataTypeVariant * input_type_as_variant = checkAndGetDataType<DataTypeVariant>(input_type);
+        const ColumnVariant * input_col_as_variant = checkAndGetColumn<ColumnVariant>(input_col);
+        if (!input_type_as_variant || !input_col_as_variant)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                            "First argument for function {} must be Variant or array of Variants. Actual {}", getName(), input_arg.type->getName());
+
+        std::optional<size_t> variant_global_discr = getVariantGlobalDiscriminator(arguments[1].column, *input_type_as_variant, arguments.size());
+
+        if (!variant_global_discr.has_value())
+            return arguments[2].column;
+
+        const auto & variant_type = input_type_as_variant->getVariant(*variant_global_discr);
+        const auto & variant_column = input_col_as_variant->getVariantPtrByGlobalDiscriminator(*variant_global_discr);
+
+        /// If Variant has only NULLs or our variant doesn't have any real values,
+        /// just create column with default values and create null mask with 1.
+        if (input_col_as_variant->hasOnlyNulls() || variant_column->empty())
+        {
+            auto res = variant_type->createColumn();
+
+            if (variant_type->lowCardinality())
+                assert_cast<ColumnLowCardinality &>(*res).nestedToNullable();
+
+            res->insertManyDefaults(input_col_as_variant->size());
+            if (!variant_type->canBeInsideNullable())
+                return wrapInArraysAndConstIfNeeded(std::move(res), array_offsets, input_arg_is_const, input_rows_count);
+
+            auto null_map = ColumnUInt8::create();
+            auto & null_map_data = null_map->getData();
+            null_map_data.resize_fill(input_col_as_variant->size(), 1);
+            return wrapInArraysAndConstIfNeeded(ColumnNullable::create(std::move(res), std::move(null_map)), array_offsets, input_arg_is_const, input_rows_count);
+        }
+
+        /// If we extract single non-empty column and have no NULLs, then just return this variant.
+        if (auto non_empty_local_discr = input_col_as_variant->getLocalDiscriminatorOfOneNoneEmptyVariantNoNulls())
+        {
+            /// If we were trying to extract some other variant,
+            /// it would be empty and we would already processed this case above.
+            chassert(input_col_as_variant->globalDiscriminatorByLocal(*non_empty_local_discr) == variant_global_discr);
+            return wrapInArraysAndConstIfNeeded(makeNullableOrLowCardinalityNullableSafe(variant_column), array_offsets, input_arg_is_const, input_rows_count);
+        }
+
+        /// In general case we should calculate null-mask for variant
+        /// according to the discriminators column and expand
+        /// variant column by this mask to get a full column (with default values on NULLs)
+        const auto & local_discriminators = input_col_as_variant->getLocalDiscriminators();
+        auto null_map = ColumnUInt8::create();
+        auto & null_map_data = null_map->getData();
+        null_map_data.reserve(local_discriminators.size());
+        auto variant_local_discr = input_col_as_variant->localDiscriminatorByGlobal(*variant_global_discr);
+        for (auto local_discr : local_discriminators)
+            null_map_data.push_back(local_discr != variant_local_discr);
+
+        auto expanded_variant_column = IColumn::mutate(variant_column);
+        if (variant_type->lowCardinality())
+            expanded_variant_column = assert_cast<ColumnLowCardinality &>(*expanded_variant_column).cloneNullable();
+        expanded_variant_column->expand(null_map_data, /*inverted = */ true);
+        if (variant_type->canBeInsideNullable())
+            return wrapInArraysAndConstIfNeeded(ColumnNullable::create(std::move(expanded_variant_column), std::move(null_map)), array_offsets, input_arg_is_const, input_rows_count);
+        return wrapInArraysAndConstIfNeeded(std::move(expanded_variant_column), array_offsets, input_arg_is_const, input_rows_count);
+    }
+private:
+    std::optional<size_t> getVariantGlobalDiscriminator(const ColumnPtr & index_column, const DataTypeVariant & variant_type, size_t argument_size) const
+    {
+        const auto * name_col = checkAndGetColumnConst<ColumnString>(index_column.get());
+        if (!name_col)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                            "Second argument to {} with Variant argument must be a constant String",
+                            getName());
+
+        String variant_element_name = name_col->getValue<String>();
+        auto variant_element_type = DataTypeFactory::instance().tryGet(variant_element_name);
+        if (variant_element_type)
+        {
+            const auto & variants = variant_type.getVariants();
+            for (size_t i = 0; i != variants.size(); ++i)
+            {
+                if (variants[i]->getName() == variant_element_type->getName())
+                    return i;
+            }
+        }
+
+        if (argument_size == 2)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "{} doesn't contain variant with type {}", variant_type.getName(), variant_element_name);
+        return std::nullopt;
+    }
+
+    ColumnPtr wrapInArraysAndConstIfNeeded(ColumnPtr res, const Columns & array_offsets, bool input_arg_is_const, size_t input_rows_count) const
+    {
+        for (auto it = array_offsets.rbegin(); it != array_offsets.rend(); ++it)
+            res = ColumnArray::create(res, *it);
+
+        if (input_arg_is_const)
+            res = ColumnConst::create(res, input_rows_count);
+
+        return res;
+    }
+};
+
+}
+
+REGISTER_FUNCTION(VariantElement)
+{
+    factory.registerFunction<FunctionVariantElement>(FunctionDocumentation{
+        .description = R"(
+Extracts a column with specified type from a `Variant` column.
+)",
+        .syntax{"tupleElement(variant, type_name, [, default_value])"},
+        .arguments{{
+            {"variant", "Variant column"},
+            {"type_name", "The name of the variant type to extract"},
+            {"default_value", "The default value that will be used if variant doesn't have variant with specified type. Can be any type. Optional"}}},
+        .examples{{{
+            "Example",
+            R"(
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantElement(v, 'Array(UInt64)') FROM test;)",
+            R"(
+┌─v─────────────┬─variantElement(v, 'String')─┬─variantElement(v, 'UInt64')─┬─variantElement(v, 'Array(UInt64)')─┐
+│ ᴺᵁᴸᴸ          │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ []                                 │
+│ 42            │ ᴺᵁᴸᴸ                        │                          42 │ []                                 │
+│ Hello, World! │ Hello, World!               │                        ᴺᵁᴸᴸ │ []                                 │
+│ [1,2,3]       │ ᴺᵁᴸᴸ                        │                        ᴺᵁᴸᴸ │ [1,2,3]                            │
+└───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
+)"}}},
+        .categories{"Variant"},
+    });
+}
+
+}
diff --git a/src/IO/ReadHelpers.cpp b/src/IO/ReadHelpers.cpp
index ff5743a63af..2534f248d83 100644
--- a/src/IO/ReadHelpers.cpp
+++ b/src/IO/ReadHelpers.cpp
@@ -619,13 +619,16 @@ void readQuotedStringInto(Vector & s, ReadBuffer & buf)
     readAnyQuotedStringInto<'\'', enable_sql_style_quoting>(s, buf);
 }
 
-template <typename Vector>
+template <bool enable_sql_style_quoting, typename Vector>
 bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf)
 {
-    return readAnyQuotedStringInto<'\'', false, Vector, bool>(s, buf);
+    return readAnyQuotedStringInto<'\'', enable_sql_style_quoting, Vector, bool>(s, buf);
 }
 
-template bool tryReadQuotedStringInto(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<true, String>(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<false, String>(String & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<true, PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool tryReadQuotedStringInto<false, PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
 template <bool enable_sql_style_quoting, typename Vector>
 void readDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
@@ -633,6 +636,16 @@ void readDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
     readAnyQuotedStringInto<'"', enable_sql_style_quoting>(s, buf);
 }
 
+template <bool enable_sql_style_quoting, typename Vector>
+bool tryReadDoubleQuotedStringInto(Vector & s, ReadBuffer & buf)
+{
+    return readAnyQuotedStringInto<'"', enable_sql_style_quoting, Vector, bool>(s, buf);
+}
+
+template bool tryReadDoubleQuotedStringInto<true, String>(String & s, ReadBuffer & buf);
+template bool tryReadDoubleQuotedStringInto<false, String>(String & s, ReadBuffer & buf);
+
+
 template <bool enable_sql_style_quoting, typename Vector>
 void readBackQuotedStringInto(Vector & s, ReadBuffer & buf)
 {
@@ -652,6 +665,18 @@ void readQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
     readQuotedStringInto<true>(s, buf);
 }
 
+bool tryReadQuotedString(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadQuotedStringInto<false>(s, buf);
+}
+
+bool tryReadQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadQuotedStringInto<true>(s, buf);
+}
+
 
 template void readQuotedStringInto<true>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 template void readQuotedStringInto<true>(String & s, ReadBuffer & buf);
@@ -672,6 +697,18 @@ void readDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
     readDoubleQuotedStringInto<true>(s, buf);
 }
 
+bool tryReadDoubleQuotedString(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadDoubleQuotedStringInto<false>(s, buf);
+}
+
+bool tryReadDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return tryReadDoubleQuotedStringInto<true>(s, buf);
+}
+
 void readBackQuotedString(String & s, ReadBuffer & buf)
 {
     s.clear();
@@ -691,7 +728,7 @@ concept WithResize = requires (T value)
     { value.size() } -> std::integral<>;
 };
 
-template <typename Vector, bool include_quotes>
+template <typename Vector, bool include_quotes, bool allow_throw>
 void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV & settings)
 {
     /// Empty string
@@ -754,12 +791,20 @@ void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV &
         {
             PeekableReadBuffer * peekable_buf = dynamic_cast<PeekableReadBuffer *>(&buf);
             if (!peekable_buf)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Reading CSV string with custom delimiter is allowed only when using PeekableReadBuffer");
+            {
+                if constexpr (allow_throw)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Reading CSV string with custom delimiter is allowed only when using PeekableReadBuffer");
+                return;
+            }
 
             while (true)
             {
                 if (peekable_buf->eof())
-                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF while reading CSV string, expected custom delimiter \"{}\"", custom_delimiter);
+                {
+                    if constexpr (allow_throw)
+                        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF while reading CSV string, expected custom delimiter \"{}\"", custom_delimiter);
+                    return;
+                }
 
                 char * next_pos = reinterpret_cast<char *>(memchr(peekable_buf->position(), custom_delimiter[0], peekable_buf->available()));
                 if (!next_pos)
@@ -948,6 +993,9 @@ String readCSVFieldWithTwoPossibleDelimiters(PeekableReadBuffer & buf, const For
 
 template void readCSVStringInto<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 template void readCSVStringInto<NullOutput>(NullOutput & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<String, false, false>(String & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<String, true, false>(String & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
+template void readCSVStringInto<PaddedPODArray<UInt8>, false, false>(PaddedPODArray<UInt8> & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 
 
 template <typename Vector, typename ReturnType>
@@ -1069,15 +1117,18 @@ ReturnType readJSONObjectPossiblyInvalid(Vector & s, ReadBuffer & buf)
 }
 
 template void readJSONObjectPossiblyInvalid<String>(String & s, ReadBuffer & buf);
+template bool readJSONObjectPossiblyInvalid<String, bool>(String & s, ReadBuffer & buf);
 template void readJSONObjectPossiblyInvalid<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool readJSONObjectPossiblyInvalid<PaddedPODArray<UInt8>, bool>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
-template <typename Vector>
-void readJSONArrayInto(Vector & s, ReadBuffer & buf)
+template <typename Vector, typename ReturnType>
+ReturnType readJSONArrayInto(Vector & s, ReadBuffer & buf)
 {
-    readJSONObjectOrArrayPossiblyInvalid<Vector, void, '[', ']'>(s, buf);
+    return readJSONObjectOrArrayPossiblyInvalid<Vector, ReturnType, '[', ']'>(s, buf);
 }
 
-template void readJSONArrayInto<PaddedPODArray<UInt8>>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template void readJSONArrayInto<PaddedPODArray<UInt8>, void>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
+template bool readJSONArrayInto<PaddedPODArray<UInt8>, bool>(PaddedPODArray<UInt8> & s, ReadBuffer & buf);
 
 template <typename ReturnType>
 ReturnType readDateTextFallback(LocalDate & date, ReadBuffer & buf)
@@ -1217,6 +1268,13 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
                 return false;
         }
 
+        if constexpr (!throw_exception)
+        {
+            if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[2]) || !isNumericASCII(s[3])
+                || !isNumericASCII(s[5]) || !isNumericASCII(s[6]) || !isNumericASCII(s[8]) || !isNumericASCII(s[9]))
+                return false;
+        }
+
         UInt16 year = (s[0] - '0') * 1000 + (s[1] - '0') * 100 + (s[2] - '0') * 10 + (s[3] - '0');
         UInt8 month = (s[5] - '0') * 10 + (s[6] - '0');
         UInt8 day = (s[8] - '0') * 10 + (s[9] - '0');
@@ -1240,6 +1298,13 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
                     return false;
             }
 
+            if constexpr (!throw_exception)
+            {
+                if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[3]) || !isNumericASCII(s[4])
+                    || !isNumericASCII(s[6]) || !isNumericASCII(s[7]))
+                    return false;
+            }
+
             hour = (s[0] - '0') * 10 + (s[1] - '0');
             minute = (s[3] - '0') * 10 + (s[4] - '0');
             second = (s[6] - '0') * 10 + (s[7] - '0');
@@ -1259,7 +1324,14 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
         {
             /// Not very efficient.
             for (const char * digit_pos = s; digit_pos < s_pos; ++digit_pos)
+            {
+                if constexpr (!throw_exception)
+                {
+                    if (!isNumericASCII(*digit_pos))
+                        return false;
+                }
                 datetime = datetime * 10 + *digit_pos - '0';
+            }
         }
         datetime *= negative_multiplier;
 
@@ -1282,14 +1354,24 @@ template bool readDateTimeTextFallback<bool, false>(time_t &, ReadBuffer &, cons
 template bool readDateTimeTextFallback<bool, true>(time_t &, ReadBuffer &, const DateLUTImpl &);
 
 
-void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
+template <typename ReturnType>
+ReturnType skipJSONFieldImpl(ReadBuffer & buf, StringRef name_of_field)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof())
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+    {
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+        return ReturnType(false);
+    }
     else if (*buf.position() == '"') /// skip double-quoted string
     {
         NullOutput sink;
-        readJSONStringInto(sink, buf);
+        if constexpr (throw_exception)
+            readJSONStringInto(sink, buf);
+        else if (!tryReadJSONStringInto(sink, buf))
+            return ReturnType(false);
     }
     else if (isNumericASCII(*buf.position()) || *buf.position() == '-' || *buf.position() == '+' || *buf.position() == '.') /// skip number
     {
@@ -1298,19 +1380,32 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
 
         double v;
         if (!tryReadFloatText(v, buf))
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Expected a number field for key '{}'", name_of_field.toString());
+        {
+            if constexpr (throw_exception)
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Expected a number field for key '{}'", name_of_field.toString());
+            return ReturnType(false);
+        }
     }
     else if (*buf.position() == 'n') /// skip null
     {
-        assertString("null", buf);
+        if constexpr (throw_exception)
+            assertString("null", buf);
+        else if (!checkString("null", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == 't') /// skip true
     {
-        assertString("true", buf);
+        if constexpr (throw_exception)
+            assertString("true", buf);
+        else if (!checkString("true", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == 'f') /// skip false
     {
-        assertString("false", buf);
+        if constexpr (throw_exception)
+            assertString("false", buf);
+        else if (!checkString("false", buf))
+            return ReturnType(false);
     }
     else if (*buf.position() == '[')
     {
@@ -1320,12 +1415,16 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
         if (!buf.eof() && *buf.position() == ']') /// skip empty array
         {
             ++buf.position();
-            return;
+            return ReturnType(true);
         }
 
         while (true)
         {
-            skipJSONField(buf, name_of_field);
+            if constexpr (throw_exception)
+                skipJSONFieldImpl<ReturnType>(buf, name_of_field);
+            else if (!skipJSONFieldImpl<ReturnType>(buf, name_of_field))
+                return ReturnType(false);
+
             skipWhitespaceIfAny(buf);
 
             if (!buf.eof() && *buf.position() == ',')
@@ -1339,7 +1438,11 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
                 break;
             }
             else
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
         }
     }
     else if (*buf.position() == '{') /// skip whole object
@@ -1353,19 +1456,34 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
             if (*buf.position() == '"')
             {
                 NullOutput sink;
-                readJSONStringInto(sink, buf);
+                if constexpr (throw_exception)
+                    readJSONStringInto(sink, buf);
+                else if (!tryReadJSONStringInto(sink, buf))
+                    return ReturnType(false);
             }
             else
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
 
             // ':'
             skipWhitespaceIfAny(buf);
             if (buf.eof() || !(*buf.position() == ':'))
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol for key '{}'", name_of_field.toString());
+                return ReturnType(false);
+            }
             ++buf.position();
             skipWhitespaceIfAny(buf);
 
-            skipJSONField(buf, name_of_field);
+            if constexpr (throw_exception)
+                skipJSONFieldImpl<ReturnType>(buf, name_of_field);
+            else if (!skipJSONFieldImpl<ReturnType>(buf, name_of_field))
+                return ReturnType(false);
+
             skipWhitespaceIfAny(buf);
 
             // optional ','
@@ -1377,14 +1495,32 @@ void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
         }
 
         if (buf.eof())
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+        {
+            if constexpr (throw_exception)
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected EOF for key '{}'", name_of_field.toString());
+            return ReturnType(false);
+        }
         ++buf.position();
     }
     else
     {
-        throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol '{}' for key '{}'",
-                        std::string(*buf.position(), 1), name_of_field.toString());
+        if constexpr (throw_exception)
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected symbol '{}' for key '{}'",
+                            std::string(*buf.position(), 1), name_of_field.toString());
+        return ReturnType(false);
     }
+
+    return ReturnType(true);
+}
+
+void skipJSONField(ReadBuffer & buf, StringRef name_of_field)
+{
+    skipJSONFieldImpl<void>(buf, name_of_field);
+}
+
+bool trySkipJSONField(ReadBuffer & buf, StringRef name_of_field)
+{
+    return skipJSONFieldImpl<bool>(buf, name_of_field);
 }
 
 
@@ -1597,23 +1733,31 @@ void skipToNextRowOrEof(PeekableReadBuffer & buf, const String & row_after_delim
 }
 
 // Use PeekableReadBuffer to copy field to string after parsing.
-template <typename Vector, typename ParseFunc>
-static void readParsedValueInto(Vector & s, ReadBuffer & buf, ParseFunc parse_func)
+template <typename ReturnType, typename Vector, typename ParseFunc>
+static ReturnType readParsedValueInto(Vector & s, ReadBuffer & buf, ParseFunc parse_func)
 {
     PeekableReadBuffer peekable_buf(buf);
     peekable_buf.setCheckpoint();
-    parse_func(peekable_buf);
+    if constexpr (std::is_same_v<ReturnType, void>)
+        parse_func(peekable_buf);
+    else if (!parse_func(peekable_buf))
+        return ReturnType(false);
     peekable_buf.makeContinuousMemoryFromCheckpointToPos();
     auto * end = peekable_buf.position();
     peekable_buf.rollbackToCheckpoint();
     s.append(peekable_buf.position(), end);
     peekable_buf.position() = end;
+    return ReturnType(true);
 }
 
-template <typename Vector>
-static void readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType = void, typename Vector>
+static ReturnType readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
 {
-    assertChar('\'', buf);
+    if constexpr (std::is_same_v<ReturnType, void>)
+        assertChar('\'', buf);
+    else if (!checkChar('\'', buf))
+        return ReturnType(false);
+
     s.push_back('\'');
     while (!buf.eof())
     {
@@ -1641,16 +1785,23 @@ static void readQuotedStringFieldInto(Vector & s, ReadBuffer & buf)
     }
 
     if (buf.eof())
-        return;
+        return ReturnType(false);
 
     ++buf.position();
     s.push_back('\'');
+    return ReturnType(true);
 }
 
-template <char opening_bracket, char closing_bracket, typename Vector>
-static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType = void, char opening_bracket, char closing_bracket, typename Vector>
+static ReturnType readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
 {
-    assertChar(opening_bracket, buf);
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+    if constexpr (throw_exception)
+        assertChar(opening_bracket, buf);
+    else if (!checkChar(opening_bracket, buf))
+        return ReturnType(false);
+
     s.push_back(opening_bracket);
 
     size_t balance = 1;
@@ -1666,7 +1817,10 @@ static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
 
         if (*buf.position() == '\'')
         {
-            readQuotedStringFieldInto(s, buf);
+            if constexpr (throw_exception)
+                readQuotedStringFieldInto<void>(s, buf);
+            else if (!readQuotedStringFieldInto<bool>(s, buf))
+                return ReturnType(false);
         }
         else if (*buf.position() == opening_bracket)
         {
@@ -1681,13 +1835,20 @@ static void readQuotedFieldInBracketsInto(Vector & s, ReadBuffer & buf)
             ++buf.position();
         }
     }
+
+    if (balance)
+        return ReturnType(false);
+
+    return ReturnType(true);
 }
 
-template <typename Vector>
-void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
+template <typename ReturnType, typename Vector>
+ReturnType readQuotedFieldInto(Vector & s, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof())
-        return;
+        return ReturnType(false);
 
     /// Possible values in 'Quoted' field:
     /// - Strings: '...'
@@ -1699,35 +1860,47 @@ void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
     /// - Number: integer, float, decimal.
 
     if (*buf.position() == '\'')
-        readQuotedStringFieldInto(s, buf);
+        return readQuotedStringFieldInto<ReturnType>(s, buf);
     else if (*buf.position() == '[')
-        readQuotedFieldInBracketsInto<'[', ']'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '[', ']'>(s, buf);
     else if (*buf.position() == '(')
-        readQuotedFieldInBracketsInto<'(', ')'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '(', ')'>(s, buf);
     else if (*buf.position() == '{')
-        readQuotedFieldInBracketsInto<'{', '}'>(s, buf);
+        return readQuotedFieldInBracketsInto<ReturnType, '{', '}'>(s, buf);
     else if (checkCharCaseInsensitive('n', buf))
     {
         /// NULL or NaN
         if (checkCharCaseInsensitive('u', buf))
         {
-            assertStringCaseInsensitive("ll", buf);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("ll", buf);
+            else if (!checkStringCaseInsensitive("ll", buf))
+                return ReturnType(false);
             s.append("NULL");
         }
         else
         {
-            assertStringCaseInsensitive("an", buf);
+            if constexpr (throw_exception)
+                assertStringCaseInsensitive("an", buf);
+            else if (!checkStringCaseInsensitive("an", buf))
+                return ReturnType(false);
             s.append("NaN");
         }
     }
     else if (checkCharCaseInsensitive('t', buf))
     {
-        assertStringCaseInsensitive("rue", buf);
+        if constexpr (throw_exception)
+            assertStringCaseInsensitive("rue", buf);
+        else if (!checkStringCaseInsensitive("rue", buf))
+            return ReturnType(false);
         s.append("true");
     }
     else if (checkCharCaseInsensitive('f', buf))
     {
-        assertStringCaseInsensitive("alse", buf);
+        if constexpr (throw_exception)
+            assertStringCaseInsensitive("alse", buf);
+        else if (!checkStringCaseInsensitive("alse", buf))
+            return ReturnType(false);
         s.append("false");
     }
     else
@@ -1736,13 +1909,19 @@ void readQuotedFieldInto(Vector & s, ReadBuffer & buf)
         auto parse_func = [](ReadBuffer & in)
         {
             Float64 tmp;
-            readFloatText(tmp, in);
+            if constexpr (throw_exception)
+                readFloatText(tmp, in);
+            else
+                return tryReadFloatText(tmp, in);
         };
-        readParsedValueInto(s, buf, parse_func);
+
+        return readParsedValueInto<ReturnType>(s, buf, parse_func);
     }
+
+    return ReturnType(true);
 }
 
-template void readQuotedFieldInto<NullOutput>(NullOutput & s, ReadBuffer & buf);
+template void readQuotedFieldInto<void, NullOutput>(NullOutput & s, ReadBuffer & buf);
 
 void readQuotedField(String & s, ReadBuffer & buf)
 {
@@ -1750,11 +1929,24 @@ void readQuotedField(String & s, ReadBuffer & buf)
     readQuotedFieldInto(s, buf);
 }
 
+bool tryReadQuotedField(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    return readQuotedFieldInto<bool>(s, buf);
+}
+
 void readJSONField(String & s, ReadBuffer & buf)
 {
     s.clear();
     auto parse_func = [](ReadBuffer & in) { skipJSONField(in, "json_field"); };
-    readParsedValueInto(s, buf, parse_func);
+    readParsedValueInto<void>(s, buf, parse_func);
+}
+
+bool tryReadJSONField(String & s, ReadBuffer & buf)
+{
+    s.clear();
+    auto parse_func = [](ReadBuffer & in) { return trySkipJSONField(in, "json_field"); };
+    return readParsedValueInto<bool>(s, buf, parse_func);
 }
 
 void readTSVField(String & s, ReadBuffer & buf)
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 17f3d3d4151..ad62a3deaca 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -257,26 +257,43 @@ inline void readBoolText(bool & x, ReadBuffer & buf)
     x = tmp != '0';
 }
 
-inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case = false)
+template <typename ReturnType = void>
+inline ReturnType readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case = false)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        else
+            return ReturnType(false);
+    }
 
     switch (*buf.position())
     {
         case 't':
-            assertString("true", buf);
+            if constexpr (throw_exception)
+                assertString("true", buf);
+            else if (!checkString("true", buf))
+                return ReturnType(false);
             x = true;
             break;
         case 'f':
-            assertString("false", buf);
+            if constexpr (throw_exception)
+                assertString("false", buf);
+            else if (!checkString("false", buf))
+                return ReturnType(false);
             x = false;
             break;
         case 'T':
         {
             if (support_upper_case)
             {
-                assertString("TRUE", buf);
+                if constexpr (throw_exception)
+                    assertString("TRUE", buf);
+                else if (!checkString("TRUE", buf))
+                    return ReturnType(false);
                 x = true;
                 break;
             }
@@ -287,7 +304,10 @@ inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case
         {
             if (support_upper_case)
             {
-                assertString("FALSE", buf);
+                if constexpr (throw_exception)
+                    assertString("FALSE", buf);
+                else if (!checkString("FALSE", buf))
+                    return ReturnType(false);
                 x = false;
                 break;
             }
@@ -295,8 +315,15 @@ inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case
                 [[fallthrough]];
         }
         default:
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
+        {
+            if constexpr (throw_exception)
+                throw ParsingException(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
+            else
+                return ReturnType(false);
+        }
     }
+
+    return ReturnType(true);
 }
 
 enum class ReadIntTextCheckOverflow
@@ -468,7 +495,10 @@ void readIntText(T & x, ReadBuffer & buf)
 template <ReadIntTextCheckOverflow check_overflow = ReadIntTextCheckOverflow::CHECK_OVERFLOW, typename T>
 bool tryReadIntText(T & x, ReadBuffer & buf)
 {
-    return readIntTextImpl<T, bool, check_overflow>(x, buf);
+    if constexpr (is_decimal<T>)
+        return tryReadIntText<check_overflow>(x.value, buf);
+    else
+        return readIntTextImpl<T, bool, check_overflow>(x, buf);
 }
 
 
@@ -477,16 +507,18 @@ bool tryReadIntText(T & x, ReadBuffer & buf)
   * - for numbers starting with zero, parsed only zero;
   * - symbol '+' before number is not supported;
   */
-template <typename T, bool throw_on_error = true>
-void readIntTextUnsafe(T & x, ReadBuffer & buf)
+template <typename T, typename ReturnType = void>
+ReturnType readIntTextUnsafe(T & x, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
     bool negative = false;
     make_unsigned_t<T> res = 0;
 
     auto on_error = []
     {
-        if (throw_on_error)
+        if constexpr (throw_exception)
             throwReadAfterEOF();
+        return ReturnType(false);
     };
 
     if (buf.eof()) [[unlikely]]
@@ -504,7 +536,7 @@ void readIntTextUnsafe(T & x, ReadBuffer & buf)
     {
         ++buf.position();
         x = 0;
-        return;
+        return ReturnType(true);
     }
 
     while (!buf.eof())
@@ -523,12 +555,13 @@ void readIntTextUnsafe(T & x, ReadBuffer & buf)
 
     /// See note about undefined behaviour above.
     x = is_signed_v<T> && negative ? -res : res;
+    return ReturnType(true);
 }
 
 template <typename T>
-void tryReadIntTextUnsafe(T & x, ReadBuffer & buf)
+bool tryReadIntTextUnsafe(T & x, ReadBuffer & buf)
 {
-    return readIntTextUnsafe<T, false>(x, buf);
+    return readIntTextUnsafe<T, bool>(x, buf);
 }
 
 
@@ -550,9 +583,15 @@ void readEscapedString(String & s, ReadBuffer & buf);
 void readQuotedString(String & s, ReadBuffer & buf);
 void readQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
 
+bool tryReadQuotedString(String & s, ReadBuffer & buf);
+bool tryReadQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
+
 void readDoubleQuotedString(String & s, ReadBuffer & buf);
 void readDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
 
+bool tryReadDoubleQuotedString(String & s, ReadBuffer & buf);
+bool tryReadDoubleQuotedStringWithSQLStyle(String & s, ReadBuffer & buf);
+
 void readJSONString(String & s, ReadBuffer & buf);
 
 void readBackQuotedString(String & s, ReadBuffer & buf);
@@ -615,7 +654,7 @@ void readBackQuotedStringInto(Vector & s, ReadBuffer & buf);
 template <typename Vector>
 void readStringUntilEOFInto(Vector & s, ReadBuffer & buf);
 
-template <typename Vector, bool include_quotes = false>
+template <typename Vector, bool include_quotes = false, bool allow_throw = true>
 void readCSVStringInto(Vector & s, ReadBuffer & buf, const FormatSettings::CSV & settings);
 
 /// ReturnType is either bool or void. If bool, the function will return false instead of throwing an exception.
@@ -628,7 +667,7 @@ bool tryReadJSONStringInto(Vector & s, ReadBuffer & buf)
     return readJSONStringInto<Vector, bool>(s, buf);
 }
 
-template <typename Vector>
+template <bool enable_sql_style_quoting, typename Vector>
 bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf);
 
 /// Reads chunk of data between {} in that way,
@@ -637,8 +676,8 @@ bool tryReadQuotedStringInto(Vector & s, ReadBuffer & buf);
 template <typename Vector, typename ReturnType = void>
 ReturnType readJSONObjectPossiblyInvalid(Vector & s, ReadBuffer & buf);
 
-template <typename Vector>
-void readJSONArrayInto(Vector & s, ReadBuffer & buf);
+template <typename Vector, typename ReturnType = void>
+ReturnType readJSONArrayInto(Vector & s, ReadBuffer & buf);
 
 template <typename Vector>
 void readStringUntilWhitespaceInto(Vector & s, ReadBuffer & buf);
@@ -962,6 +1001,13 @@ inline ReturnType readDateTimeTextImpl(time_t & datetime, ReadBuffer & buf, cons
     {
         if (s[4] < '0' || s[4] > '9')
         {
+            if constexpr (!throw_exception)
+            {
+                if (!isNumericASCII(s[0]) || !isNumericASCII(s[1]) || !isNumericASCII(s[2]) || !isNumericASCII(s[3])
+                    || !isNumericASCII(s[5]) || !isNumericASCII(s[6]) || !isNumericASCII(s[8]) || !isNumericASCII(s[9]))
+                    return ReturnType(false);
+            }
+
             UInt16 year = (s[0] - '0') * 1000 + (s[1] - '0') * 100 + (s[2] - '0') * 10 + (s[3] - '0');
             UInt8 month = (s[5] - '0') * 10 + (s[6] - '0');
             UInt8 day = (s[8] - '0') * 10 + (s[9] - '0');
@@ -974,6 +1020,13 @@ inline ReturnType readDateTimeTextImpl(time_t & datetime, ReadBuffer & buf, cons
             bool dt_long = (s[10] == ' ' || s[10] == 'T');
             if (dt_long)
             {
+                if constexpr (!throw_exception)
+                {
+                    if (!isNumericASCII(s[11]) || !isNumericASCII(s[12]) || !isNumericASCII(s[14]) || !isNumericASCII(s[15])
+                        || !isNumericASCII(s[17]) || !isNumericASCII(s[18]))
+                        return ReturnType(false);
+                }
+
                 hour = (s[11] - '0') * 10 + (s[12] - '0');
                 minute = (s[14] - '0') * 10 + (s[15] - '0');
                 second = (s[17] - '0') * 10 + (s[18] - '0');
@@ -1311,6 +1364,11 @@ inline bool tryReadText(is_integer auto & x, ReadBuffer & buf)
     return tryReadIntText(x, buf);
 }
 
+inline bool tryReadText(is_floating_point auto & x, ReadBuffer & buf)
+{
+    return tryReadFloatText(x, buf);
+}
+
 inline bool tryReadText(UUID & x, ReadBuffer & buf) { return tryReadUUIDText(x, buf); }
 inline bool tryReadText(IPv4 & x, ReadBuffer & buf) { return tryReadIPv4Text(x, buf); }
 inline bool tryReadText(IPv6 & x, ReadBuffer & buf) { return tryReadIPv6Text(x, buf); }
@@ -1320,9 +1378,20 @@ inline void readText(is_floating_point auto & x, ReadBuffer & buf) { readFloatTe
 inline void readText(String & x, ReadBuffer & buf) { readEscapedString(x, buf); }
 
 inline void readText(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { readDateText(x, buf, time_zone); }
+inline bool tryReadText(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone = DateLUT::instance()) { return tryReadDateText(x, buf, time_zone); }
 
 inline void readText(LocalDate & x, ReadBuffer & buf) { readDateText(x, buf); }
+inline bool tryReadText(LocalDate & x, ReadBuffer & buf) { return tryReadDateText(x, buf); }
 inline void readText(LocalDateTime & x, ReadBuffer & buf) { readDateTimeText(x, buf); }
+inline bool tryReadText(LocalDateTime & x, ReadBuffer & buf)
+{
+    time_t time;
+    if (!tryReadDateTimeText(time, buf))
+        return false;
+    x = LocalDateTime(time, DateLUT::instance());
+    return true;
+}
+
 inline void readText(UUID & x, ReadBuffer & buf) { readUUIDText(x, buf); }
 inline void readText(IPv4 & x, ReadBuffer & buf) { readIPv4Text(x, buf); }
 inline void readText(IPv6 & x, ReadBuffer & buf) { readIPv6Text(x, buf); }
@@ -1400,39 +1469,71 @@ inline void readDoubleQuoted(LocalDateTime & x, ReadBuffer & buf)
 }
 
 /// CSV for numbers: quotes are optional, no special escaping rules.
-template <typename T>
-inline void readCSVSimple(T & x, ReadBuffer & buf)
+template <typename T, typename ReturnType = void>
+inline ReturnType readCSVSimple(T & x, ReadBuffer & buf)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        return ReturnType(false);
+    }
 
     char maybe_quote = *buf.position();
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
         ++buf.position();
 
-    readText(x, buf);
+    if constexpr (throw_exception)
+        readText(x, buf);
+    else if (!tryReadText(x, buf))
+        return ReturnType(false);
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
-        assertChar(maybe_quote, buf);
+    {
+        if constexpr (throw_exception)
+            assertChar(maybe_quote, buf);
+        else if (!checkChar(maybe_quote, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 // standalone overload for dates: to avoid instantiating DateLUTs while parsing other types
-template <typename T>
-inline void readCSVSimple(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone)
+template <typename T, typename ReturnType = void>
+inline ReturnType readCSVSimple(T & x, ReadBuffer & buf, const DateLUTImpl & time_zone)
 {
+    static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
     if (buf.eof()) [[unlikely]]
-        throwReadAfterEOF();
+    {
+        if constexpr (throw_exception)
+            throwReadAfterEOF();
+        return ReturnType(false);
+    }
 
     char maybe_quote = *buf.position();
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
         ++buf.position();
 
-    readText(x, buf, time_zone);
+    if constexpr (throw_exception)
+        readText(x, buf, time_zone);
+    else if (!tryReadText(x, buf, time_zone))
+        return ReturnType(false);
 
     if (maybe_quote == '\'' || maybe_quote == '\"')
-        assertChar(maybe_quote, buf);
+    {
+        if constexpr (throw_exception)
+            assertChar(maybe_quote, buf);
+        else if (!checkChar(maybe_quote, buf))
+            return ReturnType(false);
+    }
+
+    return ReturnType(true);
 }
 
 template <typename T>
@@ -1442,18 +1543,52 @@ inline void readCSV(T & x, ReadBuffer & buf)
     readCSVSimple(x, buf);
 }
 
+template <typename T>
+requires is_arithmetic_v<T>
+inline bool tryReadCSV(T & x, ReadBuffer & buf)
+{
+    return readCSVSimple<T, bool>(x, buf);
+}
+
 inline void readCSV(String & x, ReadBuffer & buf, const FormatSettings::CSV & settings) { readCSVString(x, buf, settings); }
+inline bool tryReadCSV(String & x, ReadBuffer & buf, const FormatSettings::CSV & settings)
+{
+    x.clear();
+    readCSVStringInto<String, false, false>(x, buf, settings);
+    return true;
+}
+
 inline void readCSV(LocalDate & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(LocalDate & x, ReadBuffer & buf) { return readCSVSimple<LocalDate, bool>(x, buf); }
+
 inline void readCSV(DayNum & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(DayNum & x, ReadBuffer & buf) { return readCSVSimple<DayNum, bool>(x, buf); }
 inline void readCSV(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { readCSVSimple(x, buf, time_zone); }
+inline bool tryReadCSV(DayNum & x, ReadBuffer & buf, const DateLUTImpl & time_zone) { return readCSVSimple<DayNum, bool>(x, buf, time_zone); }
+
 inline void readCSV(LocalDateTime & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(LocalDateTime & x, ReadBuffer & buf) { return readCSVSimple<LocalDateTime, bool>(x, buf); }
+
 inline void readCSV(UUID & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UUID & x, ReadBuffer & buf) { return readCSVSimple<UUID, bool>(x, buf); }
+
 inline void readCSV(IPv4 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(IPv4 & x, ReadBuffer & buf) { return readCSVSimple<IPv4, bool>(x, buf); }
+
 inline void readCSV(IPv6 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(IPv6 & x, ReadBuffer & buf) { return readCSVSimple<IPv6, bool>(x, buf); }
+
 inline void readCSV(UInt128 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UInt128 & x, ReadBuffer & buf) { return readCSVSimple<UInt128, bool>(x, buf); }
+
 inline void readCSV(Int128 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(Int128 & x, ReadBuffer & buf) { return readCSVSimple<Int128, bool>(x, buf); }
+
 inline void readCSV(UInt256 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(UInt256 & x, ReadBuffer & buf) { return readCSVSimple<UInt256, bool>(x, buf); }
+
 inline void readCSV(Int256 & x, ReadBuffer & buf) { readCSVSimple(x, buf); }
+inline bool tryReadCSV(Int256 & x, ReadBuffer & buf) { return readCSVSimple<Int256, bool>(x, buf); }
 
 template <typename T>
 void readBinary(std::vector<T> & x, ReadBuffer & buf)
@@ -1535,6 +1670,7 @@ inline void skipWhitespaceIfAny(ReadBuffer & buf, bool one_line = false)
 
 /// Skips json value.
 void skipJSONField(ReadBuffer & buf, StringRef name_of_field);
+bool trySkipJSONField(ReadBuffer & buf, StringRef name_of_field);
 
 
 /** Read serialized exception.
@@ -1749,12 +1885,14 @@ struct PcgDeserializer
     }
 };
 
-template <typename Vector>
-void readQuotedFieldInto(Vector & s, ReadBuffer & buf);
+template <typename ReturnType = void, typename Vector>
+ReturnType readQuotedFieldInto(Vector & s, ReadBuffer & buf);
 
 void readQuotedField(String & s, ReadBuffer & buf);
+bool tryReadQuotedField(String & s, ReadBuffer & buf);
 
 void readJSONField(String & s, ReadBuffer & buf);
+bool tryReadJSONField(String & s, ReadBuffer & buf);
 
 void readTSVField(String & s, ReadBuffer & buf);
 
diff --git a/src/IO/readDecimalText.h b/src/IO/readDecimalText.h
index 9fd9c439b87..81bde87f1f1 100644
--- a/src/IO/readDecimalText.h
+++ b/src/IO/readDecimalText.h
@@ -224,4 +224,24 @@ inline void readCSVDecimalText(ReadBuffer & buf, T & x, uint32_t precision, uint
         assertChar(maybe_quote, buf);
 }
 
+template <typename T>
+inline bool tryReadCSVDecimalText(ReadBuffer & buf, T & x, uint32_t precision, uint32_t & scale)
+{
+    if (buf.eof())
+        return false;
+
+    char maybe_quote = *buf.position();
+
+    if (maybe_quote == '\'' || maybe_quote == '\"')
+        ++buf.position();
+
+    if (!tryReadDecimalText(buf, x, precision, scale))
+        return false;
+
+    if ((maybe_quote == '\'' || maybe_quote == '\"') && !checkChar(maybe_quote, buf))
+        return false;
+
+    return true;
+}
+
 }
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index bf07f4ed3ee..51f767afc04 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -939,6 +939,20 @@ void InterpreterCreateQuery::validateTableStructure(const ASTCreateQuery & creat
             }
         }
     }
+    if (!create.attach && !settings.allow_experimental_variant_type)
+    {
+        for (const auto & [name, type] : properties.columns.getAllPhysical())
+        {
+            if (isVariant(type))
+            {
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN,
+                        "Cannot create table with column '{}' which type is '{}' "
+                        "because experimental Variant type is not allowed. "
+                        "Set setting allow_experimental_variant_type = 1 in order to allow it",
+                        name, type->getName());
+            }
+        }
+    }
 }
 
 namespace
diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 283289f0dfc..32b24cba940 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -532,7 +532,7 @@ BlockIO InterpreterInsertQuery::execute()
                     {
                         /// Change query sample block columns to Nullable to allow inserting nullable columns, where NULL values will be substituted with
                         /// default column values (in AddingDefaultsTransform), so all values will be cast correctly.
-                        if (isNullableOrLowCardinalityNullable(input_columns[col_idx].type) && !isNullableOrLowCardinalityNullable(query_columns[col_idx].type) && output_columns.has(query_columns[col_idx].name))
+                        if (isNullableOrLowCardinalityNullable(input_columns[col_idx].type) && !isNullableOrLowCardinalityNullable(query_columns[col_idx].type) && !isVariant(query_columns[col_idx].type) && output_columns.has(query_columns[col_idx].name))
                             query_sample_block.setColumn(col_idx, ColumnWithTypeAndName(makeNullableOrLowCardinalityNullable(query_columns[col_idx].column), makeNullableOrLowCardinalityNullable(query_columns[col_idx].type), query_columns[col_idx].name));
                     }
                 }
diff --git a/src/Interpreters/inplaceBlockConversions.cpp b/src/Interpreters/inplaceBlockConversions.cpp
index c7a1cab8bac..fd8f5b154c4 100644
--- a/src/Interpreters/inplaceBlockConversions.cpp
+++ b/src/Interpreters/inplaceBlockConversions.cpp
@@ -237,17 +237,36 @@ static std::unordered_map<String, ColumnPtr> collectOffsetsColumns(
             {
                 auto & offsets_column = offsets_columns[stream_name];
                 if (!offsets_column)
+                {
                     offsets_column = current_offsets_column;
+                }
+                else
+                {
+                    /// If we are inside Variant element, it may happen that
+                    /// offsets are different, because when we read Variant
+                    /// element as a subcolumn, we expand this column according
+                    /// to the discriminators, so, offsets column can be changed.
+                    /// In this case we should select the original offsets column
+                    /// of this stream, which is the smallest one.
+                    bool inside_variant_element = false;
+                    for (const auto & elem : subpath)
+                        inside_variant_element |= elem.type == ISerialization::Substream::VariantElement;
 
-            #ifndef NDEBUG
-                const auto & offsets_data = assert_cast<const ColumnUInt64 &>(*offsets_column).getData();
-                const auto & current_offsets_data = assert_cast<const ColumnUInt64 &>(*current_offsets_column).getData();
+                    if (offsets_column->size() != current_offsets_column->size() && inside_variant_element)
+                        offsets_column = offsets_column->size() < current_offsets_column->size() ? offsets_column : current_offsets_column;
+#ifndef NDEBUG
+                    else
+                    {
+                        const auto & offsets_data = assert_cast<const ColumnUInt64 &>(*offsets_column).getData();
+                        const auto & current_offsets_data = assert_cast<const ColumnUInt64 &>(*current_offsets_column).getData();
 
-                if (offsets_data != current_offsets_data)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR,
-                        "Found non-equal columns with offsets (sizes: {} and {}) for stream {}",
-                        offsets_data.size(), current_offsets_data.size(), stream_name);
-            #endif
+                        if (offsets_data != current_offsets_data)
+                            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                            "Found non-equal columns with offsets (sizes: {} and {}) for stream {}",
+                                            offsets_data.size(), current_offsets_data.size(), stream_name);
+                    }
+#endif
+                }
             }
         }, available_column->type, res_columns[i]);
     }
diff --git a/src/Interpreters/parseColumnsListForTableFunction.cpp b/src/Interpreters/parseColumnsListForTableFunction.cpp
index 87f76f7f824..551a883d093 100644
--- a/src/Interpreters/parseColumnsListForTableFunction.cpp
+++ b/src/Interpreters/parseColumnsListForTableFunction.cpp
@@ -60,6 +60,17 @@ void validateDataType(const DataTypePtr & type, const DataTypeValidationSettings
                     MAX_FIXEDSTRING_SIZE_WITHOUT_SUSPICIOUS);
         }
     }
+
+    if (!settings.allow_experimental_variant_type)
+    {
+        if (isVariant(type))
+        {
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN,
+                "Cannot create column with type '{}' because experimental Variant type is not allowed. "
+                "Set setting allow_experimental_variant_type = 1 in order to allow it", type->getName());
+        }
+    }
 }
 
 ColumnsDescription parseColumnsListFromString(const std::string & structure, const ContextPtr & context)
diff --git a/src/Interpreters/parseColumnsListForTableFunction.h b/src/Interpreters/parseColumnsListForTableFunction.h
index ef1bbe5498e..1fbbfa4b12f 100644
--- a/src/Interpreters/parseColumnsListForTableFunction.h
+++ b/src/Interpreters/parseColumnsListForTableFunction.h
@@ -18,12 +18,14 @@ struct DataTypeValidationSettings
         : allow_suspicious_low_cardinality_types(settings.allow_suspicious_low_cardinality_types)
         , allow_experimental_object_type(settings.allow_experimental_object_type)
         , allow_suspicious_fixed_string_types(settings.allow_suspicious_fixed_string_types)
+        , allow_experimental_variant_type(settings.allow_experimental_variant_type)
     {
     }
 
     bool allow_suspicious_low_cardinality_types = true;
     bool allow_experimental_object_type = true;
     bool allow_suspicious_fixed_string_types = true;
+    bool allow_experimental_variant_type = true;
 };
 
 void validateDataType(const DataTypePtr & type, const DataTypeValidationSettings & settings);
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 594221fe050..5dc791f7003 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -250,7 +250,7 @@ bool ParserTableAsStringLiteralIdentifier::parseImpl(Pos & pos, ASTPtr & node, E
     ReadBufferFromMemory in(pos->begin, pos->size());
     String s;
 
-    if (!tryReadQuotedStringInto(s, in))
+    if (!tryReadQuotedString(s, in))
     {
         expected.add(pos, "string literal");
         return false;
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
index 5e12ec18d27..cab0f7523f1 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
@@ -391,7 +391,7 @@ bool CSVFormatReader::readFieldImpl(ReadBuffer & istr, DB::IColumn & column, con
     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
     {
         /// If value is null but type is not nullable then use default value instead.
-        return SerializationNullable::deserializeTextCSVImpl(column, istr, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextCSV(column, istr, format_settings, serialization);
     }
 
     /// Read the column normally.
diff --git a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
index 7e8b4accf4d..9c7f095e661 100644
--- a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
@@ -409,7 +409,7 @@ bool MySQLDumpRowInputFormat::readField(IColumn & column, size_t column_idx)
     const auto & type = types[column_idx];
     const auto & serialization = serializations[column_idx];
     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-        return SerializationNullable::deserializeTextQuotedImpl(column, *in, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, *in, format_settings, serialization);
 
     serialization->deserializeTextQuoted(column, *in, format_settings);
     return true;
diff --git a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
index f4f92583473..0f68c28ab1f 100644
--- a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
@@ -147,7 +147,7 @@ bool TSKVRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & ex
                     const auto & type = getPort().getHeader().getByPosition(index).type;
                     const auto & serialization = serializations[index];
                     if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-                        read_columns[index] = SerializationNullable::deserializeTextEscapedImpl(*columns[index], *in, format_settings, serialization);
+                        read_columns[index] = SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(*columns[index], *in, format_settings, serialization);
                     else
                         serialization->deserializeTextEscaped(*columns[index], *in, format_settings);
                 }
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
index 3205adc2a48..88eb11d130d 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
@@ -167,7 +167,7 @@ bool TabSeparatedFormatReader::readField(IColumn & column, const DataTypePtr & t
     if (is_raw)
     {
         if (as_nullable)
-            return SerializationNullable::deserializeTextRawImpl(column, *buf, format_settings, serialization);
+            return SerializationNullable::deserializeNullAsDefaultOrNestedTextRaw(column, *buf, format_settings, serialization);
 
         serialization->deserializeTextRaw(column, *buf, format_settings);
         return true;
@@ -175,7 +175,7 @@ bool TabSeparatedFormatReader::readField(IColumn & column, const DataTypePtr & t
 
 
     if (as_nullable)
-        return SerializationNullable::deserializeTextEscapedImpl(column, *buf, format_settings, serialization);
+        return SerializationNullable::deserializeNullAsDefaultOrNestedTextEscaped(column, *buf, format_settings, serialization);
 
     serialization->deserializeTextEscaped(column, *buf, format_settings);
     return true;
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
index d55ccce8879..a7b5795b89e 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
@@ -293,7 +293,7 @@ bool ValuesBlockInputFormat::tryReadValue(IColumn & column, size_t column_idx)
             const auto & type = types[column_idx];
             const auto & serialization = serializations[column_idx];
             if (format_settings.null_as_default && !isNullableOrLowCardinalityNullable(type))
-                read = SerializationNullable::deserializeTextQuotedImpl(column, *buf, format_settings, serialization);
+                read = SerializationNullable::deserializeNullAsDefaultOrNestedTextQuoted(column, *buf, format_settings, serialization);
             else
                 serialization->deserializeTextQuoted(column, *buf, format_settings);
         }
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.reference b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
new file mode 100644
index 00000000000..98725917567
--- /dev/null
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
@@ -0,0 +1,516 @@
+JSON
+String
+{"v":null,"variantElement(v, 'String')":null}
+{"v":"string","variantElement(v, 'String')":"string"}
+{"v":"42","variantElement(v, 'String')":null}
+FixedString
+{"v":null,"variantElement(v, 'FixedString(4)')":null}
+{"v":"string","variantElement(v, 'FixedString(4)')":null}
+{"v":"abcd","variantElement(v, 'FixedString(4)')":"abcd"}
+Bool
+{"v":null,"variantElement(v, 'Bool')":null}
+{"v":"string","variantElement(v, 'Bool')":null}
+{"v":true,"variantElement(v, 'Bool')":true}
+Integers
+{"v":null,"variantElement(v, 'Int8')":null}
+{"v":"string","variantElement(v, 'Int8')":null}
+{"v":-1,"variantElement(v, 'Int8')":-1}
+{"v":0,"variantElement(v, 'Int8')":0}
+{"v":"10000000000","variantElement(v, 'Int8')":null}
+{"v":null,"variantElement(v, 'UInt8')":null}
+{"v":"string","variantElement(v, 'UInt8')":null}
+{"v":"-1","variantElement(v, 'UInt8')":null}
+{"v":0,"variantElement(v, 'UInt8')":0}
+{"v":"10000000000","variantElement(v, 'UInt8')":null}
+{"v":null,"variantElement(v, 'Int16')":null}
+{"v":"string","variantElement(v, 'Int16')":null}
+{"v":-1,"variantElement(v, 'Int16')":-1}
+{"v":0,"variantElement(v, 'Int16')":0}
+{"v":"10000000000","variantElement(v, 'Int16')":null}
+{"v":null,"variantElement(v, 'UInt16')":null}
+{"v":"string","variantElement(v, 'UInt16')":null}
+{"v":"-1","variantElement(v, 'UInt16')":null}
+{"v":0,"variantElement(v, 'UInt16')":0}
+{"v":"10000000000","variantElement(v, 'UInt16')":null}
+{"v":null,"variantElement(v, 'Int32')":null}
+{"v":"string","variantElement(v, 'Int32')":null}
+{"v":-1,"variantElement(v, 'Int32')":-1}
+{"v":0,"variantElement(v, 'Int32')":0}
+{"v":"10000000000","variantElement(v, 'Int32')":null}
+{"v":null,"variantElement(v, 'UInt32')":null}
+{"v":"string","variantElement(v, 'UInt32')":null}
+{"v":"-1","variantElement(v, 'UInt32')":null}
+{"v":0,"variantElement(v, 'UInt32')":0}
+{"v":"10000000000","variantElement(v, 'UInt32')":null}
+{"v":null,"variantElement(v, 'Int64')":null}
+{"v":"string","variantElement(v, 'Int64')":null}
+{"v":"-1","variantElement(v, 'Int64')":"-1"}
+{"v":"0","variantElement(v, 'Int64')":"0"}
+{"v":"10000000000000000000000","variantElement(v, 'Int64')":null}
+{"v":null,"variantElement(v, 'UInt64')":null}
+{"v":"string","variantElement(v, 'UInt64')":null}
+{"v":"-1","variantElement(v, 'UInt64')":null}
+{"v":"0","variantElement(v, 'UInt64')":"0"}
+{"v":"10000000000000000000000","variantElement(v, 'UInt64')":null}
+{"v":null,"variantElement(v, 'Int128')":null}
+{"v":"string","variantElement(v, 'Int128')":null}
+{"v":"-1","variantElement(v, 'Int128')":"-1"}
+{"v":"0","variantElement(v, 'Int128')":"0"}
+{"v":null,"variantElement(v, 'UInt128')":null}
+{"v":"string","variantElement(v, 'UInt128')":null}
+{"v":"-1","variantElement(v, 'UInt128')":null}
+{"v":"0","variantElement(v, 'UInt128')":"0"}
+Floats
+{"v":null,"variantElement(v, 'Float32')":null}
+{"v":"string","variantElement(v, 'Float32')":null}
+{"v":42.42,"variantElement(v, 'Float32')":42.42}
+{"v":null,"variantElement(v, 'Float64')":null}
+{"v":"string","variantElement(v, 'Float64')":null}
+{"v":42.42,"variantElement(v, 'Float64')":42.42}
+Decimals
+{"v":null,"variantElement(v, 'Decimal32(6)')":null}
+{"v":"string","variantElement(v, 'Decimal32(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal32(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal32(6)')":null}
+{"v":null,"variantElement(v, 'Decimal64(6)')":null}
+{"v":"string","variantElement(v, 'Decimal64(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal64(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal64(6)')":null}
+{"v":null,"variantElement(v, 'Decimal128(6)')":null}
+{"v":"string","variantElement(v, 'Decimal128(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal128(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal128(6)')":null}
+{"v":null,"variantElement(v, 'Decimal256(6)')":null}
+{"v":"string","variantElement(v, 'Decimal256(6)')":null}
+{"v":42.42,"variantElement(v, 'Decimal256(6)')":42.42}
+{"v":"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242","variantElement(v, 'Decimal256(6)')":null}
+Dates and DateTimes
+{"v":null,"variantElement(v, 'Date')":null}
+{"v":"string","variantElement(v, 'Date')":null}
+{"v":"2020-01-01","variantElement(v, 'Date')":"2020-01-01"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'Date')":null}
+{"v":null,"variantElement(v, 'Date32')":null}
+{"v":"string","variantElement(v, 'Date32')":null}
+{"v":"1900-01-01","variantElement(v, 'Date32')":"1900-01-01"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'Date32')":null}
+{"v":null,"variantElement(v, 'DateTime')":null}
+{"v":"string","variantElement(v, 'DateTime')":null}
+{"v":"2020-01-01 00:00:00","variantElement(v, 'DateTime')":"2020-01-01 00:00:00"}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'DateTime')":null}
+{"v":null,"variantElement(v, 'DateTime64')":null}
+{"v":"string","variantElement(v, 'DateTime64')":null}
+{"v":"2020-01-01 00:00:00.999","variantElement(v, 'DateTime64')":"2020-01-01 00:00:00.999"}
+{"v":"2020-01-01 00:00:00.999999999 ABC","variantElement(v, 'DateTime64')":null}
+UUID
+{"v":null,"variantElement(v, 'UUID')":null}
+{"v":"string","variantElement(v, 'UUID')":null}
+{"v":"c8619cca-0caa-445e-ae76-1d4f6e0b3927","variantElement(v, 'UUID')":"c8619cca-0caa-445e-ae76-1d4f6e0b3927"}
+IPv4
+{"v":null,"variantElement(v, 'IPv4')":null}
+{"v":"string","variantElement(v, 'IPv4')":null}
+{"v":"127.0.0.1","variantElement(v, 'IPv4')":"127.0.0.1"}
+IPv6
+{"v":null,"variantElement(v, 'IPv6')":null}
+{"v":"string","variantElement(v, 'IPv6')":null}
+{"v":"2001:db8:85a3::8a2e:370:7334","variantElement(v, 'IPv6')":"2001:db8:85a3::8a2e:370:7334"}
+Enum
+{"v":null,"variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+{"v":"string","variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+{"v":"a","variantElement(v, 'Enum(\\'a\\' = 1)')":"a"}
+{"v":"a","variantElement(v, 'Enum(\\'a\\' = 1)')":"a"}
+{"v":2,"variantElement(v, 'Enum(\\'a\\' = 1)')":null}
+Map
+{"v":null,"variantElement(v, 'Map(String, UInt64)')":{}}
+{"v":"string","variantElement(v, 'Map(String, UInt64)')":{}}
+{"v":{"a":"42","b":"43","c":"0"},"variantElement(v, 'Map(String, UInt64)')":{"a":"42","b":"43","c":"0"}}
+{"v":"{\"c\" : 44, \"d\" : [1,2,3]}","variantElement(v, 'Map(String, UInt64)')":{}}
+Tuple
+{"v":null,"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"0","b":"0"}}
+{"v":"string","variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"0","b":"0"}}
+{"v":{"a":"42","b":"0"},"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"42","b":"0"}}
+{"v":{"a":"44","b":"0"},"variantElement(v, 'Tuple(a UInt64, b UInt64)')":{"a":"44","b":"0"}}
+\N	(0,0)
+string	(0,0)
+(42,0)	(42,0)
+{"a" : 44, "d" : 32}	(0,0)
+Array
+{"v":null,"variantElement(v, 'Array(UInt64)')":[]}
+{"v":"string","variantElement(v, 'Array(UInt64)')":[]}
+{"v":["1","2","3"],"variantElement(v, 'Array(UInt64)')":["1","2","3"]}
+{"v":["0","0","0"],"variantElement(v, 'Array(UInt64)')":["0","0","0"]}
+{"v":"[1, 2, \"hello\"]","variantElement(v, 'Array(UInt64)')":[]}
+LowCardinality
+{"v":null,"variantElement(v, 'LowCardinality(String)')":null}
+{"v":"string","variantElement(v, 'LowCardinality(String)')":"string"}
+{"v":"42","variantElement(v, 'LowCardinality(String)')":null}
+{"v":null,"variantElement(v, 'Array(LowCardinality(Nullable(String)))')":[]}
+{"v":["string",null],"variantElement(v, 'Array(LowCardinality(Nullable(String)))')":["string",null]}
+{"v":"42","variantElement(v, 'Array(LowCardinality(Nullable(String)))')":[]}
+Nullable
+{"v":null,"variantElement(v, 'Array(Nullable(String))')":[]}
+{"v":"string","variantElement(v, 'Array(Nullable(String))')":[]}
+{"v":["hello",null,"world"],"variantElement(v, 'Array(Nullable(String))')":["hello",null,"world"]}
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+CSV
+String
+\N,\N
+"string","string"
+"string","string"
+42,\N
+FixedString
+\N,\N
+"string",\N
+"string",\N
+"abcd","abcd"
+Bool
+\N,\N
+"Truee",\N
+true,true
+Integers
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+10000000000000000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+10000000000000000000000,\N
+"42d42",\N
+\N,\N
+"string",\N
+-1,-1
+0,0
+"42d42",\N
+\N,\N
+"string",\N
+-1,\N
+0,0
+"42d42",\N
+Floats
+\N,\N
+"string",\N
+42.42,42.42
+"42.d42",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42.d42",\N
+Decimals
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+\N,\N
+"string",\N
+42.42,42.42
+"42d42",\N
+"4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242",\N
+Dates and DateTimes
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01","2020-01-01"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"1900-01-01","1900-01-01"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01 00:00:00","2020-01-01 00:00:00"
+"2020-01-01 00:00:00.999",\N
+\N,\N
+"string",\N
+"2020-01-d1",\N
+"2020-01-01 00:00:00.999","2020-01-01 00:00:00.999"
+"2020-01-01 00:00:00.999999999 ABC",\N
+UUID
+\N,\N
+"string",\N
+"c8619cca-0caa-445e-ae76-1d4f6e0b3927","c8619cca-0caa-445e-ae76-1d4f6e0b3927"
+"c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA",\N
+IPv4
+\N,\N
+"string",\N
+"127.0.0.1","127.0.0.1"
+"127.0.0.1AAA",\N
+IPv6
+\N,\N
+"string",\N
+"2001:db8:85a3::8a2e:370:7334","2001:db8:85a3::8a2e:370:7334"
+"2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA",\N
+Enum
+\N,\N
+"string",\N
+"a","a"
+"a","a"
+2,\N
+"aa",\N
+Map
+\N,"{}"
+"string","{}"
+"{'a':42,'b':43,'c':0}","{'a':42,'b':43,'c':0}"
+"{'c' : 44, 'd' : [1,2,3]}","{}"
+"{'c' : 44","{}"
+Array
+\N,"[]"
+"string","[]"
+"[1,2,3]","[1,2,3]"
+"[0,0,0]","[0,0,0]"
+"[1, 2, 'hello']","[]"
+"[1, 2","[]"
+LowCardinality
+\N,\N
+"string","string"
+42,\N
+\N,"[]"
+"['string',NULL]","['string',NULL]"
+"['string', nul]","[]"
+42,"[]"
+Nullable
+\N,"[]"
+"string","[]"
+"['hello',NULL,'world']","['hello',NULL,'world']"
+"['hello', nul]","[]"
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+TSV
+String
+\N	\N
+string	string
+42	\N
+FixedString
+\N	\N
+string	\N
+abcd	abcd
+Bool
+\N	\N
+Truee	\N
+true	true
+Integers
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+10000000000000000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+10000000000000000000000	\N
+42d42	\N
+\N	\N
+string	\N
+-1	-1
+0	0
+42d42	\N
+\N	\N
+string	\N
+-1	\N
+0	0
+42d42	\N
+Floats
+\N	\N
+string	\N
+42.42	42.42
+42.d42	\N
+\N	\N
+string	\N
+42.42	42.42
+42.d42	\N
+Decimals
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+\N	\N
+string	\N
+42.42	42.42
+42d42	\N
+4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242	\N
+Dates and DateTimes
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01	2020-01-01
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+1900-01-01	1900-01-01
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01 00:00:00	2020-01-01 00:00:00
+2020-01-01 00:00:00.999	\N
+\N	\N
+string	\N
+2020-01-d1	\N
+2020-01-01 00:00:00.999	2020-01-01 00:00:00.999
+2020-01-01 00:00:00.999999999 ABC	\N
+UUID
+\N	\N
+string	\N
+c8619cca-0caa-445e-ae76-1d4f6e0b3927	c8619cca-0caa-445e-ae76-1d4f6e0b3927
+c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA	\N
+IPv4
+\N	\N
+string	\N
+127.0.0.1	127.0.0.1
+127.0.0.1AAA	\N
+IPv6
+\N	\N
+string	\N
+2001:db8:85a3::8a2e:370:7334	2001:db8:85a3::8a2e:370:7334
+2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA	\N
+Enum
+\N	\N
+string	\N
+a	a
+a	a
+2	\N
+aa	\N
+Map
+\N	{}
+string	{}
+{'a':42,'b':43,'c':0}	{'a':42,'b':43,'c':0}
+{\'c\' : 44, \'d\' : [1,2,3]}	{}
+{\'c\' : 44	{}
+Array
+\N	[]
+string	[]
+[1,2,3]	[1,2,3]
+[0,0,0]	[0,0,0]
+[1, 2, \'hello\']	[]
+[1, 2	[]
+LowCardinality
+\N	\N
+string	string
+42	\N
+\N	[]
+['string',NULL]	['string',NULL]
+[\'string\', nul]	[]
+42	[]
+Nullable
+\N	[]
+string	[]
+['hello',NULL,'world']	['hello',NULL,'world']
+[\'hello\', nul]	[]
+{"repeat('-', 80)":"--------------------------------------------------------------------------------"}
+Values
+String
+(NULL,NULL),('string','string'),(42,NULL)FixedString
+(NULL,NULL),('string',NULL),('abcd','abcd')Bool
+(NULL,NULL),(true,true)Integers
+(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0)(NULL,NULL),('string',NULL),(-1,NULL),(0,0)Floats
+(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Decimals
+(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Dates and DateTimes
+(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000','1970-01-01 00:00:00.000'),('2020-01-01 00:00:00.999',NULL),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
+(NULL,NULL),('string',NULL),('c8619cca-0caa-445e-ae76-1d4f6e0b3927','c8619cca-0caa-445e-ae76-1d4f6e0b3927'),('c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA',NULL)IPv4
+(NULL,NULL),('string',NULL),('127.0.0.1','127.0.0.1'),('127.0.0.1AAA',NULL)IPv6
+(NULL,NULL),('string',NULL),('2001:db8:85a3::8a2e:370:7334','2001:db8:85a3::8a2e:370:7334'),('2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA',NULL)Enum
+(NULL,NULL),('string',NULL),('a','a'),(1,NULL),(2,NULL),('aa',NULL)Map
+(NULL,{}),('string',{}),({'a':42,'b':43,'c':0},{'a':42,'b':43,'c':0})Array
+(NULL,[]),('string',[]),([1,2,3],[1,2,3]),([0,0,0],[0,0,0])LowCardinality
+(NULL,NULL),('string','string'),(42,NULL)(NULL,[]),(['string',NULL],['string',NULL]),(42,[])Nullable
+(NULL,[]),('string',[]),(['hello',NULL,'world'],['hello',NULL,'world'])
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.sql b/tests/queries/0_stateless/02940_variant_text_deserialization.sql
new file mode 100644
index 00000000000..041d02088ef
--- /dev/null
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.sql
@@ -0,0 +1,266 @@
+set allow_experimental_variant_type = 1;
+set session_timezone = 'UTC';
+
+select 'JSON';
+select 'String';
+select v, variantElement(v, 'String') from format(JSONEachRow, 'v Variant(String, UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : 42}') format JSONEachRow;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(JSONEachRow, 'v Variant(String, FixedString(4))', '{"v" : null}, {"v" : "string"}, {"v" : "abcd"}') format JSONEachRow;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(JSONEachRow, 'v Variant(String, Bool)', '{"v" : null}, {"v" : "string"}, {"v" : true}') format JSONEachRow;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(JSONEachRow, 'v Variant(String, Int8, UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt8') from format(JSONEachRow, 'v Variant(String, UInt8, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int16') from format(JSONEachRow, 'v Variant(String, Int16, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt16') from format(JSONEachRow, 'v Variant(String, UInt16, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int32') from format(JSONEachRow, 'v Variant(String, Int32, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt32') from format(JSONEachRow, 'v Variant(String, UInt32, Int64)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int64') from format(JSONEachRow, 'v Variant(String, Int64, Int128)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000000000000000}') format JSONEachRow;
+select v, variantElement(v, 'UInt64') from format(JSONEachRow, 'v Variant(String, UInt64, Int128)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}, {"v" : 10000000000000000000000}') format JSONEachRow;
+select v, variantElement(v, 'Int128') from format(JSONEachRow, 'v Variant(String, Int128, Int256)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}') format JSONEachRow;
+select v, variantElement(v, 'UInt128') from format(JSONEachRow, 'v Variant(String, UInt128, Int256)', '{"v" : null}, {"v" : "string"}, {"v" : -1}, {"v" : 0}') format JSONEachRow;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(JSONEachRow, 'v Variant(String, Float32)', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}') format JSONEachRow;
+select v, variantElement(v, 'Float64') from format(JSONEachRow, 'v Variant(String, Float64)', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}') format JSONEachRow;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(JSONEachRow, 'v Variant(String, Decimal32(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal64(6)') from format(JSONEachRow, 'v Variant(String, Decimal64(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal128(6)') from format(JSONEachRow, 'v Variant(String, Decimal128(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+select v, variantElement(v, 'Decimal256(6)') from format(JSONEachRow, 'v Variant(String, Decimal256(6))', '{"v" : null}, {"v" : "string"}, {"v" : 42.42}, {"v" : 4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242}') format JSONEachRow;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(JSONEachRow, 'v Variant(String, Date, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'Date32') from format(JSONEachRow, 'v Variant(String, Date32, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "1900-01-01"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'DateTime') from format(JSONEachRow, 'v Variant(String, DateTime, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01 00:00:00"}, {"v" : "2020-01-01 00:00:00.999"}') format JSONEachRow;
+select v, variantElement(v, 'DateTime64') from format(JSONEachRow, 'v Variant(String, DateTime64)', '{"v" : null}, {"v" : "string"}, {"v" : "2020-01-01 00:00:00.999"}, {"v" : "2020-01-01 00:00:00.999999999 ABC"}') format JSONEachRow;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(JSONEachRow, 'v Variant(String, UUID)', '{"v" : null}, {"v" : "string"}, {"v" : "c8619cca-0caa-445e-ae76-1d4f6e0b3927"}') format JSONEachRow;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(JSONEachRow, 'v Variant(String, IPv4)', '{"v" : null}, {"v" : "string"}, {"v" : "127.0.0.1"}') format JSONEachRow;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(JSONEachRow, 'v Variant(String, IPv6)', '{"v" : null}, {"v" : "string"}, {"v" : "2001:0db8:85a3:0000:0000:8a2e:0370:7334"}') format JSONEachRow;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(JSONEachRow, 'v Variant(String, UInt32, Enum(''a'' = 1))', '{"v" : null}, {"v" : "string"}, {"v" : "a"}, {"v" : 1}, {"v" : 2}') format JSONEachRow;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(JSONEachRow, 'v Variant(String, Map(String, UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : 43, "c" : null}}, {"v" : {"c" : 44, "d" : [1,2,3]}}') format JSONEachRow;
+
+select 'Tuple';
+select v, variantElement(v, 'Tuple(a UInt64, b UInt64)') from format(JSONEachRow, 'v Variant(String, Tuple(a UInt64, b UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : null}}, {"v" : {"a" : 44, "d" : 32}}') format JSONEachRow;
+select v, variantElement(v, 'Tuple(a UInt64, b UInt64)') from format(JSONEachRow, 'v Variant(String, Tuple(a UInt64, b UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : {"a" : 42, "b" : null}}, {"v" : {"a" : 44, "d" : 32}}') settings input_format_json_defaults_for_missing_elements_in_named_tuple=0;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(JSONEachRow, 'v Variant(String, Array(UInt64))', '{"v" : null}, {"v" : "string"}, {"v" : [1, 2, 3]}, {"v" : [null, null, null]} {"v" : [1, 2, "hello"]}') format JSONEachRow;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(JSONEachRow, 'v Variant(LowCardinality(String), UInt64)', '{"v" : null}, {"v" : "string"}, {"v" : 42}') format JSONEachRow;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(JSONEachRow, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64)', '{"v" : null}, {"v" : ["string", null]}, {"v" : 42}') format JSONEachRow;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(JSONEachRow, 'v Variant(String, Array(Nullable(String)))', '{"v" : null}, {"v" : "string"}, {"v" : ["hello", null, "world"]}') format JSONEachRow;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'CSV';
+select 'String';
+select v, variantElement(v, 'String') from format(CSV, 'v Variant(String, UInt64)', '\\N\n"string"\nstring\n42') format CSV;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(CSV, 'v Variant(String, FixedString(4))', '\\N\n"string"\nstring\n"abcd"') format CSV;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(CSV, 'v Variant(String, Bool)', '\\N\nTruee\nTrue') format CSV;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(CSV, 'v Variant(String, Int8, UInt64)', '\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt8') from format(CSV, 'v Variant(String, UInt8, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int16') from format(CSV, 'v Variant(String, Int16, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt16') from format(CSV, 'v Variant(String, UInt16, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int32') from format(CSV, 'v Variant(String, Int32, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt32') from format(CSV, 'v Variant(String, UInt32, Int64)', '\\N\n"string"\n-1\n0\n10000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int64') from format(CSV, 'v Variant(String, Int64, Int128)', '\\N\n"string"\n-1\n0\n10000000000000000000000\n42d42') format CSV;
+select v, variantElement(v, 'UInt64') from format(CSV, 'v Variant(String, UInt64, Int128)', '\\N\n"string"\n-1\n0\n10000000000000000000000\n42d42') format CSV;
+select v, variantElement(v, 'Int128') from format(CSV, 'v Variant(String, Int128, Int256)', '\\N\n"string"\n-1\n0\n42d42') format CSV;
+select v, variantElement(v, 'UInt128') from format(CSV, 'v Variant(String, UInt128, Int256)', '\\N\n"string"\n-1\n0\n42d42') format CSV;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(CSV, 'v Variant(String, Float32)', '\\N\n"string"\n42.42\n42.d42') format CSV;
+select v, variantElement(v, 'Float64') from format(CSV, 'v Variant(String, Float64)', '\\N\n"string"\n42.42\n42.d42') format CSV;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(CSV, 'v Variant(String, Decimal32(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal64(6)') from format(CSV, 'v Variant(String, Decimal64(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal128(6)') from format(CSV, 'v Variant(String, Decimal128(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+select v, variantElement(v, 'Decimal256(6)') from format(CSV, 'v Variant(String, Decimal256(6))', '\\N\n"string"\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format CSV;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(CSV, 'v Variant(String, Date, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'Date32') from format(CSV, 'v Variant(String, Date32, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"1900-01-01"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'DateTime') from format(CSV, 'v Variant(String, DateTime, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01 00:00:00"\n"2020-01-01 00:00:00.999"') format CSV;
+select v, variantElement(v, 'DateTime64') from format(CSV, 'v Variant(String, DateTime64)', '\\N\n"string"\n"2020-01-d1"\n"2020-01-01 00:00:00.999"\n"2020-01-01 00:00:00.999999999 ABC"') format CSV;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(CSV, 'v Variant(String, UUID)', '\\N\n"string"\n"c8619cca-0caa-445e-ae76-1d4f6e0b3927"\nc8619cca-0caa-445e-ae76-1d4f6e0b3927AAA') format CSV;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(CSV, 'v Variant(String, IPv4)', '\\N\n"string"\n"127.0.0.1"\n"127.0.0.1AAA"') format CSV;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(CSV, 'v Variant(String, IPv6)', '\\N\n"string"\n"2001:0db8:85a3:0000:0000:8a2e:0370:7334"\n2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA') format CSV;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(CSV, 'v Variant(String, UInt32, Enum(''a'' = 1))', '\\N\n"string"\n"a"\n1\n2\naa') format CSV;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(CSV, 'v Variant(String, Map(String, UInt64))', '\\N\n"string"\n"{''a'' : 42, ''b'' : 43, ''c'' : null}"\n"{''c'' : 44, ''d'' : [1,2,3]}"\n"{''c'' : 44"') format CSV;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(CSV, 'v Variant(String, Array(UInt64))', '\\N\n"string"\n"[1, 2, 3]"\n"[null, null, null]"\n"[1, 2, ''hello'']"\n"[1, 2"') format CSV;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(CSV, 'v Variant(LowCardinality(String), UInt64)', '\\N\n"string"\n42') format CSV;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(CSV, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '\\N\n"[''string'', null]"\n"[''string'', nul]"\n42') format CSV;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(CSV, 'v Variant(String, Array(Nullable(String)))', '\\N\n"string"\n"[''hello'', null, ''world'']"\n"[''hello'', nul]"') format CSV;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'TSV';
+select 'String';
+select v, variantElement(v, 'String') from format(TSV, 'v Variant(String, UInt64)', '\\N\nstring\n42') format TSV;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(TSV, 'v Variant(String, FixedString(4))', '\\N\nstring\nabcd') format TSV;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(TSV, 'v Variant(String, Bool)', '\\N\nTruee\nTrue') format TSV;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(TSV, 'v Variant(String, Int8, UInt64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt8') from format(TSV, 'v Variant(String, UInt8, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int16') from format(TSV, 'v Variant(String, Int16, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt16') from format(TSV, 'v Variant(String, UInt16, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int32') from format(TSV, 'v Variant(String, Int32, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt32') from format(TSV, 'v Variant(String, UInt32, Int64)', '\\N\nstring\n-1\n0\n10000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int64') from format(TSV, 'v Variant(String, Int64, Int128)', '\\N\nstring\n-1\n0\n10000000000000000000000\n42d42') format TSV;
+select v, variantElement(v, 'UInt64') from format(TSV, 'v Variant(String, UInt64, Int128)', '\\N\nstring\n-1\n0\n10000000000000000000000\n42d42') format TSV;
+select v, variantElement(v, 'Int128') from format(TSV, 'v Variant(String, Int128, Int256)', '\\N\nstring\n-1\n0\n42d42') format TSV;
+select v, variantElement(v, 'UInt128') from format(TSV, 'v Variant(String, UInt128, Int256)', '\\N\nstring\n-1\n0\n42d42') format TSV;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(TSV, 'v Variant(String, Float32)', '\\N\nstring\n42.42\n42.d42') format TSV;
+select v, variantElement(v, 'Float64') from format(TSV, 'v Variant(String, Float64)', '\\N\nstring\n42.42\n42.d42') format TSV;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(TSV, 'v Variant(String, Decimal32(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal64(6)') from format(TSV, 'v Variant(String, Decimal64(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal128(6)') from format(TSV, 'v Variant(String, Decimal128(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+select v, variantElement(v, 'Decimal256(6)') from format(TSV, 'v Variant(String, Decimal256(6))', '\\N\nstring\n42.42\n42d42\n4242424242424242424242424242424242424242424242424242424242424242424242424242424242424242424242.424242424242424242') format TSV;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(TSV, 'v Variant(String, Date, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'Date32') from format(TSV, 'v Variant(String, Date32, DateTime64)', '\\N\nstring\n2020-01-d1\n1900-01-01\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'DateTime') from format(TSV, 'v Variant(String, DateTime, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01 00:00:00\n2020-01-01 00:00:00.999') format TSV;
+select v, variantElement(v, 'DateTime64') from format(TSV, 'v Variant(String, DateTime64)', '\\N\nstring\n2020-01-d1\n2020-01-01 00:00:00.999\n2020-01-01 00:00:00.999999999 ABC') format TSV;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(TSV, 'v Variant(String, UUID)', '\\N\nstring\nc8619cca-0caa-445e-ae76-1d4f6e0b3927\nc8619cca-0caa-445e-ae76-1d4f6e0b3927AAA') format TSV;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(TSV, 'v Variant(String, IPv4)', '\\N\nstring\n127.0.0.1\n127.0.0.1AAA') format TSV;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(TSV, 'v Variant(String, IPv6)', '\\N\nstring\n2001:0db8:85a3:0000:0000:8a2e:0370:7334\n2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA') format TSV;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(TSV, 'v Variant(String, UInt32, Enum(''a'' = 1))', '\\N\nstring\na\n1\n2\naa') format TSV;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(TSV, 'v Variant(String, Map(String, UInt64))', '\\N\nstring\n{''a'' : 42, ''b'' : 43, ''c'' : null}\n{''c'' : 44, ''d'' : [1,2,3]}\n{''c'' : 44') format TSV;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(TSV, 'v Variant(String, Array(UInt64))', '\\N\nstring\n[1, 2, 3]\n[null, null, null]\n[1, 2, ''hello'']\n[1, 2') format TSV;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(TSV, 'v Variant(LowCardinality(String), UInt64)', '\\N\nstring\n42') format TSV;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(TSV, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '\\N\n[''string'', null]\n[''string'', nul]\n42') format TSV;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(TSV, 'v Variant(String, Array(Nullable(String)))', '\\N\nstring\n[''hello'', null, ''world'']\n[''hello'', nul]') format TSV;
+
+select repeat('-', 80) format JSONEachRow;
+
+select 'Values';
+select 'String';
+select v, variantElement(v, 'String') from format(Values, 'v Variant(String, UInt64)', '(NULL), (''string''), (42)') format Values;
+
+select 'FixedString';
+select v, variantElement(v, 'FixedString(4)') from format(Values, 'v Variant(String, FixedString(4))', '(NULL), (''string''), (''abcd'')') format Values;
+
+select 'Bool';
+select v, variantElement(v, 'Bool') from format(Values, 'v Variant(String, Bool)', '(NULL), (True)') format Values;
+
+select 'Integers';
+select v, variantElement(v, 'Int8') from format(Values, 'v Variant(String, Int8, UInt64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt8') from format(Values, 'v Variant(String, UInt8, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int16') from format(Values, 'v Variant(String, Int16, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt16') from format(Values, 'v Variant(String, UInt16, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int32') from format(Values, 'v Variant(String, Int32, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'UInt32') from format(Values, 'v Variant(String, UInt32, Int64)', '(NULL), (''string''), (-1), (0), (10000000000)') format Values;
+select v, variantElement(v, 'Int64') from format(Values, 'v Variant(String, Int64, Int128)', '(NULL), (''string''), (-1), (0), (10000000000000000000000)') format Values;
+select v, variantElement(v, 'UInt64') from format(Values, 'v Variant(String, UInt64, Int128)', '(NULL), (''string''), (-1), (0), (10000000000000000000000)') format Values;
+select v, variantElement(v, 'Int128') from format(Values, 'v Variant(String, Int128, Int256)', '(NULL), (''string''), (-1), (0)') format Values;
+select v, variantElement(v, 'UInt128') from format(Values, 'v Variant(String, UInt128, Int256)', '(NULL), (''string''), (-1), (0)') format Values;
+
+select 'Floats';
+select v, variantElement(v, 'Float32') from format(Values, 'v Variant(String, Float32)', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Float64') from format(Values, 'v Variant(String, Float64)', '(NULL), (''string''), (42.42)') format Values;
+
+select 'Decimals';
+select v, variantElement(v, 'Decimal32(6)') from format(Values, 'v Variant(String, Decimal32(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal64(6)') from format(Values, 'v Variant(String, Decimal64(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal128(6)') from format(Values, 'v Variant(String, Decimal128(6))', '(NULL), (''string''), (42.42)') format Values;
+select v, variantElement(v, 'Decimal256(6)') from format(Values, 'v Variant(String, Decimal256(6))', '(NULL), (''string''), (42.42)') format Values;
+
+select 'Dates and DateTimes';
+select v, variantElement(v, 'Date') from format(Values, 'v Variant(String, Date, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'Date32') from format(Values, 'v Variant(String, Date32, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''1900-01-01''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'DateTime') from format(Values, 'v Variant(String, DateTime, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01 00:00:00''), (''2020-01-01 00:00:00.999'')') format Values;
+select v, variantElement(v, 'DateTime64') from format(Values, 'v Variant(String, DateTime64)', '(NULL), (''string''), (''2020-01-d1''), (''2020-01-01 00:00:00.999''), (''2020-01-01 00:00:00.999999999 ABC'')') format Values;
+
+select 'UUID';
+select v, variantElement(v, 'UUID') from format(Values, 'v Variant(String, UUID)', '(NULL), (''string''), (''c8619cca-0caa-445e-ae76-1d4f6e0b3927''), (''c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA'')') format Values;
+
+select 'IPv4';
+select v, variantElement(v, 'IPv4') from format(Values, 'v Variant(String, IPv4)', '(NULL), (''string''), (''127.0.0.1''), (''127.0.0.1AAA'')') format Values;
+
+select 'IPv6';
+select v, variantElement(v, 'IPv6') from format(Values, 'v Variant(String, IPv6)', '(NULL), (''string''), (''2001:0db8:85a3:0000:0000:8a2e:0370:7334''), (''2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA'')') format Values;
+
+select 'Enum';
+select v, variantElement(v, 'Enum(''a'' = 1)') from format(Values, 'v Variant(String, UInt32, Enum(''a'' = 1))', '(NULL), (''string''), (''a''), (1), (2), (''aa'')') format Values;
+
+select 'Map';
+select v, variantElement(v, 'Map(String, UInt64)') from format(Values, 'v Variant(String, Map(String, UInt64))', '(NULL), (''string''), ({''a'' : 42, ''b'' : 43, ''c'' : null})') format Values;
+
+select 'Array';
+select v, variantElement(v, 'Array(UInt64)') from format(Values, 'v Variant(String, Array(UInt64))', '(NULL), (''string''), ([1, 2, 3]), ([null, null, null])') format Values;
+
+select 'LowCardinality';
+select v, variantElement(v, 'LowCardinality(String)') from format(Values, 'v Variant(LowCardinality(String), UInt64)', '(NULL), (''string''), (42)') format Values;
+select v, variantElement(v, 'Array(LowCardinality(Nullable(String)))') from format(Values, 'v Variant(Array(LowCardinality(Nullable(String))), UInt64, String)', '(NULL), ([''string'', null]), (42)') format Values;
+
+select 'Nullable';
+select v, variantElement(v, 'Array(Nullable(String))') from format(Values, 'v Variant(String, Array(Nullable(String)))', '(NULL), (''string''), ([''hello'', null, ''world''])') format Values;
+
+select '';
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02941_variant_type_1.reference b/tests/queries/0_stateless/02941_variant_type_1.reference
new file mode 100644
index 00000000000..8a6e77d4f6d
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_1.reference
@@ -0,0 +1,2472 @@
+Memory
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test1 insert
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test1 select
+\N
+\N
+\N
+0
+1
+2
+str_0
+str_1
+str_2
+lc_str_0
+lc_str_1
+lc_str_2
+(0,1)
+(1,2)
+(2,3)
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+str_1
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+lc_str_1
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(1,2)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+1
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[0,1]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+2
+3
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test2 select
+\N
+\N
+\N
+0
+\N
+2
+str_0
+\N
+str_2
+lc_str_0
+\N
+lc_str_2
+(0,1)
+\N
+(2,3)
+[0]
+\N
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_0
+\N
+lc_str_2
+\N
+\N
+\N
+\N
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,1)
+(0,0)
+(2,3)
+(0,0)
+(0,0)
+(0,0)
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+1
+\N
+3
+-----------------------------------------------------------------------------------------------------------
+test3 insert
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
+test3 select
+\N
+str_1
+2
+lc_str_3
+(4,5)
+[0,1,2,3,4,5]
+\N
+str_7
+8
+lc_str_9
+(10,11)
+[0,1,2,3,4,5,6,7,8,9,10,11]
+\N
+str_13
+14
+lc_str_15
+(16,17)
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+str_1
+\N
+\N
+\N
+\N
+\N
+str_7
+\N
+\N
+\N
+\N
+\N
+str_13
+\N
+\N
+\N
+\N
+\N
+\N
+2
+\N
+\N
+\N
+\N
+\N
+8
+\N
+\N
+\N
+\N
+\N
+14
+\N
+\N
+\N
+\N
+\N
+\N
+lc_str_3
+\N
+\N
+\N
+\N
+\N
+lc_str_9
+\N
+\N
+\N
+\N
+\N
+lc_str_15
+\N
+\N
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(4,5)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(10,11)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(0,0)
+(16,17)
+(0,0)
+\N
+\N
+\N
+\N
+4
+\N
+\N
+\N
+\N
+\N
+10
+\N
+\N
+\N
+\N
+\N
+16
+\N
+\N
+\N
+\N
+\N
+5
+\N
+\N
+\N
+\N
+\N
+11
+\N
+\N
+\N
+\N
+\N
+17
+\N
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11]
+[]
+[]
+[]
+[]
+[]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]
+\N
+\N
+\N
+\N
+\N
+6
+\N
+\N
+\N
+\N
+\N
+12
+\N
+\N
+\N
+\N
+\N
+18
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
new file mode 100755
index 00000000000..774acb4bbef
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -0,0 +1,124 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test1_insert()
+{
+    echo "test1 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 3, number from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 6, 'str_' || toString(number) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
+}
+
+function test1_select()
+{
+    echo "test1 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test2_insert()
+{
+    echo "test2 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 3, number % 2 ? NULL : number from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -q "insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+}
+
+function test2_select()
+{
+    echo "test2 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test3_insert()
+{
+    echo "test3 insert"
+    $CH_CLIENT -q "insert into test with 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))' as type select number, multiIf(number % 6 == 0, CAST(NULL, type), number % 6 == 1, CAST('str_' || toString(number), type), number % 6 == 2, CAST(number, type), number % 6 == 3, CAST(('lc_str_' || toString(number))::LowCardinality(String), type), number % 6 == 4, CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), type), CAST(range(number + 1)::Array(UInt64), type)) as res from numbers(18);"
+}
+
+function test3_select()
+{
+    echo "test3 select"
+    $CH_CLIENT -q "select v from test order by id;"
+    $CH_CLIENT -q "select v.String from test order by id;"
+    $CH_CLIENT -q "select v.UInt64 from test order by id;"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test1_insert
+    test1_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test1_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test2_insert
+    test2_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test2_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test3_insert
+    test3_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test3_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_2.reference b/tests/queries/0_stateless/02941_variant_type_2.reference
new file mode 100644
index 00000000000..4b6d53c52ac
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_2.reference
@@ -0,0 +1,51 @@
+Memory
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+MergeTree compact
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+MergeTree wide
+test4 insert
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+test4 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
new file mode 100755
index 00000000000..aef5bc3fe02
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+# tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test4_insert()
+{
+    echo "test4 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 200000, number from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
+}
+
+function test4_select
+{
+    echo "test4 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+}
+
+function run()
+{
+    test4_insert
+    test4_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test4_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_3.reference b/tests/queries/0_stateless/02941_variant_type_3.reference
new file mode 100644
index 00000000000..1ccdb3acdff
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_3.reference
@@ -0,0 +1,51 @@
+Memory
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+MergeTree compact
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+MergeTree wide
+test5 insert
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
+test5 select
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
new file mode 100755
index 00000000000..d3692270deb
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+# tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test5_insert()
+{
+    echo "test5 insert"
+    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -q "insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+}
+
+function test5_select()
+{
+    echo "test5 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+}
+
+function run()
+{
+    test5_insert
+    test5_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test5_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02941_variant_type_4.reference b/tests/queries/0_stateless/02941_variant_type_4.reference
new file mode 100644
index 00000000000..e13d5820343
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_4.reference
@@ -0,0 +1,56 @@
+Memory
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test6 insert
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
+test6 select
+1000000
+200000
+200000
+200000
+200000
+200000
+200000
+200000
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
new file mode 100755
index 00000000000..b3cc041bcd8
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -0,0 +1,66 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
+
+function test6_insert()
+{
+    echo "test6 insert"
+    $CH_CLIENT -q "insert into test with 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))' as type select number, multiIf(number % 6 == 0, CAST(NULL, type), number % 6 == 1, CAST('str_' || toString(number), type), number % 6 == 2, CAST(number, type), number % 6 == 3, CAST(('lc_str_' || toString(number))::LowCardinality(String), type), number % 6 == 4, CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), type), CAST(range(number % 20 + 1)::Array(UInt64), type)) as res from numbers(1200000);"
+}
+
+function test6_select()
+{
+    echo "test6 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
+    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
+    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
+    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test6_insert
+    test6_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test6_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02942_variant_cast.reference b/tests/queries/0_stateless/02942_variant_cast.reference
new file mode 100644
index 00000000000..f3fd7a9ba33
--- /dev/null
+++ b/tests/queries/0_stateless/02942_variant_cast.reference
@@ -0,0 +1,25 @@
+\N
+42
+0
+\N
+2
+\N
+Hello
+Hello
+NULL
+Hello
+Hello
+\N
+Hello
+\N
+0
+\N
+42
+\N
+Hello
+2
+\N
+Hello
+5
+0
+1
diff --git a/tests/queries/0_stateless/02942_variant_cast.sql b/tests/queries/0_stateless/02942_variant_cast.sql
new file mode 100644
index 00000000000..33587e3e438
--- /dev/null
+++ b/tests/queries/0_stateless/02942_variant_cast.sql
@@ -0,0 +1,23 @@
+set allow_experimental_variant_type=1;
+
+select NULL::Variant(String, UInt64);
+select 42::UInt64::Variant(String, UInt64);
+select 42::UInt32::Variant(String, UInt64); -- {serverError CANNOT_CONVERT_TYPE}
+select now()::Variant(String, UInt64); -- {serverError CANNOT_CONVERT_TYPE}
+select CAST(number % 2 ? NULL : number, 'Variant(String, UInt64)') from numbers(4);
+select 'Hello'::LowCardinality(String)::Variant(LowCardinality(String), UInt64);
+select 'Hello'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select 'NULL'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select 'Hello'::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64);
+select CAST(CAST(number % 2 ? NULL : 'Hello', 'LowCardinality(Nullable(String))'), 'Variant(LowCardinality(String), UInt64)') from numbers(4);
+
+select NULL::Variant(String, UInt64)::UInt64;
+select NULL::Variant(String, UInt64)::Nullable(UInt64);
+select '42'::Variant(String, UInt64)::UInt64;
+select 'str'::Variant(String, UInt64)::UInt64; -- {serverError CANNOT_PARSE_TEXT}
+select CAST(multiIf(number % 3 == 0, NULL::Variant(String, UInt64), number % 3 == 1, 'Hello'::Variant(String, UInt64), number::Variant(String, UInt64)), 'Nullable(String)') from numbers(6);
+select CAST(multiIf(number == 1, NULL::Variant(String, UInt64), number == 2, 'Hello'::Variant(String, UInt64), number::Variant(String, UInt64)), 'UInt64') from numbers(6); -- {serverError CANNOT_PARSE_TEXT}
+
+
+select number::Variant(UInt64)::Variant(String, UInt64)::Variant(Array(String), String, UInt64) from numbers(2);
+select 'str'::Variant(String, UInt64)::Variant(String, Array(UInt64)); -- {serverError CANNOT_CONVERT_TYPE}
diff --git a/tests/queries/0_stateless/02943_variant_element.reference b/tests/queries/0_stateless/02943_variant_element.reference
new file mode 100644
index 00000000000..ab8aaa8fdef
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_element.reference
@@ -0,0 +1,44 @@
+\N
+\N
+\N
+\N
+0
+1
+2
+3
+\N
+\N
+\N
+\N
+0
+\N
+2
+\N
+\N
+\N
+\N
+\N
+str_0
+\N
+str_2
+\N
+\N
+\N
+\N
+\N
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[]
+[0]
+[]
+[0,1,2]
+[]
+[[0]]
+[[NULL]]
+[[2]]
+[[NULL]]
diff --git a/tests/queries/0_stateless/02943_variant_element.sql b/tests/queries/0_stateless/02943_variant_element.sql
new file mode 100644
index 00000000000..c8eff9775ad
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_element.sql
@@ -0,0 +1,16 @@
+set allow_experimental_variant_type=1;
+set use_variant_when_no_common_type_in_if=1;
+
+select variantElement(NULL::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement(number::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement(number::Variant(String, UInt64), 'String') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(String, UInt64), 'UInt64') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(String, UInt64), 'String') from numbers(4);
+select variantElement((number % 2 ? NULL : 'str_' || toString(number))::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64), 'LowCardinality(String)') from numbers(4);
+select variantElement(NULL::LowCardinality(Nullable(String))::Variant(LowCardinality(String), UInt64), 'LowCardinality(String)') from numbers(4);
+select variantElement((number % 2 ? NULL : number)::Variant(Array(UInt64), UInt64), 'Array(UInt64)') from numbers(4);
+select variantElement(NULL::Variant(Array(UInt64), UInt64), 'Array(UInt64)') from numbers(4);
+select variantElement(number % 2 ? NULL : range(number + 1), 'Array(UInt64)') from numbers(4);
+
+select variantElement([[(number % 2 ? NULL : number)::Variant(String, UInt64)]], 'UInt64') from numbers(4);
+
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
new file mode 100644
index 00000000000..3803f39253c
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
@@ -0,0 +1,96 @@
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+Array(UInt8)	[1,2,3]
+Array(UInt8)	[1,2,3]
+String	str_1
+Nullable(String)	str_1
+String	str_1
+Nullable(String)	str_1
+Variant(Array(UInt8), String)	str_1
+Variant(Array(UInt8), String)	str_1
+String	str_0
+String	str_1
+String	str_2
+String	str_3
+Nullable(String)	str_0
+Nullable(String)	str_1
+Nullable(String)	str_2
+Nullable(String)	str_3
+Array(UInt64)	[0]
+Array(UInt64)	[0,1]
+Array(UInt64)	[0,1,2]
+Array(UInt64)	[0,1,2,3]
+Array(UInt64)	[0]
+Array(UInt64)	[0,1]
+Array(UInt64)	[0,1,2]
+Array(UInt64)	[0,1,2,3]
+String	str_0
+String	str_1
+String	str_2
+String	str_3
+Nullable(String)	str_0
+Nullable(String)	str_1
+Nullable(String)	str_2
+Nullable(String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	str_1
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	str_3
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String)	str_0
+Variant(Array(UInt64), String)	[0,1]
+Variant(Array(UInt64), String)	str_2
+Variant(Array(UInt64), String)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
+Variant(Array(UInt64), String, UInt64)	[0]
+Variant(Array(UInt64), String, UInt64)	1
+Variant(Array(UInt64), String, UInt64)	str_2
+Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
+Variant(Array(UInt64), String, UInt64)	4
+Variant(Array(UInt64), String, UInt64)	str_5
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
new file mode 100644
index 00000000000..da36863bfda
--- /dev/null
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -0,0 +1,64 @@
+set allow_experimental_variant_type=1;
+set use_variant_when_no_common_type_in_if=1;
+
+select toTypeName(res), if(1, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(1, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(0, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], 'str_1') as res;
+select toTypeName(res), if(NULL, [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(1, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(0, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(NULL, materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1') as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), materialize([1,2,3]), 'str_1'::Nullable(String)) as res;
+
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(1, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(0, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(NULL, [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')) as res;
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), [1,2,3], materialize('str_1')::Nullable(String)) as res;
+
+
+select toTypeName(res), if(0, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(0, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(1, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(1, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(NULL, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(NULL, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(materialize(NULL::Nullable(UInt8)), range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), 'str_' || toString(number)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::Nullable(String)) as res from numbers(4);
+
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(String)) as res from numbers(4);
+select toTypeName(res), if(number % 2, range(number + 1), ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(4);
+
+
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, 'str_' || toString(number)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number,  ('str_' || toString(number))::Nullable(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(String)) as res from numbers(6);
+select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(6);
+

From 0a7ca36e7fbd02b4b64a30371fa3118144179e51 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:08:35 +0000
Subject: [PATCH 0055/1081] Remove unneded changes in IColumn.h

---
 src/Columns/IColumn.h | 11 -----------
 1 file changed, 11 deletions(-)

diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 0dcba5b310c..3f866e6213d 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -631,17 +631,6 @@ struct IsMutableColumns<Arg, Args ...>
 template <>
 struct IsMutableColumns<> { static const bool value = true; };
 
-template <typename ... Args>
-struct IsMutableColumnsOrRvalueReferences;
-
-template <typename Arg, typename ... Args>
-struct IsMutableColumnsOrRvalueReferences<Arg, Args ...>
-{
-    static const bool value = (std::is_assignable<MutableColumnPtr &&, Arg>::value || std::is_rvalue_reference_v<Arg &&>) && IsMutableColumnsOrRvalueReferences<Args ...>::value;
-};
-
-template <>
-struct IsMutableColumnsOrRvalueReferences<> { static const bool value = true; };
 
 template <typename Type>
 const Type * checkAndGetColumn(const IColumn & column)

From bd84799aecb0f8103fd88e9fb1491720f9ec90c8 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:21:45 +0000
Subject: [PATCH 0056/1081] Fix style

---
 src/Columns/ColumnVariant.h                        | 4 ++--
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index 692fdd1709e..702107504f0 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -9,7 +9,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
 }
 
 /**
@@ -263,7 +263,7 @@ public:
     bool hasOnlyNulls() const
     {
         /// If all variants are empty, we have only NULL values.
-        return std::all_of(variants.begin(), variants.end(), [](const auto & v){ return v->empty(); } );
+        return std::all_of(variants.begin(), variants.end(), [](const WrappedPtr & v){ return v->empty(); });
     }
 
     /// Check if local and global order is the same.
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 637ab0ce6d4..bc03f4b39f8 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2594,6 +2594,7 @@ uuid
 varPop
 varSamp
 variadic
+variantElement
 varint
 varpop
 varsamp

From e74ae96dd006f8ff5fc8150eba5ab0beb47ddba3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:35:13 +0000
Subject: [PATCH 0057/1081] Fux typo

---
 src/DataTypes/Serializations/SerializationNullable.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationNullable.cpp b/src/DataTypes/Serializations/SerializationNullable.cpp
index e7f0e61f2a5..05c70827c35 100644
--- a/src/DataTypes/Serializations/SerializationNullable.cpp
+++ b/src/DataTypes/Serializations/SerializationNullable.cpp
@@ -206,7 +206,7 @@ ReturnType safeAppendToNullMap(ColumnNullable & column, bool is_null)
 }
 
 /// Deserialize value into non-nullable column. In case of NULL, insert default and set is_null to true.
-/// If ReturnType is bool, return true if parsing was succesfull and false in case of any error.
+/// If ReturnType is bool, return true if parsing was successful and false in case of any error.
 template <typename ReturnType = void, typename CheckForNull, typename DeserializeNested>
 static ReturnType deserializeImpl(IColumn & column, ReadBuffer & buf, CheckForNull && check_for_null, DeserializeNested && deserialize_nested, bool & is_null)
 {

From 9edbfb3a31e67722a6af3b418a119e9b2bbb164e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 17:55:42 +0000
Subject: [PATCH 0058/1081] Fix build after merging with master

---
 src/DataTypes/Serializations/SerializationEnum.cpp | 10 +++++-----
 src/DataTypes/Serializations/SerializationEnum.h   |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index 6ad55913738..fb384547d64 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -47,7 +47,7 @@ bool SerializationEnum<Type>::tryDeserializeTextEscaped(IColumn & column, ReadBu
     {
         std::string field_name;
         readEscapedString(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
@@ -75,7 +75,7 @@ bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuf
     std::string field_name;
     readQuotedStringWithSQLStyle(field_name, istr);
     FieldType x;
-    if (!this->tryGetValue(x, StringRef(field_name)))
+    if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
         return false;
     assert_cast<ColumnType &>(column).getData().push_back(x);
     return true;
@@ -111,7 +111,7 @@ bool SerializationEnum<Type>::tryDeserializeWholeText(IColumn & column, ReadBuff
     {
         std::string field_name;
         readStringUntilEOF(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
@@ -157,7 +157,7 @@ bool SerializationEnum<Type>::tryDeserializeTextJSON(IColumn & column, ReadBuffe
     {
         std::string field_name;
         readJSONString(field_name, istr);
-        if (!this->tryGetValue(x, StringRef(field_name)))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
             return false;
     }
 
@@ -198,7 +198,7 @@ bool SerializationEnum<Type>::tryDeserializeTextCSV(IColumn & column, ReadBuffer
     {
         std::string field_name;
         readCSVString(field_name, istr, settings.csv);
-        if (!this->tryGetValue(x, StringRef(field_name), true))
+        if (!ref_enum_values.tryGetValue(x, StringRef(field_name), true))
             return false;
     }
 
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 708161dc5fd..5152a3fbc93 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -60,7 +60,7 @@ public:
 
     bool tryReadValue(ReadBuffer & istr, FieldType & x) const
     {
-       if (!tryReadText(x, istr) || !this->hasValue(x))
+       if (!tryReadText(x, istr) || !ref_enum_values.hasValue(x))
            return false;
 
        return true;

From 3c9dd07f7b2c036f5d299869f16ae0a39621b25f Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 19 Dec 2023 21:17:39 +0000
Subject: [PATCH 0059/1081] Fix special builds, fix test

---
 src/Columns/tests/gtest_column_variant.cpp                | 5 ++++-
 src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp | 7 +++----
 tests/queries/0_stateless/02941_variant_type_1.sh         | 1 +
 tests/queries/0_stateless/02941_variant_type_2.sh         | 2 +-
 tests/queries/0_stateless/02941_variant_type_3.sh         | 2 +-
 tests/queries/0_stateless/02941_variant_type_4.sh         | 1 +
 6 files changed, 11 insertions(+), 7 deletions(-)

diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
index b701e2d3183..0a6512c46b7 100644
--- a/src/Columns/tests/gtest_column_variant.cpp
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -582,7 +582,10 @@ TEST(ColumnVariant, PermuteAndIndexOneColumnNoNulls)
     ASSERT_EQ((*permuted_column)[2].get<UInt64>(), 2);
 
     auto index = ColumnUInt64::create();
-    index->getData() = std::move(permutation);
+    index->getData().push_back(1);
+    index->getData().push_back(3);
+    index->getData().push_back(2);
+    index->getData().push_back(0);
     auto indexed_column = column->index(*index, 3);
     ASSERT_EQ(indexed_column->size(), 3);
     ASSERT_EQ((*indexed_column)[0].get<UInt64>(), 1);
diff --git a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
index 81c4af97401..dfcd24aff58 100644
--- a/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
+++ b/src/DataTypes/Serializations/SerializationIPv4andIPv6.cpp
@@ -15,10 +15,10 @@ void SerializationIP<IPv>::deserializeText(DB::IColumn & column, DB::ReadBuffer
     IPv x;
     readText(x, istr);
 
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
+
     if (whole && !istr.eof())
         throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
-
-    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
 }
 
 template <typename IPv>
@@ -77,11 +77,10 @@ void SerializationIP<IPv>::deserializeTextJSON(DB::IColumn & column, DB::ReadBuf
     /// this code looks weird, but we want to throw specific exception to match original behavior...
     if (istr.eof())
         assertChar('"', istr);
+    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
     if (*istr.position() != '"')
         throwUnexpectedDataAfterParsedValue(column, istr, settings, TypeName<IPv>.data());
     istr.ignore();
-
-    assert_cast<ColumnVector<IPv> &>(column).getData().push_back(x);
 }
 
 template <typename IPv>
diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
index 774acb4bbef..4cf8ad25122 100755
--- a/tests/queries/0_stateless/02941_variant_type_1.sh
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index aef5bc3fe02..7064dfbf4ec 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# tags: long
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
index d3692270deb..303039edef7 100755
--- a/tests/queries/0_stateless/02941_variant_type_3.sh
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# tags: long
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
index b3cc041bcd8..169e43c6d69 100755
--- a/tests/queries/0_stateless/02941_variant_type_4.sh
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From e832599dfab7ba2304a4a00175ce48f6a63ed701 Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Wed, 20 Dec 2023 04:57:56 +0000
Subject: [PATCH 0060/1081] fix materialize column for compact parts

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 src/Storages/MergeTree/MutateTask.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index a04d9cdb886..dd84aa0d98a 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -80,7 +80,11 @@ static void splitAndModifyMutationCommands(
                 /// So we only mutated column if `command.column_name` is a materialized column or if the part does not have physical column file
                 auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
                 if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
+                {
+                    LOG_DEBUG(log, "Materializing column {}\n", command.column_name);
+                    for_interpreter.push_back(command);
                     mutated_columns.emplace(command.column_name);
+                }
             }
             if (command.type == MutationCommand::Type::MATERIALIZE_INDEX
                 || command.type == MutationCommand::Type::MATERIALIZE_STATISTIC
@@ -92,7 +96,6 @@ static void splitAndModifyMutationCommands(
                 for_interpreter.push_back(command);
                 for (const auto & [column_name, expr] : command.column_to_update_expression)
                     mutated_columns.emplace(column_name);
-
             }
             else if (command.type == MutationCommand::Type::DROP_INDEX
                      || command.type == MutationCommand::Type::DROP_PROJECTION

From 7b49a0e530e2a2cb8629c249b96f43c6554ea51d Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Wed, 20 Dec 2023 04:59:03 +0000
Subject: [PATCH 0061/1081] remove junk log

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 src/Storages/MergeTree/MutateTask.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index dd84aa0d98a..bb41608eb00 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -81,7 +81,6 @@ static void splitAndModifyMutationCommands(
                 auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
                 if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
                 {
-                    LOG_DEBUG(log, "Materializing column {}\n", command.column_name);
                     for_interpreter.push_back(command);
                     mutated_columns.emplace(command.column_name);
                 }

From 1efd65b8c73951e60e94f74ccc45141a5b39d85e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 20 Dec 2023 17:43:04 +0000
Subject: [PATCH 0062/1081] Fix tests

---
 src/Columns/ColumnVariant.cpp                        | 10 ++++++++++
 src/Columns/ColumnVariant.h                          |  1 +
 src/DataTypes/DataTypeVariant.cpp                    | 12 ++++++++++++
 src/DataTypes/DataTypeVariant.h                      |  1 +
 src/DataTypes/IDataType.h                            |  2 +-
 .../Serializations/SerializationVariantElement.cpp   |  2 +-
 6 files changed, 26 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index 67754e77992..a3a0362b646 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -480,6 +480,16 @@ void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
     }
 }
 
+void ColumnVariant::insertIntoVariant(const DB::Field & x, Discriminator global_discr)
+{
+    if (global_discr > variants.size())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid global discriminator: {}. The number of variants is {}", size_t(global_discr), variants.size());
+    auto & variant = getVariantByGlobalDiscriminator(global_discr);
+    variant.insert(x);
+    getLocalDiscriminators().push_back(localDiscriminatorByGlobal(global_discr));
+    getOffsets().push_back(variant.size() - 1);
+}
+
 void ColumnVariant::insertRangeFrom(const IColumn & src_, size_t start, size_t length)
 {
     const size_t num_variants = variants.size();
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index 702107504f0..b388b118a69 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -174,6 +174,7 @@ public:
     StringRef getDataAt(size_t n) const override;
     void insertData(const char * pos, size_t length) override;
     void insert(const Field & x) override;
+    void insertIntoVariant(const Field & x, Discriminator global_discr);
     void insertFrom(const IColumn & src_, size_t n) override;
     void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
     void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 77e1c504cf8..334ed2c7b10 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -1,9 +1,11 @@
 #include <Columns/ColumnVariant.h>
+#include <Columns/ColumnConst.h>
 #include <Core/Field.h>
 #include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/Serializations/SerializationVariant.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/FieldToDataType.h>
 #include <Common/assert_cast.h>
 #include <IO/WriteHelpers.h>
 #include <IO/WriteBufferFromString.h>
@@ -94,6 +96,16 @@ MutableColumnPtr DataTypeVariant::createColumn() const
     return ColumnVariant::create(std::move(nested_columns));
 }
 
+ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
+{
+    auto field_type = applyVisitor(FieldToDataType(), field);
+    auto discr = tryGetVariantDiscriminator(field_type);
+    if (!discr)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+    auto column = createColumn();
+    assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    return ColumnConst::create(std::move(column), size);
+}
 
 Field DataTypeVariant::getDefault() const
 {
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index 60113a188b0..ca15dff1476 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -37,6 +37,7 @@ public:
 
     MutableColumnPtr createColumn() const override;
 
+    ColumnPtr createColumnConst(size_t size, const Field & field) const override;
     Field getDefault() const override;
 
     bool equals(const IDataType & rhs) const override;
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index ccdf54f57c3..4533c23a89f 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -150,7 +150,7 @@ public:
 
     /** Create ColumnConst for corresponding type, with specified size and value.
       */
-    ColumnPtr createColumnConst(size_t size, const Field & field) const;
+    virtual ColumnPtr createColumnConst(size_t size, const Field & field) const;
     ColumnPtr createColumnConstWithDefaultValue(size_t size) const;
 
     /** Get default value of data type.
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 4b24ee5754e..1c0808db2a0 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -204,7 +204,7 @@ ColumnPtr SerializationVariantElement::VariantSubcolumnCreator::create(const DB:
     /// If this variant is empty, fill result column with default values.
     if (prev->empty())
     {
-        auto res = IColumn::mutate(makeNullableOrLowCardinalityNullableSafe(prev));
+        auto res = makeNullableOrLowCardinalityNullableSafe(prev)->cloneEmpty();
         res->insertManyDefaults(local_discriminators->size());
         return res;
     }

From 4f8789927db4dd0d9c79a80bebc805895d82297c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 21 Dec 2023 15:53:21 +0000
Subject: [PATCH 0063/1081] Fix tests with analyzer, add more tests

---
 src/DataTypes/DataTypeVariant.cpp             |  18 +-
 ...different_local_and_global_order.reference | 244 ++++++++++++++++++
 ...e_with_different_local_and_global_order.sh |  82 ++++++
 .../02944_variant_as_if_multi_if_result.sql   |   1 +
 4 files changed, 340 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 334ed2c7b10..0575f220f22 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -98,12 +98,20 @@ MutableColumnPtr DataTypeVariant::createColumn() const
 
 ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
 {
-    auto field_type = applyVisitor(FieldToDataType(), field);
-    auto discr = tryGetVariantDiscriminator(field_type);
-    if (!discr)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
     auto column = createColumn();
-    assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    if (field.isNull())
+    {
+        column->insertDefault();
+    }
+    else
+    {
+        auto field_type = applyVisitor(FieldToDataType(), field);
+        auto discr = tryGetVariantDiscriminator(field_type);
+        if (!discr)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+        assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
+    }
+
     return ColumnConst::create(std::move(column), size);
 }
 
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
new file mode 100644
index 00000000000..f2e355824f9
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
@@ -0,0 +1,244 @@
+Memory
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+MergeTree compact
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+MergeTree wide
+test1 insert
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test1 select
+0	\N	0
+1	\N	1
+2	\N	2
+3	\N	3
+4	\N	4
+5	\N	5
+6	\N	6
+7	\N	7
+8	\N	8
+9	\N	9
+10	\N	10
+\N	\N	\N
+12	\N	12
+\N	\N	\N
+14	\N	14
+\N	\N	\N
+16	\N	16
+\N	\N	\N
+18	\N	18
+\N	\N	\N
+str_20	str_20	\N
+\N	\N	\N
+str_22	str_22	\N
+\N	\N	\N
+str_24	str_24	\N
+\N	\N	\N
+str_26	str_26	\N
+\N	\N	\N
+str_28	str_28	\N
+\N	\N	\N
+30	\N	30
+\N	\N	\N
+32	\N	32
+\N	\N	\N
+34	\N	34
+\N	\N	\N
+str_36	str_36	\N
+\N	\N	\N
+str_38	str_38	\N
+\N	\N	\N
+-----------------------------------------------------------------------------------------------------------
+test2 insert
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
+test2 select
+7000000
+1000000
+6000000
+-----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
new file mode 100755
index 00000000000..88bd2d3bd42
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -0,0 +1,82 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test1_insert()
+{
+    echo "test1 insert"
+    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(10, 10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(20, 10) settings max_block_size=3"
+    $CH_CLIENT -q "insert into test select number, if(number < 35, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(30, 10) settings max_block_size=3"
+}
+
+function test1_select()
+{
+    echo "test1 select"
+    $CH_CLIENT -q "select v, v.String, v.UInt64 from test order by id;"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function test2_insert()
+{
+    echo "test2 insert"
+    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 10000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(2000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number < 5, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    }
+
+function test2_select()
+{
+    echo "test2 select"
+    $CH_CLIENT -q "select v from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v);"
+    $CH_CLIENT -q "select v.String from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
+    $CH_CLIENT -q "select v.UInt64 from test format Null;"
+    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
+    echo "-----------------------------------------------------------------------------------------------------------"
+}
+
+function run()
+{
+    test1_insert
+    test1_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test1_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+    test2_insert
+    test2_select
+    if [ $1 == 1 ]; then
+        $CH_CLIENT -q "optimize table test final;"
+        test2_select
+    fi
+    $CH_CLIENT -q "truncate table test;"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=Memory;"
+run 0
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run 1
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run 1
+$CH_CLIENT -q "drop table test;"
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
index da36863bfda..1121b21e383 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -1,3 +1,4 @@
+set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
 set allow_experimental_variant_type=1;
 set use_variant_when_no_common_type_in_if=1;
 

From 38ec9b5f719740b4e94758f9e5578acd562df939 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 22 Dec 2023 00:11:39 +0000
Subject: [PATCH 0064/1081] Fix variant element deserialization

---
 .../Serializations/SerializationVariant.cpp   |  27 ++--
 .../SerializationVariantElement.cpp           | 149 ++++++++++--------
 ...different_local_and_global_order.reference |  30 ++--
 ...e_with_different_local_and_global_order.sh |   8 +-
 4 files changed, 117 insertions(+), 97 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index ebd44fd6955..910ad1da303 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -277,13 +277,10 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
 
     /// First, deserialize new discriminators.
-    /// We deserialize them into a separate column to be able to use substream cache,
-    /// so if we also need to deserialize some of sub columns, we will read discriminators only once.
     settings.path.push_back(Substream::VariantDiscriminators);
-    ColumnPtr discriminators;
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
-        discriminators = cached_discriminators;
+        col.getLocalDiscriminatorsPtr() = cached_discriminators;
     }
     else
     {
@@ -291,29 +288,31 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         if (!discriminators_stream)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
 
-        discriminators = ColumnVariant::ColumnDiscriminators::create();
-        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
-        addToSubstreamsCache(cache, settings.path, discriminators);
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
     }
 
     settings.path.pop_back();
 
-    /// Iterate through new discriminators, append them to column and calculate the limit for each variant.
+    /// Iterate through new discriminators and calculate the limit for each variant.
     /// While calculating limits we can also fill offsets column (we store offsets only in memory).
-    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
-    auto & local_discriminators = col.getLocalDiscriminators();
-    local_discriminators.reserve(local_discriminators.size() + limit);
+    auto & discriminators_data = col.getLocalDiscriminators();
     auto & offsets = col.getOffsets();
     offsets.reserve(offsets.size() + limit);
     std::vector<size_t> variant_limits(variants.size(), 0);
-    for (size_t i = 0; i != limit; ++i)
+    size_t discriminators_offset = discriminators_data.size() - limit;
+    for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
     {
         ColumnVariant::Discriminator discr = discriminators_data[i];
-        local_discriminators.push_back(discr);
         if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+        {
             offsets.emplace_back();
+        }
         else
-            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]++);
+        {
+            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]);
+            ++variant_limits[discr];
+        }
     }
 
     /// Now we can deserialize variants according to their limits.
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 1c0808db2a0..e06a20d2990 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -40,11 +40,31 @@ void SerializationVariantElement::serializeBinaryBulkStateSuffix(SerializeBinary
         ErrorCodes::NOT_IMPLEMENTED, "Method serializeBinaryBulkStateSuffix is not implemented for SerializationVariantElement");
 }
 
+struct DeserializeBinaryBulkStateVariantElement : public ISerialization::DeserializeBinaryBulkState
+{
+    /// During deserialization discriminators and variant streams can be shared.
+    /// For example we can read several variant elements together: "select v.UInt32, v.String from table",
+    /// or we can read the whole variant and some of variant elements: "select v, v.UInt32 from table".
+    /// To read the same column from the same stream more than once we use substream cache,
+    /// but this cache stores the whole column, not only the current range.
+    /// During deserialization of variant element discriminators and variant columns are not stored
+    /// in the result column, so we need to store them inside deserialization state, so we can use
+    /// substream cache correctly.
+    ColumnPtr discriminators;
+    ColumnPtr variant;
+
+    ISerialization::DeserializeBinaryBulkStatePtr variant_element_state;
+};
+
 void SerializationVariantElement::deserializeBinaryBulkStatePrefix(DeserializeBinaryBulkSettings & settings, DeserializeBinaryBulkStatePtr & state) const
 {
+    auto variant_element_state = std::make_shared<DeserializeBinaryBulkStateVariantElement>();
+
     addVariantToPath(settings.path);
-    nested_serialization->deserializeBinaryBulkStatePrefix(settings, state);
+    nested_serialization->deserializeBinaryBulkStatePrefix(settings, variant_element_state->variant_element_state);
     removeVariantFromPath(settings.path);
+
+    state = std::move(variant_element_state);
 }
 
 void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const IColumn &, size_t, size_t, SerializeBinaryBulkSettings &, SerializeBinaryBulkStatePtr &) const
@@ -53,22 +73,19 @@ void SerializationVariantElement::serializeBinaryBulkWithMultipleStreams(const I
 }
 
 void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
-    ColumnPtr & column,
+    ColumnPtr & result_column,
     size_t limit,
     DeserializeBinaryBulkSettings & settings,
     DeserializeBinaryBulkStatePtr & state,
     SubstreamsCache * cache) const
 {
-    auto mutable_column = column->assumeMutable();
-    ColumnNullable * nullable_col = typeid_cast<ColumnNullable *>(mutable_column.get());
-    NullMap * null_map = nullable_col ? &nullable_col->getNullMapData() : nullptr;
+    auto * variant_element_state = checkAndGetState<DeserializeBinaryBulkStateVariantElement>(state);
 
     /// First, deserialize discriminators from Variant column.
     settings.path.push_back(Substream::VariantDiscriminators);
-    ColumnPtr discriminators;
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
-        discriminators = cached_discriminators;
+        variant_element_state->discriminators = cached_discriminators;
     }
     else
     {
@@ -76,85 +93,87 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         if (!discriminators_stream)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
 
-        discriminators = ColumnVariant::ColumnDiscriminators::create();
-        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*discriminators->assumeMutable(), *discriminators_stream, limit, 0);
-        addToSubstreamsCache(cache, settings.path, discriminators);
+        /// If we started to read a new column, reinitialize discriminators column in deserialization state.
+        if (!variant_element_state->discriminators || result_column->empty())
+            variant_element_state->discriminators = ColumnVariant::ColumnDiscriminators::create();
+
+        SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*variant_element_state->discriminators->assumeMutable(), *discriminators_stream, limit, 0);
+        addToSubstreamsCache(cache, settings.path, variant_element_state->discriminators);
     }
     settings.path.pop_back();
 
-    /// Iterate through discriminators to calculate the size of the variant.
-    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*discriminators).getData();
-    size_t variant_size = 0;
-    for (auto discr : discriminators_data)
-        variant_size += discr == variant_discriminator;
+    /// Iterate through new discriminators to calculate the limit for our variant.
+    const auto & discriminators_data = assert_cast<const ColumnVariant::ColumnDiscriminators &>(*variant_element_state->discriminators).getData();
+    size_t discriminators_offset = variant_element_state->discriminators->size() - limit;
+    size_t variant_limit = 0;
+    for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+        variant_limit += (discriminators_data[i] == variant_discriminator);
 
-    /// Now we know the size of the variant and can deserialize it.
+    /// Now we know the limit for our variant and can deserialize it.
 
-    /// If the size of variant column is the same as the size of discriminators,
-    /// we can deserialize new values directly into our column.
-    if (variant_size == discriminators_data.size())
+    /// If result column is Nullable, fill null map and extract nested column.
+    MutableColumnPtr mutable_column = result_column->assumeMutable();
+    if (isColumnNullable(*mutable_column))
     {
-        addVariantToPath(settings.path);
-        /// Special case when our result column is LowCardinality(Nullable(T)).
-        /// In this case the variant type is LowCardinality(T), and we cannot just
-        /// deserialize its values directly into LowCardinality(Nullable(T)) column.
-        /// We create a separate column with type LowCardinality(T), deserialize
-        /// values into it and then insert into result column using insertRangeFrom.
-        if (isColumnLowCardinalityNullable(*column))
+        auto & nullable_column = assert_cast<ColumnNullable &>(*mutable_column);
+        NullMap & null_map = nullable_column.getNullMapData();
+        /// If we have only our discriminator in range, fill null map with 0.
+        if (variant_limit == limit)
         {
-            ColumnPtr variant_col = mutable_column->cloneEmpty();
-            /// LowCardinality(Nullable(T)) -> LowCardinality(T)
-            assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
-            nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, limit, settings, state, cache);
-            mutable_column->insertRangeFrom(*variant_col, 0, variant_col->size());
+            null_map.resize_fill(null_map.size() + limit, 0);
         }
+        /// If no our discriminator in current range, fill null map with 1.
+        else if (variant_limit == 0)
+        {
+            null_map.resize_fill(null_map.size() + limit, 1);
+        }
+        /// Otherwise we should iterate through discriminators to fill null map.
         else
         {
-            nested_serialization->deserializeBinaryBulkWithMultipleStreams(nullable_col ? nullable_col->getNestedColumnPtr() : column, limit, settings, state, cache);
+            null_map.reserve(null_map.size() + limit);
+            for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+                null_map.push_back(discriminators_data[i] != variant_discriminator);
         }
-        if (nullable_col)
-            null_map->resize_fill(null_map->size() + limit, 0);
-        removeVariantFromPath(settings.path);
-        return;
+
+        mutable_column = nullable_column.getNestedColumnPtr()->assumeMutable();
     }
 
-    /// If variant size is 0, just fill column with default values.
-    if (variant_size == 0)
+    /// If we started to read a new column, reinitialize variant column in deserialization state.
+    if (!variant_element_state->variant || result_column->empty())
     {
-        mutable_column->insertManyDefaults(limit);
-        return;
+        variant_element_state->variant = mutable_column->cloneEmpty();
+
+        /// When result column is LowCardinality(Nullable(T)) we should
+        /// remove Nullable from variant column before deserialization.
+        if (isColumnLowCardinalityNullable(*mutable_column))
+            assert_cast<ColumnLowCardinality &>(*variant_element_state->variant->assumeMutable()).nestedRemoveNullable();
     }
 
-    /// In general case we should deserialize variant into a separate column,
-    /// iterate through discriminators and insert values from variant only when
-    /// row contains its discriminator and default value otherwise.
-    mutable_column->reserve(mutable_column->size() + limit);
-    mutable_column = nullable_col ? nullable_col->getNestedColumnPtr()->assumeMutable() : std::move(mutable_column);
-    ColumnPtr variant_col = mutable_column->cloneEmpty();
-
-    /// Special case when our result column is LowCardinality(Nullable(T)).
-    /// We should remove Nullable from variant column before deserialization.
-    if (isColumnLowCardinalityNullable(*column))
-        assert_cast<ColumnLowCardinality &>(*variant_col->assumeMutable()).nestedRemoveNullable();
-
     addVariantToPath(settings.path);
-    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_col, variant_size, settings, state, cache);
+    nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
-    size_t variant_index = 0;
-    for (auto discr : discriminators_data)
+    size_t variant_offset = variant_element_state->variant->size() - variant_limit;
+
+    /// If don't have our discriminator in range, just insert defaults.
+    if (variant_limit == 0)
     {
-        if (discr == variant_discriminator)
+        mutable_column->insertManyDefaults(limit);
+    }
+    /// If we have only our discriminator in range, insert the whole range to result column.
+    else if (variant_limit == limit)
+    {
+        mutable_column->insertRangeFrom(*variant_element_state->variant, variant_offset, variant_limit);
+    }
+    /// Otherwise iterate through discriminators and insert value from variant or default value depending on the discriminator.
+    else
+    {
+        for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
         {
-            if (null_map)
-                null_map->push_back(0);
-            mutable_column->insertFrom(*variant_col, variant_index++);
-        }
-        else
-        {
-            if (null_map)
-                null_map->push_back(1);
-            mutable_column->insertDefault();
+            if (discriminators_data[i] == variant_discriminator)
+                mutable_column->insertFrom(*variant_element_state->variant, variant_offset++);
+            else
+                mutable_column->insertDefault();
         }
     }
 }
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
index f2e355824f9..1736a307c42 100644
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
@@ -44,9 +44,9 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 MergeTree compact
 test1 insert
@@ -136,14 +136,14 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 MergeTree wide
 test1 insert
@@ -233,12 +233,12 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-7000000
-1000000
-6000000
+2500000
+750000
+1750000
 -----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index 88bd2d3bd42..9f4df8d7466 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
@@ -29,14 +30,15 @@ function test2_insert()
 {
     echo "test2 insert"
     $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 10000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
     $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(2000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number < 5, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    }
+    $CH_CLIENT -q "insert into test select number, if(number < 3500000, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+}
 
 function test2_select()
 {
     echo "test2 select"
+    $CH_CLIENT -q "select v, v.String, v.UInt64 from test format Null;"
     $CH_CLIENT -q "select v from test format Null;"
     $CH_CLIENT -q "select count() from test where isNotNull(v);"
     $CH_CLIENT -q "select v.String from test format Null;"

From 319c20091efe8eebee5bde9bb8bae67e58a589d9 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 22 Dec 2023 00:15:44 +0000
Subject: [PATCH 0065/1081] Fix comments

---
 src/DataTypes/Serializations/SerializationVariant.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 910ad1da303..3b51c51872f 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -276,7 +276,7 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
     if (!col.hasGlobalVariantsOrder())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to deserialize data into Variant column with not global variants order");
 
-    /// First, deserialize new discriminators.
+    /// First, deserialize discriminators.
     settings.path.push_back(Substream::VariantDiscriminators);
     if (auto cached_discriminators = getFromSubstreamsCache(cache, settings.path))
     {
@@ -451,7 +451,7 @@ std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
 /// then for types with the same depth we sort by the types priority, and last we sort by the depth of LowCardinality/Nullable types,
 /// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
 /// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
-/// This is just a batch of heuristics,
+/// This is just a batch of heuristics.
 std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
 {
     if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
@@ -553,7 +553,7 @@ bool SerializationVariant::tryDeserializeImpl(
     for (size_t global_discr : deserialize_text_order)
     {
         ReadBufferFromString variant_buf(field);
-        /// Usually try_deserialize_variant should not throw an exception, but let's use try/catch just in case.
+        /// Usually try_deserialize_variant should not throw any exception, but let's use try/catch just in case.
         try
         {
             auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);

From a61efedba8854e8f06b549deb595315ee40eb303 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:10:58 +0000
Subject: [PATCH 0066/1081] Fix serialization again, add more tests

---
 src/Columns/ColumnVariant.h                   |  2 +-
 src/Columns/ColumnVector.cpp                  |  2 +-
 src/DataTypes/DataTypeVariant.cpp             | 15 +++++-
 .../Serializations/ISerialization.cpp         |  7 +++
 src/DataTypes/Serializations/ISerialization.h |  1 +
 .../Serializations/SerializationVariant.cpp   | 52 ++++++++++++++-----
 .../02943_variant_read_subcolumns_1.reference |  6 +++
 .../02943_variant_read_subcolumns_1.sh        | 38 ++++++++++++++
 .../02943_variant_read_subcolumns_2.reference |  6 +++
 .../02943_variant_read_subcolumns_2.sh        | 38 ++++++++++++++
 10 files changed, 150 insertions(+), 17 deletions(-)
 create mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
 create mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
 create mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh

diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index b388b118a69..ec58553f5f3 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -163,7 +163,7 @@ public:
 
     size_t size() const override
     {
-        return local_discriminators->size();
+        return offsets->size();
     }
 
     Field operator[](size_t n) const override;
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index 37e62c76596..b4e3fee5e42 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -469,7 +469,7 @@ void ColumnVector<T>::insertRangeFrom(const IColumn & src, size_t start, size_t
     const ColumnVector & src_vec = assert_cast<const ColumnVector &>(src);
 
     if (start + length > src_vec.data.size())
-        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
                         "Parameters start = {}, length = {} are out of bound "
                         "in ColumnVector<T>::insertRangeFrom method (data.size() = {}).",
                         toString(start), toString(length), toString(src_vec.data.size()));
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 0575f220f22..5dc42cc7443 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -108,7 +108,20 @@ ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & fiel
         auto field_type = applyVisitor(FieldToDataType(), field);
         auto discr = tryGetVariantDiscriminator(field_type);
         if (!discr)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" into column with type {}", toString(field), getName());
+        {
+            for (size_t i = 0; i != variants.size(); ++i)
+            {
+                if (field.getType() == variants[i]->getDefault().getType())
+                {
+                    discr = i;
+                    break;
+                }
+            }
+        }
+
+        if (!discr)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" with type {} into column with type {}", toString(field), field.getTypeName(), getName());
+
         assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
     }
 
diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 86a37949dc8..46353fffb48 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -124,15 +124,20 @@ void ISerialization::deserializeBinaryBulkWithMultipleStreams(
     DeserializeBinaryBulkStatePtr & /* state */,
     SubstreamsCache * cache) const
 {
+    LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize path {}. Initial column size: {}", settings.path.toString(), column->size());
+
     auto cached_column = getFromSubstreamsCache(cache, settings.path);
     if (cached_column)
     {
         column = cached_column;
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Use column from cache. Size: {}", cached_column->size());
     }
     else if (ReadBuffer * stream = settings.getter(settings.path))
     {
         auto mutable_column = column->assumeMutable();
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize column. Initial size: {}", mutable_column->size());
         deserializeBinaryBulk(*mutable_column, *stream, limit, settings.avg_value_size_hint);
+        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialized column. Size: {}", mutable_column->size());
         column = std::move(mutable_column);
         addToSubstreamsCache(cache, settings.path, column);
     }
@@ -177,6 +182,8 @@ String getNameForSubstreamPath(
         }
         else if (it->type == Substream::VariantDiscriminators)
             stream_name += ".discr";
+        else if (it->type == Substream::VariantOffsets)
+            stream_name += ".variant_offsets";
         else if (it->type == Substream::VariantElement)
             stream_name += "." + it->variant_element_name;
     }
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index f0273f59d1f..5c6fe31ed9e 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -153,6 +153,7 @@ public:
             ObjectData,
 
             VariantDiscriminators,
+            VariantOffsets,
             VariantElements,
             VariantElement,
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 3b51c51872f..d36151fe8e9 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -291,28 +291,17 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
         addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
     }
-
     settings.path.pop_back();
 
-    /// Iterate through new discriminators and calculate the limit for each variant.
-    /// While calculating limits we can also fill offsets column (we store offsets only in memory).
-    auto & discriminators_data = col.getLocalDiscriminators();
-    auto & offsets = col.getOffsets();
-    offsets.reserve(offsets.size() + limit);
+    /// Second, calculate limits for each variant by iterating through new discriminators.
     std::vector<size_t> variant_limits(variants.size(), 0);
+    auto & discriminators_data = col.getLocalDiscriminators();
     size_t discriminators_offset = discriminators_data.size() - limit;
     for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
     {
         ColumnVariant::Discriminator discr = discriminators_data[i];
-        if (discr == ColumnVariant::NULL_DISCRIMINATOR)
-        {
-            offsets.emplace_back();
-        }
-        else
-        {
-            offsets.push_back(col.getVariantByLocalDiscriminator(discr).size() + variant_limits[discr]);
+        if (discr != ColumnVariant::NULL_DISCRIMINATOR)
             ++variant_limits[discr];
-        }
     }
 
     /// Now we can deserialize variants according to their limits.
@@ -325,6 +314,41 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
         settings.path.pop_back();
     }
     settings.path.pop_back();
+
+    /// Fill offsets column.
+    /// It's important to do it after deserialization of all variants, because to fill offsets we need
+    /// initial variants sizes without values in current range, but some variants can be shared with
+    /// other columns via substream cache and they can already contain values from this range even
+    /// before we call deserialize for them. So, before deserialize we cannot know for sure if
+    /// variant columns already contain values from current range or not. But after calling deserialize
+    /// we know for sure that they contain these values, so we can use valiant limits and their
+    /// new sizes to calculate correct offsets.
+    settings.path.push_back(Substream::VariantOffsets);
+    if (auto cached_offsets = getFromSubstreamsCache(cache, settings.path))
+    {
+        col.getOffsetsPtr() = cached_offsets;
+    }
+    else
+    {
+        auto & offsets = col.getOffsets();
+        offsets.reserve(offsets.size() + limit);
+        std::vector<size_t> variant_offsets;
+        variant_offsets.reserve(variants.size());
+        for (size_t i = 0; i != variants.size(); ++i)
+            variant_offsets.push_back(col.getVariantByLocalDiscriminator(i).size() - variant_limits[i]);
+
+        for (size_t i = discriminators_offset; i != discriminators_data.size(); ++i)
+        {
+            ColumnVariant::Discriminator discr = discriminators_data[i];
+            if (discr == ColumnVariant::NULL_DISCRIMINATOR)
+                offsets.emplace_back();
+            else
+                offsets.push_back(variant_offsets[discr]++);
+        }
+
+        addToSubstreamsCache(cache, settings.path, col.getOffsetsPtr());
+    }
+    settings.path.pop_back();
 }
 
 void SerializationVariant::addVariantElementToPath(DB::ISerialization::SubstreamPath & path, size_t i) const
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
new file mode 100644
index 00000000000..4b93782cddf
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
@@ -0,0 +1,6 @@
+Memory
+test
+MergeTree compact
+test
+MergeTree wide
+test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
new file mode 100755
index 00000000000..9ccad55191f
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
@@ -0,0 +1,38 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test()
+{
+    echo "test"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+test
+$CH_CLIENT -q "drop table test;"
+
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
new file mode 100644
index 00000000000..4b93782cddf
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
@@ -0,0 +1,6 @@
+Memory
+test
+MergeTree compact
+test
+MergeTree wide
+test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
new file mode 100755
index 00000000000..9ccad55191f
--- /dev/null
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
@@ -0,0 +1,38 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+
+function test()
+{
+    echo "test"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
+    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
+test
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+test
+$CH_CLIENT -q "drop table test;"
+

From 4931b363079aa5dd4fbc35ff6faea62efaf218de Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:32:28 +0000
Subject: [PATCH 0067/1081] Fix style

---
 src/Columns/ColumnVector.cpp                        | 2 +-
 src/DataTypes/Serializations/SerializationArray.cpp | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index b4e3fee5e42..37e62c76596 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -469,7 +469,7 @@ void ColumnVector<T>::insertRangeFrom(const IColumn & src, size_t start, size_t
     const ColumnVector & src_vec = assert_cast<const ColumnVector &>(src);
 
     if (start + length > src_vec.data.size())
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
                         "Parameters start = {}, length = {} are out of bound "
                         "in ColumnVector<T>::insertRangeFrom method (data.size() = {}).",
                         toString(start), toString(length), toString(src_vec.data.size()));
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index be23278ef25..bb22af16c69 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -348,6 +348,7 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 {
     auto mutable_column = column->assumeMutable();
     ColumnArray & column_array = typeid_cast<ColumnArray &>(*mutable_column);
+    size_t prev_last_offset = column_array.getOffsets().back();
     settings.path.push_back(Substream::ArraySizes);
 
     if (auto cached_column = getFromSubstreamsCache(cache, settings.path))
@@ -371,9 +372,9 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 
     /// Number of values corresponding with `offset_values` must be read.
     size_t last_offset = offset_values.back();
-    if (last_offset < nested_column->size())
+    if (last_offset < prev_last_offset)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested column is longer than last offset");
-    size_t nested_limit = last_offset - nested_column->size();
+    size_t nested_limit = last_offset - prev_last_offset;
 
     if (unlikely(nested_limit > MAX_ARRAYS_SIZE))
         throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Array sizes are too large: {}", nested_limit);

From 4e4aa90430d02f1fcc17b517946799f23c59b83e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 00:35:20 +0000
Subject: [PATCH 0068/1081] Remove debug logging

---
 src/DataTypes/Serializations/ISerialization.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 46353fffb48..08575f06f2a 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -124,20 +124,15 @@ void ISerialization::deserializeBinaryBulkWithMultipleStreams(
     DeserializeBinaryBulkStatePtr & /* state */,
     SubstreamsCache * cache) const
 {
-    LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize path {}. Initial column size: {}", settings.path.toString(), column->size());
-
     auto cached_column = getFromSubstreamsCache(cache, settings.path);
     if (cached_column)
     {
         column = cached_column;
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Use column from cache. Size: {}", cached_column->size());
     }
     else if (ReadBuffer * stream = settings.getter(settings.path))
     {
         auto mutable_column = column->assumeMutable();
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialize column. Initial size: {}", mutable_column->size());
         deserializeBinaryBulk(*mutable_column, *stream, limit, settings.avg_value_size_hint);
-        LOG_DEBUG(&Poco::Logger::get("ISerialization"), "Deserialized column. Size: {}", mutable_column->size());
         column = std::move(mutable_column);
         addToSubstreamsCache(cache, settings.path, column);
     }

From bc757559c9f3fd1943bf338dc4fdac9e0e61240a Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Sat, 23 Dec 2023 18:10:42 +0800
Subject: [PATCH 0069/1081] feat:add InitialQuery event

---
 src/Common/ProfileEvents.cpp                               | 1 +
 src/Databases/DatabaseReplicatedWorker.cpp                 | 7 +++++--
 src/Interpreters/DDLWorker.cpp                             | 2 +-
 .../queries/0_stateless/02950_initialquery_event.reference | 1 +
 tests/queries/0_stateless/02950_initialquery_event.sql     | 1 +
 5 files changed, 9 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02950_initialquery_event.reference
 create mode 100644 tests/queries/0_stateless/02950_initialquery_event.sql

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index f342a19b2aa..a2dc7f5ecd6 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -8,6 +8,7 @@
     M(Query, "Number of queries to be interpreted and potentially executed. Does not include queries that failed to parse or were rejected due to AST size limits, quota limits or limits on the number of simultaneously running queries. May include internal queries initiated by ClickHouse itself. Does not count subqueries.") \
     M(SelectQuery, "Same as Query, but only for SELECT queries.") \
     M(InsertQuery, "Same as Query, but only for INSERT queries.") \
+    M(InitialQuery, "Same as Query, but only counts initial queries (see is_initial_query).")\
     M(QueriesWithSubqueries, "Count queries with all subqueries") \
     M(SelectQueriesWithSubqueries, "Count SELECT queries with all subqueries") \
     M(InsertQueriesWithSubqueries, "Count INSERT queries with all subqueries") \
diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 2056b403ff6..c90af7d4ea8 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -6,7 +6,10 @@
 #include <filesystem>
 
 namespace fs = std::filesystem;
-
+namespace ProfileEvents
+{
+    extern const Event InitialQuery;
+}
 namespace DB
 {
 
@@ -264,7 +267,7 @@ String DatabaseReplicatedDDLWorker::tryEnqueueAndExecuteEntry(DDLLogEntry & entr
     chassert(!task->entry.query.empty());
     assert(!zookeeper->exists(task->getFinishedNodePath()));
     task->is_initial_query = true;
-
+    ProfileEvents::increment(ProfileEvents::InitialQuery);
     LOG_DEBUG(log, "Waiting for worker thread to process all entries before {}", entry_name);
     UInt64 timeout = query_context->getSettingsRef().database_replicated_initial_query_timeout_sec;
     {
diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index f08fd72ff7f..ac3af6e441c 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -490,7 +490,7 @@ bool DDLWorker::tryExecuteQuery(DDLTaskBase & task, const ZooKeeperPtr & zookeep
 
         if (!task.is_initial_query)
             query_scope.emplace(query_context);
-
+        
         executeQuery(istr, ostr, !task.is_initial_query, query_context, {}, QueryFlags{ .internal = false, .distributed_backup_restore = task.entry.is_backup_restore });
 
         if (auto txn = query_context->getZooKeeperMetadataTransaction())
diff --git a/tests/queries/0_stateless/02950_initialquery_event.reference b/tests/queries/0_stateless/02950_initialquery_event.reference
new file mode 100644
index 00000000000..7ad67a1e7e4
--- /dev/null
+++ b/tests/queries/0_stateless/02950_initialquery_event.reference
@@ -0,0 +1 @@
+InitialQuery	6	Same as Query, but only counts initial queries (see is_initial_query).
diff --git a/tests/queries/0_stateless/02950_initialquery_event.sql b/tests/queries/0_stateless/02950_initialquery_event.sql
new file mode 100644
index 00000000000..2b03607c5c7
--- /dev/null
+++ b/tests/queries/0_stateless/02950_initialquery_event.sql
@@ -0,0 +1 @@
+SELECT * FROM system.events where event = 'InitialQuery'
\ No newline at end of file

From b38e7060ef455e6ae569d371203309a1ad992c66 Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Sat, 23 Dec 2023 18:36:23 +0800
Subject: [PATCH 0070/1081] feat:add InitialQuery event

---
 src/Common/ProfileEvents.cpp                               | 1 +
 src/Databases/DatabaseReplicatedWorker.cpp                 | 7 +++++--
 src/Interpreters/DDLWorker.cpp                             | 2 +-
 .../queries/0_stateless/02950_initialquery_event.reference | 1 +
 tests/queries/0_stateless/02950_initialquery_event.sql     | 1 +
 5 files changed, 9 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02950_initialquery_event.reference
 create mode 100644 tests/queries/0_stateless/02950_initialquery_event.sql

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index f342a19b2aa..a2dc7f5ecd6 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -8,6 +8,7 @@
     M(Query, "Number of queries to be interpreted and potentially executed. Does not include queries that failed to parse or were rejected due to AST size limits, quota limits or limits on the number of simultaneously running queries. May include internal queries initiated by ClickHouse itself. Does not count subqueries.") \
     M(SelectQuery, "Same as Query, but only for SELECT queries.") \
     M(InsertQuery, "Same as Query, but only for INSERT queries.") \
+    M(InitialQuery, "Same as Query, but only counts initial queries (see is_initial_query).")\
     M(QueriesWithSubqueries, "Count queries with all subqueries") \
     M(SelectQueriesWithSubqueries, "Count SELECT queries with all subqueries") \
     M(InsertQueriesWithSubqueries, "Count INSERT queries with all subqueries") \
diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 2056b403ff6..c90af7d4ea8 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -6,7 +6,10 @@
 #include <filesystem>
 
 namespace fs = std::filesystem;
-
+namespace ProfileEvents
+{
+    extern const Event InitialQuery;
+}
 namespace DB
 {
 
@@ -264,7 +267,7 @@ String DatabaseReplicatedDDLWorker::tryEnqueueAndExecuteEntry(DDLLogEntry & entr
     chassert(!task->entry.query.empty());
     assert(!zookeeper->exists(task->getFinishedNodePath()));
     task->is_initial_query = true;
-
+    ProfileEvents::increment(ProfileEvents::InitialQuery);
     LOG_DEBUG(log, "Waiting for worker thread to process all entries before {}", entry_name);
     UInt64 timeout = query_context->getSettingsRef().database_replicated_initial_query_timeout_sec;
     {
diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index f08fd72ff7f..ac3af6e441c 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -490,7 +490,7 @@ bool DDLWorker::tryExecuteQuery(DDLTaskBase & task, const ZooKeeperPtr & zookeep
 
         if (!task.is_initial_query)
             query_scope.emplace(query_context);
-
+        
         executeQuery(istr, ostr, !task.is_initial_query, query_context, {}, QueryFlags{ .internal = false, .distributed_backup_restore = task.entry.is_backup_restore });
 
         if (auto txn = query_context->getZooKeeperMetadataTransaction())
diff --git a/tests/queries/0_stateless/02950_initialquery_event.reference b/tests/queries/0_stateless/02950_initialquery_event.reference
new file mode 100644
index 00000000000..7ad67a1e7e4
--- /dev/null
+++ b/tests/queries/0_stateless/02950_initialquery_event.reference
@@ -0,0 +1 @@
+InitialQuery	6	Same as Query, but only counts initial queries (see is_initial_query).
diff --git a/tests/queries/0_stateless/02950_initialquery_event.sql b/tests/queries/0_stateless/02950_initialquery_event.sql
new file mode 100644
index 00000000000..2b03607c5c7
--- /dev/null
+++ b/tests/queries/0_stateless/02950_initialquery_event.sql
@@ -0,0 +1 @@
+SELECT * FROM system.events where event = 'InitialQuery'
\ No newline at end of file

From 3e22f29b4529b6fefd5e92616ce9ef1ac33966d0 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sat, 23 Dec 2023 11:40:58 +0100
Subject: [PATCH 0071/1081] Fixed parameters

---
 docs/en/operations/backup.md                  |  2 +-
 .../registerBackupEngineAzureBlobStorage.cpp  | 25 +++++++++++++++----
 .../test.py                                   |  2 +-
 3 files changed, 22 insertions(+), 7 deletions(-)

diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 15d953249a0..4871f97c270 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -463,7 +463,7 @@ To write backups to an AzureBlobStorage container you need the following pieces
 
 The destination for a backup will be specified like this:
 ```
-AzureBlobStorage('<connection string>/<url>', '<Container>', '<Path>', '<Account Name>', '<Account Key>)
+AzureBlobStorage('<connection string>/<url>', '<container>', '<path>', '<account name>', '<account key>')
 ```
 
 ```sql
diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
index 6f7b5f38c28..ef95206831f 100644
--- a/src/Backups/registerBackupEngineAzureBlobStorage.cpp
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -22,6 +22,7 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int SUPPORT_IS_DISABLED;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
 #if USE_AZURE_BLOB_STORAGE
@@ -54,20 +55,34 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
 
         StorageAzureBlob::Configuration configuration;
 
-        if (args.size() == 4)
+        if (args.size() == 3)
         {
             configuration.connection_url = args[0].safeGet<String>();
             configuration.is_connection_string = true;
 
             configuration.container =  args[1].safeGet<String>();
             configuration.blob_path = args[2].safeGet<String>();
-            configuration.format = args[3].safeGet<String>();
 
             LOG_TRACE(&Poco::Logger::get("registerBackupEngineAzureBlobStorage"), "configuration.connection_url = {}"
                                                                                  "configuration.container = {}"
-                                                                                 "configuration.blob_path = {}"
-                                                                                 "configuration.format = {}",
-                                                                                 configuration.connection_url, configuration.container, configuration.blob_path, configuration.format);
+                                                                                 "configuration.blob_path = {}",
+                                                                                 configuration.connection_url, configuration.container, configuration.blob_path);
+        }
+        else if (args.size() == 5)
+        {
+            configuration.connection_url = args[0].safeGet<String>();
+            configuration.is_connection_string = false;
+
+            configuration.container =  args[1].safeGet<String>();
+            configuration.blob_path = args[2].safeGet<String>();
+            configuration.account_name = args[3].safeGet<String>();
+            configuration.account_key = args[4].safeGet<String>();
+
+        }
+        else
+        {
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                                "Backup AzureBlobStorage requires 3 or 5 arguments: connection string>/<url, container, path, [account name], [account key]");
         }
 
 
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
index cda3cab07e4..0a48d3523f0 100644
--- a/tests/integration/test_backup_restore_azure_blob_storage/test.py
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -147,7 +147,7 @@ def test_backup_restore(cluster):
     print(get_azure_file_content("test_simple_write_c.csv", port))
     assert get_azure_file_content("test_simple_write_c.csv", port) == '1,"a"\n'
 
-    backup_destination = f"AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c_backup.csv', 'CSV')"
+    backup_destination = f"AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c_backup.csv')"
     azure_query(
         node,
         f"BACKUP TABLE test_simple_write_connection_string TO {backup_destination}",

From f780a2f838d2b8a83eed2ec97703571528a7c7ed Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Sat, 23 Dec 2023 18:42:41 +0800
Subject: [PATCH 0072/1081] feat:add InitialQuery event

---
 src/Interpreters/DDLWorker.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index ac3af6e441c..f08fd72ff7f 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -490,7 +490,7 @@ bool DDLWorker::tryExecuteQuery(DDLTaskBase & task, const ZooKeeperPtr & zookeep
 
         if (!task.is_initial_query)
             query_scope.emplace(query_context);
-        
+
         executeQuery(istr, ostr, !task.is_initial_query, query_context, {}, QueryFlags{ .internal = false, .distributed_backup_restore = task.entry.is_backup_restore });
 
         if (auto txn = query_context->getZooKeeperMetadataTransaction())

From f594ab34f50c1bcd860bd3b950c8d74ffe09662d Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 23 Dec 2023 12:56:11 +0000
Subject: [PATCH 0073/1081] Fix special build

---
 src/Columns/ColumnVariant.cpp                 |  8 +++---
 src/Columns/ColumnVariant.h                   |  2 +-
 .../Serializations/SerializationArray.cpp     |  5 ++--
 .../Serializations/SerializationVariant.cpp   | 26 +++++++------------
 src/Functions/if.cpp                          |  2 +-
 5 files changed, 17 insertions(+), 26 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index a3a0362b646..f90ebfc54bb 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -102,7 +102,7 @@ ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColu
 {
 }
 
-ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & global_discriminators) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), global_discriminators)
+ColumnVariant::ColumnVariant(MutableColumnPtr local_discriminators_, MutableColumns && variants_, const std::vector<Discriminator> & local_to_global_discriminators_) : ColumnVariant(std::move(local_discriminators_), nullptr, std::move(variants_), local_to_global_discriminators_)
 {
 }
 
@@ -449,12 +449,12 @@ void ColumnVariant::insertData(const char *, size_t)
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method insertData is not supported for {}", getName());
 }
 
-void ColumnVariant::insert(const Field & field)
+void ColumnVariant::insert(const Field & x)
 {
-    if (field.isNull())
+    if (x.isNull())
         insertDefault();
     else
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(field), getName());
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot insert field {} to column {}", toString(x), getName());
 }
 
 void ColumnVariant::insertFrom(const IColumn & src_, size_t n)
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index ec58553f5f3..eb96205924c 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -194,7 +194,7 @@ public:
     template <typename Type>
     ColumnPtr indexImpl(const PaddedPODArray<Type> & indexes, size_t limit) const;
     ColumnPtr replicate(const Offsets & replicate_offsets) const override;
-    MutableColumns scatter(ColumnIndex num_variants, const Selector & selector) const override;
+    MutableColumns scatter(ColumnIndex num_columns, const Selector & selector) const override;
     void gather(ColumnGathererStream & gatherer_stream) override;
 
     /// Variant type is not comparable.
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index bb22af16c69..be23278ef25 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -348,7 +348,6 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 {
     auto mutable_column = column->assumeMutable();
     ColumnArray & column_array = typeid_cast<ColumnArray &>(*mutable_column);
-    size_t prev_last_offset = column_array.getOffsets().back();
     settings.path.push_back(Substream::ArraySizes);
 
     if (auto cached_column = getFromSubstreamsCache(cache, settings.path))
@@ -372,9 +371,9 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 
     /// Number of values corresponding with `offset_values` must be read.
     size_t last_offset = offset_values.back();
-    if (last_offset < prev_last_offset)
+    if (last_offset < nested_column->size())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested column is longer than last offset");
-    size_t nested_limit = last_offset - prev_last_offset;
+    size_t nested_limit = last_offset - nested_column->size();
 
     if (unlikely(nested_limit > MAX_ARRAYS_SIZE))
         throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Array sizes are too large: {}", nested_limit);
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index d36151fe8e9..c88dd8e9e0d 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -564,7 +564,7 @@ bool SerializationVariant::tryDeserializeImpl(
     IColumn & column,
     const String & field,
     std::function<bool(ReadBuffer &)> check_for_null,
-    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_variant) const
+    std::function<bool(IColumn & variant_column, const SerializationPtr & variant_serialization, ReadBuffer &)> try_deserialize_nested) const
 {
     auto & column_variant = assert_cast<ColumnVariant &>(column);
     ReadBufferFromString null_buf(field);
@@ -577,25 +577,17 @@ bool SerializationVariant::tryDeserializeImpl(
     for (size_t global_discr : deserialize_text_order)
     {
         ReadBufferFromString variant_buf(field);
-        /// Usually try_deserialize_variant should not throw any exception, but let's use try/catch just in case.
-        try
+        auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
+        size_t prev_size = variant_column.size();
+        if (try_deserialize_nested(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
         {
-            auto & variant_column = column_variant.getVariantByGlobalDiscriminator(global_discr);
-            size_t prev_size = variant_column.size();
-            if (try_deserialize_variant(variant_column, variants[global_discr], variant_buf) && variant_buf.eof())
-            {
-                column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
-                column_variant.getOffsets().push_back(prev_size);
-                return true;
-            }
-            else if (variant_column.size() > prev_size)
-            {
-                variant_column.popBack(1);
-            }
+            column_variant.getLocalDiscriminators().push_back(column_variant.localDiscriminatorByGlobal(global_discr));
+            column_variant.getOffsets().push_back(prev_size);
+            return true;
         }
-        catch (...)
+        else if (variant_column.size() > prev_size)
         {
-            /// Try next variant.
+            variant_column.popBack(1);
         }
     }
 
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index b15bc5938be..9ca4b487119 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -224,7 +224,7 @@ public:
         return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
     }
 
-    FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
+    explicit FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
 
 private:
     bool use_variant_when_no_common_type = false;

From fa5dde0bff8f34ebe85e1cc6e929f834c5e6b496 Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 12:37:06 +0800
Subject: [PATCH 0074/1081] feat: Add initial query event

---
 src/Databases/DatabaseReplicatedWorker.cpp    |  6 +--
 src/Interpreters/InterpreterFactory.cpp       |  5 +-
 ..._distributed_initial_query_event.reference |  6 +++
 .../02950_distributed_initial_query_event.sh  | 54 +++++++++++++++++++
 .../02950_initialquery_event.reference        |  1 -
 .../0_stateless/02950_initialquery_event.sql  |  1 -
 6 files changed, 66 insertions(+), 7 deletions(-)
 create mode 100644 tests/queries/0_stateless/02950_distributed_initial_query_event.reference
 create mode 100644 tests/queries/0_stateless/02950_distributed_initial_query_event.sh
 delete mode 100644 tests/queries/0_stateless/02950_initialquery_event.reference
 delete mode 100644 tests/queries/0_stateless/02950_initialquery_event.sql

diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index c90af7d4ea8..317cda3cd3d 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -7,9 +7,7 @@
 
 namespace fs = std::filesystem;
 namespace ProfileEvents
-{
-    extern const Event InitialQuery;
-}
+
 namespace DB
 {
 
@@ -267,7 +265,7 @@ String DatabaseReplicatedDDLWorker::tryEnqueueAndExecuteEntry(DDLLogEntry & entr
     chassert(!task->entry.query.empty());
     assert(!zookeeper->exists(task->getFinishedNodePath()));
     task->is_initial_query = true;
-    ProfileEvents::increment(ProfileEvents::InitialQuery);
+    
     LOG_DEBUG(log, "Waiting for worker thread to process all entries before {}", entry_name);
     UInt64 timeout = query_context->getSettingsRef().database_replicated_initial_query_timeout_sec;
     {
diff --git a/src/Interpreters/InterpreterFactory.cpp b/src/Interpreters/InterpreterFactory.cpp
index e32cbe4ccad..fdf7e8ebfbb 100644
--- a/src/Interpreters/InterpreterFactory.cpp
+++ b/src/Interpreters/InterpreterFactory.cpp
@@ -120,6 +120,7 @@
 namespace ProfileEvents
 {
     extern const Event Query;
+    extern const Event InitialQuery;
     extern const Event QueriesWithSubqueries;
     extern const Event SelectQuery;
     extern const Event InsertQuery;
@@ -137,7 +138,9 @@ namespace ErrorCodes
 std::unique_ptr<IInterpreter> InterpreterFactory::get(ASTPtr & query, ContextMutablePtr context, const SelectQueryOptions & options)
 {
     ProfileEvents::increment(ProfileEvents::Query);
-
+    
+    if (context->getClientInfo().query_kind == ClientInfo::QueryKind::INITIAL_QUERY)
+        ProfileEvents::increment(ProfileEvents::InitialQuery);
     /// SELECT and INSERT query will handle QueriesWithSubqueries on their own.
     if (!(query->as<ASTSelectQuery>() ||
         query->as<ASTSelectWithUnionQuery>() ||
diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.reference b/tests/queries/0_stateless/02950_distributed_initial_query_event.reference
new file mode 100644
index 00000000000..af8542c7204
--- /dev/null
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.reference
@@ -0,0 +1,6 @@
+Local situation
+Initial Query Difference: 1
+Query Difference: 1
+Distributed situation
+Initial Query Difference: 1
+Query Difference: 2
diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
new file mode 100644
index 00000000000..3a01aa63d87
--- /dev/null
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
@@ -0,0 +1,54 @@
+-- Tags: distributed
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+# CREATE TABLE local (x UInt8) Engine=Memory;
+# CREATE TABLE distributed ON CLUSTER cluster (p Date, i Int32) ENGINE = Distributed(test_cluster_two_shards, currentDatabase(), x)
+$CLICKHOUSE_CLIENT -n -q "
+DROP TABLE IF EXISTS local;
+DROP TABLE IF EXISTS distributed;
+CREATE TABLE local (x UInt8) Engine=Memory;
+CREATE TABLE distributed AS local ENGINE = Distributed(test_cluster_two_shards, currentDatabase(), local, x);
+INSERT INTO distributed SELECT number FROM numbers(10);
+SYSTEM FLUSH DISTRIBUTED distributed;
+"
+echo "Local situation"
+# before SELECT * FROM local
+query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'InitialQuery'")
+query_countQ=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'Query'")
+
+# Execute SELECT * FROM local
+$CLICKHOUSE_CLIENT -q "SELECT * FROM local" > /dev/null
+
+# Counts after SELECT * FROM local
+After_query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'InitialQuery'")
+After_query_countQ=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'Query'")
+
+# Calculate the differences
+Initial_query_diff=$(($After_query_countI-$query_countI-2))
+query_diff=$(($After_query_countQ-$query_countQ-2))
+
+echo "Initial Query Difference: $Initial_query_diff"
+echo "Query Difference: $query_diff"
+echo "Distributed situation"
+
+# before SELECT * FROM distributed
+query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'InitialQuery'")
+query_countQ=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'Query'")
+
+# Execute SELECT * FROM distributed
+$CLICKHOUSE_CLIENT -q "SELECT * FROM distributed" > /dev/null
+
+# Counts after SELECT * FROM distributed
+After_query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'InitialQuery'")
+After_query_countQ=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'Query'")
+
+# Calculate the differences
+Initial_query_diff=$(($After_query_countI-$query_countI-2))
+query_diff=$(($After_query_countQ-$query_countQ-2))
+
+echo "Initial Query Difference: $Initial_query_diff"
+echo "Query Difference: $query_diff"
+
+
diff --git a/tests/queries/0_stateless/02950_initialquery_event.reference b/tests/queries/0_stateless/02950_initialquery_event.reference
deleted file mode 100644
index 7ad67a1e7e4..00000000000
--- a/tests/queries/0_stateless/02950_initialquery_event.reference
+++ /dev/null
@@ -1 +0,0 @@
-InitialQuery	6	Same as Query, but only counts initial queries (see is_initial_query).
diff --git a/tests/queries/0_stateless/02950_initialquery_event.sql b/tests/queries/0_stateless/02950_initialquery_event.sql
deleted file mode 100644
index 2b03607c5c7..00000000000
--- a/tests/queries/0_stateless/02950_initialquery_event.sql
+++ /dev/null
@@ -1 +0,0 @@
-SELECT * FROM system.events where event = 'InitialQuery'
\ No newline at end of file

From 1464c3d1aab8c6ecdc369facceb1b9f6cf4b36fb Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 15:13:21 +0800
Subject: [PATCH 0075/1081] feat: Add initial query event

---
 src/Databases/DatabaseReplicatedWorker.cpp                 | 3 +--
 .../02950_distributed_initial_query_event.reference        | 2 +-
 .../0_stateless/02950_distributed_initial_query_event.sh   | 7 +++----
 3 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 317cda3cd3d..2056b403ff6 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -6,7 +6,6 @@
 #include <filesystem>
 
 namespace fs = std::filesystem;
-namespace ProfileEvents
 
 namespace DB
 {
@@ -265,7 +264,7 @@ String DatabaseReplicatedDDLWorker::tryEnqueueAndExecuteEntry(DDLLogEntry & entr
     chassert(!task->entry.query.empty());
     assert(!zookeeper->exists(task->getFinishedNodePath()));
     task->is_initial_query = true;
-    
+
     LOG_DEBUG(log, "Waiting for worker thread to process all entries before {}", entry_name);
     UInt64 timeout = query_context->getSettingsRef().database_replicated_initial_query_timeout_sec;
     {
diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.reference b/tests/queries/0_stateless/02950_distributed_initial_query_event.reference
index af8542c7204..cf10427e9b3 100644
--- a/tests/queries/0_stateless/02950_distributed_initial_query_event.reference
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.reference
@@ -3,4 +3,4 @@ Initial Query Difference: 1
 Query Difference: 1
 Distributed situation
 Initial Query Difference: 1
-Query Difference: 2
+Query Difference: 3
diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
index 3a01aa63d87..c8a955c4fe5 100644
--- a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
@@ -1,4 +1,5 @@
--- Tags: distributed
+#!/usr/bin/env bash
+# Tags:no-parallel shard
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -38,7 +39,7 @@ query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE even
 query_countQ=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'Query'")
 
 # Execute SELECT * FROM distributed
-$CLICKHOUSE_CLIENT -q "SELECT * FROM distributed" > /dev/null
+$CLICKHOUSE_CLIENT -q "SELECT * FROM distributed SETTINGS prefer_localhost_replica = 0" > /dev/null
 
 # Counts after SELECT * FROM distributed
 After_query_countI=$($CLICKHOUSE_CLIENT -q "SELECT value FROM system.events WHERE event = 'InitialQuery'")
@@ -50,5 +51,3 @@ query_diff=$(($After_query_countQ-$query_countQ-2))
 
 echo "Initial Query Difference: $Initial_query_diff"
 echo "Query Difference: $query_diff"
-
-

From 22e1bcb9d638d5df0c43585b1d78228beedb0dc8 Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 16:12:10 +0800
Subject: [PATCH 0076/1081] feat:add InitialQuery event

Signed-off-by: una <dengmengda@gmail.com>
---
 .../0_stateless/02950_distributed_initial_query_event.sh        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
index c8a955c4fe5..ddd0fb1e408 100644
--- a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags:no-parallel shard
+# Tags:no-parallel, shard
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From a6f2eaf5a6ba2a26943d0c1c53c7cf7460a7471d Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 16:19:06 +0800
Subject: [PATCH 0077/1081] fix:use , to split tags

Signed-off-by: una <dengmengda@gmail.com>
---
 .../0_stateless/02950_distributed_initial_query_event.sh        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
index ddd0fb1e408..7f690a681c4 100644
--- a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
+++ b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags:no-parallel, shard
+# Tags:no-parallel,shard
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From d46d91452176414426e40f598a7a1aa989f1a584 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 27 Dec 2023 10:28:52 +0100
Subject: [PATCH 0078/1081] Updated thread name

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  8 +-
 src/Backups/BackupIO_AzureBlobStorage.h       | 81 +++++++++----------
 .../copyAzureBlobStorageFile.cpp              | 25 +++---
 3 files changed, 59 insertions(+), 55 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index d41d23e3c36..a1fd5bd8327 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -35,7 +35,7 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
     : BackupReaderDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupReaderAzureBlobStorage"))
-    , data_source_description{DataSourceType::AzureBlobStorage, "AzureBlobStorage", false, false}
+    , data_source_description{DataSourceType::AzureBlobStorage, configuration_.container, false, false}
     , configuration(configuration_)
 {
     client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
@@ -160,7 +160,7 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
     : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterAzureBlobStorage"))
-    , data_source_description{DataSourceType::AzureBlobStorage, "AzureBlobStorage", false, false}
+    , data_source_description{DataSourceType::AzureBlobStorage,configuration_.container, false, false}
     , configuration(configuration_)
 {
     client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
@@ -209,7 +209,7 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
                 settings,
                 read_settings,
                 {},
-                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterAzureBlobStorage"));
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
             return; /// copied!
         }
     }
@@ -221,7 +221,7 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
 void BackupWriterAzureBlobStorage::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
 {
     copyDataToAzureBlobStorageFile(create_read_buffer, start_pos, length, client, configuration.container, path_in_backup, settings, {},
-                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterAzureBlobStorage"));
+                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
 }
 
 BackupWriterAzureBlobStorage::~BackupWriterAzureBlobStorage() = default;
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 6ef66fc432d..65affb9f079 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -12,57 +12,54 @@
 namespace DB
 {
 
-//    using AzureClientPtr = std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient>;
-
 /// Represents a backup stored to Azure
-    class BackupReaderAzureBlobStorage : public BackupReaderDefault
-    {
-    public:
-        BackupReaderAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
-        ~BackupReaderAzureBlobStorage() override;
+class BackupReaderAzureBlobStorage : public BackupReaderDefault
+{
+public:
+    BackupReaderAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
+    ~BackupReaderAzureBlobStorage() override;
 
-        bool fileExists(const String & file_name) override;
-        UInt64 getFileSize(const String & file_name) override;
-        std::unique_ptr<SeekableReadBuffer> readFile(const String & file_name) override;
+    bool fileExists(const String & file_name) override;
+    UInt64 getFileSize(const String & file_name) override;
+    std::unique_ptr<SeekableReadBuffer> readFile(const String & file_name) override;
 
-        void copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
-                            DiskPtr destination_disk, const String & destination_path, WriteMode write_mode) override;
+    void copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
+                        DiskPtr destination_disk, const String & destination_path, WriteMode write_mode) override;
 
-    private:
-        const DataSourceDescription data_source_description;
-        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
-        StorageAzureBlob::Configuration configuration;
-        std::unique_ptr<AzureObjectStorage> object_storage;
-        std::shared_ptr<AzureObjectStorageSettings> settings;
-    };
+private:
+    const DataSourceDescription data_source_description;
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+    StorageAzureBlob::Configuration configuration;
+    std::unique_ptr<AzureObjectStorage> object_storage;
+    std::shared_ptr<AzureObjectStorageSettings> settings;
+};
 
+class BackupWriterAzureBlobStorage : public BackupWriterDefault
+{
+public:
+    BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
+    ~BackupWriterAzureBlobStorage() override;
 
-    class BackupWriterAzureBlobStorage : public BackupWriterDefault
-    {
-    public:
-        BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
-        ~BackupWriterAzureBlobStorage() override;
+    bool fileExists(const String & file_name) override;
+    UInt64 getFileSize(const String & file_name) override;
+    std::unique_ptr<WriteBuffer> writeFile(const String & file_name) override;
 
-        bool fileExists(const String & file_name) override;
-        UInt64 getFileSize(const String & file_name) override;
-        std::unique_ptr<WriteBuffer> writeFile(const String & file_name) override;
+    void copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length) override;
+    void copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
+                          bool copy_encrypted, UInt64 start_pos, UInt64 length) override;
 
-        void copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length) override;
-        void copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
-                              bool copy_encrypted, UInt64 start_pos, UInt64 length) override;
+    void removeFile(const String & file_name) override;
+    void removeFiles(const Strings & file_names) override;
 
-        void removeFile(const String & file_name) override;
-        void removeFiles(const Strings & file_names) override;
-
-    private:
-        std::unique_ptr<ReadBuffer> readFile(const String & file_name, size_t expected_file_size) override;
-        void removeFilesBatch(const Strings & file_names);
-        const DataSourceDescription data_source_description;
-        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
-        StorageAzureBlob::Configuration configuration;
-        std::unique_ptr<AzureObjectStorage> object_storage;
-        std::shared_ptr<AzureObjectStorageSettings> settings;
-    };
+private:
+    std::unique_ptr<ReadBuffer> readFile(const String & file_name, size_t expected_file_size) override;
+    void removeFilesBatch(const Strings & file_names);
+    const DataSourceDescription data_source_description;
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+    StorageAzureBlob::Configuration configuration;
+    std::unique_ptr<AzureObjectStorage> object_storage;
+    std::shared_ptr<AzureObjectStorageSettings> settings;
+};
 
 }
 
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index bf0bcac664b..0a0a080b5cb 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -22,6 +22,11 @@ namespace ProfileEvents
     extern const Event DiskAzureUploadPart;
 }
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
 
 namespace DB
 {
@@ -44,7 +49,8 @@ namespace
             std::shared_ptr<AzureObjectStorageSettings> settings_,
             const std::optional<std::map<String, String>> & object_metadata_,
             ThreadPoolCallbackRunner<void> schedule_,
-            bool for_disk_azure_blob_storage_)
+            bool for_disk_azure_blob_storage_,
+            const Poco::Logger * log_)
             : create_read_buffer(create_read_buffer_)
             , client(client_)
             , offset (offset_)
@@ -55,7 +61,7 @@ namespace
             , object_metadata(object_metadata_)
             , schedule(schedule_)
             , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
-            , log(&Poco::Logger::get("azureBlobStorageUploadHelper"))
+            , log(log_)
             , max_single_part_upload_size(settings_.get()->max_single_part_upload_size)
         {
         }
@@ -179,11 +185,11 @@ namespace
                 try
                 {
                     auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
-                    auto buffer = std::make_unique<StdStreamFromReadBuffer>(std::move(read_buffer), part_size);
                     task->data = new char[part_size];
                     task->size = part_size;
-                    buffer->read(task->data,part_size);
-                    task->block_id = getRandomASCIIString(64);
+                    size_t n = read_buffer->read(task->data,part_size);
+                    if (n != part_size)
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected size");
 
                     schedule([this, task, task_finish_notify]()
                     {
@@ -208,9 +214,10 @@ namespace
             {
                 UploadPartTask task;
                 auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
-                auto buffer = std::make_unique<StdStreamFromReadBuffer>(std::move(read_buffer), part_size);
                 task.data = new char[part_size];
-                buffer->read(task.data,part_size);
+                size_t n = read_buffer->read(task.data,part_size);
+                if (n != part_size)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected size");
                 task.size = part_size;
                 processUploadTask(task);
                 block_ids.emplace_back(task.block_id);
@@ -274,7 +281,7 @@ void copyDataToAzureBlobStorageFile(
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
-    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage};
+    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyDataToAzureBlobStorageFile")};
     helper.performCopy();
 }
 
@@ -314,7 +321,7 @@ void copyAzureBlobStorageFile(
             settings->max_single_download_retries);
         };
 
-        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage};
+        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
         helper.performCopy();
     }
 }

From 0181bab23c38c2d1c15f199d522a4743b11586d6 Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 19:59:23 +0800
Subject: [PATCH 0079/1081] fix:style

Signed-off-by: una <dengmengda@gmail.com>
---
 src/Interpreters/InterpreterFactory.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Interpreters/InterpreterFactory.cpp b/src/Interpreters/InterpreterFactory.cpp
index fdf7e8ebfbb..c5d7f0f891c 100644
--- a/src/Interpreters/InterpreterFactory.cpp
+++ b/src/Interpreters/InterpreterFactory.cpp
@@ -138,7 +138,6 @@ namespace ErrorCodes
 std::unique_ptr<IInterpreter> InterpreterFactory::get(ASTPtr & query, ContextMutablePtr context, const SelectQueryOptions & options)
 {
     ProfileEvents::increment(ProfileEvents::Query);
-    
     if (context->getClientInfo().query_kind == ClientInfo::QueryKind::INITIAL_QUERY)
         ProfileEvents::increment(ProfileEvents::InitialQuery);
     /// SELECT and INSERT query will handle QueriesWithSubqueries on their own.

From 2c1513540768eaed34a13fd643c4ace491421c0e Mon Sep 17 00:00:00 2001
From: una <dengmengda@gmail.com>
Date: Wed, 27 Dec 2023 20:53:30 +0800
Subject: [PATCH 0080/1081] fix test-file permissions

Signed-off-by: una <dengmengda@gmail.com>
---
 .../queries/0_stateless/02950_distributed_initial_query_event.sh  | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 mode change 100644 => 100755 tests/queries/0_stateless/02950_distributed_initial_query_event.sh

diff --git a/tests/queries/0_stateless/02950_distributed_initial_query_event.sh b/tests/queries/0_stateless/02950_distributed_initial_query_event.sh
old mode 100644
new mode 100755

From 5497fa79edfa6fdc2559d516486f80f88af40c68 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 14:11:53 +0000
Subject: [PATCH 0081/1081] Fix tests

---
 src/DataTypes/Serializations/SerializationEnum.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index fb384547d64..14b1a33e2ce 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -73,7 +73,9 @@ template <typename Type>
 bool SerializationEnum<Type>::tryDeserializeTextQuoted(IColumn & column, ReadBuffer & istr, const FormatSettings &) const
 {
     std::string field_name;
-    readQuotedStringWithSQLStyle(field_name, istr);
+    if (!tryReadQuotedStringWithSQLStyle(field_name, istr))
+        return false;
+
     FieldType x;
     if (!ref_enum_values.tryGetValue(x, StringRef(field_name)))
         return false;

From 4b2a0b99fc094e6b70e516af0360f126f62a886d Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 27 Dec 2023 20:02:50 +0100
Subject: [PATCH 0082/1081] Update
 docs/en/sql-reference/functions/other-functions.md

---
 docs/en/sql-reference/functions/other-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index d69d692d055..ebc80e4d308 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2839,7 +2839,7 @@ Extracts a column with specified type from a `Variant` column.
 **Syntax**
 
 ```sql
-tupleElement(variant, type_name, [, default_value])
+variantElement(variant, type_name, [, default_value])
 ```
 
 **Arguments**

From 275fbe3e986c8faee3bd396e3ed87e3707f0f25f Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 20:04:14 +0000
Subject: [PATCH 0083/1081] Support function to subcolumns optimization for
 Variant, better text priority for reading Bool

---
 .../Passes/FunctionToSubcolumnsPass.cpp         | 17 +++++++++++++++++
 .../Serializations/SerializationVariant.cpp     |  4 ++++
 .../RewriteFunctionToSubcolumnVisitor.cpp       | 15 +++++++++++++++
 3 files changed, 36 insertions(+)

diff --git a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
index cd635f87e0e..c74c1038173 100644
--- a/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
+++ b/src/Analyzer/Passes/FunctionToSubcolumnsPass.cpp
@@ -176,6 +176,23 @@ public:
 
                 node = std::make_shared<ColumnNode>(column, column_source);
             }
+            else if (function_name == "variantElement" && isVariant(column_type) && second_argument_constant_node)
+            {
+                /// Replace `variantElement(variant_argument, type_name)` with `variant_argument.type_name`.
+                const auto & variant_element_constant_value = second_argument_constant_node->getValue();
+                String subcolumn_name;
+
+                if (variant_element_constant_value.getType() != Field::Types::String)
+                    return;
+
+                subcolumn_name = variant_element_constant_value.get<const String &>();
+
+                column.name += '.';
+                column.name += subcolumn_name;
+                column.type = function_node->getResultType();
+
+                node = std::make_shared<ColumnNode>(column, column_source);
+            }
             else if (function_name == "mapContains" && column_type.isMap())
             {
                 const auto & data_type_map = assert_cast<const DataTypeMap &>(*column.type);
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index c88dd8e9e0d..49ecb2fc546 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -534,6 +534,10 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
         return {max_depth, max_priority, max_simple_nested_depth};
     }
 
+    /// Bool type should have priority higher then all integers.
+    if (isBool(type))
+        return {nested_depth, priority_map[TypeIndex::Int8] + 1 , simple_nested_depth};
+
     return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
 }
 
diff --git a/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp b/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
index 506fa13b7ba..0717abd4782 100644
--- a/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
+++ b/src/Interpreters/RewriteFunctionToSubcolumnVisitor.cpp
@@ -122,6 +122,21 @@ void RewriteFunctionToSubcolumnData::visit(ASTFunction & function, ASTPtr & ast)
             ast = transformToSubcolumn(name_in_storage, subcolumn_name);
             ast->setAlias(alias);
         }
+        else if (function.name == "variantElement" && column_type_id == TypeIndex::Variant)
+        {
+            const auto * literal = arguments[1]->as<ASTLiteral>();
+            if (!literal)
+                return;
+
+            String subcolumn_name;
+            auto value_type = literal->value.getType();
+            if (value_type != Field::Types::String)
+                return;
+
+            subcolumn_name = literal->value.get<const String &>();
+            ast = transformToSubcolumn(name_in_storage, subcolumn_name);
+            ast->setAlias(alias);
+        }
         else
         {
             auto it = binary_function_to_subcolumn.find(function.name);

From 8b4157141c0501d4498278947b468d03638cdf8a Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 27 Dec 2023 20:36:10 +0000
Subject: [PATCH 0084/1081] Fix style

---
 src/DataTypes/Serializations/SerializationVariant.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 49ecb2fc546..9cfc4b9e26f 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -536,7 +536,7 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
 
     /// Bool type should have priority higher then all integers.
     if (isBool(type))
-        return {nested_depth, priority_map[TypeIndex::Int8] + 1 , simple_nested_depth};
+        return {nested_depth, priority_map[TypeIndex::Int8] + 1, simple_nested_depth};
 
     return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
 }

From 32ff152f2d7e4798a7bbc916808cc9ca883cf13e Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Thu, 28 Dec 2023 11:41:06 +0000
Subject: [PATCH 0085/1081] Support negtive position arguments

---
 .../replaceForPositionalArguments.cpp         | 24 ++++-
 .../0_stateless/01798_having_push_down.sql    |  3 +-
 .../02006_test_positional_arguments.reference | 94 +++++++++++++++++++
 .../02006_test_positional_arguments.sql       | 21 +++++
 .../02932_group_by_null_fuzzer.sql            |  1 +
 5 files changed, 137 insertions(+), 6 deletions(-)

diff --git a/src/Interpreters/replaceForPositionalArguments.cpp b/src/Interpreters/replaceForPositionalArguments.cpp
index 241dd7cf92c..bea87ad913a 100644
--- a/src/Interpreters/replaceForPositionalArguments.cpp
+++ b/src/Interpreters/replaceForPositionalArguments.cpp
@@ -27,14 +27,28 @@ bool replaceForPositionalArguments(ASTPtr & argument, const ASTSelectQuery * sel
         return false;
 
     auto which = ast_literal->value.getType();
-    if (which != Field::Types::UInt64)
+    if (which != Field::Types::UInt64 && which != Field::Types::Int64)
         return false;
 
-    auto pos = ast_literal->value.get<UInt64>();
+    UInt64 pos;
+
+    if (which == Field::Types::UInt64)
+    {
+        pos = ast_literal->value.get<UInt64>();
+    }
+    else if (which == Field::Types::Int64)
+    {
+        auto value = ast_literal->value.get<Int64>();
+        pos = value > 0 ? value : columns.size() + value + 1;
+    }
+    else
+    {
+        return false;
+    }
+
     if (!pos || pos > columns.size())
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                "Positional argument out of bounds: {} (expected in range [1, {}]",
-                        pos, columns.size());
+        throw Exception(
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Positional argument out of bounds: {} (expected in range [1, {}]", pos, columns.size());
 
     const auto & column = columns[--pos];
     if (typeid_cast<const ASTIdentifier *>(column.get()) || typeid_cast<const ASTLiteral *>(column.get()))
diff --git a/tests/queries/0_stateless/01798_having_push_down.sql b/tests/queries/0_stateless/01798_having_push_down.sql
index b3a77c8f5b5..c0c3447f5ab 100644
--- a/tests/queries/0_stateless/01798_having_push_down.sql
+++ b/tests/queries/0_stateless/01798_having_push_down.sql
@@ -8,11 +8,12 @@ SELECT sum(c0 = 0), min(c0 + 1), sum(c0 + 2) FROM t_having
 GROUP BY c0 HAVING c0 = 0
 SETTINGS enable_optimize_predicate_expression=0;
 
+SET enable_positional_arguments=0;
+
 SELECT c0 + -1, sum(intDivOrZero(intDivOrZero(NULL, NULL), '2'), intDivOrZero(10000000000., intDivOrZero(intDivOrZero(intDivOrZero(NULL, NULL), 10), NULL))) FROM t_having GROUP BY c0 = 2, c0 = 10, intDivOrZero(intDivOrZero(intDivOrZero(NULL, NULL), NULL), NULL), c0 HAVING c0 = 2 SETTINGS enable_optimize_predicate_expression = 0;
 
 SELECT sum(c0 + 257) FROM t_having GROUP BY c0 = -9223372036854775808, NULL, -2147483649, c0 HAVING c0 = -9223372036854775808 SETTINGS enable_optimize_predicate_expression = 0;
 
-SET enable_positional_arguments=0;
 SELECT c0 + -2, c0 + -9223372036854775807, c0 = NULL FROM t_having GROUP BY c0 = 0.9998999834060669, 1023, c0 HAVING c0 = 0.9998999834060669 SETTINGS enable_optimize_predicate_expression = 0;
 
 DROP TABLE t_having;
diff --git a/tests/queries/0_stateless/02006_test_positional_arguments.reference b/tests/queries/0_stateless/02006_test_positional_arguments.reference
index 40100e8d5be..079bd071103 100644
--- a/tests/queries/0_stateless/02006_test_positional_arguments.reference
+++ b/tests/queries/0_stateless/02006_test_positional_arguments.reference
@@ -3,18 +3,50 @@ select x3, x2, x1 from test order by 1;
 1	100	100
 10	1	10
 100	10	1
+select x3, x2, x1 from test order by -3;
+1	100	100
+10	1	10
+100	10	1
 select x3, x2, x1 from test order by x3;
 1	100	100
 10	1	10
 100	10	1
+select x3, x2, x1 from test order by 3;
+100	10	1
+10	1	10
+1	100	100
+select x3, x2, x1 from test order by -1;
+100	10	1
+10	1	10
+1	100	100
+select x3, x2, x1 from test order by x1;
+100	10	1
+10	1	10
+1	100	100
 select x3, x2, x1 from test order by 1 desc;
 100	10	1
 10	1	10
 1	100	100
+select x3, x2, x1 from test order by -3 desc;
+100	10	1
+10	1	10
+1	100	100
 select x3, x2, x1 from test order by x3 desc;
 100	10	1
 10	1	10
 1	100	100
+select x3, x2, x1 from test order by 3 desc;
+1	100	100
+10	1	10
+100	10	1
+select x3, x2, x1 from test order by -1 desc;
+1	100	100
+10	1	10
+100	10	1
+select x3, x2, x1 from test order by x1 desc;
+1	100	100
+10	1	10
+100	10	1
 insert into test values (1, 10, 100), (10, 1, 10), (100, 100, 1);
 select x3, x2 from test group by x3, x2 order by x3;
 1	100
@@ -54,6 +86,20 @@ SELECT
     x1
 FROM test
 ORDER BY x3 + 1 ASC
+explain syntax select x3, x2, x1 from test order by -1;
+SELECT
+    x3,
+    x2,
+    x1
+FROM test
+ORDER BY x1 ASC
+explain syntax select x3 + 1, x2, x1 from test order by -1;
+SELECT
+    x3 + 1,
+    x2,
+    x1
+FROM test
+ORDER BY x1 ASC
 explain syntax select x3, x3 - x2, x2, x1 from test order by 2;
 SELECT
     x3,
@@ -62,6 +108,14 @@ SELECT
     x1
 FROM test
 ORDER BY x3 - x2 ASC
+explain syntax select x3, x3 - x2, x2, x1 from test order by -2;
+SELECT
+    x3,
+    x3 - x2,
+    x2,
+    x1
+FROM test
+ORDER BY x2 ASC
 explain syntax select x3, if(x3 > 10, x3, plus(x1, x2)), x1 + x2 from test order by 2;
 SELECT
     x3,
@@ -69,12 +123,28 @@ SELECT
     x1 + x2
 FROM test
 ORDER BY if(x3 > 10, x3, x1 + x2) ASC
+explain syntax select x3, if(x3 > 10, x3, plus(x1, x2)), x1 + x2 from test order by -2;
+SELECT
+    x3,
+    if(x3 > 10, x3, x1 + x2),
+    x1 + x2
+FROM test
+ORDER BY if(x3 > 10, x3, x1 + x2) ASC
 explain syntax select max(x1), x2 from test group by 2 order by 1, 2;
 SELECT
     max(x1),
     x2
 FROM test
 GROUP BY x2
+ORDER BY
+    max(x1) ASC,
+    x2 ASC
+explain syntax select max(x1), x2 from test group by -1 order by -2, -1;
+SELECT
+    max(x1),
+    x2
+FROM test
+GROUP BY x2
 ORDER BY
     max(x1) ASC,
     x2 ASC
@@ -83,16 +153,34 @@ SELECT
     1 + greatest(x1, 1),
     x2
 FROM test
+GROUP BY
+    1 + greatest(x1, 1),
+    x2
+explain syntax select 1 + greatest(x1, 1), x2 from test group by -2, -1;
+SELECT
+    1 + greatest(x1, 1),
+    x2
+FROM test
 GROUP BY
     1 + greatest(x1, 1),
     x2
 select max(x1), x2 from test group by 1, 2; -- { serverError 43, 184 }
 select 1 + max(x1), x2 from test group by 1, 2; -- { serverError 43, 184 }
+select max(x1), x2 from test group by -2, -1; -- { serverError 43, 184 }
+select 1 + max(x1), x2 from test group by -2, -1; -- { serverError 43, 184 }
 explain syntax select x1 + x3, x3 from test group by 1, 2;
 SELECT
     x1 + x3,
     x3
 FROM test
+GROUP BY
+    x1 + x3,
+    x3
+explain syntax select x1 + x3, x3 from test group by -2, -1;
+SELECT
+    x1 + x3,
+    x3
+FROM test
 GROUP BY
     x1 + x3,
     x3
@@ -102,8 +190,14 @@ select x1, x1 * 2, max(x2), max(x3) from test2 group by 2, 1, x1 order by 1, 2,
 1	2	10	100
 10	20	1	10
 100	200	100	1
+select x1, x1 * 2, max(x2), max(x3) from test2 group by 2, 1, x1 order by 1, 2, -1 desc, -2 asc;
+1	2	10	100
+10	20	1	10
+100	200	100	1
 select a, b, c, d, e, f  from (select 44 a, 88 b, 13 c, 14 d, 15 e, 16 f) t group by 1,2,3,4,5,6 order by a;
 44	88	13	14	15	16
+select a, b, c, d, e, f  from (select 44 a, 88 b, 13 c, 14 d, 15 e, 16 f) t group by 1,2,3,-3,-2,-1 order by a;
+44	88	13	14	15	16
 explain syntax select plus(1, 1) as a group by a;
 SELECT 1 + 1 AS a
 GROUP BY a
diff --git a/tests/queries/0_stateless/02006_test_positional_arguments.sql b/tests/queries/0_stateless/02006_test_positional_arguments.sql
index 159ad6bd427..6f427e0298d 100644
--- a/tests/queries/0_stateless/02006_test_positional_arguments.sql
+++ b/tests/queries/0_stateless/02006_test_positional_arguments.sql
@@ -9,11 +9,21 @@ insert into test values (1, 10, 100), (10, 1, 10), (100, 100, 1);
 
 -- { echo }
 select x3, x2, x1 from test order by 1;
+select x3, x2, x1 from test order by -3;
 select x3, x2, x1 from test order by x3;
 
+select x3, x2, x1 from test order by 3;
+select x3, x2, x1 from test order by -1;
+select x3, x2, x1 from test order by x1;
+
 select x3, x2, x1 from test order by 1 desc;
+select x3, x2, x1 from test order by -3 desc;
 select x3, x2, x1 from test order by x3 desc;
 
+select x3, x2, x1 from test order by 3 desc;
+select x3, x2, x1 from test order by -1 desc;
+select x3, x2, x1 from test order by x1 desc;
+
 insert into test values (1, 10, 100), (10, 1, 10), (100, 100, 1);
 select x3, x2 from test group by x3, x2 order by x3;
 select x3, x2 from test group by 1, 2 order by x3;
@@ -25,21 +35,32 @@ select x1, x2, x3 from test order by 3 limit 1 by 1;
 
 explain syntax select x3, x2, x1 from test order by 1;
 explain syntax select x3 + 1, x2, x1 from test order by 1;
+explain syntax select x3, x2, x1 from test order by -1;
+explain syntax select x3 + 1, x2, x1 from test order by -1;
 explain syntax select x3, x3 - x2, x2, x1 from test order by 2;
+explain syntax select x3, x3 - x2, x2, x1 from test order by -2;
 explain syntax select x3, if(x3 > 10, x3, plus(x1, x2)), x1 + x2 from test order by 2;
+explain syntax select x3, if(x3 > 10, x3, plus(x1, x2)), x1 + x2 from test order by -2;
 explain syntax select max(x1), x2 from test group by 2 order by 1, 2;
+explain syntax select max(x1), x2 from test group by -1 order by -2, -1;
 explain syntax select 1 + greatest(x1, 1), x2 from test group by 1, 2;
+explain syntax select 1 + greatest(x1, 1), x2 from test group by -2, -1;
 
 select max(x1), x2 from test group by 1, 2; -- { serverError 43, 184 }
 select 1 + max(x1), x2 from test group by 1, 2; -- { serverError 43, 184 }
+select max(x1), x2 from test group by -2, -1; -- { serverError 43, 184 }
+select 1 + max(x1), x2 from test group by -2, -1; -- { serverError 43, 184 }
 
 explain syntax select x1 + x3, x3 from test group by 1, 2;
+explain syntax select x1 + x3, x3 from test group by -2, -1;
 
 create table test2(x1 Int, x2 Int, x3 Int) engine=Memory;
 insert into test2 values (1, 10, 100), (10, 1, 10), (100, 100, 1);
 select x1, x1 * 2, max(x2), max(x3) from test2 group by 2, 1, x1 order by 1, 2, 4 desc, 3 asc;
+select x1, x1 * 2, max(x2), max(x3) from test2 group by 2, 1, x1 order by 1, 2, -1 desc, -2 asc;
 
 select a, b, c, d, e, f  from (select 44 a, 88 b, 13 c, 14 d, 15 e, 16 f) t group by 1,2,3,4,5,6 order by a;
+select a, b, c, d, e, f  from (select 44 a, 88 b, 13 c, 14 d, 15 e, 16 f) t group by 1,2,3,-3,-2,-1 order by a;
 
 explain syntax select plus(1, 1) as a group by a;
 select substr('aaaaaaaaaaaaaa', 8) as a  group by a order by a;
diff --git a/tests/queries/0_stateless/02932_group_by_null_fuzzer.sql b/tests/queries/0_stateless/02932_group_by_null_fuzzer.sql
index 0c28c120d40..603c7783ef8 100644
--- a/tests/queries/0_stateless/02932_group_by_null_fuzzer.sql
+++ b/tests/queries/0_stateless/02932_group_by_null_fuzzer.sql
@@ -1,5 +1,6 @@
 -- https://github.com/ClickHouse/ClickHouse/issues/43202
 -- Queries are generated by the fuzzer, so don't expect them to make sense
+SET enable_positional_arguments=0;
 SELECT NULL, '' FROM (SELECT toNullable(''), NULL AS key GROUP BY GROUPING SETS ((NULL))) AS s1 ALL LEFT JOIN (SELECT '' AS key, NULL AS value GROUP BY GROUPING SETS (('')) WITH TOTALS UNION ALL SELECT NULL AS key, toNullable(NULL) AS value GROUP BY '', NULL, '' WITH TOTALS) AS s2 USING (key);
 SELECT NULL GROUP BY NULL WITH TOTALS;
 SELECT 1048575, NULL, b FROM (SELECT '25.5' AS a, NULL, NULL AS b GROUP BY GROUPING SETS ((0.0001)) WITH TOTALS) AS js1 ANY RIGHT JOIN (SELECT NULL AS a, NULL AS b WHERE NULL GROUP BY NULL, -9223372036854775807 WITH CUBE WITH TOTALS UNION ALL SELECT NULL AS a, NULL AS b GROUP BY 1, '21474836.46' WITH TOTALS) AS js2 USING (a, b) ORDER BY nan DESC NULLS LAST, '9223372036854775807' DESC NULLS LAST, a ASC NULLS LAST;

From 4bb63f0a6f066bca972b5b3754a20f0a56354b8d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 28 Dec 2023 13:05:15 +0100
Subject: [PATCH 0086/1081] Update test

---
 .../02916_broken_projection.reference         | 124 ------------------
 .../0_stateless/02916_broken_projection.sh    |  16 +--
 2 files changed, 8 insertions(+), 132 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index 358304de74a..d340326455a 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -2,11 +2,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -21,11 +16,6 @@ check table
 1
 0
 broke metadata of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -46,11 +36,6 @@ all_2_2_0
 broke data of part 'proj_2' (parent part: all_2_2_0)
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -63,11 +48,6 @@ check table
 broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -94,14 +74,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
 all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -131,14 +103,6 @@ all_1_1_0	proj_2	FILE_DOESNT_EXIST
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 all_2_2_0	proj_2	FILE_DOESNT_EXIST
 all_3_3_0	proj_2	FILE_DOESNT_EXIST
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -155,18 +119,6 @@ check table full (test - all_1_1_0)
 all_1_1_0
 materialize projection proj
 check table full (test - )
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_6	1	['proj','proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_6	1	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_6	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	0	['proj']
-all_3_5_1_6	1	['proj']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -189,25 +141,6 @@ OPTIMIZE TABLE test FINAL
 insert new part
 optimize
 OPTIMIZE TABLE test FINAL
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_6	0	['proj','proj_2']
-all_0_0_0_7	0	['proj','proj_2']
-all_0_8_2_7	1	['proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_6	0	['proj','proj_2']
-all_1_1_0_7	0	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_6	0	['proj','proj_2']
-all_2_2_0_7	0	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_5_1	0	['proj']
-all_3_5_1_6	0	['proj']
-all_3_5_1_7	0	['proj','proj_2']
-all_4_4_0	0	['proj','proj_2']
-all_5_5_0	0	['proj','proj_2']
-all_8_8_0	0	['proj','proj_2']
-all_9_9_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -224,9 +157,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -235,7 +165,6 @@ used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
-system.parts
 select from projection 'proj'
 used projections
 SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -248,9 +177,6 @@ check table
 broke data of part 'proj' (parent part: all_0_0_0)
 check table full (test2 - all_0_0_0)
 all_0_0_0
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -262,9 +188,6 @@ check table
 broke data of part 'all_0_0_0'
 check table full (test2 - all_0_0_0)
 all_0_0_0
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -273,9 +196,6 @@ used projections
 SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
 check table
 1
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
 select from projection 'proj'
 used projections
 SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
@@ -288,11 +208,6 @@ insert new part
 insert new part
 insert new part
 insert new part
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -307,11 +222,6 @@ check table
 1
 0
 broke data of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 FILE_DOESNT_EXIST
 select from projection 'proj_2'
@@ -325,11 +235,6 @@ broken projections info
 all_2_2_0	proj	NO_FILE_IN_DATA_PART
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -345,11 +250,6 @@ check table
 broken projections info
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 STD_EXCEPTION
 select from projection 'proj_2'
@@ -363,15 +263,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 FILE_DOESNT_EXIST
 materialize projection proj
-system.parts
-all_0_0_0	0	['proj','proj_2']
-all_0_0_0_4	1	['proj','proj_2']
-all_1_1_0	0	['proj','proj_2']
-all_1_1_0_4	1	['proj','proj_2']
-all_2_2_0	0	['proj','proj_2']
-all_2_2_0_4	1	['proj','proj_2']
-all_3_3_0	0	['proj','proj_2']
-all_3_3_0_4	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -388,11 +279,6 @@ broken projections info
 all_2_2_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
@@ -407,11 +293,6 @@ check table
 1
 0
 broke all data of part 'proj' (parent part: all_1_1_0)
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj', expect error: proj
 select from projection 'proj_2'
 12
@@ -424,11 +305,6 @@ broken projections info
 all_1_1_0	proj	FILE_DOESNT_EXIST
 BACKUP_CREATED
 RESTORED
-system.parts
-all_0_0_0	1	['proj','proj_2']
-all_1_1_0	1	['proj','proj_2']
-all_2_2_0	1	['proj','proj_2']
-all_3_3_0	1	['proj','proj_2']
 select from projection 'proj'
 12
 16
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 55e613b8f3a..a1df5dc858d 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings
+# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
@@ -149,12 +149,12 @@ function check()
         expected_error=$3
     fi
 
-    echo 'system.parts'
-    $CLICKHOUSE_CLIENT -q "
-    SELECT name, active, projections
-    FROM system.parts
-    WHERE table='$table' AND database=currentDatabase()
-    ORDER BY name;"
+    #echo 'system.parts'
+    #$CLICKHOUSE_CLIENT -q "
+    #SELECT name, active, projections
+    #FROM system.parts
+    #WHERE table='$table' AND database=currentDatabase()
+    #ORDER BY name;"
 
     query_id=$(random 8)
 
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test proj STD_EXCEPTION
+    check test
 
     broken_projections_info test
 

From e2f4219c12c216ab32a267b153969b758126a077 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Thu, 28 Dec 2023 12:22:30 +0000
Subject: [PATCH 0087/1081] Fix

---
 src/Interpreters/TreeOptimizer.cpp                  |  7 +++----
 .../02943_positional_arguments_bugs.reference       | 11 ++++++++++-
 .../0_stateless/02943_positional_arguments_bugs.sql | 13 +++++++------
 3 files changed, 20 insertions(+), 11 deletions(-)

diff --git a/src/Interpreters/TreeOptimizer.cpp b/src/Interpreters/TreeOptimizer.cpp
index 729e2ed6007..57dba3eef89 100644
--- a/src/Interpreters/TreeOptimizer.cpp
+++ b/src/Interpreters/TreeOptimizer.cpp
@@ -76,11 +76,10 @@ const std::unordered_set<String> possibly_injective_function_names
   */
 void appendUnusedGroupByColumn(ASTSelectQuery * select_query)
 {
-    /// You must insert a constant that is not the name of the column in the table. Such a case is rare, but it happens.
-    /// Also start unused_column integer must not intersect with ([1, source_columns.size()])
-    /// might be in positional GROUP BY.
+    /// Since ASTLiteral is different from ASTIdentifier, so we can use a special constant String Literal for this,
+    /// and do not need to worry about it conflict with the name of the column in the table.
     select_query->setExpression(ASTSelectQuery::Expression::GROUP_BY, std::make_shared<ASTExpressionList>());
-    select_query->groupBy()->children.emplace_back(std::make_shared<ASTLiteral>(static_cast<Int64>(-1)));
+    select_query->groupBy()->children.emplace_back(std::make_shared<ASTLiteral>("__unused_group_by_column"));
 }
 
 /// Eliminates injective function calls and constant expressions from group by statement.
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.reference b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
index 702e1261186..47e8df9e382 100644
--- a/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
@@ -1,2 +1,11 @@
-45	1
+0	0
+4	4
+3	3
+2	2
+5	5
+1	1
+6	6
+7	7
+9	9
+8	8
 processed	99	0
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.sql b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
index b8cf73da42d..8cc3fb4b17d 100644
--- a/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
@@ -2,18 +2,19 @@
 DROP TABLE IF EXISTS t;
 CREATE TABLE t
 (
-    `n` int
+    `n` int,
+	`__unused_group_by_column` int
 )
-    ENGINE = MergeTree
-        ORDER BY n AS
-SELECT *
+ENGINE = MergeTree
+ORDER BY n AS
+SELECT number, number
 FROM numbers(10);
 
 SELECT
     sum(n),
-    1 AS x
+    __unused_group_by_column 
 FROM t
-GROUP BY x;
+GROUP BY __unused_group_by_column;
 
 SELECT
     'processed' AS type,

From 3d2e95dbf5f81185d2a091d5e58490f66ed04bef Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 28 Dec 2023 13:49:49 +0100
Subject: [PATCH 0088/1081] Fix build

---
 src/Storages/MergeTree/checkDataPart.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index ea46b6f0d56..5b60f0a7fc2 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -332,7 +332,7 @@ static IMergeTreeDataPart::Checksums checkDataPart(
 
     if (throw_on_broken_projection && !broken_projections_message.empty())
     {
-        throw Exception(ErrorCodes::BROKEN_PROJECTION, broken_projections_message.data());
+        throw Exception(ErrorCodes::BROKEN_PROJECTION, "{}", broken_projections_message);
     }
 
     if (require_checksums && !projections_on_disk.empty())

From 2e9cdd17ef136f064042b541dbc68ef64ba8194f Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Thu, 28 Dec 2023 14:08:14 +0000
Subject: [PATCH 0089/1081] Fix flaky test

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 26 ++++++++++++++-----
 .../02943_positional_arguments_bugs.reference | 11 ++++----
 .../02943_positional_arguments_bugs.sql       |  6 +++--
 3 files changed, 29 insertions(+), 14 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 3290d918a8b..9ec6d9e358c 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2156,19 +2156,31 @@ void QueryAnalyzer::replaceNodesWithPositionalArguments(QueryTreeNodePtr & node_
             node_to_replace = &sort_node->getExpression();
 
         auto * constant_node = (*node_to_replace)->as<ConstantNode>();
-        if (!constant_node || constant_node->getValue().getType() != Field::Types::UInt64)
+
+        if (!constant_node
+            || (constant_node->getValue().getType() != Field::Types::UInt64 && constant_node->getValue().getType() != Field::Types::Int64))
             continue;
 
-        UInt64 positional_argument_number = constant_node->getValue().get<UInt64>();
-        if (positional_argument_number == 0 || positional_argument_number > projection_nodes.size())
-            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+        UInt64 pos;
+        if (constant_node->getValue().getType() == Field::Types::UInt64)
+        {
+            pos = constant_node->getValue().get<UInt64>();
+        }
+        else // Int64
+        {
+            auto value = constant_node->getValue().get<Int64>();
+            pos = value > 0 ? value : projection_nodes.size() + value + 1;
+        }
+
+        if (!pos || pos > projection_nodes.size())
+            throw Exception(
+                ErrorCodes::BAD_ARGUMENTS,
                 "Positional argument number {} is out of bounds. Expected in range [1, {}]. In scope {}",
-                positional_argument_number,
+                pos,
                 projection_nodes.size(),
                 scope.scope_node->formatASTForErrorMessage());
 
-        --positional_argument_number;
-        *node_to_replace = projection_nodes[positional_argument_number];
+        *node_to_replace = projection_nodes[--pos];
     }
 }
 
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.reference b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
index 47e8df9e382..08310b7cf27 100644
--- a/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
@@ -1,11 +1,12 @@
 0	0
-4	4
-3	3
-2	2
-5	5
 1	1
+2	2
+3	3
+4	4
+5	5
 6	6
 7	7
-9	9
 8	8
+9	9
+45	1
 processed	99	0
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.sql b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
index 8cc3fb4b17d..9b1b872ae40 100644
--- a/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
@@ -3,7 +3,7 @@ DROP TABLE IF EXISTS t;
 CREATE TABLE t
 (
     `n` int,
-	`__unused_group_by_column` int
+    `__unused_group_by_column` int
 )
 ENGINE = MergeTree
 ORDER BY n AS
@@ -14,7 +14,9 @@ SELECT
     sum(n),
     __unused_group_by_column 
 FROM t
-GROUP BY __unused_group_by_column;
+GROUP BY __unused_group_by_column ORDER BY __unused_group_by_column;
+
+SELECT sum(n), 1 as x from t group by x;
 
 SELECT
     'processed' AS type,

From 493f938c455e9bd507d521b7974b1e7a9e7c81b2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Thu, 28 Dec 2023 17:29:25 +0100
Subject: [PATCH 0090/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index a1df5dc858d..ca62d275189 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test
+    check test proj ErrnoException
 
     broken_projections_info test
 

From 91657185c8fc4349cb8825ac2e5d6126fddb8289 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 29 Dec 2023 13:05:15 +0100
Subject: [PATCH 0091/1081] Fxi

---
 tests/queries/0_stateless/02916_broken_projection.reference | 2 +-
 tests/queries/0_stateless/02916_broken_projection.sh        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index d340326455a..beaca49f99c 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -251,7 +251,7 @@ broken projections info
 0
 broke all data of part 'proj' (parent part: all_2_2_0)
 select from projection 'proj', expect error: proj
-STD_EXCEPTION
+Errno
 select from projection 'proj_2'
 12
 16
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index ca62d275189..99e54b08b74 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -447,7 +447,7 @@ function test3()
 
     break_projection test proj all_2_2_0 part
 
-    check test proj ErrnoException
+    check test proj Errno
 
     broken_projections_info test
 

From e0f0100332085f3075951a6d9bf5c8d69f6d9940 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 29 Dec 2023 15:38:15 +0100
Subject: [PATCH 0092/1081] Update 02916_broken_projection.reference

---
 tests/queries/0_stateless/02916_broken_projection.reference | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
index beaca49f99c..3967215e5de 100644
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ b/tests/queries/0_stateless/02916_broken_projection.reference
@@ -252,6 +252,7 @@ broken projections info
 broke all data of part 'proj' (parent part: all_2_2_0)
 select from projection 'proj', expect error: proj
 Errno
+Errno
 select from projection 'proj_2'
 12
 16

From b70ff6d8ea71d4633cdcdbe3ef486707e70c1abb Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 1 Jan 2024 11:02:57 +0100
Subject: [PATCH 0093/1081] Fix build

---
 src/Backups/BackupIO_AzureBlobStorage.cpp | 33 +++++++++++++++++++++--
 src/Backups/BackupIO_AzureBlobStorage.h   |  2 ++
 2 files changed, 33 insertions(+), 2 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index a1fd5bd8327..bd4efcf63ae 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -218,10 +218,39 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
     BackupWriterDefault::copyFileFromDisk(path_in_backup, src_disk, src_path, copy_encrypted, start_pos, length);
 }
 
+void BackupWriterAzureBlobStorage::copyFile(const String & destination, const String & source, size_t size)
+{
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client;
+    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client;
+    StorageAzureBlob::Configuration src_configuration = configuration;
+    src_configuration.container = source;
+    src_client = StorageAzureBlob::createClient(src_configuration, /* is_read_only */ false);
+
+    StorageAzureBlob::Configuration dest_configuration = configuration;
+    dest_configuration.container = destination;
+    dest_client = StorageAzureBlob::createClient(dest_configuration, /* is_read_only */ false);
+
+    LOG_TRACE(log, "Copying file inside backup from {} to {} ", source, destination);
+    copyAzureBlobStorageFile(
+       src_client,
+       dest_client,
+       configuration.container,
+       fs::path(configuration.blob_path),
+       0,
+       size,
+       /* dest_bucket= */ destination,
+       /* dest_key= */ configuration.blob_path,
+       settings,
+       read_settings,
+       {},
+       threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupRDAzure"),
+       /* for_disk_azure_blob_storage= */ true);
+}
+
 void BackupWriterAzureBlobStorage::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
 {
     copyDataToAzureBlobStorageFile(create_read_buffer, start_pos, length, client, configuration.container, path_in_backup, settings, {},
-                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
+                     threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"));
 }
 
 BackupWriterAzureBlobStorage::~BackupWriterAzureBlobStorage() = default;
@@ -257,7 +286,7 @@ UInt64 BackupWriterAzureBlobStorage::getFileSize(const String & file_name)
     RelativePathsWithMetadata children;
     object_storage->listObjects(key,children,/*max_keys*/0);
     if (children.empty())
-        throw Exception(ErrorCodes::AZURE_BLOB_STORAGE_ERROR, "Object {} must exist");
+        throw Exception(ErrorCodes::AZURE_BLOB_STORAGE_ERROR, "Object must exist");
     return children[0].metadata.size_bytes;
 }
 
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 65affb9f079..87a6c3ef675 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -48,6 +48,8 @@ public:
     void copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
                           bool copy_encrypted, UInt64 start_pos, UInt64 length) override;
 
+    void copyFile(const String & destination, const String & source, size_t size) override;
+
     void removeFile(const String & file_name) override;
     void removeFiles(const Strings & file_names) override;
 

From 4122de97213d835de5202d4ca741b4972973884b Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 2 Jan 2024 20:19:01 +0100
Subject: [PATCH 0094/1081] Updated tests and added settings

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  6 +-
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp |  5 +-
 .../AzureBlobStorage/AzureObjectStorage.h     | 11 ++-
 .../copyAzureBlobStorageFile.cpp              | 68 +++++++++++++++++--
 src/Storages/StorageAzureBlob.cpp             |  2 +-
 .../configs/config.xml                        | 11 ---
 .../configs/disable_profilers.xml             | 13 ----
 .../configs/users.xml                         |  8 ---
 .../test.py                                   |  2 -
 9 files changed, 80 insertions(+), 46 deletions(-)
 delete mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
 delete mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
 delete mode 100644 tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index bd4efcf63ae..15e8e92a85d 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -139,7 +139,7 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
                 settings,
                 read_settings,
                 object_attributes,
-                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupReaderAzureBlobStorage"),
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupRDAzure"),
                 /* for_disk_azure_blob_storage= */ true);
 
             return file_size;
@@ -209,7 +209,7 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
                 settings,
                 read_settings,
                 {},
-                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
+                threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"));
             return; /// copied!
         }
     }
@@ -243,7 +243,7 @@ void BackupWriterAzureBlobStorage::copyFile(const String & destination, const St
        settings,
        read_settings,
        {},
-       threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupRDAzure"),
+       threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"),
        /* for_disk_azure_blob_storage= */ true);
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 6075b385a6c..9e703d6fc5e 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -164,7 +164,10 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024),
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
-        config.getInt(config_prefix + ".list_object_keys_size", 1000)
+        config.getInt(config_prefix + ".list_object_keys_size", 1000),
+        config.getUInt64(config_prefix + ".min_upload_part_size", 16 * 1024 * 1024),
+        config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
+        config.getUInt64(config_prefix + ".max_part_number", 10000)
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 8e3d50418d3..55c81b4b7d9 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -24,12 +24,18 @@ struct AzureObjectStorageSettings
         uint64_t min_bytes_for_seek_,
         int max_single_read_retries_,
         int max_single_download_retries_,
-        int list_object_keys_size_)
+        int list_object_keys_size_,
+        size_t min_upload_part_size_,
+        size_t max_upload_part_size_,
+        size_t max_part_number_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
+        , min_upload_part_size(min_upload_part_size_)
+        , max_upload_part_size(max_upload_part_size_)
+        , max_part_number(max_part_number_)
     {
     }
 
@@ -40,6 +46,9 @@ struct AzureObjectStorageSettings
     size_t max_single_read_retries = 3;
     size_t max_single_download_retries = 3;
     int list_object_keys_size = 1000;
+    size_t min_upload_part_size = 16 * 1024 * 1024;
+    size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
+    size_t max_part_number = 10000;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 0a0a080b5cb..5ca30fa8071 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -22,15 +22,17 @@ namespace ProfileEvents
     extern const Event DiskAzureUploadPart;
 }
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
 
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int INVALID_CONFIG_PARAMETER;
+}
+
+
 size_t max_single_operation_copy_size = 256 * 1024 * 1024;
 
 
@@ -106,6 +108,60 @@ namespace
         std::mutex bg_tasks_mutex;
         std::condition_variable bg_tasks_condvar;
 
+        void calculatePartSize()
+        {
+            if (!total_size)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Chosen multipart upload for an empty file. This must not happen");
+
+            auto max_part_number = settings.get()->max_part_number;
+            auto min_upload_part_size = settings.get()->min_upload_part_size;
+            auto max_upload_part_size = settings.get()->max_upload_part_size;
+
+            if (!max_part_number)
+                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_part_number must not be 0");
+            else if (!min_upload_part_size)
+                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "min_upload_part_size must not be 0");
+            else if (max_upload_part_size < min_upload_part_size)
+                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_upload_part_size must not be less than min_upload_part_size");
+
+            size_t part_size = min_upload_part_size;
+            size_t num_parts = (total_size + part_size - 1) / part_size;
+
+            if (num_parts > max_part_number)
+            {
+                part_size = (total_size + max_part_number - 1) / max_part_number;
+                num_parts = (total_size + part_size - 1) / part_size;
+            }
+
+            if (part_size > max_upload_part_size)
+            {
+                part_size = max_upload_part_size;
+                num_parts = (total_size + part_size - 1) / part_size;
+            }
+
+            if (num_parts < 1 || num_parts > max_part_number || part_size < min_upload_part_size || part_size > max_upload_part_size)
+            {
+                String msg;
+                if (num_parts < 1)
+                    msg = "Number of parts is zero";
+                else if (num_parts > max_part_number)
+                    msg = fmt::format("Number of parts exceeds {}", num_parts, max_part_number);
+                else if (part_size < min_upload_part_size)
+                    msg = fmt::format("Size of a part is less than {}", part_size, min_upload_part_size);
+                else
+                    msg = fmt::format("Size of a part exceeds {}", part_size, max_upload_part_size);
+
+                throw Exception(
+                    ErrorCodes::INVALID_CONFIG_PARAMETER,
+                    "{} while writing {} bytes to AzureBlobStorage. Check max_part_number = {}, "
+                    "min_upload_part_size = {}, max_upload_part_size = {}",
+                    msg, total_size, max_part_number, min_upload_part_size, max_upload_part_size);
+            }
+
+            /// We've calculated the size of a normal part (the final part can be smaller).
+            normal_part_size = part_size;
+        }
+
     public:
         void performCopy()
         {
@@ -120,7 +176,7 @@ namespace
 
         void performMultipartUpload()
         {
-            normal_part_size = 1024;
+            calculatePartSize();
 
             size_t position = offset;
             size_t end_position = offset + total_size;
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 1b28a2c2fac..f1070c8c31e 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -1139,7 +1139,7 @@ StorageAzureBlobSource::ReaderHolder StorageAzureBlobSource::createReader()
     QueryPipelineBuilder builder;
     std::shared_ptr<ISource> source;
     std::unique_ptr<ReadBuffer> read_buf;
-    std::optional<size_t> num_rows_from_cache = need_only_count && getContext()->getSettingsRef().use_cache_for_count_from_files
+        std::optional<size_t> num_rows_from_cache = need_only_count && getContext()->getSettingsRef().use_cache_for_count_from_files
         ? tryGetNumRowsFromCache(path_with_metadata) : std::nullopt;
     if (num_rows_from_cache)
     {
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
deleted file mode 100644
index 5725dce40cd..00000000000
--- a/tests/integration/test_backup_restore_azure_blob_storage/configs/config.xml
+++ /dev/null
@@ -1,11 +0,0 @@
-<clickhouse>
-    <background_processing_pool_thread_sleep_seconds>1</background_processing_pool_thread_sleep_seconds>
-    <background_processing_pool_thread_sleep_seconds_random_part>0</background_processing_pool_thread_sleep_seconds_random_part>
-    <background_processing_pool_thread_sleep_seconds_if_nothing_to_do>0.0</background_processing_pool_thread_sleep_seconds_if_nothing_to_do>
-    <background_processing_pool_task_sleep_seconds_when_no_work_min>0</background_processing_pool_task_sleep_seconds_when_no_work_min>
-    <background_processing_pool_task_sleep_seconds_when_no_work_max>1</background_processing_pool_task_sleep_seconds_when_no_work_max>
-    <background_processing_pool_task_sleep_seconds_when_no_work_multiplier>1</background_processing_pool_task_sleep_seconds_when_no_work_multiplier>
-    <background_processing_pool_task_sleep_seconds_when_no_work_random_part>0</background_processing_pool_task_sleep_seconds_when_no_work_random_part>
-    <backup_threads>16</backup_threads>
-    <restore_threads>16</restore_threads>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
deleted file mode 100644
index b74bb1502ce..00000000000
--- a/tests/integration/test_backup_restore_azure_blob_storage/configs/disable_profilers.xml
+++ /dev/null
@@ -1,13 +0,0 @@
-<!-- Sometime azurite is super slow, profiler make it even worse -->
-<clickhouse>
-    <profiles>
-        <default>
-            <query_profiler_real_time_period_ns>0</query_profiler_real_time_period_ns>
-            <query_profiler_cpu_time_period_ns>0</query_profiler_cpu_time_period_ns>
-            <load_marks_asynchronously>0</load_marks_asynchronously>
-            <backup_restore_keeper_max_retries>1000</backup_restore_keeper_max_retries>
-            <backup_restore_keeper_retry_initial_backoff_ms>1</backup_restore_keeper_retry_initial_backoff_ms>
-            <backup_restore_keeper_retry_max_backoff_ms>1</backup_restore_keeper_retry_max_backoff_ms>
-        </default>
-    </profiles>
-</clickhouse>
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml b/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml
deleted file mode 100644
index c12eb2f79f4..00000000000
--- a/tests/integration/test_backup_restore_azure_blob_storage/configs/users.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<clickhouse>
-    <users>
-        <default>
-            <password></password>
-            <profile>default</profile>
-        </default>
-    </users>
-</clickhouse>
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
index 0a48d3523f0..06c18d7468f 100644
--- a/tests/integration/test_backup_restore_azure_blob_storage/test.py
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -24,8 +24,6 @@ def cluster():
         cluster = ClickHouseCluster(__file__)
         cluster.add_instance(
             "node",
-            main_configs=["configs/config.xml"],
-            user_configs=["configs/disable_profilers.xml", "configs/users.xml"],
             with_azurite=True,
         )
         cluster.start()

From df221f7db65fd17af6a71704f756e47ceec7a928 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 3 Jan 2024 11:35:06 +0100
Subject: [PATCH 0095/1081] Renamed Bucket-Key to Container-Blob

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     | 14 +++---
 .../copyAzureBlobStorageFile.cpp              | 44 +++++++++----------
 .../copyAzureBlobStorageFile.h                | 10 ++---
 3 files changed, 34 insertions(+), 34 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 15e8e92a85d..de40fc6b33b 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -134,8 +134,8 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
                 fs::path(configuration.blob_path) / path_in_backup,
                 0,
                 file_size,
-                /* dest_bucket= */ blob_path[1],
-                /* dest_key= */ blob_path[0],
+                /* dest_container */ blob_path[1],
+                /* dest_path */ blob_path[0],
                 settings,
                 read_settings,
                 object_attributes,
@@ -178,7 +178,7 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
     auto source_data_source_description = src_disk->getDataSourceDescription();
     if (source_data_source_description.sameKind(data_source_description) && (source_data_source_description.is_encrypted == copy_encrypted))
     {
-        /// getBlobPath() can return more than 3 elements if the file is stored as multiple objects in AzureBlobStorage bucket.
+        /// getBlobPath() can return more than 3 elements if the file is stored as multiple objects in AzureBlobStorage container.
         /// In this case we can't use the native copy.
         if (auto blob_path = src_disk->getBlobPath(src_path); blob_path.size() == 2)
         {
@@ -200,8 +200,8 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
             copyAzureBlobStorageFile(
                 src_client,
                 client,
-                /* src_bucket */ blob_path[1],
-                /* src_key= */ blob_path[0],
+                /* src_container */ blob_path[1],
+                /* src_path */ blob_path[0],
                 start_pos,
                 length,
                 configuration.container,
@@ -238,8 +238,8 @@ void BackupWriterAzureBlobStorage::copyFile(const String & destination, const St
        fs::path(configuration.blob_path),
        0,
        size,
-       /* dest_bucket= */ destination,
-       /* dest_key= */ configuration.blob_path,
+       /* dest_container */ destination,
+       /* dest_path */ configuration.blob_path,
        settings,
        read_settings,
        {},
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 5ca30fa8071..df1341efdd1 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -46,8 +46,8 @@ namespace
             std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client_,
             size_t offset_,
             size_t total_size_,
-            const String & dest_bucket_,
-            const String & dest_key_,
+            const String & dest_container_,
+            const String & dest_blob_,
             std::shared_ptr<AzureObjectStorageSettings> settings_,
             const std::optional<std::map<String, String>> & object_metadata_,
             ThreadPoolCallbackRunner<void> schedule_,
@@ -57,8 +57,8 @@ namespace
             , client(client_)
             , offset (offset_)
             , total_size (total_size_)
-            , dest_bucket(dest_bucket_)
-            , dest_key(dest_key_)
+            , dest_container(dest_container_)
+            , dest_blob(dest_blob_)
             , settings(settings_)
             , object_metadata(object_metadata_)
             , schedule(schedule_)
@@ -75,8 +75,8 @@ namespace
         std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
         size_t offset;
         size_t total_size;
-        const String & dest_bucket;
-        const String & dest_key;
+        const String & dest_container;
+        const String & dest_blob;
         std::shared_ptr<AzureObjectStorageSettings> settings;
         const std::optional<std::map<String, String>> & object_metadata;
         ThreadPoolCallbackRunner<void> schedule;
@@ -170,7 +170,7 @@ namespace
 
         void completeMultipartUpload()
         {
-            auto block_blob_client = client->GetBlockBlobClient(dest_key);
+            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
             block_blob_client.CommitBlockList(block_ids);
         }
 
@@ -207,7 +207,7 @@ namespace
 
         void uploadPart(size_t part_offset, size_t part_size)
         {
-            LOG_TRACE(log, "Writing part. Bucket: {}, Key: {}, Size: {}", dest_bucket, dest_key, part_size);
+            LOG_TRACE(log, "Writing part. Container: {}, Blob: {}, Size: {}", dest_container, dest_blob, part_size);
 
             if (!part_size)
             {
@@ -286,7 +286,7 @@ namespace
 
             std::lock_guard lock(bg_tasks_mutex); /// Protect bg_tasks from race
             task.block_id = block_id;
-            LOG_TRACE(log, "Writing part finished. Bucket: {}, Key: {}, block_id: {}, Parts: {}", dest_bucket, dest_key, block_id, bg_tasks.size());
+            LOG_TRACE(log, "Writing part finished. Container: {}, Blob: {}, block_id: {}, Parts: {}", dest_container, dest_blob, block_id, bg_tasks.size());
         }
 
         String processUploadPartRequest(UploadPartTask & task)
@@ -295,7 +295,7 @@ namespace
             if (for_disk_azure_blob_storage)
                 ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
 
-            auto block_blob_client = client->GetBlockBlobClient(dest_key);
+            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
             task.block_id = getRandomASCIIString(64);
             Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.data), task.size);
             block_blob_client.StageBlock(task.block_id, memory);
@@ -330,14 +330,14 @@ void copyDataToAzureBlobStorageFile(
     size_t offset,
     size_t size,
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
-    const String & dest_bucket,
-    const String & dest_key,
+    const String & dest_container,
+    const String & dest_blob,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const std::optional<std::map<String, String>> & object_metadata,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
-    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyDataToAzureBlobStorageFile")};
+    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container, dest_blob, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyDataToAzureBlobStorageFile")};
     helper.performCopy();
 }
 
@@ -345,12 +345,12 @@ void copyDataToAzureBlobStorageFile(
 void copyAzureBlobStorageFile(
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
-    const String & src_bucket,
-    const String & src_key,
+    const String & src_container,
+    const String & src_blob,
     size_t offset,
     size_t size,
-    const String & dest_bucket,
-    const String & dest_key,
+    const String & dest_container,
+    const String & dest_blob,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     const std::optional<std::map<String, String>> & object_metadata,
@@ -363,21 +363,21 @@ void copyAzureBlobStorageFile(
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)
             ProfileEvents::increment(ProfileEvents::DiskAzureCopyObject);
-        auto block_blob_client_src = src_client->GetBlockBlobClient(src_key);
-        auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_key);
+        auto block_blob_client_src = src_client->GetBlockBlobClient(src_blob);
+        auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_blob);
         auto uri = block_blob_client_src.GetUrl();
         block_blob_client_dest.CopyFromUri(uri);
     }
     else
     {
-        LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Bucket: {}, Key: {}", src_bucket, src_key);
+        LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container, src_blob);
         auto create_read_buffer = [&]
         {
-            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_key, read_settings, settings->max_single_read_retries,
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_blob, read_settings, settings->max_single_read_retries,
             settings->max_single_download_retries);
         };
 
-        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_bucket, dest_key, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
+        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container, dest_blob, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
         helper.performCopy();
     }
 }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index 31228fbcb23..059d0318f57 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -23,12 +23,12 @@ using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
 void copyAzureBlobStorageFile(
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
-    const String & src_bucket,
-    const String & src_key,
+    const String & src_container,
+    const String & src_path,
     size_t src_offset,
     size_t src_size,
-    const String & dest_bucket,
-    const String & dest_key,
+    const String & dest_container,
+    const String & dest_path,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
@@ -46,8 +46,8 @@ void copyDataToAzureBlobStorageFile(
     size_t offset,
     size_t size,
     std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & client,
+    const String & dest_container,
     const String & dest_bucket,
-    const String & dest_key,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},

From 91bad5bc39963e9450f284dfc6b45fd69fa146de Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 4 Jan 2024 16:06:36 +0100
Subject: [PATCH 0096/1081] Updated to use MultiVersion for BlobContainerClient
 in Backups and updated to get client from disk

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     | 72 +++++--------------
 src/Backups/BackupIO_AzureBlobStorage.h       |  4 +-
 .../AzureBlobStorage/AzureObjectStorage.h     |  5 ++
 .../copyAzureBlobStorageFile.cpp              | 20 +++---
 .../copyAzureBlobStorageFile.h                |  6 +-
 5 files changed, 37 insertions(+), 70 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index de40fc6b33b..968a60c566f 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -27,8 +27,6 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-//using AzureClientPtr = std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient>;
-
 BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     StorageAzureBlob::Configuration configuration_,
     const ReadSettings & read_settings_,
@@ -38,12 +36,13 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     , data_source_description{DataSourceType::AzureBlobStorage, configuration_.container, false, false}
     , configuration(configuration_)
 {
-    client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
+    auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
     settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
     auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupReaderAzureBlobStorage",
-                                                          std::make_unique<Azure::Storage::Blobs::BlobContainerClient>(*client.get()),
+                                                          std::move(client_ptr),
                                                           std::move(settings_as_unique_ptr));
+    client = object_storage->getClient();
 }
 
 BackupReaderAzureBlobStorage::~BackupReaderAzureBlobStorage() = default;
@@ -89,7 +88,7 @@ std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const
         key = file_name;
     }
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client, key, read_settings, settings->max_single_read_retries,
+        client.get(), key, read_settings, settings->max_single_read_retries,
         settings->max_single_download_retries);
 }
 
@@ -113,23 +112,9 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
                                 "Blob writing function called with unexpected blob_path.size={} or mode={}",
                                 blob_path.size(), mode);
 
-            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client;
-            if (configuration.container == blob_path[1])
-            {
-                dest_client = client;
-            }
-            else
-            {
-                StorageAzureBlob::Configuration dest_configuration = configuration;
-                dest_configuration.container = blob_path[1];
-                dest_configuration.blob_path = blob_path[0];
-                dest_client = StorageAzureBlob::createClient(dest_configuration, /* is_read_only */ false);
-            }
-
-
             copyAzureBlobStorageFile(
                 client,
-                dest_client,
+                reinterpret_cast<AzureObjectStorage *>(destination_disk->getObjectStorage().get())->getClient(),
                 configuration.container,
                 fs::path(configuration.blob_path) / path_in_backup,
                 0,
@@ -163,12 +148,13 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     , data_source_description{DataSourceType::AzureBlobStorage,configuration_.container, false, false}
     , configuration(configuration_)
 {
-    client = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
+    auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
     settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
     auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
-                                                          std::make_unique<Azure::Storage::Blobs::BlobContainerClient>(*client.get()),
-                                                                  std::move(settings_as_unique_ptr));
+                                                          std::move(client_ptr),
+                                                          std::move(settings_as_unique_ptr));
+    client = object_storage->getClient();
 }
 
 void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
@@ -182,23 +168,9 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
         /// In this case we can't use the native copy.
         if (auto blob_path = src_disk->getBlobPath(src_path); blob_path.size() == 2)
         {
-
-            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client;
-            if (configuration.container == blob_path[1])
-            {
-                src_client = client;
-            }
-            else
-            {
-                StorageAzureBlob::Configuration src_configuration = configuration;
-                src_configuration.container = blob_path[1];
-                src_configuration.blob_path = blob_path[0];
-                src_client = StorageAzureBlob::createClient(src_configuration, /* is_read_only */ false);
-            }
-
             LOG_TRACE(log, "Copying file {} from disk {} to AzureBlobStorag", src_path, src_disk->getName());
             copyAzureBlobStorageFile(
-                src_client,
+                reinterpret_cast<AzureObjectStorage *>(src_disk->getObjectStorage().get())->getClient(),
                 client,
                 /* src_container */ blob_path[1],
                 /* src_path */ blob_path[0],
@@ -220,26 +192,16 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
 
 void BackupWriterAzureBlobStorage::copyFile(const String & destination, const String & source, size_t size)
 {
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client;
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client;
-    StorageAzureBlob::Configuration src_configuration = configuration;
-    src_configuration.container = source;
-    src_client = StorageAzureBlob::createClient(src_configuration, /* is_read_only */ false);
-
-    StorageAzureBlob::Configuration dest_configuration = configuration;
-    dest_configuration.container = destination;
-    dest_client = StorageAzureBlob::createClient(dest_configuration, /* is_read_only */ false);
-
     LOG_TRACE(log, "Copying file inside backup from {} to {} ", source, destination);
     copyAzureBlobStorageFile(
-       src_client,
-       dest_client,
+       client,
+       client,
        configuration.container,
-       fs::path(configuration.blob_path),
+       fs::path(source),
        0,
        size,
-       /* dest_container */ destination,
-       /* dest_path */ configuration.blob_path,
+       /* dest_container */ configuration.container,
+       /* dest_path */ destination,
        settings,
        read_settings,
        {},
@@ -303,7 +265,7 @@ std::unique_ptr<ReadBuffer> BackupWriterAzureBlobStorage::readFile(const String
     }
 
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client, key, read_settings, settings->max_single_read_retries,
+        client.get(), key, read_settings, settings->max_single_read_retries,
         settings->max_single_download_retries);
 }
 
@@ -319,7 +281,7 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
         key = file_name;
     }
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
-        client,
+        client.get(),
         key,
         settings->max_single_part_upload_size,
         DBMS_DEFAULT_BUFFER_SIZE,
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 87a6c3ef675..12bf073cd08 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -28,7 +28,7 @@ public:
 
 private:
     const DataSourceDescription data_source_description;
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
     std::shared_ptr<AzureObjectStorageSettings> settings;
@@ -57,7 +57,7 @@ private:
     std::unique_ptr<ReadBuffer> readFile(const String & file_name, size_t expected_file_size) override;
     void removeFilesBatch(const Strings & file_names);
     const DataSourceDescription data_source_description;
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
     std::shared_ptr<AzureObjectStorageSettings> settings;
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 55c81b4b7d9..1ff4537742f 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -134,6 +134,11 @@ public:
 
     bool isRemote() const override { return true; }
 
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getClient()
+    {
+        return client;
+    }
+
 private:
     const String name;
     /// client used to access the files in the Blob Storage cloud
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index df1341efdd1..4ec90d2830e 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -43,7 +43,7 @@ namespace
     public:
         UploadHelper(
             const CreateReadBuffer & create_read_buffer_,
-            std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client_,
+            MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client_,
             size_t offset_,
             size_t total_size_,
             const String & dest_container_,
@@ -72,7 +72,7 @@ namespace
 
     protected:
         std::function<std::unique_ptr<SeekableReadBuffer>()> create_read_buffer;
-        std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> client;
+        MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client;
         size_t offset;
         size_t total_size;
         const String & dest_container;
@@ -170,7 +170,7 @@ namespace
 
         void completeMultipartUpload()
         {
-            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
+            auto block_blob_client = client.get()->GetBlockBlobClient(dest_blob);
             block_blob_client.CommitBlockList(block_ids);
         }
 
@@ -295,7 +295,7 @@ namespace
             if (for_disk_azure_blob_storage)
                 ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
 
-            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
+            auto block_blob_client = client.get()->GetBlockBlobClient(dest_blob);
             task.block_id = getRandomASCIIString(64);
             Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.data), task.size);
             block_blob_client.StageBlock(task.block_id, memory);
@@ -329,7 +329,7 @@ void copyDataToAzureBlobStorageFile(
     const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
     size_t offset,
     size_t size,
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
     const String & dest_container,
     const String & dest_blob,
     std::shared_ptr<AzureObjectStorageSettings> settings,
@@ -343,8 +343,8 @@ void copyDataToAzureBlobStorageFile(
 
 
 void copyAzureBlobStorageFile(
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
     const String & src_container,
     const String & src_blob,
     size_t offset,
@@ -363,8 +363,8 @@ void copyAzureBlobStorageFile(
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)
             ProfileEvents::increment(ProfileEvents::DiskAzureCopyObject);
-        auto block_blob_client_src = src_client->GetBlockBlobClient(src_blob);
-        auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_blob);
+        auto block_blob_client_src = src_client.get()->GetBlockBlobClient(src_blob);
+        auto block_blob_client_dest = dest_client.get()->GetBlockBlobClient(dest_blob);
         auto uri = block_blob_client_src.GetUrl();
         block_blob_client_dest.CopyFromUri(uri);
     }
@@ -373,7 +373,7 @@ void copyAzureBlobStorageFile(
         LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container, src_blob);
         auto create_read_buffer = [&]
         {
-            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_blob, read_settings, settings->max_single_read_retries,
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client.get(), src_blob, read_settings, settings->max_single_read_retries,
             settings->max_single_download_retries);
         };
 
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index 059d0318f57..a6502541db1 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -21,8 +21,8 @@ using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
 /// Copies a file from AzureBlobStorage to AzureBlobStorage.
 /// The parameters `src_offset` and `src_size` specify a part in the source to copy.
 void copyAzureBlobStorageFile(
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> src_client,
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> dest_client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
     const String & src_container,
     const String & src_path,
     size_t src_offset,
@@ -45,7 +45,7 @@ void copyDataToAzureBlobStorageFile(
     const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
     size_t offset,
     size_t size,
-    std::shared_ptr<Azure::Storage::Blobs::BlobContainerClient> & client,
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client,
     const String & dest_container,
     const String & dest_bucket,
     std::shared_ptr<AzureObjectStorageSettings> settings,

From c14605caa7f403531a6ff0663c242aa5d466ab07 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 4 Jan 2024 18:27:54 +0100
Subject: [PATCH 0097/1081] Added flag use_native_copy and updated to use
 StartCopyFromUri for native copy with large files

---
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp |  3 ++-
 .../AzureBlobStorage/AzureObjectStorage.h     | 10 +++----
 .../copyAzureBlobStorageFile.cpp              | 26 ++++++++++++++++---
 3 files changed, 30 insertions(+), 9 deletions(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 9e703d6fc5e..e29def06363 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -167,7 +167,8 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
         config.getUInt64(config_prefix + ".min_upload_part_size", 16 * 1024 * 1024),
         config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
-        config.getUInt64(config_prefix + ".max_part_number", 10000)
+        config.getUInt64(config_prefix + ".max_part_number", 10000),
+        config.getBool(config_prefix + ".use_native_copy", false)
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 1ff4537742f..436b48c0ad4 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -27,7 +27,8 @@ struct AzureObjectStorageSettings
         int list_object_keys_size_,
         size_t min_upload_part_size_,
         size_t max_upload_part_size_,
-        size_t max_part_number_)
+        size_t max_part_number_,
+        bool use_native_copy_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
@@ -36,6 +37,7 @@ struct AzureObjectStorageSettings
         , min_upload_part_size(min_upload_part_size_)
         , max_upload_part_size(max_upload_part_size_)
         , max_part_number(max_part_number_)
+        , use_native_copy(use_native_copy_)
     {
     }
 
@@ -49,6 +51,7 @@ struct AzureObjectStorageSettings
     size_t min_upload_part_size = 16 * 1024 * 1024;
     size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
     size_t max_part_number = 10000;
+    bool use_native_copy = false;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
@@ -134,10 +137,7 @@ public:
 
     bool isRemote() const override { return true; }
 
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getClient()
-    {
-        return client;
-    }
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getClient() { return client; }
 
 private:
     const String name;
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 4ec90d2830e..9db5ddb476a 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -30,6 +30,7 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int INVALID_CONFIG_PARAMETER;
+    extern const int AZURE_BLOB_STORAGE_ERROR;
 }
 
 
@@ -358,15 +359,34 @@ void copyAzureBlobStorageFile(
     bool for_disk_azure_blob_storage)
 {
 
-    if (size < max_single_operation_copy_size)
+    if (settings->use_native_copy )
     {
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)
             ProfileEvents::increment(ProfileEvents::DiskAzureCopyObject);
+
         auto block_blob_client_src = src_client.get()->GetBlockBlobClient(src_blob);
         auto block_blob_client_dest = dest_client.get()->GetBlockBlobClient(dest_blob);
-        auto uri = block_blob_client_src.GetUrl();
-        block_blob_client_dest.CopyFromUri(uri);
+        auto source_uri = block_blob_client_src.GetUrl();
+
+        if (size < max_single_operation_copy_size)
+        {
+            block_blob_client_dest.CopyFromUri(source_uri);
+        }
+        else
+        {
+            Azure::Storage::Blobs::StartBlobCopyOperation operation = block_blob_client_dest.StartCopyFromUri(source_uri);
+
+            // Wait for the operation to finish, checking for status every 100 second.
+            auto copy_response = operation.PollUntilDone(std::chrono::milliseconds(100));
+            auto properties_model = copy_response.Value;
+
+            if (properties_model.CopySource.HasValue())
+            {
+                throw Exception(ErrorCodes::AZURE_BLOB_STORAGE_ERROR, "Copy failed");
+            }
+
+        }
     }
     else
     {

From 2ee68933123583fe585093868e65c3562d36d66a Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 5 Jan 2024 10:58:04 +0100
Subject: [PATCH 0098/1081] Updated to return container for getObjectsNamespace

---
 src/Backups/BackupIO_AzureBlobStorage.cpp                  | 6 ++++--
 .../ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp | 7 +++++--
 .../ObjectStorages/AzureBlobStorage/AzureObjectStorage.h   | 6 ++++--
 .../AzureBlobStorage/registerDiskAzureBlobStorage.cpp      | 4 +++-
 src/Storages/StorageAzureBlob.cpp                          | 2 +-
 src/TableFunctions/TableFunctionAzureBlobStorage.cpp       | 4 ++--
 .../TableFunctionAzureBlobStorageCluster.cpp               | 4 ++--
 7 files changed, 21 insertions(+), 12 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 968a60c566f..5ddbb42e2c0 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -41,7 +41,8 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupReaderAzureBlobStorage",
                                                           std::move(client_ptr),
-                                                          std::move(settings_as_unique_ptr));
+                                                          std::move(settings_as_unique_ptr),
+                                                          configuration_.container);
     client = object_storage->getClient();
 }
 
@@ -153,7 +154,8 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
                                                           std::move(client_ptr),
-                                                          std::move(settings_as_unique_ptr));
+                                                          std::move(settings_as_unique_ptr),
+                                                          configuration_.container);
     client = object_storage->getClient();
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 068e2aebab1..1f92ef48350 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -92,10 +92,12 @@ private:
 AzureObjectStorage::AzureObjectStorage(
     const String & name_,
     AzureClientPtr && client_,
-    SettingsPtr && settings_)
+    SettingsPtr && settings_,
+    const String & container_)
     : name(name_)
     , client(std::move(client_))
     , settings(std::move(settings_))
+    , container(container_)
     , log(&Poco::Logger::get("AzureObjectStorage"))
 {
     data_source_description.type = DataSourceType::AzureBlobStorage;
@@ -379,7 +381,8 @@ std::unique_ptr<IObjectStorage> AzureObjectStorage::cloneObjectStorage(const std
     return std::make_unique<AzureObjectStorage>(
         name,
         getAzureBlobContainerClient(config, config_prefix),
-        getAzureBlobStorageSettings(config, config_prefix, context)
+        getAzureBlobStorageSettings(config, config_prefix, context),
+        container
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 436b48c0ad4..660d4a30889 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -66,7 +66,8 @@ public:
     AzureObjectStorage(
         const String & name_,
         AzureClientPtr && client_,
-        SettingsPtr && settings_);
+        SettingsPtr && settings_,
+        const String & container_);
 
     void listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const override;
 
@@ -125,7 +126,7 @@ public:
         const std::string & config_prefix,
         ContextPtr context) override;
 
-    String getObjectsNamespace() const override { return ""; }
+    String getObjectsNamespace() const override { return container ; }
 
     std::unique_ptr<IObjectStorage> cloneObjectStorage(
         const std::string & new_namespace,
@@ -144,6 +145,7 @@ private:
     /// client used to access the files in the Blob Storage cloud
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
     MultiVersion<AzureObjectStorageSettings> settings;
+    const String container;
 
     Poco::Logger * log;
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/registerDiskAzureBlobStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/registerDiskAzureBlobStorage.cpp
index 7ba9d21db62..2ffd910f92a 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/registerDiskAzureBlobStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/registerDiskAzureBlobStorage.cpp
@@ -26,10 +26,12 @@ void registerDiskAzureBlobStorage(DiskFactory & factory, bool global_skip_access
     {
         auto [metadata_path, metadata_disk] = prepareForLocalMetadata(name, config, config_prefix, context);
 
+        String container_name = config.getString(config_prefix + ".container_name", "default-container");
         ObjectStoragePtr azure_object_storage = std::make_unique<AzureObjectStorage>(
             name,
             getAzureBlobContainerClient(config, config_prefix),
-            getAzureBlobStorageSettings(config, config_prefix, context));
+            getAzureBlobStorageSettings(config, config_prefix, context),
+            container_name);
 
         String key_prefix;
         auto metadata_storage = std::make_shared<MetadataStorageFromDisk>(metadata_disk, key_prefix);
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index f1070c8c31e..fcd7074b9d2 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -314,7 +314,7 @@ void registerStorageAzureBlob(StorageFactory & factory)
 
         return std::make_shared<StorageAzureBlob>(
             std::move(configuration),
-            std::make_unique<AzureObjectStorage>("AzureBlobStorage", std::move(client), std::move(settings)),
+            std::make_unique<AzureObjectStorage>("AzureBlobStorage", std::move(client), std::move(settings),configuration.container),
             args.getContext(),
             args.table_id,
             args.columns,
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
index d394c836369..b098cac5144 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
@@ -262,7 +262,7 @@ ColumnsDescription TableFunctionAzureBlobStorage::getActualTableStructure(Contex
         auto client = StorageAzureBlob::createClient(configuration, !is_insert_query);
         auto settings = StorageAzureBlob::createSettings(context);
 
-        auto object_storage = std::make_unique<AzureObjectStorage>("AzureBlobStorageTableFunction", std::move(client), std::move(settings));
+        auto object_storage = std::make_unique<AzureObjectStorage>("AzureBlobStorageTableFunction", std::move(client), std::move(settings), configuration.container);
         return StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, std::nullopt, context, false);
     }
 
@@ -293,7 +293,7 @@ StoragePtr TableFunctionAzureBlobStorage::executeImpl(const ASTPtr & /*ast_funct
 
     StoragePtr storage = std::make_shared<StorageAzureBlob>(
         configuration,
-        std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings)),
+        std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings), configuration.container),
         context,
         StorageID(getDatabaseName(), table_name),
         columns,
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp b/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
index eee585967c2..1c3b302a186 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
+++ b/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
@@ -40,7 +40,7 @@ StoragePtr TableFunctionAzureBlobStorageCluster::executeImpl(
         /// On worker node this filename won't contains globs
         storage = std::make_shared<StorageAzureBlob>(
             configuration,
-            std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings)),
+            std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings), configuration.container),
             context,
             StorageID(getDatabaseName(), table_name),
             columns,
@@ -55,7 +55,7 @@ StoragePtr TableFunctionAzureBlobStorageCluster::executeImpl(
         storage = std::make_shared<StorageAzureBlobCluster>(
             cluster_name,
             configuration,
-            std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings)),
+            std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings), configuration.container),
             StorageID(getDatabaseName(), table_name),
             columns,
             ConstraintsDescription{},

From b250acff789620be57e21977d8f3d4a3468070d5 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 5 Jan 2024 11:26:32 +0100
Subject: [PATCH 0099/1081] Fixed style check

---
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 9db5ddb476a..3399f1705f4 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -359,7 +359,7 @@ void copyAzureBlobStorageFile(
     bool for_disk_azure_blob_storage)
 {
 
-    if (settings->use_native_copy )
+    if (settings->use_native_copy)
     {
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)

From 356fc0aadb8f7c0f15f72c3b72955e1db7046e48 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 7 Jan 2024 14:49:24 +0100
Subject: [PATCH 0100/1081] Fix tests

---
 src/Storages/StorageView.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 2f7267e3701..1898e49de86 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -112,8 +112,14 @@ StorageView::StorageView(
     : IStorage(table_id_)
 {
     StorageInMemoryMetadata storage_metadata;
-    if (is_parameterized_view_ && !query.isParameterizedView())
+    if (is_parameterized_view_)
+    {
+        if (!query.isParameterizedView())
+            storage_metadata.setColumns(columns_);
+    }
+    else
         storage_metadata.setColumns(columns_);
+
     storage_metadata.setComment(comment);
 
     if (!query.select)

From fd92c1961e5f09411d83b21c4fe9f00b78be22ba Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 7 Jan 2024 16:33:48 +0100
Subject: [PATCH 0101/1081] Fix clang tidy build

---
 src/Backups/BackupIO_AzureBlobStorage.cpp            | 12 ++++++------
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp | 10 +++++-----
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h   |  6 +++---
 3 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 5ddbb42e2c0..8c6c1040eec 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -305,21 +305,21 @@ void BackupWriterAzureBlobStorage::removeFile(const String & file_name)
     object_storage->removeObjectIfExists(object);
 }
 
-void BackupWriterAzureBlobStorage::removeFiles(const Strings & keys)
+void BackupWriterAzureBlobStorage::removeFiles(const Strings & file_names)
 {
     StoredObjects objects;
-    for (const auto & key : keys)
-        objects.emplace_back(key);
+    for (const auto & file_name : file_names)
+        objects.emplace_back(file_name);
 
     object_storage->removeObjectsIfExist(objects);
 
 }
 
-void BackupWriterAzureBlobStorage::removeFilesBatch(const Strings & keys)
+void BackupWriterAzureBlobStorage::removeFilesBatch(const Strings & file_names)
 {
     StoredObjects objects;
-    for (const auto & key : keys)
-        objects.emplace_back(key);
+    for (const auto & file_name : file_names)
+        objects.emplace_back(file_name);
 
     object_storage->removeObjectsIfExist(objects);
 }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 3399f1705f4..272be914cc1 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -65,11 +65,11 @@ namespace
             , schedule(schedule_)
             , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
             , log(log_)
-            , max_single_part_upload_size(settings_.get()->max_single_part_upload_size)
+            , max_single_part_upload_size(settings_->max_single_part_upload_size)
         {
         }
 
-        ~UploadHelper() {}
+        virtual ~UploadHelper() = default;
 
     protected:
         std::function<std::unique_ptr<SeekableReadBuffer>()> create_read_buffer;
@@ -114,9 +114,9 @@ namespace
             if (!total_size)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Chosen multipart upload for an empty file. This must not happen");
 
-            auto max_part_number = settings.get()->max_part_number;
-            auto min_upload_part_size = settings.get()->min_upload_part_size;
-            auto max_upload_part_size = settings.get()->max_upload_part_size;
+            auto max_part_number = settings->max_part_number;
+            auto min_upload_part_size = settings->min_upload_part_size;
+            auto max_upload_part_size = settings->max_upload_part_size;
 
             if (!max_part_number)
                 throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_part_number must not be 0");
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index a6502541db1..b022151d32d 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -24,11 +24,11 @@ void copyAzureBlobStorageFile(
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
     const String & src_container,
-    const String & src_path,
+    const String & src_blob,
     size_t src_offset,
     size_t src_size,
     const String & dest_container,
-    const String & dest_path,
+    const String & dest_blob,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
@@ -47,7 +47,7 @@ void copyDataToAzureBlobStorageFile(
     size_t size,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client,
     const String & dest_container,
-    const String & dest_bucket,
+    const String & dest_blob,
     std::shared_ptr<AzureObjectStorageSettings> settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},

From f50f7f56949021d01ba692f6788e50d411ca8af9 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 8 Jan 2024 14:25:33 +0100
Subject: [PATCH 0102/1081] Removed unwanted includes

---
 .../registerBackupEngineAzureBlobStorage.cpp  | 19 -------------------
 1 file changed, 19 deletions(-)

diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
index ef95206831f..810da5adb3f 100644
--- a/src/Backups/registerBackupEngineAzureBlobStorage.cpp
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -10,13 +10,11 @@
 #include <IO/Archives/hasRegisteredArchiveFileExtension.h>
 #include <Interpreters/Context.h>
 #include <Poco/Util/AbstractConfiguration.h>
-#include <filesystem>
 #endif
 
 
 namespace DB
 {
-namespace fs = std::filesystem;
 
 namespace ErrorCodes
 {
@@ -25,23 +23,6 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
-#if USE_AZURE_BLOB_STORAGE
-namespace
-{
-    String removeFileNameFromURL(String & url)
-    {
-        Poco::URI url2{url};
-        String path = url2.getPath();
-        size_t slash_pos = path.find_last_of('/');
-        String file_name = path.substr(slash_pos + 1);
-        path.resize(slash_pos + 1);
-        url2.setPath(path);
-        url = url2.toString();
-        return file_name;
-    }
-}
-#endif
-
 
 void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
 {

From 2d914721e5101215c2c63c97151552cb7c8ff746 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 8 Jan 2024 15:10:37 +0100
Subject: [PATCH 0103/1081] Fix build

---
 .../registerBackupEngineAzureBlobStorage.cpp    | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)

diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
index 810da5adb3f..3480ea75f1f 100644
--- a/src/Backups/registerBackupEngineAzureBlobStorage.cpp
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -10,6 +10,7 @@
 #include <IO/Archives/hasRegisteredArchiveFileExtension.h>
 #include <Interpreters/Context.h>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <filesystem>
 #endif
 
 
@@ -23,6 +24,22 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
+#if USE_AZURE_BLOB_STORAGE
+namespace
+{
+    String removeFileNameFromURL(String & url)
+    {
+        Poco::URI url2{url};
+        String path = url2.getPath();
+        size_t slash_pos = path.find_last_of('/');
+        String file_name = path.substr(slash_pos + 1);
+        path.resize(slash_pos + 1);
+        url2.setPath(path);
+        url = url2.toString();
+        return file_name;
+    }
+}
+#endif
 
 void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
 {

From 3de5b27c48483962285de0b16f152cc35eadd1a6 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 8 Jan 2024 16:50:17 +0100
Subject: [PATCH 0104/1081] Fix conflicts

---
 .../Serializations/SerializationString.cpp    | 22 ++++++++++++++++++-
 1 file changed, 21 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index a6bf29336b7..b2c254e63c5 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -381,7 +381,7 @@ void SerializationString::deserializeTextJSON(IColumn & column, ReadBuffer & ist
             str_value = "false";
         }
 
-        read(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
+        read<void>(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
     }
     else if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
@@ -406,6 +406,26 @@ bool SerializationString::tryDeserializeTextJSON(IColumn & column, ReadBuffer &
     if (settings.json.read_arrays_as_strings && !istr.eof() && *istr.position() == '[')
         return read<bool>(column, [&](ColumnString::Chars & data) { return readJSONArrayInto<ColumnString::Chars, bool>(data, istr); });
 
+    if (settings.json.read_bools_as_strings && !istr.eof() && (*istr.position() == 't' || *istr.position() == 'f'))
+    {
+        String str_value;
+        if (*istr.position() == 't')
+        {
+            if (!checkString("true", istr))
+                return false;
+            str_value = "true";
+        }
+        else if (*istr.position() == 'f')
+        {
+            if (!checkString("false", istr))
+                return false;
+            str_value = "false";
+        }
+
+        read<void>(column, [&](ColumnString::Chars & data) { data.insert(str_value.begin(), str_value.end()); });
+        return true;
+    }
+
     if (settings.json.read_numbers_as_strings && !istr.eof() && *istr.position() != '"')
     {
         String field;

From c5bf722ee2d2b50d1b0691112b769e3e67612214 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 8 Jan 2024 21:24:44 +0300
Subject: [PATCH 0105/1081] Create ch/chc/chl symlinks by cmake as well (for
 develop mode)

Before, they had been created only by install target.

Follow-up for: #56634

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/CMakeLists.txt | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index b3a5af6d6c9..6e544bac81c 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -328,6 +328,10 @@ set (CLICKHOUSE_BUNDLE)
 if (ENABLE_CLICKHOUSE_SELF_EXTRACTING)
     list(APPEND CLICKHOUSE_BUNDLE self-extracting)
 endif ()
+
+if (NOT BUILD_STANDALONE_KEEPER)
+    add_custom_target (ch ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ch DEPENDS clickhouse)
+endif()
 if (ENABLE_CLICKHOUSE_SERVER)
     add_custom_target (clickhouse-server ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-server DEPENDS clickhouse)
     install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-server" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
@@ -335,11 +339,13 @@ if (ENABLE_CLICKHOUSE_SERVER)
 endif ()
 if (ENABLE_CLICKHOUSE_CLIENT)
     add_custom_target (clickhouse-client ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-client DEPENDS clickhouse)
+    add_custom_target (chc ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chc DEPENDS clickhouse)
     install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-client" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
     list(APPEND CLICKHOUSE_BUNDLE clickhouse-client)
 endif ()
 if (ENABLE_CLICKHOUSE_LOCAL)
     add_custom_target (clickhouse-local ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-local DEPENDS clickhouse)
+    add_custom_target (chl ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chl DEPENDS clickhouse)
     install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-local" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
     list(APPEND CLICKHOUSE_BUNDLE clickhouse-local)
 endif ()

From 21e4b453dfc7df905ed304c5513b50f57ef19228 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 8 Jan 2024 22:02:40 +0100
Subject: [PATCH 0106/1081] Fix pretty type name

---
 src/DataTypes/DataTypeVariant.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 5dc42cc7443..2bc4dfa5a7a 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -71,17 +71,17 @@ std::string DataTypeVariant::doGetPrettyName(size_t indent) const
 {
     size_t size = variants.size();
     WriteBufferFromOwnString s;
-    s << "Variant(\n";
+    s << "Variant(";
 
     for (size_t i = 0; i != size; ++i)
     {
         if (i != 0)
-            s << ",\n";
+            s << ", ";
 
-        s << fourSpaceIndent(indent + 1) << variants[i]->getPrettyName(indent + 1);
+        s << variants[i]->getPrettyName(indent);
     }
 
-    s << '\n' << fourSpaceIndent(indent) << ')';
+    s << ')';
     return s.str();
 }
 

From 629d4b921e5cf2d709d2ca7a55658d95407e2ff7 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 9 Jan 2024 15:38:04 +0000
Subject: [PATCH 0107/1081] Fix style

---
 src/Analyzer/Passes/IfConstantConditionPass.cpp | 2 +-
 src/Storages/StorageMerge.cpp                   | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Analyzer/Passes/IfConstantConditionPass.cpp b/src/Analyzer/Passes/IfConstantConditionPass.cpp
index f3b8b712dbf..6b24eb1d539 100644
--- a/src/Analyzer/Passes/IfConstantConditionPass.cpp
+++ b/src/Analyzer/Passes/IfConstantConditionPass.cpp
@@ -57,7 +57,7 @@ public:
 
 }
 
-void IfConstantConditionPass::run(QueryTreeNodePtr & query_tree_node,  ContextPtr context)
+void IfConstantConditionPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     IfConstantConditionVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 15ca6e65482..ffbf98e85c7 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -92,7 +92,6 @@ namespace ErrorCodes
     extern const int SAMPLING_NOT_SUPPORTED;
     extern const int ALTER_OF_COLUMN_IS_FORBIDDEN;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
-    extern const int LOGICAL_ERROR;
 }
 
 StorageMerge::DatabaseNameOrRegexp::DatabaseNameOrRegexp(

From 633b4a5dcfcf63bec8e2b5a1b5f38e648348639d Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 9 Jan 2024 19:23:34 +0100
Subject: [PATCH 0108/1081] Apply suggestions from code review

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 src/Columns/ColumnNullable.cpp | 2 +-
 src/Columns/ColumnVariant.cpp  | 8 +++++---
 src/Columns/ColumnVariant.h    | 2 +-
 src/DataTypes/EnumValues.cpp   | 4 +---
 4 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index d2a579d6800..25b0e35e15e 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -928,7 +928,7 @@ ColumnPtr makeNullableOrLowCardinalityNullableSafe(const ColumnPtr & column)
         return assert_cast<const ColumnLowCardinality &>(*column).cloneNullable();
 
     if (column->canBeInsideNullable())
-        return makeNullableSafe(column);
+        return makeNullable(column);
 
     return column;
 }
diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index f90ebfc54bb..10d79f59d37 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -631,9 +631,9 @@ void ColumnVariant::popBack(size_t n)
     size_t size = local_discriminators_data.size();
     const size_t num_variants = variants.size();
     std::vector<size_t> nested_n(num_variants, 0);
-    for (size_t i = 0; i != n; ++i)
+    for (size_t i = size - n; i < size; ++i)
     {
-        Discriminator discr = local_discriminators_data[size - i - 1];
+        Discriminator discr = local_discriminators_data[i];
         if (discr != NULL_DISCRIMINATOR)
             ++nested_n[discr];
     }
@@ -966,7 +966,7 @@ ColumnPtr ColumnVariant::replicate(const Offsets & replicate_offsets) const
         {
             new_offsets_data.reserve(new_size);
             for (size_t i = old_size; i < new_size; ++i)
-                new_offsets_data.push_back(new_offsets_data[i - 1] + 1);
+                new_offsets_data.push_back(i);
         }
         else
         {
@@ -1260,6 +1260,8 @@ std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminator
     {
         if (variants[i]->size() == local_discriminators->size())
             return i;
+        if (!variants[i]->empty())
+            return std::nullopt
     }
 
     return std::nullopt;
diff --git a/src/Columns/ColumnVariant.h b/src/Columns/ColumnVariant.h
index eb96205924c..8f0c5a6eef9 100644
--- a/src/Columns/ColumnVariant.h
+++ b/src/Columns/ColumnVariant.h
@@ -205,7 +205,7 @@ public:
 
     void compareColumn(const IColumn &, size_t, PaddedPODArray<UInt64> *, PaddedPODArray<Int8> &, int, int) const override
     {
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnAggregateFunction");
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method compareColumn is not supported for ColumnVariant");
     }
 
     bool hasEqualValues() const override;
diff --git a/src/DataTypes/EnumValues.cpp b/src/DataTypes/EnumValues.cpp
index 8a4b1304d5e..a15136b9335 100644
--- a/src/DataTypes/EnumValues.cpp
+++ b/src/DataTypes/EnumValues.cpp
@@ -85,9 +85,7 @@ bool EnumValues<T>::tryGetValue(T & x, StringRef field_name, bool try_treat_as_i
         if (try_treat_as_id)
         {
             ReadBufferFromMemory tmp_buf(field_name.data, field_name.size);
-            if (!tryReadText(x, tmp_buf) || !tmp_buf.eof() || !value_to_name_map.contains(x))
-                return false;
-            return true;
+            return tryReadText(x, tmp_buf) && tmp_buf.eof() && value_to_name_map.contains(x);
         }
         return false;
     }

From fb758e48b04c5f799a5169af584f6a562866640d Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 9 Jan 2024 19:02:20 +0000
Subject: [PATCH 0109/1081] Apply suggestions

---
 src/Columns/ColumnVariant.cpp | 172 +++++++++++++++-------------------
 1 file changed, 74 insertions(+), 98 deletions(-)

diff --git a/src/Columns/ColumnVariant.cpp b/src/Columns/ColumnVariant.cpp
index 10d79f59d37..a707ec8e153 100644
--- a/src/Columns/ColumnVariant.cpp
+++ b/src/Columns/ColumnVariant.cpp
@@ -204,10 +204,13 @@ ColumnVariant::ColumnVariant(DB::MutableColumnPtr local_discriminators_, DB::Mut
     }
 }
 
-ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+namespace
+{
+
+MutableColumns getVariantsAssumeMutable(const Columns & variants)
 {
     MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
+
     for (const auto & variant : variants)
     {
         if (isColumnConst(*variant))
@@ -215,35 +218,24 @@ ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::ve
         mutable_variants.emplace_back(variant->assumeMutable());
     }
 
-    return ColumnVariant::create(std::move(mutable_variants), local_to_global_discriminators);
+    return mutable_variants;
+}
+
+}
+
+ColumnVariant::Ptr ColumnVariant::create(const Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
+{
+    return ColumnVariant::create(getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
 {
-    MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
-    for (const auto & variant : variants)
-    {
-        if (isColumnConst(*variant))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
-        mutable_variants.emplace_back(variant->assumeMutable());
-    }
-
-    return ColumnVariant::create(local_discriminators->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+    return ColumnVariant::create(local_discriminators->assumeMutable(), getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 ColumnVariant::Ptr ColumnVariant::create(const DB::ColumnPtr & local_discriminators, const DB::ColumnPtr & offsets, const DB::Columns & variants, const std::vector<Discriminator> & local_to_global_discriminators)
 {
-    MutableColumns mutable_variants;
-    mutable_variants.reserve(variants.size());
-    for (const auto & variant : variants)
-    {
-        if (isColumnConst(*variant))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnVariant cannot have ColumnConst as its element");
-        mutable_variants.emplace_back(variant->assumeMutable());
-    }
-
-    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), std::move(mutable_variants), local_to_global_discriminators);
+    return ColumnVariant::create(local_discriminators->assumeMutable(), offsets->assumeMutable(), getVariantsAssumeMutable(variants), local_to_global_discriminators);
 }
 
 MutableColumnPtr ColumnVariant::cloneEmpty() const
@@ -309,104 +301,88 @@ MutableColumnPtr ColumnVariant::cloneResized(size_t new_size) const
     const auto & local_discriminators_data = getLocalDiscriminators();
     const auto & offsets_data = getOffsets();
 
-    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating
-    /// sizes for all new variants. This code is below and commented.
-
-//    std::vector<size_t> new_nested_sizes(num_variants, 0);
-//    for (size_t i = 0; i != new_size; ++i)
-//    {
-//        Discriminator discr = local_discriminators_data[i];
-//        if (discr != NULL_DISCRIMINATOR)
-//            ++new_nested_sizes[discr];
-//    }
-//
-//    MutableColumns new_variants;
-//    new_variants.reserve(num_variants);
-//    for (size_t i = 0; i != num_variants; ++i)
-//    {
-//        if (new_nested_sizes[i])
-//            new_variants.emplace_back(variants[i]->cloneResized(new_nested_sizes[i]));
-//        else
-//            new_variants.emplace_back(variants[i]->cloneEmpty());
-//    }
-//
-//    return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
-
+    /// We can find all variants sizes by scanning all new_size local_discriminators and calculating sizes for all new variants.
     /// But instead we are trying to optimize it using offsets column:
     /// For all non-empty variants we are trying to find last occurrence of its discriminator in local_discriminators[:new_size] or
-    /// first occurrence in local_discriminators[new_size:]. The same row in offsets column will contain the desired size (or size - 1) of variant.
+    /// first occurrence in local_discriminators[new_size:] depending on what range is smaller. The same row in offsets column will
+    /// contain the desired size (or size - 1) of variant.
     /// All empty variants will remain empty.
-    /// Not sure how good this optimization is, feel free to remove it and use simpler version above.
+    /// Not sure how good this optimization is, feel free to remove it and use simpler version without using offsets.
 
     MutableColumns new_variants(num_variants);
-    std::unordered_set<Discriminator> seen_variants;
+    std::vector<UInt8> seen_variants(num_variants, 0);
+    size_t number_of_seen_variants = 0;
     /// First, check which variants are empty. They will remain empty.
     for (Discriminator i = 0; i != num_variants; ++i)
     {
         if (variants[i]->empty())
         {
-            seen_variants.insert(i);
+            seen_variants[i] = 1;
+            ++number_of_seen_variants;
             new_variants[i] = variants[i]->cloneEmpty();
         }
     }
 
-    /// Now, iterate through local discriminators using two pointers.
-    /// First will go from new_size - 1 to 0, second from new_size to size.
-    /// Finish when we find all variants or hit lower or upper bound.
-    ssize_t i = new_size - 1;
-    size_t j = new_size;
-    while (i != -1 && j != size)
+    /// Now, choose what range is smaller and use it.
+    /// [0, new_size)
+    if (2 * new_size <= size)
     {
-        Discriminator i_discr = local_discriminators_data[i];
-        if (i_discr != NULL_DISCRIMINATOR)
+        for (ssize_t i = new_size - 1; i > -1; --i)
         {
-            auto [_, inserted] = seen_variants.insert(i_discr);
-            /// If this is the first occurrence of this discriminator,
-            /// we can get new size for this variant.
-            if (inserted)
+            Discriminator discr = local_discriminators_data[i];
+            if (discr != NULL_DISCRIMINATOR)
             {
-                new_variants[i_discr] = variants[i_discr]->cloneResized(offsets_data[i] + 1);
-                if (seen_variants.size() == num_variants)
-                    break;
+                /// If this is the first occurrence of this discriminator,
+                /// we can get new size for this variant.
+                if (!seen_variants[discr])
+                {
+                    seen_variants[discr] = 1;
+                    ++number_of_seen_variants;
+                    new_variants[discr] = variants[discr]->cloneResized(offsets_data[i] + 1);
+                    /// Break if we found sizes for all variants.
+                    if (number_of_seen_variants == num_variants)
+                        break;
+                }
             }
         }
 
-        Discriminator j_discr = local_discriminators_data[j];
-        if (j_discr != NULL_DISCRIMINATOR)
+        /// All variants that weren't found in range [0, new_size] will be empty in the result column.
+        if (number_of_seen_variants != num_variants)
         {
-            auto [_, inserted] = seen_variants.insert(j_discr);
-            /// If this is the first occurrence of this discriminator,
-            /// we can get new size for this variant.
-            if (inserted)
-            {
-                new_variants[j_discr] = variants[j_discr]->cloneResized(offsets_data[j]);
-                if (seen_variants.size() == num_variants)
-                    break;
-            }
-        }
-
-        --i;
-        ++j;
-    }
-
-    /// We can finish in 3 cases:
-    ///   1) seen_variants.size() == num_variants - we found local_discriminators of all variants, nothing to do.
-    ///   2) i == -1 - we scanned all values in local_discriminators[:new_size]. Not found variants doesn't have
-    /// values in local_discriminators[:new_size], so they should be empty in the resized version.
-    ///   3) j == size - we scanned all values in local_discriminators[new_size:]. Not found variants doesn't have
-    /// values in local_discriminators[new_size:], so, we should use the full variant in the resized version.
-    if (seen_variants.size() != num_variants)
-    {
-        for (size_t discr = 0; discr != num_variants; ++discr)
-        {
-            if (!seen_variants.contains(discr))
-            {
-                if (i == -1)
+            for (size_t discr = 0; discr != num_variants; ++discr)
+                if (!seen_variants[discr])
                     new_variants[discr] = variants[discr]->cloneEmpty();
-                else
-                    new_variants[discr] = IColumn::mutate(variants[discr]);
+        }
+    }
+    /// [new_size, size)
+    else
+    {
+        for (size_t i = new_size; i < size; ++i)
+        {
+            Discriminator discr = local_discriminators_data[i];
+            if (discr != NULL_DISCRIMINATOR)
+            {
+                /// If this is the first occurrence of this discriminator,
+                /// we can get new size for this variant.
+                if (!seen_variants[discr])
+                {
+                    seen_variants[discr] = 1;
+                    ++number_of_seen_variants;
+                    new_variants[discr] = variants[discr]->cloneResized(offsets_data[i]);
+                    /// Break if we found sizes for all variants.
+                    if (number_of_seen_variants == num_variants)
+                        break;
+                }
             }
         }
+
+        if (number_of_seen_variants != num_variants)
+        {
+            /// All variants that weren't found in range [new_size, size) will not change their sizes.
+            for (size_t discr = 0; discr != num_variants; ++discr)
+                if (!seen_variants[discr])
+                    new_variants[discr] = IColumn::mutate(variants[discr]);
+        }
     }
 
     return ColumnVariant::create(local_discriminators->cloneResized(new_size), offsets->cloneResized(new_size), std::move(new_variants), local_to_global_discriminators);
@@ -1261,7 +1237,7 @@ std::optional<ColumnVariant::Discriminator> ColumnVariant::getLocalDiscriminator
         if (variants[i]->size() == local_discriminators->size())
             return i;
         if (!variants[i]->empty())
-            return std::nullopt
+            return std::nullopt;
     }
 
     return std::nullopt;

From 10af0d406fb536917a84d23f4bacba073ea9443e Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 10 Jan 2024 16:55:58 +0100
Subject: [PATCH 0110/1081] Update 02916_broken_projection.sh

---
 tests/queries/0_stateless/02916_broken_projection.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
index 99e54b08b74..fbd26e59f6f 100755
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ b/tests/queries/0_stateless/02916_broken_projection.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage
+# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage, no-parallel
 # shellcheck disable=SC2046
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 1deaaf5466a2633d58fba87521435491546df0a2 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 11 Jan 2024 15:20:06 +0100
Subject: [PATCH 0111/1081] Apply suggestions from code review

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 .../Serializations/SerializationDateTime64.cpp    |  6 +++---
 src/DataTypes/Serializations/SerializationEnum.h  |  5 +----
 .../Serializations/SerializationNamed.cpp         |  1 -
 .../Serializations/SerializationTuple.cpp         | 15 +++------------
 4 files changed, 7 insertions(+), 20 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationDateTime64.cpp b/src/DataTypes/Serializations/SerializationDateTime64.cpp
index a19619bf8d3..442e29edd52 100644
--- a/src/DataTypes/Serializations/SerializationDateTime64.cpp
+++ b/src/DataTypes/Serializations/SerializationDateTime64.cpp
@@ -50,7 +50,7 @@ void SerializationDateTime64::deserializeText(IColumn & column, ReadBuffer & ist
 bool SerializationDateTime64::tryDeserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const
 {
     DateTime64 result = 0;
-    if (tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && istr.eof()))
+    if (!tryReadDateTime64Text(result, scale, istr, time_zone) || (whole && !istr.eof()))
         return false;
 
     assert_cast<ColumnType &>(column).getData().push_back(result);
@@ -151,7 +151,7 @@ bool SerializationDateTime64::tryDeserializeTextQuoted(IColumn & column, ReadBuf
     DateTime64 x = 0;
     if (checkChar('\'', istr)) /// Cases: '2017-08-31 18:36:48' or '1504193808'
     {
-        if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
+        if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone) || !checkChar('\'', istr))
             return false;
     }
     else /// Just 1504193808 or 01504193808
@@ -265,7 +265,7 @@ bool SerializationDateTime64::tryDeserializeTextCSV(IColumn & column, ReadBuffer
     {
         if (settings.csv.delimiter != ',' || settings.date_time_input_format == FormatSettings::DateTimeInputFormat::Basic)
         {
-            if (tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
+            if (!tryReadText(x, scale, istr, settings, time_zone, utc_time_zone))
                 return false;
         }
         else
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 5152a3fbc93..bb720ee9b1f 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -60,10 +60,7 @@ public:
 
     bool tryReadValue(ReadBuffer & istr, FieldType & x) const
     {
-       if (!tryReadText(x, istr) || !ref_enum_values.hasValue(x))
-           return false;
-
-       return true;
+       return tryReadText(x, istr) && ref_enum_values.hasValue(x);
     }
 
     std::optional<EnumValues<Type>> own_enum_values;
diff --git a/src/DataTypes/Serializations/SerializationNamed.cpp b/src/DataTypes/Serializations/SerializationNamed.cpp
index 1a9cbe9a37d..ca60948ce68 100644
--- a/src/DataTypes/Serializations/SerializationNamed.cpp
+++ b/src/DataTypes/Serializations/SerializationNamed.cpp
@@ -1,5 +1,4 @@
 #include <DataTypes/Serializations/SerializationNamed.h>
-#include <iostream>
 
 namespace DB
 {
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index c0b0658e6b4..79b7fa84242 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -212,10 +212,7 @@ ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer
         return ReturnType(true);
     };
 
-    if constexpr (throw_exception)
-        addElementSafe<ReturnType>(elems.size(), column, impl);
-    else
-        return addElementSafe<ReturnType>(elems.size(), column, impl);
+    return addElementSafe<ReturnType>(elems.size(), column, impl);
 }
 
 void SerializationTuple::deserializeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings, bool whole) const
@@ -457,10 +454,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
             return ReturnType(true);
         };
 
-        if constexpr (throw_exception)
-            addElementSafe<ReturnType>(elems.size(), column, impl);
-        else
-            return addElementSafe<ReturnType>(elems.size(), column, impl);
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
     else
     {
@@ -502,10 +496,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
             return ReturnType(true);
         };
 
-        if constexpr (throw_exception)
-            addElementSafe<ReturnType>(elems.size(), column, impl);
-        else
-            return addElementSafe<ReturnType>(elems.size(), column, impl);
+        return addElementSafe<ReturnType>(elems.size(), column, impl);
     }
 }
 

From f05d89bc2b26206b1b6854ad48dd35840b82a123 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 11 Jan 2024 14:48:57 +0000
Subject: [PATCH 0112/1081] Apply review suggestions

---
 .../Serializations/ISerialization.cpp         |  47 +++---
 .../Serializations/SerializationTuple.cpp     |   3 +
 .../Serializations/SerializationVariant.cpp   | 135 +++++++++---------
 3 files changed, 101 insertions(+), 84 deletions(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 08575f06f2a..c699b3b0748 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -176,7 +176,7 @@ String getNameForSubstreamPath(
                 stream_name += "." + it->tuple_element_name;
         }
         else if (it->type == Substream::VariantDiscriminators)
-            stream_name += ".discr";
+            stream_name += ".variant_discr";
         else if (it->type == Substream::VariantOffsets)
             stream_name += ".variant_offsets";
         else if (it->type == Substream::VariantElement)
@@ -261,43 +261,51 @@ bool ISerialization::isSpecialCompressionAllowed(const SubstreamPath & path)
     return true;
 }
 
-#define TRY_DESERIALIZE_TEXT(deserialize)                \
-    size_t prev_size = column.size();                    \
-    try                                                  \
-    {                                                    \
-        deserialize(column, istr, settings);             \
-        return true;                                     \
-    }                                                    \
-    catch (...)                                          \
-    {                                                    \
-        if (column.size() > prev_size)                   \
-            column.popBack(column.size() - prev_size);   \
-        return false;                                    \
-    }                                                    \
+namespace
+{
+
+template <typename F>
+bool tryDeserializeText(const F deserialize, DB::IColumn & column)
+{
+    size_t prev_size = column.size();
+    try
+    {
+        deserialize(column);
+        return true;
+    }
+    catch (...)
+    {
+        if (column.size() > prev_size)
+            column.popBack(column.size() - prev_size);
+        return false;
+    }
+}
+
+}
 
 bool ISerialization::tryDeserializeTextCSV(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextCSV)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextCSV(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextEscaped(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextEscaped)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextEscaped(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextJSON(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextJSON)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextJSON(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeTextQuoted(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeTextQuoted)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeTextQuoted(my_column, istr, settings); }, column);
 }
 
 bool ISerialization::tryDeserializeWholeText(DB::IColumn & column, DB::ReadBuffer & istr, const DB::FormatSettings & settings) const
 {
-    TRY_DESERIALIZE_TEXT(deserializeWholeText)
+    return tryDeserializeText([&](DB::IColumn & my_column) { deserializeWholeText(my_column, istr, settings); }, column);
 }
 
 void ISerialization::deserializeTextRaw(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
@@ -346,7 +354,6 @@ bool ISerialization::hasSubcolumnForPath(const SubstreamPath & path, size_t pref
     return path[last_elem].type == Substream::NullMap
             || path[last_elem].type == Substream::TupleElement
             || path[last_elem].type == Substream::ArraySizes
-            || path[last_elem].type == Substream::VariantDiscriminators
             || path[last_elem].type == Substream::VariantElement;
 }
 
diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index 79b7fa84242..c249ee69e46 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -76,7 +76,10 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
         {
             auto & element_column = extractElementColumn(column, i);
             if (element_column.size() > old_size)
+            {
+                chassert(old_size - element_column.size() == 1);
                 element_column.popBack(1);
+            }
         }
     };
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 9cfc4b9e26f..64fcb63d604 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -397,70 +397,76 @@ void SerializationVariant::deserializeBinary(IColumn & column, ReadBuffer & istr
 namespace
 {
 
-std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
+const std::unordered_map<TypeIndex, size_t> & getTypesTextDeserializePriorityMap()
 {
-    static const std::vector<TypeIndex> priorities = {
-        /// Complex types have highest priority.
-        TypeIndex::Array,
-        TypeIndex::Tuple,
-        TypeIndex::Map,
-        TypeIndex::AggregateFunction,
+    static std::unordered_map<TypeIndex, size_t> priority_map = []
+    {
+        static constexpr std::array priorities = {
+            /// Complex types have highest priority.
+            TypeIndex::Array,
+            TypeIndex::Tuple,
+            TypeIndex::Map,
+            TypeIndex::AggregateFunction,
 
-        /// Enums can be parsed both from strings and numbers.
-        /// So they have high enough priority.
-        TypeIndex::Enum8,
-        TypeIndex::Enum16,
+            /// Enums can be parsed both from strings and numbers.
+            /// So they have high enough priority.
+            TypeIndex::Enum8,
+            TypeIndex::Enum16,
 
-        /// Types that can be parsed from strings.
-        TypeIndex::UUID,
-        TypeIndex::IPv4,
-        TypeIndex::IPv6,
+            /// Types that can be parsed from strings.
+            TypeIndex::UUID,
+            TypeIndex::IPv4,
+            TypeIndex::IPv6,
 
-        /// Types that can be parsed from numbers.
-        /// The order:
-        ///    1) Integers
-        ///    2) Big Integers
-        ///    3) Decimals
-        ///    4) Floats
-        /// In each group small types have higher priority.
-        TypeIndex::Int8,
-        TypeIndex::UInt8,
-        TypeIndex::Int16,
-        TypeIndex::UInt16,
-        TypeIndex::Int32,
-        TypeIndex::UInt32,
-        TypeIndex::Int64,
-        TypeIndex::UInt64,
-        TypeIndex::Int128,
-        TypeIndex::UInt128,
-        TypeIndex::Int256,
-        TypeIndex::UInt256,
-        TypeIndex::Decimal32,
-        TypeIndex::Decimal64,
-        TypeIndex::Decimal128,
-        TypeIndex::Decimal256,
-        TypeIndex::Float32,
-        TypeIndex::Float64,
+            /// Types that can be parsed from numbers.
+            /// The order:
+            ///    1) Integers
+            ///    2) Big Integers
+            ///    3) Decimals
+            ///    4) Floats
+            /// In each group small types have higher priority.
+            TypeIndex::Int8,
+            TypeIndex::UInt8,
+            TypeIndex::Int16,
+            TypeIndex::UInt16,
+            TypeIndex::Int32,
+            TypeIndex::UInt32,
+            TypeIndex::Int64,
+            TypeIndex::UInt64,
+            TypeIndex::Int128,
+            TypeIndex::UInt128,
+            TypeIndex::Int256,
+            TypeIndex::UInt256,
+            TypeIndex::Decimal32,
+            TypeIndex::Decimal64,
+            TypeIndex::Decimal128,
+            TypeIndex::Decimal256,
+            TypeIndex::Float32,
+            TypeIndex::Float64,
 
-        /// Dates and DateTimes. More simple Date types have higher priority.
-        /// They have lower priority as numbers as some DateTimes sometimes can
-        /// be also parsed from numbers, but we don't want it usually.
-        TypeIndex::Date,
-        TypeIndex::Date32,
-        TypeIndex::DateTime,
-        TypeIndex::DateTime64,
+            /// Dates and DateTimes. More simple Date types have higher priority.
+            /// They have lower priority as numbers as some DateTimes sometimes can
+            /// be also parsed from numbers, but we don't want it usually.
+            TypeIndex::Date,
+            TypeIndex::Date32,
+            TypeIndex::DateTime,
+            TypeIndex::DateTime64,
 
-        /// String types have almost the lowest priority,
-        /// as in text formats almost all data can
-        /// be deserialized into String type.
-        TypeIndex::FixedString,
-        TypeIndex::String,
-    };
+            /// String types have almost the lowest priority,
+            /// as in text formats almost all data can
+            /// be deserialized into String type.
+            TypeIndex::FixedString,
+            TypeIndex::String,
+        };
+
+        std::unordered_map<TypeIndex, size_t> pm;
+
+        pm.reserve(priorities.size());
+        for (size_t i = 0; i != priorities.size(); ++i)
+            pm[priorities[i]] = priorities.size() - i;
+        return pm;
+    }();
 
-    std::unordered_map<TypeIndex, size_t> priority_map;
-    priority_map.reserve(priorities.size());
-    for (size_t i = 0; i != priorities.size(); ++i)
-        priority_map[priorities[i]] = priorities.size() - i;
     return priority_map;
 }
 
@@ -476,7 +482,7 @@ std::unordered_map<TypeIndex, size_t> getTypesTextDeserializePriorityMap()
 /// so if we have types with the same level of nesting and the same priority, we will first try to deserialize LowCardinality/Nullable types
 /// (for example if we have types Array(Array(String)) and Array(Array(Nullable(String))).
 /// This is just a batch of heuristics.
-std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, std::unordered_map<TypeIndex, size_t> & priority_map)
+std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataTypePtr & type, size_t nested_depth, size_t simple_nested_depth, const std::unordered_map<TypeIndex, size_t> & priority_map)
 {
     if (const auto * nullable_type = typeid_cast<const DataTypeNullable *>(type.get()))
         return getTypeTextDeserializePriority(nullable_type->getNestedType(), nested_depth, simple_nested_depth + 1, priority_map);
@@ -487,7 +493,7 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
     if (const auto * array_type = typeid_cast<const DataTypeArray *>(type.get()))
     {
         auto [elements_nested_depth, elements_priority, elements_simple_nested_depth] = getTypeTextDeserializePriority(array_type->getNestedType(), nested_depth + 1, simple_nested_depth, priority_map);
-        return {elements_nested_depth, elements_priority + priority_map[TypeIndex::Array], elements_simple_nested_depth};
+        return {elements_nested_depth, elements_priority + priority_map.at(TypeIndex::Array), elements_simple_nested_depth};
     }
 
     if (const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get()))
@@ -505,14 +511,14 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
                 max_simple_nested_depth = elem_simple_nested_depth;
         }
 
-        return {max_nested_depth, sum_priority + priority_map[TypeIndex::Tuple], max_simple_nested_depth};
+        return {max_nested_depth, sum_priority + priority_map.at(TypeIndex::Tuple), max_simple_nested_depth};
     }
 
     if (const auto * map_type = typeid_cast<const DataTypeMap *>(type.get()))
     {
         auto [key_max_depth, key_priority, key_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getKeyType(), nested_depth + 1, simple_nested_depth, priority_map);
         auto [value_max_depth, value_priority, value_simple_nested_depth] = getTypeTextDeserializePriority(map_type->getValueType(), nested_depth + 1, simple_nested_depth, priority_map);
-        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map[TypeIndex::Map], std::max(key_simple_nested_depth, value_simple_nested_depth)};
+        return {std::max(key_max_depth, value_max_depth), key_priority + value_priority + priority_map.at(TypeIndex::Map), std::max(key_simple_nested_depth, value_simple_nested_depth)};
     }
 
     if (const auto * variant_type = typeid_cast<const DataTypeVariant *>(type.get()))
@@ -536,9 +542,10 @@ std::tuple<size_t, size_t, size_t> getTypeTextDeserializePriority(const DataType
 
     /// Bool type should have priority higher then all integers.
     if (isBool(type))
-        return {nested_depth, priority_map[TypeIndex::Int8] + 1, simple_nested_depth};
+        return {nested_depth, priority_map.at(TypeIndex::Int8) + 1, simple_nested_depth};
 
-    return {nested_depth, priority_map[type->getTypeId()], simple_nested_depth};
+    auto it = priority_map.find(type->getTypeId());
+    return {nested_depth, it == priority_map.end() ? 0 : it->second, simple_nested_depth};
 }
 
 }
@@ -549,7 +556,7 @@ std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const
     priorities.reserve(variant_types.size());
     std::vector<size_t> order;
     order.reserve(variant_types.size());
-    auto priority_map = getTypesTextDeserializePriorityMap();
+    const auto & priority_map = getTypesTextDeserializePriorityMap();
     for (size_t i = 0; i != variant_types.size(); ++i)
     {
         priorities.push_back(getTypeTextDeserializePriority(variant_types[i], 0, 0, priority_map));

From 9e639df12e69c7373e400115977c432b8fdf31f2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 11 Jan 2024 18:44:05 +0000
Subject: [PATCH 0113/1081] Add fixes, add new mode to getLeastSupertype and
 use it in if/multiIf

---
 .../Serializations/SerializationTuple.cpp     |  2 +-
 src/DataTypes/getLeastSupertype.cpp           | 73 ++++++++++++++++---
 src/DataTypes/getLeastSupertype.h             | 12 +++
 src/Functions/if.cpp                          | 14 +---
 src/Functions/multiIf.cpp                     |  8 +-
 ...940_variant_text_deserialization.reference |  2 +-
 6 files changed, 79 insertions(+), 32 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index c249ee69e46..5d8c84b70bf 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -77,7 +77,7 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
             auto & element_column = extractElementColumn(column, i);
             if (element_column.size() > old_size)
             {
-                chassert(old_size - element_column.size() == 1);
+                chassert(element_column.size() - old_size == 1);
                 element_column.popBack(1);
             }
         }
diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index e5bdb4b267f..5d67f888c4b 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -18,6 +18,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypesDecimal.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypeVariant.h>
 
 
 namespace DB
@@ -58,6 +59,25 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     if constexpr (on_error == LeastSupertypeOnError::String)
         return std::make_shared<DataTypeString>();
 
+    if constexpr (on_error == LeastSupertypeOnError::Variant && std::is_same_v<DataTypes, std::vector<DataTypePtr>>)
+    {
+        DataTypes variants;
+        for (const auto & type : types)
+        {
+            if (isVariant(type))
+            {
+                const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
+                variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
+            }
+            else
+            {
+                variants.push_back(removeNullableOrLowCardinalityNullable(type));
+            }
+        }
+
+        return std::make_shared<DataTypeVariant>(variants);
+    }
+
     if constexpr (on_error == LeastSupertypeOnError::Null)
         return nullptr;
 
@@ -67,8 +87,8 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     throw Exception(error_code, "There is no supertype for types {} {}", getExceptionMessagePrefix(types), message_suffix);
 }
 
-template <LeastSupertypeOnError on_error>
-DataTypePtr getNumericType(const TypeIndexSet & types)
+template <typename ThrowOrReturnFunc>
+DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOrReturnFunc)
 {
     bool all_numbers = true;
 
@@ -119,7 +139,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
     if (max_bits_of_signed_integer || max_bits_of_unsigned_integer || max_mantissa_bits_of_floating)
     {
         if (!all_numbers)
-            return throwOrReturn<on_error>(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
+            return throwOrReturnFunc(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
         /// If there are signed and unsigned types of same bit-width, the result must be signed number with at least one more bit.
         /// Example, common of Int32, UInt32 = Int64.
@@ -134,7 +154,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             if (min_bit_width_of_integer != 64)
                 ++min_bit_width_of_integer;
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     "because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values",
                     ErrorCodes::NO_COMMON_TYPE);
@@ -149,7 +169,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_mantissa_bits <= 53)
                 return std::make_shared<DataTypeFloat64>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " because some of them are integers and some are floating point,"
                     " but there is no floating point type, that can exactly represent all required integers", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -170,7 +190,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeInt256>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -190,7 +210,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types)
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeUInt256>();
             else
-                return throwOrReturn<on_error>(types,
+                return throwOrReturnFunc(types,
                     " but as all data types are unsigned integers, we must have found maximum unsigned integer type", ErrorCodes::NO_COMMON_TYPE);
         }
     }
@@ -382,7 +402,18 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            auto keys_common_type = getLeastSupertype<on_error>(key_types);
+            DataTypePtr keys_common_type;
+            if constexpr (on_error == LeastSupertypeOnError::Variant)
+            {
+                keys_common_type = getLeastSupertype<LeastSupertypeOnError::Null>(key_types);
+                if (!keys_common_type)
+                    return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
+            }
+            else
+            {
+                keys_common_type = getLeastSupertype<on_error>(key_types);
+            }
+
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
             /// keys_common_type or values_common_type will be nullptr, we should return nullptr in this case.
@@ -423,7 +454,18 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                auto nested_type = getLeastSupertype<on_error>(nested_types);
+                DataTypePtr nested_type;
+                if constexpr (on_error == LeastSupertypeOnError::Variant)
+                {
+                    nested_type = getLeastSupertype<LeastSupertypeOnError::Null>(nested_types);
+                    if (!nested_type)
+                        return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
+                }
+                else
+                {
+                    nested_type = getLeastSupertype<on_error>(nested_types);
+                }
+
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
                 if (!nested_type)
@@ -456,6 +498,8 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
         if (have_nullable)
         {
             auto nested_type = getLeastSupertype<on_error>(nested_types);
+            if (isVariant(nested_type))
+                return nested_type;
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
             /// nested_type will be nullptr, we should return nullptr in this case.
             if (!nested_type)
@@ -623,7 +667,8 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
     {
         /// First, if we have signed integers, try to convert all UInt64 to Int64 if possible.
         convertUInt64toInt64IfPossible(types, type_ids);
-        auto numeric_type = getNumericType<on_error>(type_ids);
+        auto throw_or_return = [&](const TypeIndexSet &, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(types, message_suffix, error_code); };
+        auto numeric_type = getNumericType(type_ids, throw_or_return);
         if (numeric_type)
             return numeric_type;
     }
@@ -637,6 +682,11 @@ DataTypePtr getLeastSupertypeOrString(const DataTypes & types)
     return getLeastSupertype<LeastSupertypeOnError::String>(types);
 }
 
+DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types)
+{
+    return getLeastSupertype<LeastSupertypeOnError::Variant>(types);
+}
+
 DataTypePtr tryGetLeastSupertype(const DataTypes & types)
 {
     return getLeastSupertype<LeastSupertypeOnError::Null>(types);
@@ -676,7 +726,8 @@ DataTypePtr getLeastSupertype(const TypeIndexSet & types)
         return std::make_shared<DataTypeString>();
     }
 
-    auto numeric_type = getNumericType<on_error>(types);
+    auto throw_or_return = [](const TypeIndexSet & type_ids, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(type_ids, message_suffix, error_code); };
+    auto numeric_type = getNumericType(types, throw_or_return);
     if (numeric_type)
         return numeric_type;
 
diff --git a/src/DataTypes/getLeastSupertype.h b/src/DataTypes/getLeastSupertype.h
index 2ef4a0e6850..d949fad69c5 100644
--- a/src/DataTypes/getLeastSupertype.h
+++ b/src/DataTypes/getLeastSupertype.h
@@ -8,6 +8,7 @@ enum class LeastSupertypeOnError
 {
     Throw,
     String,
+    Variant,
     Null,
 };
 
@@ -24,6 +25,17 @@ DataTypePtr getLeastSupertype(const DataTypes & types);
 /// All types can be casted to String, because they can be serialized to String.
 DataTypePtr getLeastSupertypeOrString(const DataTypes & types);
 
+/// Same as getLeastSupertype but in case when there is no supertype for some types
+/// it uses Variant of these types as a supertype. Any type can be casted to a Variant
+/// that contains this type.
+/// As nested Variants are not allowed, if one of the types is Variant, it's variants
+/// are used in the resulting Variant.
+/// Examples:
+/// (UInt64, String) -> Variant(UInt64, String)
+/// (Array(UInt64), Array(String)) -> Array(Variant(UInt64, String))
+/// (Variant(UInt64, String), Array(UInt32)) -> Variant(UInt64, String, Array(UInt32))
+DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types);
+
 /// Same as above but return nullptr instead of throwing exception.
 DataTypePtr tryGetLeastSupertype(const DataTypes & types);
 
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 1dc7443f124..c247938f885 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -688,15 +688,9 @@ private:
 
         DataTypePtr common_type;
         if (use_variant_when_no_common_type)
-        {
-            common_type = tryGetLeastSupertype(DataTypes{arg1.type, arg2.type});
-            if (!common_type)
-                common_type = std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arg1.type), removeNullableOrLowCardinalityNullable(arg2.type)});
-        }
+            common_type = getLeastSupertypeOrVariant(DataTypes{arg1.type, arg2.type});
         else
-        {
             common_type = getLeastSupertype(DataTypes{arg1.type, arg2.type});
-        }
 
         ColumnPtr col_then = castColumn(arg1, common_type);
         ColumnPtr col_else = castColumn(arg2, common_type);
@@ -1118,11 +1112,7 @@ public:
                 "Must be UInt8.", arguments[0]->getName());
 
         if (use_variant_when_no_common_type)
-        {
-            if (auto res = tryGetLeastSupertype(DataTypes{arguments[1], arguments[2]}))
-                return res;
-            return std::make_shared<DataTypeVariant>(DataTypes{removeNullableOrLowCardinalityNullable(arguments[1]), removeNullableOrLowCardinalityNullable(arguments[2])});
-        }
+            return getLeastSupertypeOrVariant(DataTypes{arguments[1], arguments[2]});
 
         return getLeastSupertype(DataTypes{arguments[1], arguments[2]});
     }
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 7a2e9444b2c..cefbea9f352 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -119,13 +119,7 @@ public:
         });
 
         if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
-        {
-            if (auto res = tryGetLeastSupertype(types_of_branches))
-                return res;
-            for (auto & type : types_of_branches)
-                type = removeNullableOrLowCardinalityNullable(type);
-            return std::make_shared<DataTypeVariant>(types_of_branches);
-        }
+            return getLeastSupertypeOrVariant(types_of_branches);
 
         return getLeastSupertype(types_of_branches);
     }
diff --git a/tests/queries/0_stateless/02940_variant_text_deserialization.reference b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
index 98725917567..8836e6c4e57 100644
--- a/tests/queries/0_stateless/02940_variant_text_deserialization.reference
+++ b/tests/queries/0_stateless/02940_variant_text_deserialization.reference
@@ -505,7 +505,7 @@ String
 (NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,NULL),(0,0),(10000000000000000000000,NULL)(NULL,NULL),('string',NULL),(-1,-1),(0,0)(NULL,NULL),('string',NULL),(-1,NULL),(0,0)Floats
 (NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Decimals
 (NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)(NULL,NULL),('string',NULL),(42.42,42.42)Dates and DateTimes
-(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('1970-01-01 00:00:00.000','1970-01-01 00:00:00.000'),('2020-01-01 00:00:00.999',NULL),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
+(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01','2020-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('1900-01-01','1900-01-01'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01 00:00:00','2020-01-01 00:00:00'),('2020-01-01 00:00:00.999',NULL)(NULL,NULL),('string',NULL),('2020-01-d1',NULL),('2020-01-01 00:00:00.999','2020-01-01 00:00:00.999'),('2020-01-01 00:00:00.999999999 ABC',NULL)UUID
 (NULL,NULL),('string',NULL),('c8619cca-0caa-445e-ae76-1d4f6e0b3927','c8619cca-0caa-445e-ae76-1d4f6e0b3927'),('c8619cca-0caa-445e-ae76-1d4f6e0b3927AAA',NULL)IPv4
 (NULL,NULL),('string',NULL),('127.0.0.1','127.0.0.1'),('127.0.0.1AAA',NULL)IPv6
 (NULL,NULL),('string',NULL),('2001:db8:85a3::8a2e:370:7334','2001:db8:85a3::8a2e:370:7334'),('2001:0db8:85a3:0000:0000:8a2e:0370:7334AAA',NULL)Enum

From c30736d415fcdaccb68a1c0e37e8c4de9242e014 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Fri, 12 Jan 2024 15:31:15 +0000
Subject: [PATCH 0114/1081] Cosmetics

---
 src/Storages/MergeTree/MutateTask.cpp         |  8 +--
 ...mn_must_not_override_past_values.reference | 33 ++++++++++++
 ...e_column_must_not_override_past_values.sql | 53 +++++++++++++++++++
 ..._column_not_override_past_values.reference | 29 ----------
 ...ialize_column_not_override_past_values.sql | 49 -----------------
 5 files changed, 90 insertions(+), 82 deletions(-)
 create mode 100644 tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
 create mode 100644 tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
 delete mode 100644 tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
 delete mode 100644 tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index bb41608eb00..25fa45e7b68 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -76,8 +76,8 @@ static void splitAndModifyMutationCommands(
         {
             if (command.type == MutationCommand::Type::MATERIALIZE_COLUMN)
             {
-                /// For ordinary column with default expression, materialize column should not override past values
-                /// So we only mutated column if `command.column_name` is a materialized column or if the part does not have physical column file
+                /// For ordinary column with default or materialized expression, MATERIALIZE COLUMN should not override past values
+                /// So we only mutate column if `command.column_name` is a default/materialized column or if the part does not have physical column file
                 auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
                 if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
                 {
@@ -206,8 +206,8 @@ static void splitAndModifyMutationCommands(
         {
             if (command.type == MutationCommand::Type::MATERIALIZE_COLUMN)
             {
-                /// For ordinary column with default expression, materialize column should not override past values
-                /// So we only mutated column if `command.column_name` is a materialized column or if the part does not have physical column file
+                /// For ordinary column with default or materialized expression, MATERIALIZE COLUMN should not override past values
+                /// So we only mutate column if `command.column_name` is a default/materialized column or if the part does not have physical column file
                 auto column_ordinary = table_columns.getOrdinary().tryGetByName(command.column_name);
                 if (!column_ordinary || !part->tryGetColumn(command.column_name) || !part->hasColumnFiles(*column_ordinary))
                     for_interpreter.push_back(command);
diff --git a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
new file mode 100644
index 00000000000..a5a0370620b
--- /dev/null
+++ b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
@@ -0,0 +1,33 @@
+-- Compact parts
+Origin
+1	2
+2	54321
+After materialize
+1	2
+2	54321
+-- Wide parts
+Origin
+1	2
+2	54321
+After materialize
+1	2
+2	54321
+-- Nullable column != physically absent
+Origin
+1	2
+2	\N
+3	54321
+After materialize
+1	2
+2	\N
+3	54321
+-- Parts with renamed column
+Origin
+1	2
+2	54321
+After rename
+1	2
+2	54321
+After materialize
+1	2
+2	54321
diff --git a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
new file mode 100644
index 00000000000..825c7eab048
--- /dev/null
+++ b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
@@ -0,0 +1,53 @@
+SET mutations_sync = 2;
+
+SELECT '-- Compact parts';
+
+CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id;
+INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id) VALUES (2);
+SELECT 'Origin';
+SELECT * FROM tab ORDER BY id;
+ALTER TABLE tab MATERIALIZE COLUMN dflt;
+SELECT 'After materialize';
+SELECT * FROM tab ORDER BY id;
+DROP TABLE tab;
+
+SELECT '-- Wide parts';
+
+CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
+INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id) VALUES (2);
+SELECT 'Origin';
+SELECT * FROM tab ORDER BY id;
+ALTER TABLE tab MATERIALIZE COLUMN dflt;
+SELECT 'After materialize';
+SELECT * FROM tab ORDER BY id;
+DROP TABLE tab;
+
+SELECT '-- Nullable column != physically absent';
+
+CREATE TABLE tab (id Int64, dflt Nullable(Int64) DEFAULT 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
+INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id, dflt) VALUES (2, NULL);
+INSERT INTO tab (id) VALUES (3);
+SELECT 'Origin';
+SELECT * FROM tab ORDER BY id;
+ALTER TABLE tab MATERIALIZE COLUMN dflt;
+SELECT 'After materialize';
+SELECT * FROM tab ORDER BY id;
+DROP TABLE tab;
+
+SELECT '-- Parts with renamed column';
+
+CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id;
+INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id) VALUES (2);
+SELECT 'Origin';
+SELECT * FROM tab ORDER BY id;
+ALTER TABLE tab RENAME COLUMN dflt TO dflt2;
+SELECT 'After rename';
+SELECT * FROM tab ORDER BY id;
+ALTER TABLE tab MATERIALIZE COLUMN bar;
+SELECT 'After materialize';
+SELECT * FROM tab ORDER BY id;
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
deleted file mode 100644
index 6b0d88bd09b..00000000000
--- a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.reference
+++ /dev/null
@@ -1,29 +0,0 @@
---Origin--
-1	2
-2	54321
---After materialize--
-1	2
-2	54321
---Origin--
-1	2
-2	54321
---After materialize--
-1	2
-2	54321
---Origin--
-1	2
-2	\N
-3	54321
---After materialize--
-1	2
-2	\N
-3	54321
---Origin--
-1	2
-2	54321
---After rename--
-1	2
-2	54321
---After materialize--
-1	2
-2	54321
diff --git a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql b/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql
deleted file mode 100644
index 1815661e097..00000000000
--- a/tests/queries/0_stateless/02946_materialize_column_not_override_past_values.sql
+++ /dev/null
@@ -1,49 +0,0 @@
-
-SET mutations_sync = 2;
--- Compact parts
-CREATE TABLE test (id Int64, foo Int64 default 54321) ENGINE MergeTree ORDER BY id;
-INSERT INTO test ( id, foo ) values ( 1, 2 );
-INSERT INTO test ( id ) values ( 2 );
-SELECT '--Origin--';
-SELECT * FROM test ORDER BY id;
-ALTER TABLE test MATERIALIZE COLUMN foo;
-SELECT '--After materialize--';
-SELECT * FROM test ORDER BY id;
-DROP TABLE test;
-
--- Wide parts
-CREATE TABLE test (id Int64, foo Nullable(Int64) default 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
-INSERT INTO test ( id, foo ) values ( 1, 2 );
-INSERT INTO test ( id ) values ( 2 );
-SELECT '--Origin--';
-SELECT * FROM test ORDER BY id;
-ALTER TABLE test MATERIALIZE COLUMN foo;
-SELECT '--After materialize--';
-SELECT * FROM test ORDER BY id;
-DROP TABLE test;
-
--- Nullable column != physically absent
-CREATE TABLE test (id Int64, foo Nullable(Int64) default 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
-INSERT INTO test ( id, foo ) values ( 1, 2 );
-INSERT INTO test ( id, foo ) values ( 2, NULL );
-INSERT INTO test ( id ) values ( 3 );
-SELECT '--Origin--';
-SELECT * FROM test ORDER BY id;
-ALTER TABLE test MATERIALIZE COLUMN foo;
-SELECT '--After materialize--';
-SELECT * FROM test ORDER BY id;
-DROP TABLE test;
-
--- Parts with renamed column
-CREATE TABLE test (id Int64, foo Int64 default 54321) ENGINE MergeTree ORDER BY id;
-INSERT INTO test ( id, foo ) values ( 1, 2 );
-INSERT INTO test ( id ) values ( 2 );
-SELECT '--Origin--';
-SELECT * FROM test ORDER BY id;
-ALTER TABLE test RENAME COLUMN foo TO bar;
-SELECT '--After rename--';
-SELECT * FROM test ORDER BY id;
-ALTER TABLE test MATERIALIZE COLUMN bar;
-SELECT '--After materialize--';
-SELECT * FROM test ORDER BY id;
-DROP TABLE test;
\ No newline at end of file

From 1dacfc53ff97fbab6ee349c6df27b3ad2f9df1e8 Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Fri, 12 Jan 2024 17:28:45 +0000
Subject: [PATCH 0115/1081] weather data

---
 .../getting-started/example-datasets/noaa.md  | 340 ++++++++++++++++++
 1 file changed, 340 insertions(+)
 create mode 100644 docs/en/getting-started/example-datasets/noaa.md

diff --git a/docs/en/getting-started/example-datasets/noaa.md b/docs/en/getting-started/example-datasets/noaa.md
new file mode 100644
index 00000000000..8d34ff8d3ee
--- /dev/null
+++ b/docs/en/getting-started/example-datasets/noaa.md
@@ -0,0 +1,340 @@
+---
+slug: /en/getting-started/example-datasets/noaa
+sidebar_label: NOAA Global Historical Climatology Network 
+sidebar_position: 1
+description: 2.5 billion rows of climate data for the last 120 yrs
+---
+
+# NOAA Global Historical Climatology Network 
+
+This dataset contains weather measurements for the last 120 years. Each row is a measurement for a point in time and station.
+
+More precisely and according to the [origin of this data](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn):
+
+> GHCN-Daily is a dataset that contains daily observations over global land areas. It contains station-based measurements from land-based stations worldwide, about two thirds of which are for precipitation measurements only (Menne et al., 2012). GHCN-Daily is a composite of climate records from numerous sources that were merged together and subjected to a common suite of quality assurance reviews (Durre et al., 2010). The archive includes the following meteorological elements:
+
+    - Daily maximum temperature
+    - Daily minimum temperature
+    - Temperature at the time of observation
+    - Precipitation (i.e., rain, melted snow)
+    - Snowfall
+    - Snow depth
+    - Other elements where available
+
+## Downloading the data
+
+- A [pre-prepared version](#pre-prepared-data) of the data for ClickHouse, which has been cleansed, re-structured, and enriched. This data covers the years 1900 to 2022.
+- [Download the original data](#original-data) and convert to the format required by ClickHouse. Users wanting to add their own columns may wish to explore this approach.
+
+### Pre-prepared data
+
+More specifically, rows have been removed that did not fail any quality assurance checks by Noaa. The data has also been restructured from a measurement per line to a row per station id and date i.e.
+
+```csv
+"station_id","date","tempAvg","tempMax","tempMin","precipitation","snowfall","snowDepth","percentDailySun","averageWindSpeed","maxWindSpeed","weatherType"
+"AEM00041194","2022-07-30",347,0,308,0,0,0,0,0,0,0
+"AEM00041194","2022-07-31",371,413,329,0,0,0,0,0,0,0
+"AEM00041194","2022-08-01",384,427,357,0,0,0,0,0,0,0
+"AEM00041194","2022-08-02",381,424,352,0,0,0,0,0,0,0
+```
+
+This is simpler to query and ensures the resulting table is less sparse. Finally, the data has also been enriched with latitude and longitude.
+
+This data is available in the following S3 location. Either download the data to your local filesystem (and insert using the ClickHouse client) or insert directly into ClickHouse (see [Inserting from S3](#inserting-from-s3)).
+
+To download:
+
+```bash
+wget https://datasets-documentation.s3.eu-west-3.amazonaws.com/noaa/noaa_enriched.parquet
+```
+
+### Original data
+
+The following details the steps to download and transform the original data in preparation for loading into ClickHouse.
+
+#### Download
+
+To download the original data:
+
+```bash
+for i in {1900..2023}; do wget https://noaa-ghcn-pds.s3.amazonaws.com/csv.gz/${i}.csv.gz; done
+```
+
+#### Sampling the data
+
+```bash
+zcat 2021.csv.gz | head
+AE000041196,20210101,TMAX,278,,,S,
+AE000041196,20210101,PRCP,0,D,,S,
+AE000041196,20210101,TAVG,214,H,,S,
+AEM00041194,20210101,TMAX,266,,,S,
+AEM00041194,20210101,TMIN,178,,,S,
+AEM00041194,20210101,PRCP,0,,,S,
+AEM00041194,20210101,TAVG,217,H,,S,
+AEM00041217,20210101,TMAX,262,,,S,
+AEM00041217,20210101,TMIN,155,,,S,
+AEM00041217,20210101,TAVG,202,H,,S,
+```
+
+Summarizing the [format documentation](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn):
+
+
+Summarizing the format documentation and the columns in order:
+
+ - An 11 character station identification code. This itself encodes some useful information
+ - YEAR/MONTH/DAY = 8 character date in YYYYMMDD format (e.g. 19860529 = May 29, 1986)
+ - ELEMENT = 4 character indicator of element type. Effectively the measurement type. While there are many measurements available, we select the following:
+    - PRCP - Precipitation (tenths of mm)
+    - SNOW - Snowfall (mm)
+    - SNWD - Snow depth (mm)
+    - TMAX - Maximum temperature (tenths of degrees C)
+    - TAVG - Average temperature (tenths of a degrees C)
+    - TMIN - Minimum temperature (tenths of degrees C)
+    - PSUN - Daily percent of possible sunshine (percent)
+    - AWND - Average daily wind speed (tenths of meters per second)
+    - WSFG - Peak gust wind speed (tenths of meters per second)
+    - WT** = Weather Type where ** defines the weather type. Full list of weather types here.
+- DATA VALUE = 5 character data value for ELEMENT i.e. the value of the measurement.
+- M-FLAG = 1 character Measurement Flag. This has 10 possible values. Some of these values indicate questionable data accuracy. We accept data where this is set to “P” - identified as missing presumed zero, as this is only relevant to the PRCP, SNOW and SNWD measurements.
+- Q-FLAG is the measurement quality flag with 14 possible values. We are only interested in data with an empty value i.e. it did not fail any quality assurance checks.
+- S-FLAG is the source flag for the observation. Not useful for our analysis and ignored.
+- OBS-TIME = 4-character time of observation in hour-minute format (i.e. 0700 =7:00 am). Typically not present in older data. We ignore this for our purposes.
+
+A measurement per line would result in a sparse table structure in ClickHouse. We should transform to a row per time and station, with measurements as columns. First, we limit the dataset to those rows without issues i.e. where `qFlag` is equal to an empty string.
+
+#### Clean the data
+
+Using [ClickHouse local](https://clickhouse.com/blog/extracting-converting-querying-local-files-with-sql-clickhouse-local) we can filter rows that represent measurements of interest and pass our quality requirements:
+
+```bash
+clickhouse local --query "SELECT count() 
+FROM file('*.csv.gz', CSV, 'station_id String, date String, measurement String, value Int64, mFlag String, qFlag String, sFlag String, obsTime String') WHERE qFlag = '' AND (measurement IN ('PRCP', 'SNOW', 'SNWD', 'TMAX', 'TAVG', 'TMIN', 'PSUN', 'AWND', 'WSFG') OR startsWith(measurement, 'WT'))"
+
+2679264563
+```
+
+With over 2.6 billion rows, this isn’t a fast query since it involves parsing all the files. On our 8 core  machine, this takes around 160 seconds.
+
+
+### Pivot data
+
+While the measurement per line structure can be used with ClickHouse, it will unnecessarily complicate future queries. Ideally, we need a row per station id and date, where each measurement type and associated value are a column i.e.
+
+```csv
+"station_id","date","tempAvg","tempMax","tempMin","precipitation","snowfall","snowDepth","percentDailySun","averageWindSpeed","maxWindSpeed","weatherType"
+"AEM00041194","2022-07-30",347,0,308,0,0,0,0,0,0,0
+"AEM00041194","2022-07-31",371,413,329,0,0,0,0,0,0,0
+"AEM00041194","2022-08-01",384,427,357,0,0,0,0,0,0,0
+"AEM00041194","2022-08-02",381,424,352,0,0,0,0,0,0,0
+```
+
+Using ClickHouse local and a simple `GROUP BY`, we can repivot our data to this structure. To limit memory overhead, we do this one file at a time.
+
+```bash
+for i in {1900..2022}
+do
+clickhouse-local --query "SELECT station_id,
+       toDate32(date) as date,
+       anyIf(value, measurement = 'TAVG') as tempAvg,
+       anyIf(value, measurement = 'TMAX') as tempMax,
+       anyIf(value, measurement = 'TMIN') as tempMin,
+       anyIf(value, measurement = 'PRCP') as precipitation,
+       anyIf(value, measurement = 'SNOW') as snowfall,
+       anyIf(value, measurement = 'SNWD') as snowDepth,
+       anyIf(value, measurement = 'PSUN') as percentDailySun,
+       anyIf(value, measurement = 'AWND') as averageWindSpeed,
+       anyIf(value, measurement = 'WSFG') as maxWindSpeed,
+       toUInt8OrZero(replaceOne(anyIf(measurement, startsWith(measurement, 'WT') AND value = 1), 'WT', '')) as weatherType
+FROM file('$i.csv.gz', CSV, 'station_id String, date String, measurement String, value Int64, mFlag String, qFlag String, sFlag String, obsTime String')
+ WHERE qFlag = '' AND (measurement IN ('PRCP', 'SNOW', 'SNWD', 'TMAX', 'TAVG', 'TMIN', 'PSUN', 'AWND', 'WSFG') OR startsWith(measurement, 'WT'))
+GROUP BY station_id, date
+ORDER BY station_id, date FORMAT CSV" >> "noaa.csv";
+done
+```
+
+This query produces a single 50GB file `noaa.csv`.
+
+### Enriching the data
+
+The data has no indication of location aside from a station id, which includes a prefix country code. Ideally, each station would have a latitude and longitude associated with it. To achieve this, NOAA conveniently provides the details of each station as a separate [ghcnd-stations.txt](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn#format-of-ghcnd-stationstxt-file). This file has [several columns](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn#format-of-ghcnd-stationstxt-file), of which five are useful to our future analysis: id, latitude, longitude, elevation, and name.
+
+```bash
+wget http://noaa-ghcn-pds.s3.amazonaws.com/ghcnd-stations.txt
+```
+
+```bash
+clickhouse local --query "WITH stations AS (SELECT id, lat, lon, elevation, splitByString(' GSN ',name)[1] as name FROM file('ghcnd-stations.txt', Regexp, 'id String, lat Float64, lon Float64, elevation Float32, name String'))
+SELECT station_id,
+       date,
+       tempAvg,
+       tempMax,
+       tempMin,
+       precipitation,
+       snowfall,
+       snowDepth,
+       percentDailySun,
+       averageWindSpeed,
+       maxWindSpeed,
+       weatherType,
+       tuple(lon, lat) as location,
+       elevation,
+       name
+FROM file('noaa.csv', CSV,
+          'station_id String, date Date32, tempAvg Int32, tempMax Int32, tempMin Int32, precipitation Int32, snowfall Int32, snowDepth Int32, percentDailySun Int8, averageWindSpeed Int32, maxWindSpeed Int32, weatherType UInt8') as noaa LEFT OUTER
+         JOIN stations ON noaa.station_id = stations.id INTO OUTFILE 'noaa_enriched.parquet' FORMAT Parquet SETTINGS format_regexp='^(.{11})\s+(\-?\d{1,2}\.\d{4})\s+(\-?\d{1,3}\.\d{1,4})\s+(\-?\d*\.\d*)\s+(.*)\s+(?:[\d]*)'" 
+```
+This query takes a few minutes to run and produces an 6.4GB file `noaa_enriched.parquet`.
+
+## Create table
+
+Create a MergeTree table in ClickHouse (from the ClickHouse client).
+
+```sql
+CREATE TABLE noaa
+(
+   `station_id` LowCardinality(String),
+   `date` Date32,
+   `tempAvg` Int32 COMMENT 'Average temperature (tenths of a degrees C)',
+   `tempMax` Int32 COMMENT 'Maximum temperature (tenths of degrees C)',
+   `tempMin` Int32 COMMENT 'Minimum temperature (tenths of degrees C)',
+   `precipitation` UInt32 COMMENT 'Precipitation (tenths of mm)',
+   `snowfall` UInt32 COMMENT 'Snowfall (mm)',
+   `snowDepth` UInt32 COMMENT 'Snow depth (mm)',
+   `percentDailySun` UInt8 COMMENT 'Daily percent of possible sunshine (percent)',
+   `averageWindSpeed` UInt32 COMMENT 'Average daily wind speed (tenths of meters per second)',
+   `maxWindSpeed` UInt32 COMMENT 'Peak gust wind speed (tenths of meters per second)',
+   `weatherType` Enum8('Normal' = 0, 'Fog' = 1, 'Heavy Fog' = 2, 'Thunder' = 3, 'Small Hail' = 4, 'Hail' = 5, 'Glaze' = 6, 'Dust/Ash' = 7, 'Smoke/Haze' = 8, 'Blowing/Drifting Snow' = 9, 'Tornado' = 10, 'High Winds' = 11, 'Blowing Spray' = 12, 'Mist' = 13, 'Drizzle' = 14, 'Freezing Drizzle' = 15, 'Rain' = 16, 'Freezing Rain' = 17, 'Snow' = 18, 'Unknown Precipitation' = 19, 'Ground Fog' = 21, 'Freezing Fog' = 22),
+   `location` Point,
+   `elevation` Float32,
+   `name` LowCardinality(String)
+) ENGINE = MergeTree() ORDER BY (station_id, date);
+
+```
+
+## Inserting into ClickHouse
+
+### Inserting from local file
+
+Data can be inserted from local file as follows (from the ClickHouse client):
+
+```sql
+INSERT INTO noaa FROM INFILE '<path>/noaa_enriched.parquet'
+```
+
+where `<path>` represents the full path to the local file on disk. 
+
+See [here](https://clickhouse.com/blog/real-world-data-noaa-climate-data#load-the-data) for how to speed this load up.
+
+### Inserting from S3
+
+```sql
+INSERT INTO noaa SELECT *
+FROM s3('https://datasets-documentation.s3.eu-west-3.amazonaws.com/noaa/noaa_enriched.parquet')
+
+```
+For how to speed this up, see our blog post on [tuning large data loads](https://clickhouse.com/blog/supercharge-your-clickhouse-data-loads-part2).
+
+## Sample queries
+
+### Highest temperature ever
+
+```sql
+SELECT
+    tempMax / 10 AS maxTemp,
+    location,
+    name,
+    date
+FROM blogs.noaa
+WHERE tempMax > 500
+ORDER BY
+    tempMax DESC,
+    date ASC
+LIMIT 5
+
+┌─maxTemp─┬─location──────────┬─name───────────────────────────────────────────┬───────date─┐
+│    56.7 │ (-116.8667,36.45) │ CA GREENLAND RCH                               │ 1913-07-10 │
+│    56.7 │ (-115.4667,32.55) │ MEXICALI (SMN)                                 │ 1949-08-20 │
+│    56.7 │ (-115.4667,32.55) │ MEXICALI (SMN)                                 │ 1949-09-18 │
+│    56.7 │ (-115.4667,32.55) │ MEXICALI (SMN)                                 │ 1952-07-17 │
+│    56.7 │ (-115.4667,32.55) │ MEXICALI (SMN)                                 │ 1952-09-04 │
+└─────────┴───────────────────┴────────────────────────────────────────────────┴────────────┘
+
+5 rows in set. Elapsed: 0.514 sec. Processed 1.06 billion rows, 4.27 GB (2.06 billion rows/s., 8.29 GB/s.)
+```
+
+Reassuringly consistent with the [documented record](https://en.wikipedia.org/wiki/List_of_weather_records#Highest_temperatures_ever_recorded) at [Furnace Creek](https://www.google.com/maps/place/36%C2%B027'00.0%22N+116%C2%B052'00.1%22W/@36.1329666,-116.1104099,8.95z/data=!4m5!3m4!1s0x0:0xf2ed901b860f4446!8m2!3d36.45!4d-116.8667) as of 2023.
+
+### Best ski resorts
+
+Using a [list of ski resorts](https://gist.githubusercontent.com/gingerwizard/dd022f754fd128fdaf270e58fa052e35/raw/622e03c37460f17ef72907afe554cb1c07f91f23/ski_resort_stats.csv) in the united states and their respective locations, we join these against the top 1000 weather stations with the most in any month in the last 5 yrs. Sorting this join by [geoDistance](https://clickhouse.com/docs/en/sql-reference/functions/geo/coordinates/#geodistance) and restricting the results to those where the distance is less than 20km, we select the top result per resort and sort this by total snow. Note we also restrict resorts to those above 1800m, as a broad indicator of good skiing conditions.
+
+```sql
+SELECT
+   resort_name,
+   total_snow / 1000 AS total_snow_m,
+   resort_location,
+   month_year
+FROM
+(
+   WITH resorts AS
+       (
+           SELECT
+               resort_name,
+               state,
+               (lon, lat) AS resort_location,
+               'US' AS code
+           FROM url('https://gist.githubusercontent.com/gingerwizard/dd022f754fd128fdaf270e58fa052e35/raw/622e03c37460f17ef72907afe554cb1c07f91f23/ski_resort_stats.csv', CSVWithNames)
+       )
+   SELECT
+       resort_name,
+       highest_snow.station_id,
+       geoDistance(resort_location.1, resort_location.2, station_location.1, station_location.2) / 1000 AS distance_km,
+       highest_snow.total_snow,
+       resort_location,
+       station_location,
+       month_year
+   FROM
+   (
+       SELECT
+           sum(snowfall) AS total_snow,
+           station_id,
+           any(location) AS station_location,
+           month_year,
+           substring(station_id, 1, 2) AS code
+       FROM noaa
+       WHERE (date > '2017-01-01') AND (code = 'US') AND (elevation > 1800)
+       GROUP BY
+           station_id,
+           toYYYYMM(date) AS month_year
+       ORDER BY total_snow DESC
+       LIMIT 1000
+   ) AS highest_snow
+   INNER JOIN resorts ON highest_snow.code = resorts.code
+   WHERE distance_km < 20
+   ORDER BY
+       resort_name ASC,
+       total_snow DESC
+   LIMIT 1 BY
+       resort_name,
+       station_id
+)
+ORDER BY total_snow DESC
+LIMIT 5
+
+┌─resort_name──────────┬─total_snow_m─┬─resort_location─┬─month_year─┐
+│ Sugar Bowl, CA       │        7.799 │ (-120.3,39.27)  │     201902 │
+│ Donner Ski Ranch, CA │        7.799 │ (-120.34,39.31) │     201902 │
+│ Boreal, CA           │        7.799 │ (-120.35,39.33) │     201902 │
+│ Homewood, CA         │        4.926 │ (-120.17,39.08) │     201902 │
+│ Alpine Meadows, CA   │        4.926 │ (-120.22,39.17) │     201902 │
+└──────────────────────┴──────────────┴─────────────────┴────────────┘
+
+5 rows in set. Elapsed: 0.750 sec. Processed 689.10 million rows, 3.20 GB (918.20 million rows/s., 4.26 GB/s.)
+Peak memory usage: 67.66 MiB.
+```
+
+## Credits
+
+We would like to acknowledge the efforts of the Global Historical Climatology Network for preparing, cleansing, and distributing this data. We appreciate your efforts.
+
+Menne, M.J., I. Durre, B. Korzeniewski, S. McNeal, K. Thomas, X. Yin, S. Anthony, R. Ray, R.S. Vose, B.E.Gleason, and T.G. Houston, 2012: Global Historical Climatology Network - Daily (GHCN-Daily), Version 3. [indicate subset used following decimal, e.g. Version 3.25]. NOAA National Centers for Environmental Information. http://doi.org/10.7289/V5D21VHZ [17/08/2020]

From ffde721f08359e0437c44026881e2514012a4966 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 13 Jan 2024 23:09:10 +0300
Subject: [PATCH 0116/1081] Update 02932_set_ttl_where.sql

---
 tests/queries/0_stateless/02932_set_ttl_where.sql | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/02932_set_ttl_where.sql b/tests/queries/0_stateless/02932_set_ttl_where.sql
index bf2b317c4bf..ee8473e1af2 100644
--- a/tests/queries/0_stateless/02932_set_ttl_where.sql
+++ b/tests/queries/0_stateless/02932_set_ttl_where.sql
@@ -1,3 +1,5 @@
+-- Tags: no-ordinary-database
+
 create or replace table t_temp (
     a UInt32,
     timestamp DateTime
@@ -12,3 +14,5 @@ select sleep(1);
 insert into t_temp select rand(), now() from system.numbers limit 1_000_000;
 select sleep(1);
 optimize table t_temp final;
+
+DROP TABLE t_temp;

From 12585ea0e4cae1771ee6b51dd85a309e5923f12c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 13 Jan 2024 23:10:27 +0300
Subject: [PATCH 0117/1081] Update TTLDescription.cpp

---
 src/Storages/TTLDescription.cpp | 25 -------------------------
 1 file changed, 25 deletions(-)

diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index bfd3afc30d8..3db5269b617 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -117,11 +117,6 @@ TTLDescription::TTLDescription(const TTLDescription & other)
     , if_exists(other.if_exists)
     , recompression_codec(other.recompression_codec)
 {
-    // if (other.expression)
-    //     expression = other.expression->clone();
-
-    // if (other.where_expression)
-    //     where_expression = other.where_expression->clone();
 }
 
 TTLDescription & TTLDescription::operator=(const TTLDescription & other)
@@ -135,11 +130,6 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
     else
         expression_ast.reset();
 
-    // if (other.expression)
-    //     expression = other.expression->clone();
-    // else
-    //     expression.reset();
-
     expression_columns = other.expression_columns;
     result_column = other.result_column;
 
@@ -148,11 +138,6 @@ TTLDescription & TTLDescription::operator=(const TTLDescription & other)
     else
         where_expression_ast.reset();
 
-    // if (other.where_expression)
-    //     where_expression = other.where_expression->clone();
-    // else
-    //     where_expression.reset();
-
     where_expression_columns = other.where_expression_columns;
     where_result_column = other.where_result_column;
     group_by_keys = other.group_by_keys;
@@ -179,7 +164,6 @@ static ExpressionAndSets buildExpressionAndSets(ASTPtr & ast, const NamesAndType
     auto dag = analyzer.getActionsDAG(false);
 
     const auto * col = &dag->findInOutputs(ast->getColumnName());
-    // std::cerr << "buildExpressionAndSets " << ttl_string << std::endl;
     if (col->result_name != ttl_string)
         col = &dag->addAlias(*col, ttl_string);
 
@@ -189,10 +173,6 @@ static ExpressionAndSets buildExpressionAndSets(ASTPtr & ast, const NamesAndType
     result.expression = std::make_shared<ExpressionActions>(dag, ExpressionActionsSettings::fromContext(context));
     result.sets = analyzer.getPreparedSets();
 
-    // std::cerr << "--------- buildExpressionAndSets\n";
-    // std::cerr << result.expression->dumpActions() << std::endl;
-    // std::cerr << result.sets->getSubqueries().size() << std::endl;
-
     return result;
 }
 
@@ -232,8 +212,6 @@ TTLDescription TTLDescription::getTTLFromAST(
     auto expression = buildExpressionAndSets(ttl_ast, columns.getAllPhysical(), context).expression;
     result.expression_columns = expression->getRequiredColumnsWithTypes();
 
-    // auto syntax_analyzer_result = TreeRewriter(context).analyze(ttl_ast, columns.getAllPhysical());
-    // result.expression = ExpressionAnalyzer(ttl_ast, syntax_analyzer_result, context).getActions(false);
     result.result_column = expression->getSampleBlock().safeGetByPosition(0).name;
 
     ExpressionActionsPtr where_expression;
@@ -256,9 +234,6 @@ TTLDescription TTLDescription::getTTLFromAST(
             {
                 result.where_expression_ast = where_expr_ast->clone();
                 where_expression = buildExpressionAndSets(where_expr_ast, columns.getAllPhysical(), context).expression;
-                // auto where_syntax_result = TreeRewriter(context).analyze(where_expr_ast, columns.getAllPhysical());
-                // result.where_expression = ExpressionAnalyzer(where_expr_ast, where_syntax_result, context).getActions(false);
-
                 result.where_expression_columns = where_expression->getRequiredColumnsWithTypes();
                 result.where_result_column = where_expression->getSampleBlock().safeGetByPosition(0).name;
             }

From 776ea26ce71287735897b00c65b47d73e8d9811c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 02:45:51 +0300
Subject: [PATCH 0118/1081] Update PreparedSets.h

---
 src/Interpreters/PreparedSets.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 30bfda4700d..4f5ca337c5b 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -115,7 +115,6 @@ public:
     SetPtr buildSetInplace(const ContextPtr & context);
 
     std::unique_ptr<QueryPlan> build(const ContextPtr & context);
-    void buildSetInplace(const ContextPtr & context);
 
     QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
     void setQueryPlan(std::unique_ptr<QueryPlan> source_);

From 1afc5e8c01685d1bb3e86b5a0fff55618db517b0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 03:45:42 +0100
Subject: [PATCH 0119/1081] Enable coverage for debug build

---
 docker/packager/packager | 8 ++++++++
 tests/ci/build_check.py  | 2 ++
 tests/ci/ci_config.py    | 2 ++
 3 files changed, 12 insertions(+)

diff --git a/docker/packager/packager b/docker/packager/packager
index ade36a55591..4c443896f4a 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -121,6 +121,7 @@ def is_release_build(debug_build: bool, package_type: str, sanitizer: str) -> bo
 
 def parse_env_variables(
     debug_build: bool,
+    coverage: bool,
     compiler: str,
     sanitizer: str,
     package_type: str,
@@ -287,6 +288,9 @@ def parse_env_variables(
     else:
         result.append("BUILD_TYPE=None")
 
+    if coverage:
+        result.append("SANITIZE_COVERAGE=1")
+
     if not cache:
         cmake_flags.append("-DCOMPILER_CACHE=disabled")
 
@@ -415,6 +419,9 @@ def parse_args() -> argparse.Namespace:
         choices=("address", "thread", "memory", "undefined", ""),
         default="",
     )
+    parser.add_argument(
+        "--coverage", action="store_true", help="enable granular coverage with introspection"
+    )
 
     parser.add_argument("--clang-tidy", action="store_true")
     parser.add_argument(
@@ -507,6 +514,7 @@ def main() -> None:
 
     env_prepared = parse_env_variables(
         args.debug_build,
+        args.coverage,
         args.compiler,
         args.sanitizer,
         args.package_type,
diff --git a/tests/ci/build_check.py b/tests/ci/build_check.py
index 27243aac4f1..fe4308f5933 100644
--- a/tests/ci/build_check.py
+++ b/tests/ci/build_check.py
@@ -73,6 +73,8 @@ def get_packager_cmd(
         cmd += " --debug-build"
     if build_config.sanitizer:
         cmd += f" --sanitizer={build_config.sanitizer}"
+    if build_config.coverage:
+        cmd += " --coverage"
     if build_config.tidy:
         cmd += " --clang-tidy"
 
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index e3319fe4a72..b8dff3f0a28 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -62,6 +62,7 @@ class BuildConfig:
     package_type: Literal["deb", "binary", "fuzzers"]
     additional_pkgs: bool = False
     debug_build: bool = False
+    coverage: bool = False
     sanitizer: str = ""
     tidy: bool = False
     sparse_checkout: bool = False
@@ -473,6 +474,7 @@ CI_CONFIG = CiConfig(
             name="package_debug",
             compiler="clang-17",
             debug_build=True,
+            coverage=True,
             package_type="deb",
             sparse_checkout=True,
         ),

From 0219d58d925bd3f7901f9251c2abca76c1ae00dc Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Sun, 14 Jan 2024 02:56:50 +0000
Subject: [PATCH 0120/1081] Automatic style fix

---
 docker/packager/packager | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index 4c443896f4a..3e7f1ba447e 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -420,7 +420,9 @@ def parse_args() -> argparse.Namespace:
         default="",
     )
     parser.add_argument(
-        "--coverage", action="store_true", help="enable granular coverage with introspection"
+        "--coverage",
+        action="store_true",
+        help="enable granular coverage with introspection",
     )
 
     parser.add_argument("--clang-tidy", action="store_true")

From 6405decbb0ad0e80fe20b22a9956481abbe3b479 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 05:14:54 +0100
Subject: [PATCH 0121/1081] Fix Python

---
 docker/packager/packager | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index 4c443896f4a..2e2b6550636 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -289,7 +289,7 @@ def parse_env_variables(
         result.append("BUILD_TYPE=None")
 
     if coverage:
-        result.append("SANITIZE_COVERAGE=1")
+        cmake_flags.append("-DSANITIZE_COVERAGE=1")
 
     if not cache:
         cmake_flags.append("-DCOMPILER_CACHE=disabled")

From 5ba6def57d0e256be75b729678fc37d4c8989f7e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 07:29:28 +0300
Subject: [PATCH 0122/1081] Update noaa.md

---
 .../getting-started/example-datasets/noaa.md  | 32 ++++++++++---------
 1 file changed, 17 insertions(+), 15 deletions(-)

diff --git a/docs/en/getting-started/example-datasets/noaa.md b/docs/en/getting-started/example-datasets/noaa.md
index 8d34ff8d3ee..bc2e9fecae1 100644
--- a/docs/en/getting-started/example-datasets/noaa.md
+++ b/docs/en/getting-started/example-datasets/noaa.md
@@ -11,7 +11,7 @@ This dataset contains weather measurements for the last 120 years. Each row is a
 
 More precisely and according to the [origin of this data](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn):
 
-> GHCN-Daily is a dataset that contains daily observations over global land areas. It contains station-based measurements from land-based stations worldwide, about two thirds of which are for precipitation measurements only (Menne et al., 2012). GHCN-Daily is a composite of climate records from numerous sources that were merged together and subjected to a common suite of quality assurance reviews (Durre et al., 2010). The archive includes the following meteorological elements:
+> GHCN-Daily is a dataset that contains daily observations over global land areas. It contains station-based measurements from land-based stations worldwide, about two-thirds of which are for precipitation measurements only (Menne et al., 2012). GHCN-Daily is a composite of climate records from numerous sources that were merged together and subjected to a common suite of quality assurance reviews (Durre et al., 2010). The archive includes the following meteorological elements:
 
     - Daily maximum temperature
     - Daily minimum temperature
@@ -28,7 +28,7 @@ More precisely and according to the [origin of this data](https://github.com/aws
 
 ### Pre-prepared data
 
-More specifically, rows have been removed that did not fail any quality assurance checks by Noaa. The data has also been restructured from a measurement per line to a row per station id and date i.e.
+More specifically, rows have been removed that did not fail any quality assurance checks by Noaa. The data has also been restructured from a measurement per line to a row per station id and date, i.e.
 
 ```csv
 "station_id","date","tempAvg","tempMax","tempMin","precipitation","snowfall","snowDepth","percentDailySun","averageWindSpeed","maxWindSpeed","weatherType"
@@ -63,17 +63,19 @@ for i in {1900..2023}; do wget https://noaa-ghcn-pds.s3.amazonaws.com/csv.gz/${i
 #### Sampling the data
 
 ```bash
-zcat 2021.csv.gz | head
-AE000041196,20210101,TMAX,278,,,S,
-AE000041196,20210101,PRCP,0,D,,S,
-AE000041196,20210101,TAVG,214,H,,S,
-AEM00041194,20210101,TMAX,266,,,S,
-AEM00041194,20210101,TMIN,178,,,S,
-AEM00041194,20210101,PRCP,0,,,S,
-AEM00041194,20210101,TAVG,217,H,,S,
-AEM00041217,20210101,TMAX,262,,,S,
-AEM00041217,20210101,TMIN,155,,,S,
-AEM00041217,20210101,TAVG,202,H,,S,
+$ clickhouse-local --query "SELECT * FROM '2021.csv.gz' LIMIT 10" --format PrettyCompact
+┌─c1──────────┬───────c2─┬─c3───┬──c4─┬─c5───┬─c6───┬─c7─┬───c8─┐
+│ AE000041196 │ 20210101 │ TMAX │ 278 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AE000041196 │ 20210101 │ PRCP │   0 │ D    │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AE000041196 │ 20210101 │ TAVG │ 214 │ H    │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041194 │ 20210101 │ TMAX │ 266 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041194 │ 20210101 │ TMIN │ 178 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041194 │ 20210101 │ PRCP │   0 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041194 │ 20210101 │ TAVG │ 217 │ H    │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041217 │ 20210101 │ TMAX │ 262 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041217 │ 20210101 │ TMIN │ 155 │ ᴺᵁᴸᴸ │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+│ AEM00041217 │ 20210101 │ TAVG │ 202 │ H    │ ᴺᵁᴸᴸ │ S  │ ᴺᵁᴸᴸ │
+└─────────────┴──────────┴──────┴─────┴──────┴──────┴────┴──────┘
 ```
 
 Summarizing the [format documentation](https://github.com/awslabs/open-data-docs/tree/main/docs/noaa/noaa-ghcn):
@@ -88,7 +90,7 @@ Summarizing the format documentation and the columns in order:
     - SNOW - Snowfall (mm)
     - SNWD - Snow depth (mm)
     - TMAX - Maximum temperature (tenths of degrees C)
-    - TAVG - Average temperature (tenths of a degrees C)
+    - TAVG - Average temperature (tenths of a degree C)
     - TMIN - Minimum temperature (tenths of degrees C)
     - PSUN - Daily percent of possible sunshine (percent)
     - AWND - Average daily wind speed (tenths of meters per second)
@@ -215,7 +217,7 @@ CREATE TABLE noaa
 
 ### Inserting from local file
 
-Data can be inserted from local file as follows (from the ClickHouse client):
+Data can be inserted from a local file as follows (from the ClickHouse client):
 
 ```sql
 INSERT INTO noaa FROM INFILE '<path>/noaa_enriched.parquet'

From 9f5a7c51175dc3d4cfe46065b4912e7973a30983 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 08:05:57 +0100
Subject: [PATCH 0123/1081] Fix error

---
 cmake/sanitize.cmake                  | 1 +
 contrib/jemalloc-cmake/CMakeLists.txt | 3 +++
 2 files changed, 4 insertions(+)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 3f7a8498059..3882b51227e 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -82,3 +82,4 @@ if (SANITIZE_COVERAGE)
 endif()
 
 set (WITHOUT_COVERAGE_FLAGS "-fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table")
+set (WITHOUT_COVERAGE_FLAGS_LIST -fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table)
diff --git a/contrib/jemalloc-cmake/CMakeLists.txt b/contrib/jemalloc-cmake/CMakeLists.txt
index 15e965ed841..f85a38dcf8a 100644
--- a/contrib/jemalloc-cmake/CMakeLists.txt
+++ b/contrib/jemalloc-cmake/CMakeLists.txt
@@ -161,6 +161,9 @@ target_include_directories(_jemalloc SYSTEM PRIVATE
 
 target_compile_definitions(_jemalloc PRIVATE -DJEMALLOC_NO_PRIVATE_NAMESPACE)
 
+# Because our coverage callbacks call malloc, and recursive call of malloc could not work.
+target_compile_options(_jemalloc PRIVATE ${WITHOUT_COVERAGE_FLAGS_LIST})
+
 if (CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG")
     target_compile_definitions(_jemalloc PRIVATE
         -DJEMALLOC_DEBUG=1

From 3d904cbf81eb6ce2472eabdcd0be5f6955984ce5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 08:09:08 +0100
Subject: [PATCH 0124/1081] Slightly better

---
 base/base/coverage.cpp | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/base/base/coverage.cpp b/base/base/coverage.cpp
index d70c3bcd82b..ac8055e836c 100644
--- a/base/base/coverage.cpp
+++ b/base/base/coverage.cpp
@@ -1,4 +1,5 @@
 #include "coverage.h"
+#include <sys/mman.h>
 
 #pragma GCC diagnostic ignored "-Wreserved-identifier"
 
@@ -57,6 +58,14 @@ namespace
 
     uintptr_t * all_addresses_array = nullptr;
     size_t all_addresses_array_size = 0;
+
+    uintptr_t * allocate(size_t size)
+    {
+        void * map = mmap(nullptr, size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
+        if (MAP_FAILED == map)
+            return nullptr;
+        return static_cast<uintptr_t*>(map);
+    }
 }
 
 extern "C"
@@ -79,7 +88,7 @@ void __sanitizer_cov_trace_pc_guard_init(uint32_t * start, uint32_t * stop)
     coverage_array_size = stop - start;
 
     /// Note: we will leak this.
-    coverage_array = static_cast<uintptr_t*>(malloc(sizeof(uintptr_t) * coverage_array_size));
+    coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
 
     resetCoverage();
 }
@@ -92,7 +101,7 @@ void __sanitizer_cov_pcs_init(const uintptr_t * pcs_begin, const uintptr_t * pcs
         return;
     pc_table_initialized = true;
 
-    all_addresses_array = static_cast<uintptr_t*>(malloc(sizeof(uintptr_t) * coverage_array_size));
+    all_addresses_array = allocate(sizeof(uintptr_t) * coverage_array_size);
     all_addresses_array_size = pcs_end - pcs_begin;
 
     /// They are not a real pointers, but also contain a flag in the most significant bit,

From 33d9a1d4e83d58f15e36ea6e88908c8410f03c40 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 22:03:47 +0100
Subject: [PATCH 0125/1081] Documentation

---
 src/Functions/coverage.cpp | 48 ++++++++++++++++++++++++++++++++++++--
 1 file changed, 46 insertions(+), 2 deletions(-)

diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index 8a62469fa54..86de047a76b 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -85,8 +85,52 @@ public:
 
 REGISTER_FUNCTION(Coverage)
 {
-    factory.registerFunction("coverage", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Current)); });
-    factory.registerFunction("coverageAll", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::All)); });
+    factory.registerFunction("coverage", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Current)); },
+        FunctionDocumentation
+        {
+            .description=R"(
+This function is only available if ClickHouse was built with the SANITIZE_COVERAGE=1 option.
+
+It returns an array of unique addresses (a subset of the instrumented points in code) in the code
+encountered at runtime after the previous coverage reset (with the `SYSTEM RESET COVERAGE` query) or after server startup.
+
+[example:functions]
+
+The order of array elements is undetermined.
+
+You can use another function, `coverageAll` to find all instrumented addresses in the code to compare and calculate the percentage.
+
+You can process the addresses with the `addressToSymbol` (possibly with `demangle`) and `addressToLine` functions
+to calculate symbol-level, file-level, or line-level coverage.
+
+If you run multiple tests sequentially and reset the coverage with the `SYSTEM RESET COVERAGE` query between the tests,
+you can obtain a coverage information for every test in isolation, to find which functions are covered by which tests and vise-versa.
+
+By default, every *basic block* in the code is covered, which roughly means - a sequence of instructions without jumps,
+e.g. a body of for loop without ifs, or a single branch of if.
+
+See https://clang.llvm.org/docs/SanitizerCoverage.html for more information.
+)",
+            .examples{
+                {"functions", "SELECT DISTINCT demangle(addressToSymbol(arrayJoin(coverage())))", ""}},
+            .categories{"Introspection"}
+        });
+
+    factory.registerFunction("coverageAll", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::All)); },
+        FunctionDocumentation
+        {
+            .description=R"(
+This function is only available if ClickHouse was built with the SANITIZE_COVERAGE=1 option.
+
+It returns an array of all unique addresses in the code instrumented for coverage
+- all possible addresses that can appear in the result of the `coverage` function.
+
+You can use this function, and the `coverage` function to compare and calculate the coverage percentage.
+
+See the `coverage` function for the details.
+)",
+            .categories{"Introspection"}
+        });
 }
 
 }

From 3bd2c7e384d07d07da8768aa4708c7726b828db5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 14 Jan 2024 22:06:25 +0100
Subject: [PATCH 0126/1081] Report coverage if available

---
 tests/clickhouse-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index c7049b0e0c8..2d278f18176 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -2840,7 +2840,7 @@ def parse_args():
     parser.add_argument(
         "--collect-per-test-coverage",
         action="store_true",
-        default=False,
+        default=True,
         help="Create `system.coverage` table on the server and collect information about low-level code coverage on a per test basis there",
     )
     parser.add_argument(

From 1c1e1512bf92c4788ce17f38cf228d4525cdb9eb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 01:29:38 +0300
Subject: [PATCH 0127/1081] Update noaa.md

---
 docs/en/getting-started/example-datasets/noaa.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/getting-started/example-datasets/noaa.md b/docs/en/getting-started/example-datasets/noaa.md
index bc2e9fecae1..9a3ec7791b6 100644
--- a/docs/en/getting-started/example-datasets/noaa.md
+++ b/docs/en/getting-started/example-datasets/noaa.md
@@ -185,7 +185,7 @@ FROM file('noaa.csv', CSV,
           'station_id String, date Date32, tempAvg Int32, tempMax Int32, tempMin Int32, precipitation Int32, snowfall Int32, snowDepth Int32, percentDailySun Int8, averageWindSpeed Int32, maxWindSpeed Int32, weatherType UInt8') as noaa LEFT OUTER
          JOIN stations ON noaa.station_id = stations.id INTO OUTFILE 'noaa_enriched.parquet' FORMAT Parquet SETTINGS format_regexp='^(.{11})\s+(\-?\d{1,2}\.\d{4})\s+(\-?\d{1,3}\.\d{1,4})\s+(\-?\d*\.\d*)\s+(.*)\s+(?:[\d]*)'" 
 ```
-This query takes a few minutes to run and produces an 6.4GB file `noaa_enriched.parquet`.
+This query takes a few minutes to run and produces a 6.4 GB file, `noaa_enriched.parquet`.
 
 ## Create table
 

From 9141e1693f03f39d2eda37423918d2b2d873877a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:24:17 +0100
Subject: [PATCH 0128/1081] Calculate cumulative coverage by default.

---
 tests/clickhouse-test | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 2d278f18176..f1b20a3a43e 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1322,6 +1322,7 @@ class TestCase:
         # We want to calculate per-test code coverage. That's why we reset it before each test.
         if (
             args.collect_per_test_coverage
+            and args.reset_coverage_before_every_test
             and BuildFlags.SANITIZE_COVERAGE in args.build_flags
         ):
             clickhouse_execute(
@@ -2843,6 +2844,12 @@ def parse_args():
         default=True,
         help="Create `system.coverage` table on the server and collect information about low-level code coverage on a per test basis there",
     )
+    parser.add_argument(
+        "--reset-coverage-before-every-test",
+        action="store_true",
+        default=False,
+        help="Collect isolated test coverage for every test instead of a cumulative. Useful only when tests are run sequentially.",
+    )
     parser.add_argument(
         "--report-logs-stats",
         action="store_true",

From f7abeff0857ec231a7107d2a006b5f98b60a689f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:25:07 +0100
Subject: [PATCH 0129/1081] Slightly better reporting

---
 tests/clickhouse-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index f1b20a3a43e..e480957e5f4 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1259,7 +1259,7 @@ class TestCase:
                 retry_error_codes=True,
             ).decode()
 
-            description_full += f" Coverage: {coverage}"
+            description_full += f" (coverage: {coverage})"
 
         description_full += "\n"
 

From 3e09feda336a355173b46ec85a9cd86d640f3348 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:36:07 +0100
Subject: [PATCH 0130/1081] More functions

---
 base/base/coverage.cpp     | 21 +++++++++++++++------
 base/base/coverage.h       |  5 ++++-
 src/Functions/coverage.cpp | 33 ++++++++++++++++++++++++++++-----
 tests/clickhouse-test      |  6 +++---
 4 files changed, 50 insertions(+), 15 deletions(-)

diff --git a/base/base/coverage.cpp b/base/base/coverage.cpp
index ac8055e836c..499e384d21f 100644
--- a/base/base/coverage.cpp
+++ b/base/base/coverage.cpp
@@ -53,7 +53,8 @@ namespace
     uint32_t * guards_start = nullptr;
     uint32_t * guards_end = nullptr;
 
-    uintptr_t * coverage_array = nullptr;
+    uintptr_t * current_coverage_array = nullptr;
+    uintptr_t * cumulative_coverage_array = nullptr;
     size_t coverage_array_size = 0;
 
     uintptr_t * all_addresses_array = nullptr;
@@ -88,7 +89,8 @@ void __sanitizer_cov_trace_pc_guard_init(uint32_t * start, uint32_t * stop)
     coverage_array_size = stop - start;
 
     /// Note: we will leak this.
-    coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
+    current_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
+    cumulative_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
 
     resetCoverage();
 }
@@ -126,15 +128,22 @@ void __sanitizer_cov_trace_pc_guard(uint32_t * guard)
     /// and use them to dereference an array or a bit vector.
     void * pc = __builtin_return_address(0);
 
-    coverage_array[guard - guards_start] = reinterpret_cast<uintptr_t>(pc);
+    current_coverage_array[guard - guards_start] = reinterpret_cast<uintptr_t>(pc);
+    cumulative_coverage_array[guard - guards_start] = reinterpret_cast<uintptr_t>(pc);
 }
 
 }
 
 __attribute__((no_sanitize("coverage")))
-std::span<const uintptr_t> getCoverage()
+std::span<const uintptr_t> getCurrentCoverage()
 {
-    return {coverage_array, coverage_array_size};
+    return {current_coverage_array, coverage_array_size};
+}
+
+__attribute__((no_sanitize("coverage")))
+std::span<const uintptr_t> getCumulativeCoverage()
+{
+    return {cumulative_coverage_array, coverage_array_size};
 }
 
 __attribute__((no_sanitize("coverage")))
@@ -146,7 +155,7 @@ std::span<const uintptr_t> getAllInstrumentedAddresses()
 __attribute__((no_sanitize("coverage")))
 void resetCoverage()
 {
-    memset(coverage_array, 0, coverage_array_size * sizeof(*coverage_array));
+    memset(current_coverage_array, 0, coverage_array_size * sizeof(*current_coverage_array));
 
     /// The guard defines whether the __sanitizer_cov_trace_pc_guard should be called.
     /// For example, you can unset it after first invocation to prevent excessive work.
diff --git a/base/base/coverage.h b/base/base/coverage.h
index f75ed2d3553..a6e5a6848d7 100644
--- a/base/base/coverage.h
+++ b/base/base/coverage.h
@@ -15,7 +15,10 @@ void dumpCoverageReportIfPossible();
 /// Get accumulated unique program addresses of the instrumented parts of the code,
 /// seen so far after program startup or after previous reset.
 /// The returned span will be represented as a sparse map, containing mostly zeros, which you should filter away.
-std::span<const uintptr_t> getCoverage();
+std::span<const uintptr_t> getCurrentCoverage();
+
+/// Similar but not being reset.
+std::span<const uintptr_t> getCumulativeCoverage();
 
 /// Get all instrumented addresses that could be in the coverage.
 std::span<const uintptr_t> getAllInstrumentedAddresses();
diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index 86de047a76b..f4cac26df78 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -21,11 +21,14 @@ namespace
 enum class Kind
 {
     Current,
+    Cumulative,
     All
 };
 
 /** If ClickHouse is build with coverage instrumentation, returns an array
-  * of currently accumulated (`coverage`) / all possible (`coverageAll`) unique code addresses.
+  * of currently accumulated (`coverageCurrent`)
+  * or accumulated since the startup (`coverageCumulative`)
+  * or all possible (`coverageAll`) unique code addresses.
   */
 class FunctionCoverage : public IFunction
 {
@@ -64,7 +67,11 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName &, const DataTypePtr &, size_t input_rows_count) const override
     {
-        auto coverage_table = kind == Kind::Current ? getCoverage() : getAllInstrumentedAddresses();
+        auto coverage_table = kind == Kind::Current
+            ? getCurrentCoverage()
+            : (kind == Kind::Cumulative
+                ? getCumulativeCoverage()
+                : getAllInstrumentedAddresses());
 
         auto column_addresses = ColumnUInt64::create();
         auto & data = column_addresses->getData();
@@ -85,7 +92,7 @@ public:
 
 REGISTER_FUNCTION(Coverage)
 {
-    factory.registerFunction("coverage", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Current)); },
+    factory.registerFunction("coverageCurrent", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Current)); },
         FunctionDocumentation
         {
             .description=R"(
@@ -112,7 +119,23 @@ e.g. a body of for loop without ifs, or a single branch of if.
 See https://clang.llvm.org/docs/SanitizerCoverage.html for more information.
 )",
             .examples{
-                {"functions", "SELECT DISTINCT demangle(addressToSymbol(arrayJoin(coverage())))", ""}},
+                {"functions", "SELECT DISTINCT demangle(addressToSymbol(arrayJoin(coverageCurrent())))", ""}},
+            .categories{"Introspection"}
+        });
+
+    factory.registerFunction("coverageCumulative", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Cumulative)); },
+        FunctionDocumentation
+        {
+            .description=R"(
+This function is only available if ClickHouse was built with the SANITIZE_COVERAGE=1 option.
+
+It returns an array of unique addresses (a subset of the instrumented points in code) in the code
+encountered at runtime after server startup.
+
+In contrast to `coverageCurrent` it cannot be reset with the `SYSTEM RESET COVERAGE`.
+
+See the `coverageCurrent` function for the details.
+)",
             .categories{"Introspection"}
         });
 
@@ -127,7 +150,7 @@ It returns an array of all unique addresses in the code instrumented for coverag
 
 You can use this function, and the `coverage` function to compare and calculate the coverage percentage.
 
-See the `coverage` function for the details.
+See the `coverageCurrent` function for the details.
 )",
             .categories{"Introspection"}
         });
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index e480957e5f4..a39c90947ba 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1249,13 +1249,13 @@ class TestCase:
         ):
             clickhouse_execute(
                 args,
-                f"INSERT INTO system.coverage SELECT now(), '{self.case}', coverage()",
+                f"INSERT INTO system.coverage SELECT now(), '{self.case}', coverageCurrent()",
                 retry_error_codes=True,
             )
 
             coverage = clickhouse_execute(
                 args,
-                "SELECT length(coverage())",
+                "SELECT length(coverageCurrent())",
                 retry_error_codes=True,
             ).decode()
 
@@ -2460,7 +2460,7 @@ def main(args):
         # Coverage collected at the system startup before running any tests:
         clickhouse_execute(
             args,
-            "INSERT INTO system.coverage SELECT now(), '', coverage()",
+            "INSERT INTO system.coverage SELECT now(), '', coverageCurrent()",
         )
 
     total_tests_run = 0

From e4cd02ea39642dd9b8d519aee0426b752423c3bf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:36:24 +0100
Subject: [PATCH 0131/1081] Fix typo

---
 src/IO/OpenedFile.h | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/IO/OpenedFile.h b/src/IO/OpenedFile.h
index 10c36d9e1d3..4c4de2265bc 100644
--- a/src/IO/OpenedFile.h
+++ b/src/IO/OpenedFile.h
@@ -21,7 +21,7 @@ public:
     OpenedFile(const std::string & file_name_, int flags_);
     ~OpenedFile();
 
-    /// Close prematurally.
+    /// Close prematurely.
     void close();
 
     int getFD() const;
@@ -40,4 +40,3 @@ private:
 };
 
 }
-

From 30c362909089d6f7fe93b639dfdf1666d5bcfc7c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:36:44 +0100
Subject: [PATCH 0132/1081] An option to dump coverage to a file at exit

---
 programs/main.cpp | 47 ++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 46 insertions(+), 1 deletion(-)

diff --git a/programs/main.cpp b/programs/main.cpp
index 7d07112de66..4852ed8990e 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -1,6 +1,7 @@
 #include <csignal>
 #include <csetjmp>
 #include <unistd.h>
+#include <fcntl.h>
 
 #include <new>
 #include <iostream>
@@ -19,6 +20,7 @@
 #include <Common/IO.h>
 
 #include <base/phdr_cache.h>
+#include <base/coverage.h>
 
 
 /// Universal executable for various clickhouse applications
@@ -512,6 +514,49 @@ int main(int argc_, char ** argv_)
     if (main_func == printHelp && !argv.empty() && (argv.size() == 1 || argv[1][0] == '-'))
         main_func = mainEntryClickHouseLocal;
 
-    return main_func(static_cast<int>(argv.size()), argv.data());
+    int exit_code = main_func(static_cast<int>(argv.size()), argv.data());
+
+#if defined(SANITIZE_COVERAGE)
+    /// A user can request to dump the coverage information into files at exit.
+    /// This is useful for non-server applications such as clickhouse-format or clickhouse-client,
+    /// that cannot introspect it with SQL functions at runtime.
+
+    /// The CLICKHOUSE_WRITE_COVERAGE environment variable defines a prefix for two filenames:
+    /// 'prefix.covered' and 'prefix.all' which will contain
+    /// the list of addresses of covered and all instrumented addresses, respectively.
+
+    /// The format is even simpler than Clang's "sancov": an array of 64-bit addresses, native byte order, no header.
+
+    if (const char * coverage_filename_prefix = getenv("CLICKHOUSE_WRITE_COVERAGE")) // NOLINT(concurrency-mt-unsafe)
+    {
+        auto dumpCoverage = [](const std::string & name, auto span)
+        {
+            /// Write only non-zeros.
+            std::vector<uintptr_t> data;
+            data.reserve(span.size());
+            for (auto addr : span)
+                if (addr)
+                    data.push_back(addr);
+
+            int fd = ::open(name.c_str(), O_WRONLY | O_CREAT | O_TRUNC | O_CLOEXEC, 0400);
+            if (-1 == fd)
+            {
+                writeError("Cannot open a file to write the coverage data\n");
+            }
+            else
+            {
+                if (!writeRetry(fd, reinterpret_cast<const char *>(data.data()), data.size() * sizeof(data[0])))
+                    writeError("Cannot write the coverage data to a file\n");
+                if (0 != ::close(fd))
+                    writeError("Cannot close the file with coverage data\n");
+            }
+        };
+
+        dumpCoverage(coverage_filename_prefix + std::string(".covered"), getCumulativeCoverage());
+        dumpCoverage(coverage_filename_prefix + std::string(".all"), getAllInstrumentedAddresses());
+    }
+#endif
+
+    return exit_code;
 }
 #endif

From fe952fb64c460c260c77336142b5eb4bd05b46d8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:38:42 +0100
Subject: [PATCH 0133/1081] Rename to system.coverage_log to simplify export

---
 tests/clickhouse-test | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index a39c90947ba..eb85bdff0f5 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1249,7 +1249,7 @@ class TestCase:
         ):
             clickhouse_execute(
                 args,
-                f"INSERT INTO system.coverage SELECT now(), '{self.case}', coverageCurrent()",
+                f"INSERT INTO system.coverage_log SELECT now(), '{self.case}', coverageCurrent()",
                 retry_error_codes=True,
             )
 
@@ -2448,7 +2448,7 @@ def main(args):
         clickhouse_execute(
             args,
             """
-                CREATE TABLE IF NOT EXISTS system.coverage
+                CREATE TABLE IF NOT EXISTS system.coverage_log
                 (
                     time DateTime,
                     test_name String,
@@ -2460,7 +2460,7 @@ def main(args):
         # Coverage collected at the system startup before running any tests:
         clickhouse_execute(
             args,
-            "INSERT INTO system.coverage SELECT now(), '', coverageCurrent()",
+            "INSERT INTO system.coverage_log SELECT now(), '', coverageCurrent()",
         )
 
     total_tests_run = 0
@@ -2842,7 +2842,7 @@ def parse_args():
         "--collect-per-test-coverage",
         action="store_true",
         default=True,
-        help="Create `system.coverage` table on the server and collect information about low-level code coverage on a per test basis there",
+        help="Create `system.coverage_log` table on the server and collect information about low-level code coverage on a per test basis there",
     )
     parser.add_argument(
         "--reset-coverage-before-every-test",

From 7662628393f97dd1c094b3346cc55c71f10ad193 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:41:14 +0100
Subject: [PATCH 0134/1081] Export coverage to the CI database

---
 docker/test/base/setup_export_logs.sh | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index ea82e071112..659bf29b057 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -129,6 +129,19 @@ function setup_logs_replication
     debug_or_sanitizer_build=$(clickhouse-client -q "WITH ((SELECT value FROM system.build_options WHERE name='BUILD_TYPE') AS build, (SELECT value FROM system.build_options WHERE name='CXX_FLAGS') as flags) SELECT build='Debug' OR flags LIKE '%fsanitize%'")
     echo "Build is debug or sanitizer: $debug_or_sanitizer_build"
 
+    # We will pre-create a table system.coverage_log.
+    # It is normally created by clickhouse-test rather than the server,
+    # so we will create it in advance to make it be picked up by the next commands:
+
+    clickhouse-client --query "
+        CREATE TABLE IF NOT EXISTS system.coverage_log
+        (
+            time DateTime,
+            test_name String,
+            coverage Array(UInt64)
+        ) ENGINE = MergeTree ORDER BY test_name
+    "
+
     # For each system log table:
     echo 'Create %_log tables'
     clickhouse-client --query "SHOW TABLES FROM system LIKE '%\\_log'" | while read -r table

From 97200e2c5d65693ad5d1e6a7c7dea3d5cac0e23d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:46:01 +0100
Subject: [PATCH 0135/1081] Symbolization

---
 docker/test/base/setup_export_logs.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 659bf29b057..e141bc00a77 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -138,7 +138,8 @@ function setup_logs_replication
         (
             time DateTime,
             test_name String,
-            coverage Array(UInt64)
+            coverage Array(UInt64),
+            symbols Array(LowCardinality(String)) MATERIALIZED arrayMap(x -> demangle(addressToSymbol(x)), coverage)
         ) ENGINE = MergeTree ORDER BY test_name
     "
 

From bf2e5748575ad2eb74eb057e0ee242a149edecdb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 00:48:47 +0100
Subject: [PATCH 0136/1081] Symbolization

---
 docker/test/base/setup_export_logs.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index e141bc00a77..20dd864318f 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -188,7 +188,7 @@ function setup_logs_replication
         echo "Creating table system.${table}_sender" >&2
 
         # Create Distributed table and materialized view to watch on the original table:
-        clickhouse-client --query "
+        clickhouse-client --asterisk_include_materialized_columns 1 --query "
             CREATE TABLE system.${table}_sender
             ENGINE = Distributed(${CLICKHOUSE_CI_LOGS_CLUSTER}, default, ${table}_${hash})
             SETTINGS flush_on_detach=0
@@ -199,7 +199,7 @@ function setup_logs_replication
 
         echo "Creating materialized view system.${table}_watcher" >&2
 
-        clickhouse-client --query "
+        clickhouse-client --asterisk_include_materialized_columns 1 --query "
             CREATE MATERIALIZED VIEW system.${table}_watcher TO system.${table}_sender AS
             SELECT ${EXTRA_COLUMNS_EXPRESSION_FOR_TABLE}, *
             FROM system.${table}

From c5dfae1bcade85289b78f0bb760c92bcee078743 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 05:07:23 +0100
Subject: [PATCH 0137/1081] Fix error

---
 docker/test/base/setup_export_logs.sh | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 20dd864318f..26fcd10d666 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -23,6 +23,10 @@ EXTRA_ORDER_BY_COLUMNS=${EXTRA_ORDER_BY_COLUMNS:-"check_name, "}
 EXTRA_COLUMNS_TRACE_LOG="${EXTRA_COLUMNS} symbols Array(LowCardinality(String)), lines Array(LowCardinality(String)), "
 EXTRA_COLUMNS_EXPRESSION_TRACE_LOG="${EXTRA_COLUMNS_EXPRESSION}, arrayMap(x -> demangle(addressToSymbol(x)), trace)::Array(LowCardinality(String)) AS symbols, arrayMap(x -> addressToLine(x), trace)::Array(LowCardinality(String)) AS lines"
 
+# coverage_log needs more columns for symbolization, but only symbol names (the line numbers are too heavy to calculate)
+EXTRA_COLUMNS_COVERAGE_LOG="${EXTRA_COLUMNS} symbols Array(LowCardinality(String)), "
+EXTRA_COLUMNS_EXPRESSION_COVERAGE_LOG="${EXTRA_COLUMNS_EXPRESSION}, arrayMap(x -> demangle(addressToSymbol(x)), coverage)::Array(LowCardinality(String)) AS symbols"
+
 
 function __set_connection_args
 {
@@ -138,8 +142,7 @@ function setup_logs_replication
         (
             time DateTime,
             test_name String,
-            coverage Array(UInt64),
-            symbols Array(LowCardinality(String)) MATERIALIZED arrayMap(x -> demangle(addressToSymbol(x)), coverage)
+            coverage Array(UInt64)
         ) ENGINE = MergeTree ORDER BY test_name
     "
 
@@ -158,7 +161,10 @@ function setup_logs_replication
             else
                 EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION_TRACE_LOG}"
             fi
-        else
+        elif [[ "$table" = "coverage_log" ]]
+            EXTRA_COLUMNS_FOR_TABLE="${EXTRA_COLUMNS_COVERAGE_LOG}"
+            EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION_COVERAGE_LOG}"
+        then
             EXTRA_COLUMNS_FOR_TABLE="${EXTRA_COLUMNS}"
             EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION}"
         fi

From e13ca48bce836a2534047e59a4e922395a8f6a87 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 05:13:43 +0100
Subject: [PATCH 0138/1081] Better dump on exit

---
 programs/main.cpp | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/programs/main.cpp b/programs/main.cpp
index 4852ed8990e..8958d84e243 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -521,9 +521,8 @@ int main(int argc_, char ** argv_)
     /// This is useful for non-server applications such as clickhouse-format or clickhouse-client,
     /// that cannot introspect it with SQL functions at runtime.
 
-    /// The CLICKHOUSE_WRITE_COVERAGE environment variable defines a prefix for two filenames:
-    /// 'prefix.covered' and 'prefix.all' which will contain
-    /// the list of addresses of covered and all instrumented addresses, respectively.
+    /// The CLICKHOUSE_WRITE_COVERAGE environment variable defines a prefix for a filename 'prefix.pid'
+    /// containing the list of addresses of covered .
 
     /// The format is even simpler than Clang's "sancov": an array of 64-bit addresses, native byte order, no header.
 
@@ -552,8 +551,7 @@ int main(int argc_, char ** argv_)
             }
         };
 
-        dumpCoverage(coverage_filename_prefix + std::string(".covered"), getCumulativeCoverage());
-        dumpCoverage(coverage_filename_prefix + std::string(".all"), getAllInstrumentedAddresses());
+        dumpCoverage(fmt::format("{}.{}", coverage_filename_prefix, getpid()), getCumulativeCoverage());
     }
 #endif
 

From e49cfbef089499a457c8793724629e2e94c8dc37 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 05:40:03 +0100
Subject: [PATCH 0139/1081] Coverage for non-server tools

---
 tests/clickhouse-test         | 23 +++++++++++++++++++++++
 tests/queries/shell_config.sh |  4 ++++
 2 files changed, 27 insertions(+)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index eb85bdff0f5..bd796dbfdf2 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -12,6 +12,7 @@ import itertools
 import sys
 import os
 import os.path
+import glob
 import platform
 import signal
 import re
@@ -74,6 +75,10 @@ def stringhash(s):
     # only during process invocation https://stackoverflow.com/a/42089311
     return zlib.crc32(s.encode("utf-8"))
 
+def read_file_as_binary_string(file_path):
+    with open(file_path, 'rb') as file:
+        binary_data = file.read()
+    return binary_data
 
 # First and last lines of the log
 def trim_for_log(s):
@@ -101,6 +106,7 @@ class HTTPError(Exception):
 def clickhouse_execute_http(
     base_args,
     query,
+    body=None,
     timeout=30,
     settings=None,
     default_format=None,
@@ -140,6 +146,7 @@ def clickhouse_execute_http(
             client.request(
                 "POST",
                 f"/?{base_args.client_options_query_str}{urllib.parse.urlencode(params)}",
+                body=body
             )
             res = client.getresponse()
             data = res.read()
@@ -160,6 +167,7 @@ def clickhouse_execute_http(
 def clickhouse_execute(
     base_args,
     query,
+    body=None,
     timeout=30,
     settings=None,
     max_http_retries=5,
@@ -168,6 +176,7 @@ def clickhouse_execute(
     return clickhouse_execute_http(
         base_args,
         query,
+        body,
         timeout,
         settings,
         max_http_retries=max_http_retries,
@@ -181,6 +190,7 @@ def clickhouse_execute_json(
     data = clickhouse_execute_http(
         base_args,
         query,
+        None,
         timeout,
         settings,
         "JSONEachRow",
@@ -1253,6 +1263,19 @@ class TestCase:
                 retry_error_codes=True,
             )
 
+            # Check for dumped coverage files
+            file_pattern = "coverage.*"
+            matching_files = glob.glob(file_pattern)
+            for file_path in matching_files:
+                body = read_file_as_binary_string(file_path)
+                clickhouse_execute(
+                    args,
+                    f"INSERT INTO system.coverage_log SELECT now(), '{self.case}', groupArray(data) FROM input('data UInt64') FORMAT RowBinary",
+                    body=body,
+                    retry_error_codes=True,
+                )
+                os.remove(file_path)
+
             coverage = clickhouse_execute(
                 args,
                 "SELECT length(coverageCurrent())",
diff --git a/tests/queries/shell_config.sh b/tests/queries/shell_config.sh
index c687a63623f..614bfcece8f 100644
--- a/tests/queries/shell_config.sh
+++ b/tests/queries/shell_config.sh
@@ -4,6 +4,10 @@
 # Don't check for ODR violation, since we may test shared build with ASAN
 export ASAN_OPTIONS=detect_odr_violation=0
 
+# If ClickHouse was built with coverage - dump the coverage information at exit
+# (in other cases this environment variable has no effect)
+export CLICKHOUSE_WRITE_COVERAGE="coverage"
+
 export CLICKHOUSE_DATABASE=${CLICKHOUSE_DATABASE:="test"}
 export CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL=${CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL:="warning"}
 

From 678a32cedee768b6c1a6748e96a0d103e853d8bc Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 06:12:58 +0100
Subject: [PATCH 0140/1081] Obey Python's quirky formatter

---
 tests/integration/ci-runner.py                |  13 +-
 .../test_async_insert_memory/test.py          |   2 +-
 tests/integration/test_check_table/test.py    |  76 +++--
 .../test_cluster_discovery/test.py            |   2 +-
 .../test_ldap_external_user_directory/test.py |  26 +-
 tests/integration/test_mysql_protocol/test.py |  16 +-
 tests/integration/test_partition/test.py      |   4 +-
 .../test_replicated_database/test.py          |   9 +-
 .../test.py                                   |   9 +-
 .../s3_mocks/unstable_server.py               |   2 +-
 tests/integration/test_storage_s3/test.py     |  17 +-
 tests/integration/test_storage_url/test.py    |  22 +-
 tests/integration/test_system_merges/test.py  |  45 ++-
 utils/grpc-client/pb2/clickhouse_grpc_pb2.py  | 271 ++++++++++--------
 .../pb2/clickhouse_grpc_pb2_grpc.py           | 237 +++++++++------
 15 files changed, 433 insertions(+), 318 deletions(-)

diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index 7c922e339fe..d54ed2bb767 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -305,14 +305,11 @@ class ClickhouseIntegrationTestsRunner:
     def _pre_pull_images(self, repo_path):
         image_cmd = self._get_runner_image_cmd(repo_path)
 
-        cmd = (
-            "cd {repo_path}/tests/integration && "
-            "timeout --signal=KILL 1h ./runner {runner_opts} {image_cmd} --pre-pull --command '{command}' ".format(
-                repo_path=repo_path,
-                runner_opts=self._get_runner_opts(),
-                image_cmd=image_cmd,
-                command=r""" echo Pre Pull finished """,
-            )
+        cmd = "cd {repo_path}/tests/integration && " "timeout --signal=KILL 1h ./runner {runner_opts} {image_cmd} --pre-pull --command '{command}' ".format(
+            repo_path=repo_path,
+            runner_opts=self._get_runner_opts(),
+            image_cmd=image_cmd,
+            command=r""" echo Pre Pull finished """,
         )
 
         for i in range(5):
diff --git a/tests/integration/test_async_insert_memory/test.py b/tests/integration/test_async_insert_memory/test.py
index 5d2e5503680..f897007f7bb 100644
--- a/tests/integration/test_async_insert_memory/test.py
+++ b/tests/integration/test_async_insert_memory/test.py
@@ -43,7 +43,7 @@ def test_memory_usage():
 
     response = node.get_query_request(
         "SELECT groupArray(number) FROM numbers(1000000) SETTINGS max_memory_usage_for_user={}".format(
-            30 * (2**23)
+            30 * (2 ** 23)
         ),
         user="A",
     )
diff --git a/tests/integration/test_check_table/test.py b/tests/integration/test_check_table/test.py
index 021977fb6b6..ebf404e698b 100644
--- a/tests/integration/test_check_table/test.py
+++ b/tests/integration/test_check_table/test.py
@@ -95,15 +95,25 @@ def test_check_normal_table_corruption(started_cluster, merge_tree_settings):
         node1, "non_replicated_mt", "201902_1_1_0", database="default"
     )
 
-    assert node1.query(
-        "CHECK TABLE non_replicated_mt",
-        settings={"check_query_single_value_result": 0, "max_threads": 1},
-    ).strip().split("\t")[0:2] == ["201902_1_1_0", "0"]
+    assert (
+        node1.query(
+            "CHECK TABLE non_replicated_mt",
+            settings={"check_query_single_value_result": 0, "max_threads": 1},
+        )
+        .strip()
+        .split("\t")[0:2]
+        == ["201902_1_1_0", "0"]
+    )
 
-    assert node1.query(
-        "CHECK TABLE non_replicated_mt",
-        settings={"check_query_single_value_result": 0, "max_threads": 1},
-    ).strip().split("\t")[0:2] == ["201902_1_1_0", "0"]
+    assert (
+        node1.query(
+            "CHECK TABLE non_replicated_mt",
+            settings={"check_query_single_value_result": 0, "max_threads": 1},
+        )
+        .strip()
+        .split("\t")[0:2]
+        == ["201902_1_1_0", "0"]
+    )
 
     node1.query(
         "INSERT INTO non_replicated_mt VALUES (toDate('2019-01-01'), 1, 10), (toDate('2019-01-01'), 2, 12)"
@@ -123,10 +133,15 @@ def test_check_normal_table_corruption(started_cluster, merge_tree_settings):
 
     remove_checksums_on_disk(node1, "default", "non_replicated_mt", "201901_2_2_0")
 
-    assert node1.query(
-        "CHECK TABLE non_replicated_mt PARTITION 201901",
-        settings={"check_query_single_value_result": 0, "max_threads": 1},
-    ).strip().split("\t")[0:2] == ["201901_2_2_0", "0"]
+    assert (
+        node1.query(
+            "CHECK TABLE non_replicated_mt PARTITION 201901",
+            settings={"check_query_single_value_result": 0, "max_threads": 1},
+        )
+        .strip()
+        .split("\t")[0:2]
+        == ["201901_2_2_0", "0"]
+    )
 
 
 @pytest.mark.parametrize("merge_tree_settings, zk_path_suffix", [("", "_0")])
@@ -194,12 +209,15 @@ def test_check_replicated_table_simple(
         == "201901_0_0_0\t1\t\n"
     )
 
-    assert sorted(
-        node2.query(
-            "CHECK TABLE replicated_mt",
-            settings={"check_query_single_value_result": 0},
-        ).split("\n")
-    ) == ["", "201901_0_0_0\t1\t", "201902_0_0_0\t1\t"]
+    assert (
+        sorted(
+            node2.query(
+                "CHECK TABLE replicated_mt",
+                settings={"check_query_single_value_result": 0},
+            ).split("\n")
+        )
+        == ["", "201901_0_0_0\t1\t", "201902_0_0_0\t1\t"]
+    )
 
     with pytest.raises(QueryRuntimeException) as exc:
         node2.query(
@@ -273,10 +291,13 @@ def test_check_replicated_table_corruption(
     )
 
     node1.query_with_retry("SYSTEM SYNC REPLICA replicated_mt_1")
-    assert node1.query(
-        "CHECK TABLE replicated_mt_1 PARTITION 201901",
-        settings={"check_query_single_value_result": 0, "max_threads": 1},
-    ) == "{}\t1\t\n".format(part_name)
+    assert (
+        node1.query(
+            "CHECK TABLE replicated_mt_1 PARTITION 201901",
+            settings={"check_query_single_value_result": 0, "max_threads": 1},
+        )
+        == "{}\t1\t\n".format(part_name)
+    )
     assert node1.query("SELECT count() from replicated_mt_1") == "4\n"
 
     remove_part_from_disk(node2, "replicated_mt_1", part_name)
@@ -288,10 +309,13 @@ def test_check_replicated_table_corruption(
     )
 
     node1.query("SYSTEM SYNC REPLICA replicated_mt_1")
-    assert node1.query(
-        "CHECK TABLE replicated_mt_1 PARTITION 201901",
-        settings={"check_query_single_value_result": 0, "max_threads": 1},
-    ) == "{}\t1\t\n".format(part_name)
+    assert (
+        node1.query(
+            "CHECK TABLE replicated_mt_1 PARTITION 201901",
+            settings={"check_query_single_value_result": 0, "max_threads": 1},
+        )
+        == "{}\t1\t\n".format(part_name)
+    )
     assert node1.query("SELECT count() from replicated_mt_1") == "4\n"
 
 
diff --git a/tests/integration/test_cluster_discovery/test.py b/tests/integration/test_cluster_discovery/test.py
index ad3deb5b142..a2e7e15b956 100644
--- a/tests/integration/test_cluster_discovery/test.py
+++ b/tests/integration/test_cluster_discovery/test.py
@@ -61,7 +61,7 @@ def check_on_cluster(
         print(f"Retry {retry}/{retries} unsuccessful, result: {node_results}")
 
         if retry != retries:
-            time.sleep(2**retry)
+            time.sleep(2 ** retry)
     else:
         msg = msg or f"Wrong '{what}' result"
         raise Exception(
diff --git a/tests/integration/test_ldap_external_user_directory/test.py b/tests/integration/test_ldap_external_user_directory/test.py
index 39753794d63..c9642c293ee 100644
--- a/tests/integration/test_ldap_external_user_directory/test.py
+++ b/tests/integration/test_ldap_external_user_directory/test.py
@@ -76,11 +76,14 @@ def test_role_mapping(ldap_cluster):
         "select currentUser()", user="johndoe", password="qwertz"
     ) == TSV([["johndoe"]])
 
-    assert instance.query(
-        "select role_name from system.current_roles ORDER BY role_name",
-        user="johndoe",
-        password="qwertz",
-    ) == TSV([["role_1"], ["role_2"]])
+    assert (
+        instance.query(
+            "select role_name from system.current_roles ORDER BY role_name",
+            user="johndoe",
+            password="qwertz",
+        )
+        == TSV([["role_1"], ["role_2"]])
+    )
 
     instance.query("CREATE ROLE role_3")
     add_ldap_group(ldap_cluster, group_cn="clickhouse-role_3", member_cn="johndoe")
@@ -88,8 +91,11 @@ def test_role_mapping(ldap_cluster):
     # See https://github.com/ClickHouse/ClickHouse/issues/54318
     add_ldap_group(ldap_cluster, group_cn="clickhouse-role_4", member_cn="johndoe")
 
-    assert instance.query(
-        "select role_name from system.current_roles ORDER BY role_name",
-        user="johndoe",
-        password="qwertz",
-    ) == TSV([["role_1"], ["role_2"], ["role_3"]])
+    assert (
+        instance.query(
+            "select role_name from system.current_roles ORDER BY role_name",
+            user="johndoe",
+            password="qwertz",
+        )
+        == TSV([["role_1"], ["role_2"], ["role_3"]])
+    )
diff --git a/tests/integration/test_mysql_protocol/test.py b/tests/integration/test_mysql_protocol/test.py
index 7a69d07633c..61e76c0dc97 100644
--- a/tests/integration/test_mysql_protocol/test.py
+++ b/tests/integration/test_mysql_protocol/test.py
@@ -854,14 +854,14 @@ def test_types(started_cluster):
 
     result = cursor.fetchall()[0]
     expected = [
-        ("Int8_column", -(2**7)),
-        ("UInt8_column", 2**8 - 1),
-        ("Int16_column", -(2**15)),
-        ("UInt16_column", 2**16 - 1),
-        ("Int32_column", -(2**31)),
-        ("UInt32_column", 2**32 - 1),
-        ("Int64_column", -(2**63)),
-        ("UInt64_column", 2**64 - 1),
+        ("Int8_column", -(2 ** 7)),
+        ("UInt8_column", 2 ** 8 - 1),
+        ("Int16_column", -(2 ** 15)),
+        ("UInt16_column", 2 ** 16 - 1),
+        ("Int32_column", -(2 ** 31)),
+        ("UInt32_column", 2 ** 32 - 1),
+        ("Int64_column", -(2 ** 63)),
+        ("UInt64_column", 2 ** 64 - 1),
         ("String_column", "тест"),
         ("FixedString_column", "тест"),
         ("Float32_column", 1.5),
diff --git a/tests/integration/test_partition/test.py b/tests/integration/test_partition/test.py
index 054418a8ba9..d39787f8924 100644
--- a/tests/integration/test_partition/test.py
+++ b/tests/integration/test_partition/test.py
@@ -561,9 +561,7 @@ def test_make_clone_in_detached(started_cluster):
         ["cp", "-r", path + "all_0_0_0", path + "detached/broken_all_0_0_0"]
     )
     assert_eq_with_retry(instance, "select * from clone_in_detached", "\n")
-    assert [
-        "broken_all_0_0_0",
-    ] == sorted(
+    assert ["broken_all_0_0_0",] == sorted(
         instance.exec_in_container(["ls", path + "detached/"]).strip().split("\n")
     )
 
diff --git a/tests/integration/test_replicated_database/test.py b/tests/integration/test_replicated_database/test.py
index 1fc3fe37044..16425c9bd9e 100644
--- a/tests/integration/test_replicated_database/test.py
+++ b/tests/integration/test_replicated_database/test.py
@@ -506,12 +506,9 @@ def test_alters_from_different_replicas(started_cluster):
     dummy_node.stop_clickhouse(kill=True)
 
     settings = {"distributed_ddl_task_timeout": 5}
-    assert (
-        "There are 1 unfinished hosts (0 of them are currently executing the task"
-        in competing_node.query_and_get_error(
-            "ALTER TABLE alters_from_different_replicas.concurrent_test ADD COLUMN Added0 UInt32;",
-            settings=settings,
-        )
+    assert "There are 1 unfinished hosts (0 of them are currently executing the task" in competing_node.query_and_get_error(
+        "ALTER TABLE alters_from_different_replicas.concurrent_test ADD COLUMN Added0 UInt32;",
+        settings=settings,
     )
     settings = {
         "distributed_ddl_task_timeout": 5,
diff --git a/tests/integration/test_replicated_database_cluster_groups/test.py b/tests/integration/test_replicated_database_cluster_groups/test.py
index 647626d8014..5a315707efb 100644
--- a/tests/integration/test_replicated_database_cluster_groups/test.py
+++ b/tests/integration/test_replicated_database_cluster_groups/test.py
@@ -95,12 +95,9 @@ def test_cluster_groups(started_cluster):
     # Exception
     main_node_2.stop_clickhouse()
     settings = {"distributed_ddl_task_timeout": 5}
-    assert (
-        "There are 1 unfinished hosts (0 of them are currently executing the task)"
-        in main_node_1.query_and_get_error(
-            "CREATE TABLE cluster_groups.table_2 (d Date, k UInt64) ENGINE=ReplicatedMergeTree ORDER BY k PARTITION BY toYYYYMM(d);",
-            settings=settings,
-        )
+    assert "There are 1 unfinished hosts (0 of them are currently executing the task)" in main_node_1.query_and_get_error(
+        "CREATE TABLE cluster_groups.table_2 (d Date, k UInt64) ENGINE=ReplicatedMergeTree ORDER BY k PARTITION BY toYYYYMM(d);",
+        settings=settings,
     )
 
     # 3. After start both groups are synced
diff --git a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
index 5ef781bdc9e..3632fa15d8a 100644
--- a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
+++ b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
@@ -9,7 +9,7 @@ import time
 
 def gen_n_digit_number(n):
     assert 0 < n < 19
-    return random.randint(10 ** (n - 1), 10**n - 1)
+    return random.randint(10 ** (n - 1), 10 ** n - 1)
 
 
 sum_in_4_column = 0
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 2549cb0d473..e941356261a 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -553,16 +553,13 @@ def test_multipart(started_cluster, maybe_auth, positive):
         assert csv_data == get_s3_file_content(started_cluster, bucket, filename)
 
     # select uploaded data from many threads
-    select_query = (
-        "select sum(column1), sum(column2), sum(column3) "
-        "from s3('http://{host}:{port}/{bucket}/{filename}', {auth}'CSV', '{table_format}')".format(
-            host=started_cluster.minio_redirect_host,
-            port=started_cluster.minio_redirect_port,
-            bucket=bucket,
-            filename=filename,
-            auth=maybe_auth,
-            table_format=table_format,
-        )
+    select_query = "select sum(column1), sum(column2), sum(column3) " "from s3('http://{host}:{port}/{bucket}/{filename}', {auth}'CSV', '{table_format}')".format(
+        host=started_cluster.minio_redirect_host,
+        port=started_cluster.minio_redirect_port,
+        bucket=bucket,
+        filename=filename,
+        auth=maybe_auth,
+        table_format=table_format,
     )
     try:
         select_result = run_query(
diff --git a/tests/integration/test_storage_url/test.py b/tests/integration/test_storage_url/test.py
index 7ff7a871413..771df49cbac 100644
--- a/tests/integration/test_storage_url/test.py
+++ b/tests/integration/test_storage_url/test.py
@@ -79,15 +79,21 @@ def test_table_function_url_access_rights():
         f"SELECT * FROM url('http://nginx:80/test_1', 'TSV')", user="u1"
     )
 
-    assert node1.query(
-        f"DESCRIBE TABLE url('http://nginx:80/test_1', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
-        user="u1",
-    ) == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
+    assert (
+        node1.query(
+            f"DESCRIBE TABLE url('http://nginx:80/test_1', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
+            user="u1",
+        )
+        == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
+    )
 
-    assert node1.query(
-        f"DESCRIBE TABLE url('http://nginx:80/not-exist', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
-        user="u1",
-    ) == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
+    assert (
+        node1.query(
+            f"DESCRIBE TABLE url('http://nginx:80/not-exist', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
+            user="u1",
+        )
+        == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
+    )
 
     expected_error = "necessary to have the grant URL ON *.*"
     assert expected_error in node1.query_and_get_error(
diff --git a/tests/integration/test_system_merges/test.py b/tests/integration/test_system_merges/test.py
index 6dbe6c891f2..bacb0eb500d 100644
--- a/tests/integration/test_system_merges/test.py
+++ b/tests/integration/test_system_merges/test.py
@@ -204,36 +204,33 @@ def test_mutation_simple(started_cluster, replicated):
             sleep_time=0.1,
         )
 
-        assert (
-            split_tsv(
-                node_check.query(
-                    """
+        assert split_tsv(
+            node_check.query(
+                """
             SELECT database, table, num_parts, source_part_names, source_part_paths, result_part_name, result_part_path, partition_id, is_mutation
                 FROM system.merges
                 WHERE table = '{name}'
         """.format(
-                        name=table_name
-                    )
+                    name=table_name
                 )
             )
-            == [
-                [
-                    db_name,
-                    table_name,
-                    "1",
-                    "['{}']".format(part),
-                    "['{clickhouse}/{table_path}/{}/']".format(
-                        part, clickhouse=clickhouse_path, table_path=table_path
-                    ),
-                    result_part,
-                    "{clickhouse}/{table_path}/{}/".format(
-                        result_part, clickhouse=clickhouse_path, table_path=table_path
-                    ),
-                    "all",
-                    "1",
-                ],
-            ]
-        )
+        ) == [
+            [
+                db_name,
+                table_name,
+                "1",
+                "['{}']".format(part),
+                "['{clickhouse}/{table_path}/{}/']".format(
+                    part, clickhouse=clickhouse_path, table_path=table_path
+                ),
+                result_part,
+                "{clickhouse}/{table_path}/{}/".format(
+                    result_part, clickhouse=clickhouse_path, table_path=table_path
+                ),
+                "all",
+                "1",
+            ],
+        ]
         t.join()
 
         assert (
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
index 6218047af3c..9bf7817c7d3 100644
--- a/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
@@ -8,16 +8,17 @@ from google.protobuf import descriptor_pool as _descriptor_pool
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
+
 # @@protoc_insertion_point(imports)
 
 _sym_db = _symbol_database.Default()
 
 
+DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
+    b'\n\x15\x63lickhouse_grpc.proto\x12\x0f\x63lickhouse.grpc")\n\x0bNameAndType\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t"\xf5\x01\n\rExternalTable\x12\x0c\n\x04name\x18\x01 \x01(\t\x12-\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0c\n\x04\x64\x61ta\x18\x03 \x01(\x0c\x12\x0e\n\x06\x66ormat\x18\x04 \x01(\t\x12\x18\n\x10\x63ompression_type\x18\x06 \x01(\t\x12>\n\x08settings\x18\x05 \x03(\x0b\x32,.clickhouse.grpc.ExternalTable.SettingsEntry\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01"\x85\x03\n\x1cObsoleteTransportCompression\x12U\n\talgorithm\x18\x01 \x01(\x0e\x32\x42.clickhouse.grpc.ObsoleteTransportCompression.CompressionAlgorithm\x12M\n\x05level\x18\x02 \x01(\x0e\x32>.clickhouse.grpc.ObsoleteTransportCompression.CompressionLevel"R\n\x14\x43ompressionAlgorithm\x12\x12\n\x0eNO_COMPRESSION\x10\x00\x12\x0b\n\x07\x44\x45\x46LATE\x10\x01\x12\x08\n\x04GZIP\x10\x02\x12\x0f\n\x0bSTREAM_GZIP\x10\x03"k\n\x10\x43ompressionLevel\x12\x14\n\x10\x43OMPRESSION_NONE\x10\x00\x12\x13\n\x0f\x43OMPRESSION_LOW\x10\x01\x12\x16\n\x12\x43OMPRESSION_MEDIUM\x10\x02\x12\x14\n\x10\x43OMPRESSION_HIGH\x10\x03"\x8e\x06\n\tQueryInfo\x12\r\n\x05query\x18\x01 \x01(\t\x12\x10\n\x08query_id\x18\x02 \x01(\t\x12:\n\x08settings\x18\x03 \x03(\x0b\x32(.clickhouse.grpc.QueryInfo.SettingsEntry\x12\x10\n\x08\x64\x61tabase\x18\x04 \x01(\t\x12\x12\n\ninput_data\x18\x05 \x01(\x0c\x12\x1c\n\x14input_data_delimiter\x18\x06 \x01(\x0c\x12\x15\n\routput_format\x18\x07 \x01(\t\x12\x1b\n\x13send_output_columns\x18\x18 \x01(\x08\x12\x37\n\x0f\x65xternal_tables\x18\x08 \x03(\x0b\x32\x1e.clickhouse.grpc.ExternalTable\x12\x11\n\tuser_name\x18\t \x01(\t\x12\x10\n\x08password\x18\n \x01(\t\x12\r\n\x05quota\x18\x0b \x01(\t\x12\x12\n\nsession_id\x18\x0c \x01(\t\x12\x15\n\rsession_check\x18\r \x01(\x08\x12\x17\n\x0fsession_timeout\x18\x0e \x01(\r\x12\x0e\n\x06\x63\x61ncel\x18\x0f \x01(\x08\x12\x17\n\x0fnext_query_info\x18\x10 \x01(\x08\x12\x1e\n\x16input_compression_type\x18\x14 \x01(\t\x12\x1f\n\x17output_compression_type\x18\x15 \x01(\t\x12 \n\x18output_compression_level\x18\x13 \x01(\x05\x12"\n\x1atransport_compression_type\x18\x16 \x01(\t\x12#\n\x1btransport_compression_level\x18\x17 \x01(\x05\x12R\n\x1bobsolete_result_compression\x18\x11 \x01(\x0b\x32-.clickhouse.grpc.ObsoleteTransportCompression\x12!\n\x19obsolete_compression_type\x18\x12 \x01(\t\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01"\xa1\x01\n\x08LogEntry\x12\x0c\n\x04time\x18\x01 \x01(\r\x12\x19\n\x11time_microseconds\x18\x02 \x01(\r\x12\x11\n\tthread_id\x18\x03 \x01(\x04\x12\x10\n\x08query_id\x18\x04 \x01(\t\x12)\n\x05level\x18\x05 \x01(\x0e\x32\x1a.clickhouse.grpc.LogsLevel\x12\x0e\n\x06source\x18\x06 \x01(\t\x12\x0c\n\x04text\x18\x07 \x01(\t"z\n\x08Progress\x12\x11\n\tread_rows\x18\x01 \x01(\x04\x12\x12\n\nread_bytes\x18\x02 \x01(\x04\x12\x1a\n\x12total_rows_to_read\x18\x03 \x01(\x04\x12\x14\n\x0cwritten_rows\x18\x04 \x01(\x04\x12\x15\n\rwritten_bytes\x18\x05 \x01(\x04"p\n\x05Stats\x12\x0c\n\x04rows\x18\x01 \x01(\x04\x12\x0e\n\x06\x62locks\x18\x02 \x01(\x04\x12\x17\n\x0f\x61llocated_bytes\x18\x03 \x01(\x04\x12\x15\n\rapplied_limit\x18\x04 \x01(\x08\x12\x19\n\x11rows_before_limit\x18\x05 \x01(\x04"R\n\tException\x12\x0c\n\x04\x63ode\x18\x01 \x01(\x05\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x14\n\x0c\x64isplay_text\x18\x03 \x01(\t\x12\x13\n\x0bstack_trace\x18\x04 \x01(\t"\xeb\x02\n\x06Result\x12\x10\n\x08query_id\x18\t \x01(\t\x12\x11\n\ttime_zone\x18\n \x01(\t\x12\x15\n\routput_format\x18\x0b \x01(\t\x12\x34\n\x0eoutput_columns\x18\x0c \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0e\n\x06output\x18\x01 \x01(\x0c\x12\x0e\n\x06totals\x18\x02 \x01(\x0c\x12\x10\n\x08\x65xtremes\x18\x03 \x01(\x0c\x12\'\n\x04logs\x18\x04 \x03(\x0b\x32\x19.clickhouse.grpc.LogEntry\x12+\n\x08progress\x18\x05 \x01(\x0b\x32\x19.clickhouse.grpc.Progress\x12%\n\x05stats\x18\x06 \x01(\x0b\x32\x16.clickhouse.grpc.Stats\x12-\n\texception\x18\x07 \x01(\x0b\x32\x1a.clickhouse.grpc.Exception\x12\x11\n\tcancelled\x18\x08 \x01(\x08*\x9d\x01\n\tLogsLevel\x12\x0c\n\x08LOG_NONE\x10\x00\x12\r\n\tLOG_FATAL\x10\x01\x12\x10\n\x0cLOG_CRITICAL\x10\x02\x12\r\n\tLOG_ERROR\x10\x03\x12\x0f\n\x0bLOG_WARNING\x10\x04\x12\x0e\n\nLOG_NOTICE\x10\x05\x12\x13\n\x0fLOG_INFORMATION\x10\x06\x12\r\n\tLOG_DEBUG\x10\x07\x12\r\n\tLOG_TRACE\x10\x08\x32\xdb\x02\n\nClickHouse\x12\x45\n\x0c\x45xecuteQuery\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00\x12V\n\x1b\x45xecuteQueryWithStreamInput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00(\x01\x12W\n\x1c\x45xecuteQueryWithStreamOutput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00\x30\x01\x12U\n\x18\x45xecuteQueryWithStreamIO\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00(\x01\x30\x01\x62\x06proto3'
+)
 
-
-DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x15\x63lickhouse_grpc.proto\x12\x0f\x63lickhouse.grpc\")\n\x0bNameAndType\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t\"\xf5\x01\n\rExternalTable\x12\x0c\n\x04name\x18\x01 \x01(\t\x12-\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0c\n\x04\x64\x61ta\x18\x03 \x01(\x0c\x12\x0e\n\x06\x66ormat\x18\x04 \x01(\t\x12\x18\n\x10\x63ompression_type\x18\x06 \x01(\t\x12>\n\x08settings\x18\x05 \x03(\x0b\x32,.clickhouse.grpc.ExternalTable.SettingsEntry\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\x85\x03\n\x1cObsoleteTransportCompression\x12U\n\talgorithm\x18\x01 \x01(\x0e\x32\x42.clickhouse.grpc.ObsoleteTransportCompression.CompressionAlgorithm\x12M\n\x05level\x18\x02 \x01(\x0e\x32>.clickhouse.grpc.ObsoleteTransportCompression.CompressionLevel\"R\n\x14\x43ompressionAlgorithm\x12\x12\n\x0eNO_COMPRESSION\x10\x00\x12\x0b\n\x07\x44\x45\x46LATE\x10\x01\x12\x08\n\x04GZIP\x10\x02\x12\x0f\n\x0bSTREAM_GZIP\x10\x03\"k\n\x10\x43ompressionLevel\x12\x14\n\x10\x43OMPRESSION_NONE\x10\x00\x12\x13\n\x0f\x43OMPRESSION_LOW\x10\x01\x12\x16\n\x12\x43OMPRESSION_MEDIUM\x10\x02\x12\x14\n\x10\x43OMPRESSION_HIGH\x10\x03\"\x8e\x06\n\tQueryInfo\x12\r\n\x05query\x18\x01 \x01(\t\x12\x10\n\x08query_id\x18\x02 \x01(\t\x12:\n\x08settings\x18\x03 \x03(\x0b\x32(.clickhouse.grpc.QueryInfo.SettingsEntry\x12\x10\n\x08\x64\x61tabase\x18\x04 \x01(\t\x12\x12\n\ninput_data\x18\x05 \x01(\x0c\x12\x1c\n\x14input_data_delimiter\x18\x06 \x01(\x0c\x12\x15\n\routput_format\x18\x07 \x01(\t\x12\x1b\n\x13send_output_columns\x18\x18 \x01(\x08\x12\x37\n\x0f\x65xternal_tables\x18\x08 \x03(\x0b\x32\x1e.clickhouse.grpc.ExternalTable\x12\x11\n\tuser_name\x18\t \x01(\t\x12\x10\n\x08password\x18\n \x01(\t\x12\r\n\x05quota\x18\x0b \x01(\t\x12\x12\n\nsession_id\x18\x0c \x01(\t\x12\x15\n\rsession_check\x18\r \x01(\x08\x12\x17\n\x0fsession_timeout\x18\x0e \x01(\r\x12\x0e\n\x06\x63\x61ncel\x18\x0f \x01(\x08\x12\x17\n\x0fnext_query_info\x18\x10 \x01(\x08\x12\x1e\n\x16input_compression_type\x18\x14 \x01(\t\x12\x1f\n\x17output_compression_type\x18\x15 \x01(\t\x12 \n\x18output_compression_level\x18\x13 \x01(\x05\x12\"\n\x1atransport_compression_type\x18\x16 \x01(\t\x12#\n\x1btransport_compression_level\x18\x17 \x01(\x05\x12R\n\x1bobsolete_result_compression\x18\x11 \x01(\x0b\x32-.clickhouse.grpc.ObsoleteTransportCompression\x12!\n\x19obsolete_compression_type\x18\x12 \x01(\t\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\xa1\x01\n\x08LogEntry\x12\x0c\n\x04time\x18\x01 \x01(\r\x12\x19\n\x11time_microseconds\x18\x02 \x01(\r\x12\x11\n\tthread_id\x18\x03 \x01(\x04\x12\x10\n\x08query_id\x18\x04 \x01(\t\x12)\n\x05level\x18\x05 \x01(\x0e\x32\x1a.clickhouse.grpc.LogsLevel\x12\x0e\n\x06source\x18\x06 \x01(\t\x12\x0c\n\x04text\x18\x07 \x01(\t\"z\n\x08Progress\x12\x11\n\tread_rows\x18\x01 \x01(\x04\x12\x12\n\nread_bytes\x18\x02 \x01(\x04\x12\x1a\n\x12total_rows_to_read\x18\x03 \x01(\x04\x12\x14\n\x0cwritten_rows\x18\x04 \x01(\x04\x12\x15\n\rwritten_bytes\x18\x05 \x01(\x04\"p\n\x05Stats\x12\x0c\n\x04rows\x18\x01 \x01(\x04\x12\x0e\n\x06\x62locks\x18\x02 \x01(\x04\x12\x17\n\x0f\x61llocated_bytes\x18\x03 \x01(\x04\x12\x15\n\rapplied_limit\x18\x04 \x01(\x08\x12\x19\n\x11rows_before_limit\x18\x05 \x01(\x04\"R\n\tException\x12\x0c\n\x04\x63ode\x18\x01 \x01(\x05\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x14\n\x0c\x64isplay_text\x18\x03 \x01(\t\x12\x13\n\x0bstack_trace\x18\x04 \x01(\t\"\xeb\x02\n\x06Result\x12\x10\n\x08query_id\x18\t \x01(\t\x12\x11\n\ttime_zone\x18\n \x01(\t\x12\x15\n\routput_format\x18\x0b \x01(\t\x12\x34\n\x0eoutput_columns\x18\x0c \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0e\n\x06output\x18\x01 \x01(\x0c\x12\x0e\n\x06totals\x18\x02 \x01(\x0c\x12\x10\n\x08\x65xtremes\x18\x03 \x01(\x0c\x12\'\n\x04logs\x18\x04 \x03(\x0b\x32\x19.clickhouse.grpc.LogEntry\x12+\n\x08progress\x18\x05 \x01(\x0b\x32\x19.clickhouse.grpc.Progress\x12%\n\x05stats\x18\x06 \x01(\x0b\x32\x16.clickhouse.grpc.Stats\x12-\n\texception\x18\x07 \x01(\x0b\x32\x1a.clickhouse.grpc.Exception\x12\x11\n\tcancelled\x18\x08 \x01(\x08*\x9d\x01\n\tLogsLevel\x12\x0c\n\x08LOG_NONE\x10\x00\x12\r\n\tLOG_FATAL\x10\x01\x12\x10\n\x0cLOG_CRITICAL\x10\x02\x12\r\n\tLOG_ERROR\x10\x03\x12\x0f\n\x0bLOG_WARNING\x10\x04\x12\x0e\n\nLOG_NOTICE\x10\x05\x12\x13\n\x0fLOG_INFORMATION\x10\x06\x12\r\n\tLOG_DEBUG\x10\x07\x12\r\n\tLOG_TRACE\x10\x08\x32\xdb\x02\n\nClickHouse\x12\x45\n\x0c\x45xecuteQuery\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x12V\n\x1b\x45xecuteQueryWithStreamInput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x12W\n\x1c\x45xecuteQueryWithStreamOutput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x30\x01\x12U\n\x18\x45xecuteQueryWithStreamIO\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x30\x01\x62\x06proto3')
-
-_LOGSLEVEL = DESCRIPTOR.enum_types_by_name['LogsLevel']
+_LOGSLEVEL = DESCRIPTOR.enum_types_by_name["LogsLevel"]
 LogsLevel = enum_type_wrapper.EnumTypeWrapper(_LOGSLEVEL)
 LOG_NONE = 0
 LOG_FATAL = 1
@@ -30,134 +31,180 @@ LOG_DEBUG = 7
 LOG_TRACE = 8
 
 
-_NAMEANDTYPE = DESCRIPTOR.message_types_by_name['NameAndType']
-_EXTERNALTABLE = DESCRIPTOR.message_types_by_name['ExternalTable']
-_EXTERNALTABLE_SETTINGSENTRY = _EXTERNALTABLE.nested_types_by_name['SettingsEntry']
-_OBSOLETETRANSPORTCOMPRESSION = DESCRIPTOR.message_types_by_name['ObsoleteTransportCompression']
-_QUERYINFO = DESCRIPTOR.message_types_by_name['QueryInfo']
-_QUERYINFO_SETTINGSENTRY = _QUERYINFO.nested_types_by_name['SettingsEntry']
-_LOGENTRY = DESCRIPTOR.message_types_by_name['LogEntry']
-_PROGRESS = DESCRIPTOR.message_types_by_name['Progress']
-_STATS = DESCRIPTOR.message_types_by_name['Stats']
-_EXCEPTION = DESCRIPTOR.message_types_by_name['Exception']
-_RESULT = DESCRIPTOR.message_types_by_name['Result']
-_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionAlgorithm']
-_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionLevel']
-NameAndType = _reflection.GeneratedProtocolMessageType('NameAndType', (_message.Message,), {
-  'DESCRIPTOR' : _NAMEANDTYPE,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.NameAndType)
-  })
+_NAMEANDTYPE = DESCRIPTOR.message_types_by_name["NameAndType"]
+_EXTERNALTABLE = DESCRIPTOR.message_types_by_name["ExternalTable"]
+_EXTERNALTABLE_SETTINGSENTRY = _EXTERNALTABLE.nested_types_by_name["SettingsEntry"]
+_OBSOLETETRANSPORTCOMPRESSION = DESCRIPTOR.message_types_by_name[
+    "ObsoleteTransportCompression"
+]
+_QUERYINFO = DESCRIPTOR.message_types_by_name["QueryInfo"]
+_QUERYINFO_SETTINGSENTRY = _QUERYINFO.nested_types_by_name["SettingsEntry"]
+_LOGENTRY = DESCRIPTOR.message_types_by_name["LogEntry"]
+_PROGRESS = DESCRIPTOR.message_types_by_name["Progress"]
+_STATS = DESCRIPTOR.message_types_by_name["Stats"]
+_EXCEPTION = DESCRIPTOR.message_types_by_name["Exception"]
+_RESULT = DESCRIPTOR.message_types_by_name["Result"]
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM = (
+    _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name["CompressionAlgorithm"]
+)
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL = (
+    _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name["CompressionLevel"]
+)
+NameAndType = _reflection.GeneratedProtocolMessageType(
+    "NameAndType",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _NAMEANDTYPE,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.NameAndType)
+    },
+)
 _sym_db.RegisterMessage(NameAndType)
 
-ExternalTable = _reflection.GeneratedProtocolMessageType('ExternalTable', (_message.Message,), {
-
-  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
-    'DESCRIPTOR' : _EXTERNALTABLE_SETTINGSENTRY,
-    '__module__' : 'clickhouse_grpc_pb2'
-    # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable.SettingsEntry)
-    })
-  ,
-  'DESCRIPTOR' : _EXTERNALTABLE,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable)
-  })
+ExternalTable = _reflection.GeneratedProtocolMessageType(
+    "ExternalTable",
+    (_message.Message,),
+    {
+        "SettingsEntry": _reflection.GeneratedProtocolMessageType(
+            "SettingsEntry",
+            (_message.Message,),
+            {
+                "DESCRIPTOR": _EXTERNALTABLE_SETTINGSENTRY,
+                "__module__": "clickhouse_grpc_pb2"
+                # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable.SettingsEntry)
+            },
+        ),
+        "DESCRIPTOR": _EXTERNALTABLE,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable)
+    },
+)
 _sym_db.RegisterMessage(ExternalTable)
 _sym_db.RegisterMessage(ExternalTable.SettingsEntry)
 
-ObsoleteTransportCompression = _reflection.GeneratedProtocolMessageType('ObsoleteTransportCompression', (_message.Message,), {
-  'DESCRIPTOR' : _OBSOLETETRANSPORTCOMPRESSION,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ObsoleteTransportCompression)
-  })
+ObsoleteTransportCompression = _reflection.GeneratedProtocolMessageType(
+    "ObsoleteTransportCompression",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _OBSOLETETRANSPORTCOMPRESSION,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.ObsoleteTransportCompression)
+    },
+)
 _sym_db.RegisterMessage(ObsoleteTransportCompression)
 
-QueryInfo = _reflection.GeneratedProtocolMessageType('QueryInfo', (_message.Message,), {
-
-  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
-    'DESCRIPTOR' : _QUERYINFO_SETTINGSENTRY,
-    '__module__' : 'clickhouse_grpc_pb2'
-    # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo.SettingsEntry)
-    })
-  ,
-  'DESCRIPTOR' : _QUERYINFO,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo)
-  })
+QueryInfo = _reflection.GeneratedProtocolMessageType(
+    "QueryInfo",
+    (_message.Message,),
+    {
+        "SettingsEntry": _reflection.GeneratedProtocolMessageType(
+            "SettingsEntry",
+            (_message.Message,),
+            {
+                "DESCRIPTOR": _QUERYINFO_SETTINGSENTRY,
+                "__module__": "clickhouse_grpc_pb2"
+                # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo.SettingsEntry)
+            },
+        ),
+        "DESCRIPTOR": _QUERYINFO,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo)
+    },
+)
 _sym_db.RegisterMessage(QueryInfo)
 _sym_db.RegisterMessage(QueryInfo.SettingsEntry)
 
-LogEntry = _reflection.GeneratedProtocolMessageType('LogEntry', (_message.Message,), {
-  'DESCRIPTOR' : _LOGENTRY,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.LogEntry)
-  })
+LogEntry = _reflection.GeneratedProtocolMessageType(
+    "LogEntry",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _LOGENTRY,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.LogEntry)
+    },
+)
 _sym_db.RegisterMessage(LogEntry)
 
-Progress = _reflection.GeneratedProtocolMessageType('Progress', (_message.Message,), {
-  'DESCRIPTOR' : _PROGRESS,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Progress)
-  })
+Progress = _reflection.GeneratedProtocolMessageType(
+    "Progress",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _PROGRESS,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Progress)
+    },
+)
 _sym_db.RegisterMessage(Progress)
 
-Stats = _reflection.GeneratedProtocolMessageType('Stats', (_message.Message,), {
-  'DESCRIPTOR' : _STATS,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Stats)
-  })
+Stats = _reflection.GeneratedProtocolMessageType(
+    "Stats",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _STATS,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Stats)
+    },
+)
 _sym_db.RegisterMessage(Stats)
 
-Exception = _reflection.GeneratedProtocolMessageType('Exception', (_message.Message,), {
-  'DESCRIPTOR' : _EXCEPTION,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Exception)
-  })
+Exception = _reflection.GeneratedProtocolMessageType(
+    "Exception",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _EXCEPTION,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Exception)
+    },
+)
 _sym_db.RegisterMessage(Exception)
 
-Result = _reflection.GeneratedProtocolMessageType('Result', (_message.Message,), {
-  'DESCRIPTOR' : _RESULT,
-  '__module__' : 'clickhouse_grpc_pb2'
-  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Result)
-  })
+Result = _reflection.GeneratedProtocolMessageType(
+    "Result",
+    (_message.Message,),
+    {
+        "DESCRIPTOR": _RESULT,
+        "__module__": "clickhouse_grpc_pb2"
+        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Result)
+    },
+)
 _sym_db.RegisterMessage(Result)
 
-_CLICKHOUSE = DESCRIPTOR.services_by_name['ClickHouse']
+_CLICKHOUSE = DESCRIPTOR.services_by_name["ClickHouse"]
 if _descriptor._USE_C_DESCRIPTORS == False:
 
-  DESCRIPTOR._options = None
-  _EXTERNALTABLE_SETTINGSENTRY._options = None
-  _EXTERNALTABLE_SETTINGSENTRY._serialized_options = b'8\001'
-  _QUERYINFO_SETTINGSENTRY._options = None
-  _QUERYINFO_SETTINGSENTRY._serialized_options = b'8\001'
-  _LOGSLEVEL._serialized_start=2363
-  _LOGSLEVEL._serialized_end=2520
-  _NAMEANDTYPE._serialized_start=42
-  _NAMEANDTYPE._serialized_end=83
-  _EXTERNALTABLE._serialized_start=86
-  _EXTERNALTABLE._serialized_end=331
-  _EXTERNALTABLE_SETTINGSENTRY._serialized_start=284
-  _EXTERNALTABLE_SETTINGSENTRY._serialized_end=331
-  _OBSOLETETRANSPORTCOMPRESSION._serialized_start=334
-  _OBSOLETETRANSPORTCOMPRESSION._serialized_end=723
-  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_start=532
-  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_end=614
-  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_start=616
-  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_end=723
-  _QUERYINFO._serialized_start=726
-  _QUERYINFO._serialized_end=1508
-  _QUERYINFO_SETTINGSENTRY._serialized_start=284
-  _QUERYINFO_SETTINGSENTRY._serialized_end=331
-  _LOGENTRY._serialized_start=1511
-  _LOGENTRY._serialized_end=1672
-  _PROGRESS._serialized_start=1674
-  _PROGRESS._serialized_end=1796
-  _STATS._serialized_start=1798
-  _STATS._serialized_end=1910
-  _EXCEPTION._serialized_start=1912
-  _EXCEPTION._serialized_end=1994
-  _RESULT._serialized_start=1997
-  _RESULT._serialized_end=2360
-  _CLICKHOUSE._serialized_start=2523
-  _CLICKHOUSE._serialized_end=2870
+    DESCRIPTOR._options = None
+    _EXTERNALTABLE_SETTINGSENTRY._options = None
+    _EXTERNALTABLE_SETTINGSENTRY._serialized_options = b"8\001"
+    _QUERYINFO_SETTINGSENTRY._options = None
+    _QUERYINFO_SETTINGSENTRY._serialized_options = b"8\001"
+    _LOGSLEVEL._serialized_start = 2363
+    _LOGSLEVEL._serialized_end = 2520
+    _NAMEANDTYPE._serialized_start = 42
+    _NAMEANDTYPE._serialized_end = 83
+    _EXTERNALTABLE._serialized_start = 86
+    _EXTERNALTABLE._serialized_end = 331
+    _EXTERNALTABLE_SETTINGSENTRY._serialized_start = 284
+    _EXTERNALTABLE_SETTINGSENTRY._serialized_end = 331
+    _OBSOLETETRANSPORTCOMPRESSION._serialized_start = 334
+    _OBSOLETETRANSPORTCOMPRESSION._serialized_end = 723
+    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_start = 532
+    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_end = 614
+    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_start = 616
+    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_end = 723
+    _QUERYINFO._serialized_start = 726
+    _QUERYINFO._serialized_end = 1508
+    _QUERYINFO_SETTINGSENTRY._serialized_start = 284
+    _QUERYINFO_SETTINGSENTRY._serialized_end = 331
+    _LOGENTRY._serialized_start = 1511
+    _LOGENTRY._serialized_end = 1672
+    _PROGRESS._serialized_start = 1674
+    _PROGRESS._serialized_end = 1796
+    _STATS._serialized_start = 1798
+    _STATS._serialized_end = 1910
+    _EXCEPTION._serialized_start = 1912
+    _EXCEPTION._serialized_end = 1994
+    _RESULT._serialized_start = 1997
+    _RESULT._serialized_end = 2360
+    _CLICKHOUSE._serialized_start = 2523
+    _CLICKHOUSE._serialized_end = 2870
 # @@protoc_insertion_point(module_scope)
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
index 1c71218bbe5..25643a243b3 100644
--- a/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
@@ -15,25 +15,25 @@ class ClickHouseStub(object):
             channel: A grpc.Channel.
         """
         self.ExecuteQuery = channel.unary_unary(
-                '/clickhouse.grpc.ClickHouse/ExecuteQuery',
-                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-                )
+            "/clickhouse.grpc.ClickHouse/ExecuteQuery",
+            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+        )
         self.ExecuteQueryWithStreamInput = channel.stream_unary(
-                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
-                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-                )
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput",
+            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+        )
         self.ExecuteQueryWithStreamOutput = channel.unary_stream(
-                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
-                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-                )
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput",
+            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+        )
         self.ExecuteQueryWithStreamIO = channel.stream_stream(
-                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
-                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-                )
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO",
+            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+        )
 
 
 class ClickHouseServicer(object):
@@ -42,124 +42,173 @@ class ClickHouseServicer(object):
     def ExecuteQuery(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details('Method not implemented!')
-        raise NotImplementedError('Method not implemented!')
+        context.set_details("Method not implemented!")
+        raise NotImplementedError("Method not implemented!")
 
     def ExecuteQueryWithStreamInput(self, request_iterator, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details('Method not implemented!')
-        raise NotImplementedError('Method not implemented!')
+        context.set_details("Method not implemented!")
+        raise NotImplementedError("Method not implemented!")
 
     def ExecuteQueryWithStreamOutput(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details('Method not implemented!')
-        raise NotImplementedError('Method not implemented!')
+        context.set_details("Method not implemented!")
+        raise NotImplementedError("Method not implemented!")
 
     def ExecuteQueryWithStreamIO(self, request_iterator, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details('Method not implemented!')
-        raise NotImplementedError('Method not implemented!')
+        context.set_details("Method not implemented!")
+        raise NotImplementedError("Method not implemented!")
 
 
 def add_ClickHouseServicer_to_server(servicer, server):
     rpc_method_handlers = {
-            'ExecuteQuery': grpc.unary_unary_rpc_method_handler(
-                    servicer.ExecuteQuery,
-                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-            ),
-            'ExecuteQueryWithStreamInput': grpc.stream_unary_rpc_method_handler(
-                    servicer.ExecuteQueryWithStreamInput,
-                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-            ),
-            'ExecuteQueryWithStreamOutput': grpc.unary_stream_rpc_method_handler(
-                    servicer.ExecuteQueryWithStreamOutput,
-                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-            ),
-            'ExecuteQueryWithStreamIO': grpc.stream_stream_rpc_method_handler(
-                    servicer.ExecuteQueryWithStreamIO,
-                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-            ),
+        "ExecuteQuery": grpc.unary_unary_rpc_method_handler(
+            servicer.ExecuteQuery,
+            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+        ),
+        "ExecuteQueryWithStreamInput": grpc.stream_unary_rpc_method_handler(
+            servicer.ExecuteQueryWithStreamInput,
+            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+        ),
+        "ExecuteQueryWithStreamOutput": grpc.unary_stream_rpc_method_handler(
+            servicer.ExecuteQueryWithStreamOutput,
+            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+        ),
+        "ExecuteQueryWithStreamIO": grpc.stream_stream_rpc_method_handler(
+            servicer.ExecuteQueryWithStreamIO,
+            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+        ),
     }
     generic_handler = grpc.method_handlers_generic_handler(
-            'clickhouse.grpc.ClickHouse', rpc_method_handlers)
+        "clickhouse.grpc.ClickHouse", rpc_method_handlers
+    )
     server.add_generic_rpc_handlers((generic_handler,))
 
 
- # This class is part of an EXPERIMENTAL API.
+# This class is part of an EXPERIMENTAL API.
 class ClickHouse(object):
     """Missing associated documentation comment in .proto file."""
 
     @staticmethod
-    def ExecuteQuery(request,
+    def ExecuteQuery(
+        request,
+        target,
+        options=(),
+        channel_credentials=None,
+        call_credentials=None,
+        insecure=False,
+        compression=None,
+        wait_for_ready=None,
+        timeout=None,
+        metadata=None,
+    ):
+        return grpc.experimental.unary_unary(
+            request,
             target,
-            options=(),
-            channel_credentials=None,
-            call_credentials=None,
-            insecure=False,
-            compression=None,
-            wait_for_ready=None,
-            timeout=None,
-            metadata=None):
-        return grpc.experimental.unary_unary(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQuery',
+            "/clickhouse.grpc.ClickHouse/ExecuteQuery",
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options, channel_credentials,
-            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+            options,
+            channel_credentials,
+            insecure,
+            call_credentials,
+            compression,
+            wait_for_ready,
+            timeout,
+            metadata,
+        )
 
     @staticmethod
-    def ExecuteQueryWithStreamInput(request_iterator,
+    def ExecuteQueryWithStreamInput(
+        request_iterator,
+        target,
+        options=(),
+        channel_credentials=None,
+        call_credentials=None,
+        insecure=False,
+        compression=None,
+        wait_for_ready=None,
+        timeout=None,
+        metadata=None,
+    ):
+        return grpc.experimental.stream_unary(
+            request_iterator,
             target,
-            options=(),
-            channel_credentials=None,
-            call_credentials=None,
-            insecure=False,
-            compression=None,
-            wait_for_ready=None,
-            timeout=None,
-            metadata=None):
-        return grpc.experimental.stream_unary(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput",
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options, channel_credentials,
-            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+            options,
+            channel_credentials,
+            insecure,
+            call_credentials,
+            compression,
+            wait_for_ready,
+            timeout,
+            metadata,
+        )
 
     @staticmethod
-    def ExecuteQueryWithStreamOutput(request,
+    def ExecuteQueryWithStreamOutput(
+        request,
+        target,
+        options=(),
+        channel_credentials=None,
+        call_credentials=None,
+        insecure=False,
+        compression=None,
+        wait_for_ready=None,
+        timeout=None,
+        metadata=None,
+    ):
+        return grpc.experimental.unary_stream(
+            request,
             target,
-            options=(),
-            channel_credentials=None,
-            call_credentials=None,
-            insecure=False,
-            compression=None,
-            wait_for_ready=None,
-            timeout=None,
-            metadata=None):
-        return grpc.experimental.unary_stream(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput",
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options, channel_credentials,
-            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+            options,
+            channel_credentials,
+            insecure,
+            call_credentials,
+            compression,
+            wait_for_ready,
+            timeout,
+            metadata,
+        )
 
     @staticmethod
-    def ExecuteQueryWithStreamIO(request_iterator,
+    def ExecuteQueryWithStreamIO(
+        request_iterator,
+        target,
+        options=(),
+        channel_credentials=None,
+        call_credentials=None,
+        insecure=False,
+        compression=None,
+        wait_for_ready=None,
+        timeout=None,
+        metadata=None,
+    ):
+        return grpc.experimental.stream_stream(
+            request_iterator,
             target,
-            options=(),
-            channel_credentials=None,
-            call_credentials=None,
-            insecure=False,
-            compression=None,
-            wait_for_ready=None,
-            timeout=None,
-            metadata=None):
-        return grpc.experimental.stream_stream(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
+            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO",
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options, channel_credentials,
-            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+            options,
+            channel_credentials,
+            insecure,
+            call_credentials,
+            compression,
+            wait_for_ready,
+            timeout,
+            metadata,
+        )

From e42d10fa9ccf4296732941e9f1b333d692e83384 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 06:25:20 +0100
Subject: [PATCH 0141/1081] Revert "Obey Python's quirky formatter"

This reverts commit 678a32cedee768b6c1a6748e96a0d103e853d8bc.
---
 tests/integration/ci-runner.py                |  13 +-
 .../test_async_insert_memory/test.py          |   2 +-
 tests/integration/test_check_table/test.py    |  76 ++---
 .../test_cluster_discovery/test.py            |   2 +-
 .../test_ldap_external_user_directory/test.py |  26 +-
 tests/integration/test_mysql_protocol/test.py |  16 +-
 tests/integration/test_partition/test.py      |   4 +-
 .../test_replicated_database/test.py          |   9 +-
 .../test.py                                   |   9 +-
 .../s3_mocks/unstable_server.py               |   2 +-
 tests/integration/test_storage_s3/test.py     |  17 +-
 tests/integration/test_storage_url/test.py    |  22 +-
 tests/integration/test_system_merges/test.py  |  45 +--
 utils/grpc-client/pb2/clickhouse_grpc_pb2.py  | 271 ++++++++----------
 .../pb2/clickhouse_grpc_pb2_grpc.py           | 237 ++++++---------
 15 files changed, 318 insertions(+), 433 deletions(-)

diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index d54ed2bb767..7c922e339fe 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -305,11 +305,14 @@ class ClickhouseIntegrationTestsRunner:
     def _pre_pull_images(self, repo_path):
         image_cmd = self._get_runner_image_cmd(repo_path)
 
-        cmd = "cd {repo_path}/tests/integration && " "timeout --signal=KILL 1h ./runner {runner_opts} {image_cmd} --pre-pull --command '{command}' ".format(
-            repo_path=repo_path,
-            runner_opts=self._get_runner_opts(),
-            image_cmd=image_cmd,
-            command=r""" echo Pre Pull finished """,
+        cmd = (
+            "cd {repo_path}/tests/integration && "
+            "timeout --signal=KILL 1h ./runner {runner_opts} {image_cmd} --pre-pull --command '{command}' ".format(
+                repo_path=repo_path,
+                runner_opts=self._get_runner_opts(),
+                image_cmd=image_cmd,
+                command=r""" echo Pre Pull finished """,
+            )
         )
 
         for i in range(5):
diff --git a/tests/integration/test_async_insert_memory/test.py b/tests/integration/test_async_insert_memory/test.py
index f897007f7bb..5d2e5503680 100644
--- a/tests/integration/test_async_insert_memory/test.py
+++ b/tests/integration/test_async_insert_memory/test.py
@@ -43,7 +43,7 @@ def test_memory_usage():
 
     response = node.get_query_request(
         "SELECT groupArray(number) FROM numbers(1000000) SETTINGS max_memory_usage_for_user={}".format(
-            30 * (2 ** 23)
+            30 * (2**23)
         ),
         user="A",
     )
diff --git a/tests/integration/test_check_table/test.py b/tests/integration/test_check_table/test.py
index ebf404e698b..021977fb6b6 100644
--- a/tests/integration/test_check_table/test.py
+++ b/tests/integration/test_check_table/test.py
@@ -95,25 +95,15 @@ def test_check_normal_table_corruption(started_cluster, merge_tree_settings):
         node1, "non_replicated_mt", "201902_1_1_0", database="default"
     )
 
-    assert (
-        node1.query(
-            "CHECK TABLE non_replicated_mt",
-            settings={"check_query_single_value_result": 0, "max_threads": 1},
-        )
-        .strip()
-        .split("\t")[0:2]
-        == ["201902_1_1_0", "0"]
-    )
+    assert node1.query(
+        "CHECK TABLE non_replicated_mt",
+        settings={"check_query_single_value_result": 0, "max_threads": 1},
+    ).strip().split("\t")[0:2] == ["201902_1_1_0", "0"]
 
-    assert (
-        node1.query(
-            "CHECK TABLE non_replicated_mt",
-            settings={"check_query_single_value_result": 0, "max_threads": 1},
-        )
-        .strip()
-        .split("\t")[0:2]
-        == ["201902_1_1_0", "0"]
-    )
+    assert node1.query(
+        "CHECK TABLE non_replicated_mt",
+        settings={"check_query_single_value_result": 0, "max_threads": 1},
+    ).strip().split("\t")[0:2] == ["201902_1_1_0", "0"]
 
     node1.query(
         "INSERT INTO non_replicated_mt VALUES (toDate('2019-01-01'), 1, 10), (toDate('2019-01-01'), 2, 12)"
@@ -133,15 +123,10 @@ def test_check_normal_table_corruption(started_cluster, merge_tree_settings):
 
     remove_checksums_on_disk(node1, "default", "non_replicated_mt", "201901_2_2_0")
 
-    assert (
-        node1.query(
-            "CHECK TABLE non_replicated_mt PARTITION 201901",
-            settings={"check_query_single_value_result": 0, "max_threads": 1},
-        )
-        .strip()
-        .split("\t")[0:2]
-        == ["201901_2_2_0", "0"]
-    )
+    assert node1.query(
+        "CHECK TABLE non_replicated_mt PARTITION 201901",
+        settings={"check_query_single_value_result": 0, "max_threads": 1},
+    ).strip().split("\t")[0:2] == ["201901_2_2_0", "0"]
 
 
 @pytest.mark.parametrize("merge_tree_settings, zk_path_suffix", [("", "_0")])
@@ -209,15 +194,12 @@ def test_check_replicated_table_simple(
         == "201901_0_0_0\t1\t\n"
     )
 
-    assert (
-        sorted(
-            node2.query(
-                "CHECK TABLE replicated_mt",
-                settings={"check_query_single_value_result": 0},
-            ).split("\n")
-        )
-        == ["", "201901_0_0_0\t1\t", "201902_0_0_0\t1\t"]
-    )
+    assert sorted(
+        node2.query(
+            "CHECK TABLE replicated_mt",
+            settings={"check_query_single_value_result": 0},
+        ).split("\n")
+    ) == ["", "201901_0_0_0\t1\t", "201902_0_0_0\t1\t"]
 
     with pytest.raises(QueryRuntimeException) as exc:
         node2.query(
@@ -291,13 +273,10 @@ def test_check_replicated_table_corruption(
     )
 
     node1.query_with_retry("SYSTEM SYNC REPLICA replicated_mt_1")
-    assert (
-        node1.query(
-            "CHECK TABLE replicated_mt_1 PARTITION 201901",
-            settings={"check_query_single_value_result": 0, "max_threads": 1},
-        )
-        == "{}\t1\t\n".format(part_name)
-    )
+    assert node1.query(
+        "CHECK TABLE replicated_mt_1 PARTITION 201901",
+        settings={"check_query_single_value_result": 0, "max_threads": 1},
+    ) == "{}\t1\t\n".format(part_name)
     assert node1.query("SELECT count() from replicated_mt_1") == "4\n"
 
     remove_part_from_disk(node2, "replicated_mt_1", part_name)
@@ -309,13 +288,10 @@ def test_check_replicated_table_corruption(
     )
 
     node1.query("SYSTEM SYNC REPLICA replicated_mt_1")
-    assert (
-        node1.query(
-            "CHECK TABLE replicated_mt_1 PARTITION 201901",
-            settings={"check_query_single_value_result": 0, "max_threads": 1},
-        )
-        == "{}\t1\t\n".format(part_name)
-    )
+    assert node1.query(
+        "CHECK TABLE replicated_mt_1 PARTITION 201901",
+        settings={"check_query_single_value_result": 0, "max_threads": 1},
+    ) == "{}\t1\t\n".format(part_name)
     assert node1.query("SELECT count() from replicated_mt_1") == "4\n"
 
 
diff --git a/tests/integration/test_cluster_discovery/test.py b/tests/integration/test_cluster_discovery/test.py
index a2e7e15b956..ad3deb5b142 100644
--- a/tests/integration/test_cluster_discovery/test.py
+++ b/tests/integration/test_cluster_discovery/test.py
@@ -61,7 +61,7 @@ def check_on_cluster(
         print(f"Retry {retry}/{retries} unsuccessful, result: {node_results}")
 
         if retry != retries:
-            time.sleep(2 ** retry)
+            time.sleep(2**retry)
     else:
         msg = msg or f"Wrong '{what}' result"
         raise Exception(
diff --git a/tests/integration/test_ldap_external_user_directory/test.py b/tests/integration/test_ldap_external_user_directory/test.py
index c9642c293ee..39753794d63 100644
--- a/tests/integration/test_ldap_external_user_directory/test.py
+++ b/tests/integration/test_ldap_external_user_directory/test.py
@@ -76,14 +76,11 @@ def test_role_mapping(ldap_cluster):
         "select currentUser()", user="johndoe", password="qwertz"
     ) == TSV([["johndoe"]])
 
-    assert (
-        instance.query(
-            "select role_name from system.current_roles ORDER BY role_name",
-            user="johndoe",
-            password="qwertz",
-        )
-        == TSV([["role_1"], ["role_2"]])
-    )
+    assert instance.query(
+        "select role_name from system.current_roles ORDER BY role_name",
+        user="johndoe",
+        password="qwertz",
+    ) == TSV([["role_1"], ["role_2"]])
 
     instance.query("CREATE ROLE role_3")
     add_ldap_group(ldap_cluster, group_cn="clickhouse-role_3", member_cn="johndoe")
@@ -91,11 +88,8 @@ def test_role_mapping(ldap_cluster):
     # See https://github.com/ClickHouse/ClickHouse/issues/54318
     add_ldap_group(ldap_cluster, group_cn="clickhouse-role_4", member_cn="johndoe")
 
-    assert (
-        instance.query(
-            "select role_name from system.current_roles ORDER BY role_name",
-            user="johndoe",
-            password="qwertz",
-        )
-        == TSV([["role_1"], ["role_2"], ["role_3"]])
-    )
+    assert instance.query(
+        "select role_name from system.current_roles ORDER BY role_name",
+        user="johndoe",
+        password="qwertz",
+    ) == TSV([["role_1"], ["role_2"], ["role_3"]])
diff --git a/tests/integration/test_mysql_protocol/test.py b/tests/integration/test_mysql_protocol/test.py
index 61e76c0dc97..7a69d07633c 100644
--- a/tests/integration/test_mysql_protocol/test.py
+++ b/tests/integration/test_mysql_protocol/test.py
@@ -854,14 +854,14 @@ def test_types(started_cluster):
 
     result = cursor.fetchall()[0]
     expected = [
-        ("Int8_column", -(2 ** 7)),
-        ("UInt8_column", 2 ** 8 - 1),
-        ("Int16_column", -(2 ** 15)),
-        ("UInt16_column", 2 ** 16 - 1),
-        ("Int32_column", -(2 ** 31)),
-        ("UInt32_column", 2 ** 32 - 1),
-        ("Int64_column", -(2 ** 63)),
-        ("UInt64_column", 2 ** 64 - 1),
+        ("Int8_column", -(2**7)),
+        ("UInt8_column", 2**8 - 1),
+        ("Int16_column", -(2**15)),
+        ("UInt16_column", 2**16 - 1),
+        ("Int32_column", -(2**31)),
+        ("UInt32_column", 2**32 - 1),
+        ("Int64_column", -(2**63)),
+        ("UInt64_column", 2**64 - 1),
         ("String_column", "тест"),
         ("FixedString_column", "тест"),
         ("Float32_column", 1.5),
diff --git a/tests/integration/test_partition/test.py b/tests/integration/test_partition/test.py
index d39787f8924..054418a8ba9 100644
--- a/tests/integration/test_partition/test.py
+++ b/tests/integration/test_partition/test.py
@@ -561,7 +561,9 @@ def test_make_clone_in_detached(started_cluster):
         ["cp", "-r", path + "all_0_0_0", path + "detached/broken_all_0_0_0"]
     )
     assert_eq_with_retry(instance, "select * from clone_in_detached", "\n")
-    assert ["broken_all_0_0_0",] == sorted(
+    assert [
+        "broken_all_0_0_0",
+    ] == sorted(
         instance.exec_in_container(["ls", path + "detached/"]).strip().split("\n")
     )
 
diff --git a/tests/integration/test_replicated_database/test.py b/tests/integration/test_replicated_database/test.py
index 16425c9bd9e..1fc3fe37044 100644
--- a/tests/integration/test_replicated_database/test.py
+++ b/tests/integration/test_replicated_database/test.py
@@ -506,9 +506,12 @@ def test_alters_from_different_replicas(started_cluster):
     dummy_node.stop_clickhouse(kill=True)
 
     settings = {"distributed_ddl_task_timeout": 5}
-    assert "There are 1 unfinished hosts (0 of them are currently executing the task" in competing_node.query_and_get_error(
-        "ALTER TABLE alters_from_different_replicas.concurrent_test ADD COLUMN Added0 UInt32;",
-        settings=settings,
+    assert (
+        "There are 1 unfinished hosts (0 of them are currently executing the task"
+        in competing_node.query_and_get_error(
+            "ALTER TABLE alters_from_different_replicas.concurrent_test ADD COLUMN Added0 UInt32;",
+            settings=settings,
+        )
     )
     settings = {
         "distributed_ddl_task_timeout": 5,
diff --git a/tests/integration/test_replicated_database_cluster_groups/test.py b/tests/integration/test_replicated_database_cluster_groups/test.py
index 5a315707efb..647626d8014 100644
--- a/tests/integration/test_replicated_database_cluster_groups/test.py
+++ b/tests/integration/test_replicated_database_cluster_groups/test.py
@@ -95,9 +95,12 @@ def test_cluster_groups(started_cluster):
     # Exception
     main_node_2.stop_clickhouse()
     settings = {"distributed_ddl_task_timeout": 5}
-    assert "There are 1 unfinished hosts (0 of them are currently executing the task)" in main_node_1.query_and_get_error(
-        "CREATE TABLE cluster_groups.table_2 (d Date, k UInt64) ENGINE=ReplicatedMergeTree ORDER BY k PARTITION BY toYYYYMM(d);",
-        settings=settings,
+    assert (
+        "There are 1 unfinished hosts (0 of them are currently executing the task)"
+        in main_node_1.query_and_get_error(
+            "CREATE TABLE cluster_groups.table_2 (d Date, k UInt64) ENGINE=ReplicatedMergeTree ORDER BY k PARTITION BY toYYYYMM(d);",
+            settings=settings,
+        )
     )
 
     # 3. After start both groups are synced
diff --git a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
index 3632fa15d8a..5ef781bdc9e 100644
--- a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
+++ b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
@@ -9,7 +9,7 @@ import time
 
 def gen_n_digit_number(n):
     assert 0 < n < 19
-    return random.randint(10 ** (n - 1), 10 ** n - 1)
+    return random.randint(10 ** (n - 1), 10**n - 1)
 
 
 sum_in_4_column = 0
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index e941356261a..2549cb0d473 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -553,13 +553,16 @@ def test_multipart(started_cluster, maybe_auth, positive):
         assert csv_data == get_s3_file_content(started_cluster, bucket, filename)
 
     # select uploaded data from many threads
-    select_query = "select sum(column1), sum(column2), sum(column3) " "from s3('http://{host}:{port}/{bucket}/{filename}', {auth}'CSV', '{table_format}')".format(
-        host=started_cluster.minio_redirect_host,
-        port=started_cluster.minio_redirect_port,
-        bucket=bucket,
-        filename=filename,
-        auth=maybe_auth,
-        table_format=table_format,
+    select_query = (
+        "select sum(column1), sum(column2), sum(column3) "
+        "from s3('http://{host}:{port}/{bucket}/{filename}', {auth}'CSV', '{table_format}')".format(
+            host=started_cluster.minio_redirect_host,
+            port=started_cluster.minio_redirect_port,
+            bucket=bucket,
+            filename=filename,
+            auth=maybe_auth,
+            table_format=table_format,
+        )
     )
     try:
         select_result = run_query(
diff --git a/tests/integration/test_storage_url/test.py b/tests/integration/test_storage_url/test.py
index 771df49cbac..7ff7a871413 100644
--- a/tests/integration/test_storage_url/test.py
+++ b/tests/integration/test_storage_url/test.py
@@ -79,21 +79,15 @@ def test_table_function_url_access_rights():
         f"SELECT * FROM url('http://nginx:80/test_1', 'TSV')", user="u1"
     )
 
-    assert (
-        node1.query(
-            f"DESCRIBE TABLE url('http://nginx:80/test_1', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
-            user="u1",
-        )
-        == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
-    )
+    assert node1.query(
+        f"DESCRIBE TABLE url('http://nginx:80/test_1', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
+        user="u1",
+    ) == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
 
-    assert (
-        node1.query(
-            f"DESCRIBE TABLE url('http://nginx:80/not-exist', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
-            user="u1",
-        )
-        == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
-    )
+    assert node1.query(
+        f"DESCRIBE TABLE url('http://nginx:80/not-exist', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')",
+        user="u1",
+    ) == TSV([["column1", "UInt32"], ["column2", "UInt32"], ["column3", "UInt32"]])
 
     expected_error = "necessary to have the grant URL ON *.*"
     assert expected_error in node1.query_and_get_error(
diff --git a/tests/integration/test_system_merges/test.py b/tests/integration/test_system_merges/test.py
index bacb0eb500d..6dbe6c891f2 100644
--- a/tests/integration/test_system_merges/test.py
+++ b/tests/integration/test_system_merges/test.py
@@ -204,33 +204,36 @@ def test_mutation_simple(started_cluster, replicated):
             sleep_time=0.1,
         )
 
-        assert split_tsv(
-            node_check.query(
-                """
+        assert (
+            split_tsv(
+                node_check.query(
+                    """
             SELECT database, table, num_parts, source_part_names, source_part_paths, result_part_name, result_part_path, partition_id, is_mutation
                 FROM system.merges
                 WHERE table = '{name}'
         """.format(
-                    name=table_name
+                        name=table_name
+                    )
                 )
             )
-        ) == [
-            [
-                db_name,
-                table_name,
-                "1",
-                "['{}']".format(part),
-                "['{clickhouse}/{table_path}/{}/']".format(
-                    part, clickhouse=clickhouse_path, table_path=table_path
-                ),
-                result_part,
-                "{clickhouse}/{table_path}/{}/".format(
-                    result_part, clickhouse=clickhouse_path, table_path=table_path
-                ),
-                "all",
-                "1",
-            ],
-        ]
+            == [
+                [
+                    db_name,
+                    table_name,
+                    "1",
+                    "['{}']".format(part),
+                    "['{clickhouse}/{table_path}/{}/']".format(
+                        part, clickhouse=clickhouse_path, table_path=table_path
+                    ),
+                    result_part,
+                    "{clickhouse}/{table_path}/{}/".format(
+                        result_part, clickhouse=clickhouse_path, table_path=table_path
+                    ),
+                    "all",
+                    "1",
+                ],
+            ]
+        )
         t.join()
 
         assert (
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
index 9bf7817c7d3..6218047af3c 100644
--- a/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
@@ -8,17 +8,16 @@ from google.protobuf import descriptor_pool as _descriptor_pool
 from google.protobuf import message as _message
 from google.protobuf import reflection as _reflection
 from google.protobuf import symbol_database as _symbol_database
-
 # @@protoc_insertion_point(imports)
 
 _sym_db = _symbol_database.Default()
 
 
-DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b'\n\x15\x63lickhouse_grpc.proto\x12\x0f\x63lickhouse.grpc")\n\x0bNameAndType\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t"\xf5\x01\n\rExternalTable\x12\x0c\n\x04name\x18\x01 \x01(\t\x12-\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0c\n\x04\x64\x61ta\x18\x03 \x01(\x0c\x12\x0e\n\x06\x66ormat\x18\x04 \x01(\t\x12\x18\n\x10\x63ompression_type\x18\x06 \x01(\t\x12>\n\x08settings\x18\x05 \x03(\x0b\x32,.clickhouse.grpc.ExternalTable.SettingsEntry\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01"\x85\x03\n\x1cObsoleteTransportCompression\x12U\n\talgorithm\x18\x01 \x01(\x0e\x32\x42.clickhouse.grpc.ObsoleteTransportCompression.CompressionAlgorithm\x12M\n\x05level\x18\x02 \x01(\x0e\x32>.clickhouse.grpc.ObsoleteTransportCompression.CompressionLevel"R\n\x14\x43ompressionAlgorithm\x12\x12\n\x0eNO_COMPRESSION\x10\x00\x12\x0b\n\x07\x44\x45\x46LATE\x10\x01\x12\x08\n\x04GZIP\x10\x02\x12\x0f\n\x0bSTREAM_GZIP\x10\x03"k\n\x10\x43ompressionLevel\x12\x14\n\x10\x43OMPRESSION_NONE\x10\x00\x12\x13\n\x0f\x43OMPRESSION_LOW\x10\x01\x12\x16\n\x12\x43OMPRESSION_MEDIUM\x10\x02\x12\x14\n\x10\x43OMPRESSION_HIGH\x10\x03"\x8e\x06\n\tQueryInfo\x12\r\n\x05query\x18\x01 \x01(\t\x12\x10\n\x08query_id\x18\x02 \x01(\t\x12:\n\x08settings\x18\x03 \x03(\x0b\x32(.clickhouse.grpc.QueryInfo.SettingsEntry\x12\x10\n\x08\x64\x61tabase\x18\x04 \x01(\t\x12\x12\n\ninput_data\x18\x05 \x01(\x0c\x12\x1c\n\x14input_data_delimiter\x18\x06 \x01(\x0c\x12\x15\n\routput_format\x18\x07 \x01(\t\x12\x1b\n\x13send_output_columns\x18\x18 \x01(\x08\x12\x37\n\x0f\x65xternal_tables\x18\x08 \x03(\x0b\x32\x1e.clickhouse.grpc.ExternalTable\x12\x11\n\tuser_name\x18\t \x01(\t\x12\x10\n\x08password\x18\n \x01(\t\x12\r\n\x05quota\x18\x0b \x01(\t\x12\x12\n\nsession_id\x18\x0c \x01(\t\x12\x15\n\rsession_check\x18\r \x01(\x08\x12\x17\n\x0fsession_timeout\x18\x0e \x01(\r\x12\x0e\n\x06\x63\x61ncel\x18\x0f \x01(\x08\x12\x17\n\x0fnext_query_info\x18\x10 \x01(\x08\x12\x1e\n\x16input_compression_type\x18\x14 \x01(\t\x12\x1f\n\x17output_compression_type\x18\x15 \x01(\t\x12 \n\x18output_compression_level\x18\x13 \x01(\x05\x12"\n\x1atransport_compression_type\x18\x16 \x01(\t\x12#\n\x1btransport_compression_level\x18\x17 \x01(\x05\x12R\n\x1bobsolete_result_compression\x18\x11 \x01(\x0b\x32-.clickhouse.grpc.ObsoleteTransportCompression\x12!\n\x19obsolete_compression_type\x18\x12 \x01(\t\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01"\xa1\x01\n\x08LogEntry\x12\x0c\n\x04time\x18\x01 \x01(\r\x12\x19\n\x11time_microseconds\x18\x02 \x01(\r\x12\x11\n\tthread_id\x18\x03 \x01(\x04\x12\x10\n\x08query_id\x18\x04 \x01(\t\x12)\n\x05level\x18\x05 \x01(\x0e\x32\x1a.clickhouse.grpc.LogsLevel\x12\x0e\n\x06source\x18\x06 \x01(\t\x12\x0c\n\x04text\x18\x07 \x01(\t"z\n\x08Progress\x12\x11\n\tread_rows\x18\x01 \x01(\x04\x12\x12\n\nread_bytes\x18\x02 \x01(\x04\x12\x1a\n\x12total_rows_to_read\x18\x03 \x01(\x04\x12\x14\n\x0cwritten_rows\x18\x04 \x01(\x04\x12\x15\n\rwritten_bytes\x18\x05 \x01(\x04"p\n\x05Stats\x12\x0c\n\x04rows\x18\x01 \x01(\x04\x12\x0e\n\x06\x62locks\x18\x02 \x01(\x04\x12\x17\n\x0f\x61llocated_bytes\x18\x03 \x01(\x04\x12\x15\n\rapplied_limit\x18\x04 \x01(\x08\x12\x19\n\x11rows_before_limit\x18\x05 \x01(\x04"R\n\tException\x12\x0c\n\x04\x63ode\x18\x01 \x01(\x05\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x14\n\x0c\x64isplay_text\x18\x03 \x01(\t\x12\x13\n\x0bstack_trace\x18\x04 \x01(\t"\xeb\x02\n\x06Result\x12\x10\n\x08query_id\x18\t \x01(\t\x12\x11\n\ttime_zone\x18\n \x01(\t\x12\x15\n\routput_format\x18\x0b \x01(\t\x12\x34\n\x0eoutput_columns\x18\x0c \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0e\n\x06output\x18\x01 \x01(\x0c\x12\x0e\n\x06totals\x18\x02 \x01(\x0c\x12\x10\n\x08\x65xtremes\x18\x03 \x01(\x0c\x12\'\n\x04logs\x18\x04 \x03(\x0b\x32\x19.clickhouse.grpc.LogEntry\x12+\n\x08progress\x18\x05 \x01(\x0b\x32\x19.clickhouse.grpc.Progress\x12%\n\x05stats\x18\x06 \x01(\x0b\x32\x16.clickhouse.grpc.Stats\x12-\n\texception\x18\x07 \x01(\x0b\x32\x1a.clickhouse.grpc.Exception\x12\x11\n\tcancelled\x18\x08 \x01(\x08*\x9d\x01\n\tLogsLevel\x12\x0c\n\x08LOG_NONE\x10\x00\x12\r\n\tLOG_FATAL\x10\x01\x12\x10\n\x0cLOG_CRITICAL\x10\x02\x12\r\n\tLOG_ERROR\x10\x03\x12\x0f\n\x0bLOG_WARNING\x10\x04\x12\x0e\n\nLOG_NOTICE\x10\x05\x12\x13\n\x0fLOG_INFORMATION\x10\x06\x12\r\n\tLOG_DEBUG\x10\x07\x12\r\n\tLOG_TRACE\x10\x08\x32\xdb\x02\n\nClickHouse\x12\x45\n\x0c\x45xecuteQuery\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00\x12V\n\x1b\x45xecuteQueryWithStreamInput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00(\x01\x12W\n\x1c\x45xecuteQueryWithStreamOutput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00\x30\x01\x12U\n\x18\x45xecuteQueryWithStreamIO\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result"\x00(\x01\x30\x01\x62\x06proto3'
-)
 
-_LOGSLEVEL = DESCRIPTOR.enum_types_by_name["LogsLevel"]
+
+DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x15\x63lickhouse_grpc.proto\x12\x0f\x63lickhouse.grpc\")\n\x0bNameAndType\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t\"\xf5\x01\n\rExternalTable\x12\x0c\n\x04name\x18\x01 \x01(\t\x12-\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0c\n\x04\x64\x61ta\x18\x03 \x01(\x0c\x12\x0e\n\x06\x66ormat\x18\x04 \x01(\t\x12\x18\n\x10\x63ompression_type\x18\x06 \x01(\t\x12>\n\x08settings\x18\x05 \x03(\x0b\x32,.clickhouse.grpc.ExternalTable.SettingsEntry\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\x85\x03\n\x1cObsoleteTransportCompression\x12U\n\talgorithm\x18\x01 \x01(\x0e\x32\x42.clickhouse.grpc.ObsoleteTransportCompression.CompressionAlgorithm\x12M\n\x05level\x18\x02 \x01(\x0e\x32>.clickhouse.grpc.ObsoleteTransportCompression.CompressionLevel\"R\n\x14\x43ompressionAlgorithm\x12\x12\n\x0eNO_COMPRESSION\x10\x00\x12\x0b\n\x07\x44\x45\x46LATE\x10\x01\x12\x08\n\x04GZIP\x10\x02\x12\x0f\n\x0bSTREAM_GZIP\x10\x03\"k\n\x10\x43ompressionLevel\x12\x14\n\x10\x43OMPRESSION_NONE\x10\x00\x12\x13\n\x0f\x43OMPRESSION_LOW\x10\x01\x12\x16\n\x12\x43OMPRESSION_MEDIUM\x10\x02\x12\x14\n\x10\x43OMPRESSION_HIGH\x10\x03\"\x8e\x06\n\tQueryInfo\x12\r\n\x05query\x18\x01 \x01(\t\x12\x10\n\x08query_id\x18\x02 \x01(\t\x12:\n\x08settings\x18\x03 \x03(\x0b\x32(.clickhouse.grpc.QueryInfo.SettingsEntry\x12\x10\n\x08\x64\x61tabase\x18\x04 \x01(\t\x12\x12\n\ninput_data\x18\x05 \x01(\x0c\x12\x1c\n\x14input_data_delimiter\x18\x06 \x01(\x0c\x12\x15\n\routput_format\x18\x07 \x01(\t\x12\x1b\n\x13send_output_columns\x18\x18 \x01(\x08\x12\x37\n\x0f\x65xternal_tables\x18\x08 \x03(\x0b\x32\x1e.clickhouse.grpc.ExternalTable\x12\x11\n\tuser_name\x18\t \x01(\t\x12\x10\n\x08password\x18\n \x01(\t\x12\r\n\x05quota\x18\x0b \x01(\t\x12\x12\n\nsession_id\x18\x0c \x01(\t\x12\x15\n\rsession_check\x18\r \x01(\x08\x12\x17\n\x0fsession_timeout\x18\x0e \x01(\r\x12\x0e\n\x06\x63\x61ncel\x18\x0f \x01(\x08\x12\x17\n\x0fnext_query_info\x18\x10 \x01(\x08\x12\x1e\n\x16input_compression_type\x18\x14 \x01(\t\x12\x1f\n\x17output_compression_type\x18\x15 \x01(\t\x12 \n\x18output_compression_level\x18\x13 \x01(\x05\x12\"\n\x1atransport_compression_type\x18\x16 \x01(\t\x12#\n\x1btransport_compression_level\x18\x17 \x01(\x05\x12R\n\x1bobsolete_result_compression\x18\x11 \x01(\x0b\x32-.clickhouse.grpc.ObsoleteTransportCompression\x12!\n\x19obsolete_compression_type\x18\x12 \x01(\t\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\xa1\x01\n\x08LogEntry\x12\x0c\n\x04time\x18\x01 \x01(\r\x12\x19\n\x11time_microseconds\x18\x02 \x01(\r\x12\x11\n\tthread_id\x18\x03 \x01(\x04\x12\x10\n\x08query_id\x18\x04 \x01(\t\x12)\n\x05level\x18\x05 \x01(\x0e\x32\x1a.clickhouse.grpc.LogsLevel\x12\x0e\n\x06source\x18\x06 \x01(\t\x12\x0c\n\x04text\x18\x07 \x01(\t\"z\n\x08Progress\x12\x11\n\tread_rows\x18\x01 \x01(\x04\x12\x12\n\nread_bytes\x18\x02 \x01(\x04\x12\x1a\n\x12total_rows_to_read\x18\x03 \x01(\x04\x12\x14\n\x0cwritten_rows\x18\x04 \x01(\x04\x12\x15\n\rwritten_bytes\x18\x05 \x01(\x04\"p\n\x05Stats\x12\x0c\n\x04rows\x18\x01 \x01(\x04\x12\x0e\n\x06\x62locks\x18\x02 \x01(\x04\x12\x17\n\x0f\x61llocated_bytes\x18\x03 \x01(\x04\x12\x15\n\rapplied_limit\x18\x04 \x01(\x08\x12\x19\n\x11rows_before_limit\x18\x05 \x01(\x04\"R\n\tException\x12\x0c\n\x04\x63ode\x18\x01 \x01(\x05\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x14\n\x0c\x64isplay_text\x18\x03 \x01(\t\x12\x13\n\x0bstack_trace\x18\x04 \x01(\t\"\xeb\x02\n\x06Result\x12\x10\n\x08query_id\x18\t \x01(\t\x12\x11\n\ttime_zone\x18\n \x01(\t\x12\x15\n\routput_format\x18\x0b \x01(\t\x12\x34\n\x0eoutput_columns\x18\x0c \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0e\n\x06output\x18\x01 \x01(\x0c\x12\x0e\n\x06totals\x18\x02 \x01(\x0c\x12\x10\n\x08\x65xtremes\x18\x03 \x01(\x0c\x12\'\n\x04logs\x18\x04 \x03(\x0b\x32\x19.clickhouse.grpc.LogEntry\x12+\n\x08progress\x18\x05 \x01(\x0b\x32\x19.clickhouse.grpc.Progress\x12%\n\x05stats\x18\x06 \x01(\x0b\x32\x16.clickhouse.grpc.Stats\x12-\n\texception\x18\x07 \x01(\x0b\x32\x1a.clickhouse.grpc.Exception\x12\x11\n\tcancelled\x18\x08 \x01(\x08*\x9d\x01\n\tLogsLevel\x12\x0c\n\x08LOG_NONE\x10\x00\x12\r\n\tLOG_FATAL\x10\x01\x12\x10\n\x0cLOG_CRITICAL\x10\x02\x12\r\n\tLOG_ERROR\x10\x03\x12\x0f\n\x0bLOG_WARNING\x10\x04\x12\x0e\n\nLOG_NOTICE\x10\x05\x12\x13\n\x0fLOG_INFORMATION\x10\x06\x12\r\n\tLOG_DEBUG\x10\x07\x12\r\n\tLOG_TRACE\x10\x08\x32\xdb\x02\n\nClickHouse\x12\x45\n\x0c\x45xecuteQuery\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x12V\n\x1b\x45xecuteQueryWithStreamInput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x12W\n\x1c\x45xecuteQueryWithStreamOutput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x30\x01\x12U\n\x18\x45xecuteQueryWithStreamIO\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x30\x01\x62\x06proto3')
+
+_LOGSLEVEL = DESCRIPTOR.enum_types_by_name['LogsLevel']
 LogsLevel = enum_type_wrapper.EnumTypeWrapper(_LOGSLEVEL)
 LOG_NONE = 0
 LOG_FATAL = 1
@@ -31,180 +30,134 @@ LOG_DEBUG = 7
 LOG_TRACE = 8
 
 
-_NAMEANDTYPE = DESCRIPTOR.message_types_by_name["NameAndType"]
-_EXTERNALTABLE = DESCRIPTOR.message_types_by_name["ExternalTable"]
-_EXTERNALTABLE_SETTINGSENTRY = _EXTERNALTABLE.nested_types_by_name["SettingsEntry"]
-_OBSOLETETRANSPORTCOMPRESSION = DESCRIPTOR.message_types_by_name[
-    "ObsoleteTransportCompression"
-]
-_QUERYINFO = DESCRIPTOR.message_types_by_name["QueryInfo"]
-_QUERYINFO_SETTINGSENTRY = _QUERYINFO.nested_types_by_name["SettingsEntry"]
-_LOGENTRY = DESCRIPTOR.message_types_by_name["LogEntry"]
-_PROGRESS = DESCRIPTOR.message_types_by_name["Progress"]
-_STATS = DESCRIPTOR.message_types_by_name["Stats"]
-_EXCEPTION = DESCRIPTOR.message_types_by_name["Exception"]
-_RESULT = DESCRIPTOR.message_types_by_name["Result"]
-_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM = (
-    _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name["CompressionAlgorithm"]
-)
-_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL = (
-    _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name["CompressionLevel"]
-)
-NameAndType = _reflection.GeneratedProtocolMessageType(
-    "NameAndType",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _NAMEANDTYPE,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.NameAndType)
-    },
-)
+_NAMEANDTYPE = DESCRIPTOR.message_types_by_name['NameAndType']
+_EXTERNALTABLE = DESCRIPTOR.message_types_by_name['ExternalTable']
+_EXTERNALTABLE_SETTINGSENTRY = _EXTERNALTABLE.nested_types_by_name['SettingsEntry']
+_OBSOLETETRANSPORTCOMPRESSION = DESCRIPTOR.message_types_by_name['ObsoleteTransportCompression']
+_QUERYINFO = DESCRIPTOR.message_types_by_name['QueryInfo']
+_QUERYINFO_SETTINGSENTRY = _QUERYINFO.nested_types_by_name['SettingsEntry']
+_LOGENTRY = DESCRIPTOR.message_types_by_name['LogEntry']
+_PROGRESS = DESCRIPTOR.message_types_by_name['Progress']
+_STATS = DESCRIPTOR.message_types_by_name['Stats']
+_EXCEPTION = DESCRIPTOR.message_types_by_name['Exception']
+_RESULT = DESCRIPTOR.message_types_by_name['Result']
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionAlgorithm']
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionLevel']
+NameAndType = _reflection.GeneratedProtocolMessageType('NameAndType', (_message.Message,), {
+  'DESCRIPTOR' : _NAMEANDTYPE,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.NameAndType)
+  })
 _sym_db.RegisterMessage(NameAndType)
 
-ExternalTable = _reflection.GeneratedProtocolMessageType(
-    "ExternalTable",
-    (_message.Message,),
-    {
-        "SettingsEntry": _reflection.GeneratedProtocolMessageType(
-            "SettingsEntry",
-            (_message.Message,),
-            {
-                "DESCRIPTOR": _EXTERNALTABLE_SETTINGSENTRY,
-                "__module__": "clickhouse_grpc_pb2"
-                # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable.SettingsEntry)
-            },
-        ),
-        "DESCRIPTOR": _EXTERNALTABLE,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable)
-    },
-)
+ExternalTable = _reflection.GeneratedProtocolMessageType('ExternalTable', (_message.Message,), {
+
+  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
+    'DESCRIPTOR' : _EXTERNALTABLE_SETTINGSENTRY,
+    '__module__' : 'clickhouse_grpc_pb2'
+    # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable.SettingsEntry)
+    })
+  ,
+  'DESCRIPTOR' : _EXTERNALTABLE,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable)
+  })
 _sym_db.RegisterMessage(ExternalTable)
 _sym_db.RegisterMessage(ExternalTable.SettingsEntry)
 
-ObsoleteTransportCompression = _reflection.GeneratedProtocolMessageType(
-    "ObsoleteTransportCompression",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _OBSOLETETRANSPORTCOMPRESSION,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.ObsoleteTransportCompression)
-    },
-)
+ObsoleteTransportCompression = _reflection.GeneratedProtocolMessageType('ObsoleteTransportCompression', (_message.Message,), {
+  'DESCRIPTOR' : _OBSOLETETRANSPORTCOMPRESSION,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ObsoleteTransportCompression)
+  })
 _sym_db.RegisterMessage(ObsoleteTransportCompression)
 
-QueryInfo = _reflection.GeneratedProtocolMessageType(
-    "QueryInfo",
-    (_message.Message,),
-    {
-        "SettingsEntry": _reflection.GeneratedProtocolMessageType(
-            "SettingsEntry",
-            (_message.Message,),
-            {
-                "DESCRIPTOR": _QUERYINFO_SETTINGSENTRY,
-                "__module__": "clickhouse_grpc_pb2"
-                # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo.SettingsEntry)
-            },
-        ),
-        "DESCRIPTOR": _QUERYINFO,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo)
-    },
-)
+QueryInfo = _reflection.GeneratedProtocolMessageType('QueryInfo', (_message.Message,), {
+
+  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
+    'DESCRIPTOR' : _QUERYINFO_SETTINGSENTRY,
+    '__module__' : 'clickhouse_grpc_pb2'
+    # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo.SettingsEntry)
+    })
+  ,
+  'DESCRIPTOR' : _QUERYINFO,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo)
+  })
 _sym_db.RegisterMessage(QueryInfo)
 _sym_db.RegisterMessage(QueryInfo.SettingsEntry)
 
-LogEntry = _reflection.GeneratedProtocolMessageType(
-    "LogEntry",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _LOGENTRY,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.LogEntry)
-    },
-)
+LogEntry = _reflection.GeneratedProtocolMessageType('LogEntry', (_message.Message,), {
+  'DESCRIPTOR' : _LOGENTRY,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.LogEntry)
+  })
 _sym_db.RegisterMessage(LogEntry)
 
-Progress = _reflection.GeneratedProtocolMessageType(
-    "Progress",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _PROGRESS,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Progress)
-    },
-)
+Progress = _reflection.GeneratedProtocolMessageType('Progress', (_message.Message,), {
+  'DESCRIPTOR' : _PROGRESS,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Progress)
+  })
 _sym_db.RegisterMessage(Progress)
 
-Stats = _reflection.GeneratedProtocolMessageType(
-    "Stats",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _STATS,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Stats)
-    },
-)
+Stats = _reflection.GeneratedProtocolMessageType('Stats', (_message.Message,), {
+  'DESCRIPTOR' : _STATS,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Stats)
+  })
 _sym_db.RegisterMessage(Stats)
 
-Exception = _reflection.GeneratedProtocolMessageType(
-    "Exception",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _EXCEPTION,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Exception)
-    },
-)
+Exception = _reflection.GeneratedProtocolMessageType('Exception', (_message.Message,), {
+  'DESCRIPTOR' : _EXCEPTION,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Exception)
+  })
 _sym_db.RegisterMessage(Exception)
 
-Result = _reflection.GeneratedProtocolMessageType(
-    "Result",
-    (_message.Message,),
-    {
-        "DESCRIPTOR": _RESULT,
-        "__module__": "clickhouse_grpc_pb2"
-        # @@protoc_insertion_point(class_scope:clickhouse.grpc.Result)
-    },
-)
+Result = _reflection.GeneratedProtocolMessageType('Result', (_message.Message,), {
+  'DESCRIPTOR' : _RESULT,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Result)
+  })
 _sym_db.RegisterMessage(Result)
 
-_CLICKHOUSE = DESCRIPTOR.services_by_name["ClickHouse"]
+_CLICKHOUSE = DESCRIPTOR.services_by_name['ClickHouse']
 if _descriptor._USE_C_DESCRIPTORS == False:
 
-    DESCRIPTOR._options = None
-    _EXTERNALTABLE_SETTINGSENTRY._options = None
-    _EXTERNALTABLE_SETTINGSENTRY._serialized_options = b"8\001"
-    _QUERYINFO_SETTINGSENTRY._options = None
-    _QUERYINFO_SETTINGSENTRY._serialized_options = b"8\001"
-    _LOGSLEVEL._serialized_start = 2363
-    _LOGSLEVEL._serialized_end = 2520
-    _NAMEANDTYPE._serialized_start = 42
-    _NAMEANDTYPE._serialized_end = 83
-    _EXTERNALTABLE._serialized_start = 86
-    _EXTERNALTABLE._serialized_end = 331
-    _EXTERNALTABLE_SETTINGSENTRY._serialized_start = 284
-    _EXTERNALTABLE_SETTINGSENTRY._serialized_end = 331
-    _OBSOLETETRANSPORTCOMPRESSION._serialized_start = 334
-    _OBSOLETETRANSPORTCOMPRESSION._serialized_end = 723
-    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_start = 532
-    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_end = 614
-    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_start = 616
-    _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_end = 723
-    _QUERYINFO._serialized_start = 726
-    _QUERYINFO._serialized_end = 1508
-    _QUERYINFO_SETTINGSENTRY._serialized_start = 284
-    _QUERYINFO_SETTINGSENTRY._serialized_end = 331
-    _LOGENTRY._serialized_start = 1511
-    _LOGENTRY._serialized_end = 1672
-    _PROGRESS._serialized_start = 1674
-    _PROGRESS._serialized_end = 1796
-    _STATS._serialized_start = 1798
-    _STATS._serialized_end = 1910
-    _EXCEPTION._serialized_start = 1912
-    _EXCEPTION._serialized_end = 1994
-    _RESULT._serialized_start = 1997
-    _RESULT._serialized_end = 2360
-    _CLICKHOUSE._serialized_start = 2523
-    _CLICKHOUSE._serialized_end = 2870
+  DESCRIPTOR._options = None
+  _EXTERNALTABLE_SETTINGSENTRY._options = None
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_options = b'8\001'
+  _QUERYINFO_SETTINGSENTRY._options = None
+  _QUERYINFO_SETTINGSENTRY._serialized_options = b'8\001'
+  _LOGSLEVEL._serialized_start=2363
+  _LOGSLEVEL._serialized_end=2520
+  _NAMEANDTYPE._serialized_start=42
+  _NAMEANDTYPE._serialized_end=83
+  _EXTERNALTABLE._serialized_start=86
+  _EXTERNALTABLE._serialized_end=331
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_start=284
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_end=331
+  _OBSOLETETRANSPORTCOMPRESSION._serialized_start=334
+  _OBSOLETETRANSPORTCOMPRESSION._serialized_end=723
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_start=532
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_end=614
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_start=616
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_end=723
+  _QUERYINFO._serialized_start=726
+  _QUERYINFO._serialized_end=1508
+  _QUERYINFO_SETTINGSENTRY._serialized_start=284
+  _QUERYINFO_SETTINGSENTRY._serialized_end=331
+  _LOGENTRY._serialized_start=1511
+  _LOGENTRY._serialized_end=1672
+  _PROGRESS._serialized_start=1674
+  _PROGRESS._serialized_end=1796
+  _STATS._serialized_start=1798
+  _STATS._serialized_end=1910
+  _EXCEPTION._serialized_start=1912
+  _EXCEPTION._serialized_end=1994
+  _RESULT._serialized_start=1997
+  _RESULT._serialized_end=2360
+  _CLICKHOUSE._serialized_start=2523
+  _CLICKHOUSE._serialized_end=2870
 # @@protoc_insertion_point(module_scope)
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
index 25643a243b3..1c71218bbe5 100644
--- a/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
@@ -15,25 +15,25 @@ class ClickHouseStub(object):
             channel: A grpc.Channel.
         """
         self.ExecuteQuery = channel.unary_unary(
-            "/clickhouse.grpc.ClickHouse/ExecuteQuery",
-            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-        )
+                '/clickhouse.grpc.ClickHouse/ExecuteQuery',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
         self.ExecuteQueryWithStreamInput = channel.stream_unary(
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput",
-            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-        )
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
         self.ExecuteQueryWithStreamOutput = channel.unary_stream(
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput",
-            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-        )
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
         self.ExecuteQueryWithStreamIO = channel.stream_stream(
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO",
-            request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
-            response_deserializer=clickhouse__grpc__pb2.Result.FromString,
-        )
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
 
 
 class ClickHouseServicer(object):
@@ -42,173 +42,124 @@ class ClickHouseServicer(object):
     def ExecuteQuery(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details("Method not implemented!")
-        raise NotImplementedError("Method not implemented!")
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def ExecuteQueryWithStreamInput(self, request_iterator, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details("Method not implemented!")
-        raise NotImplementedError("Method not implemented!")
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def ExecuteQueryWithStreamOutput(self, request, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details("Method not implemented!")
-        raise NotImplementedError("Method not implemented!")
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
     def ExecuteQueryWithStreamIO(self, request_iterator, context):
         """Missing associated documentation comment in .proto file."""
         context.set_code(grpc.StatusCode.UNIMPLEMENTED)
-        context.set_details("Method not implemented!")
-        raise NotImplementedError("Method not implemented!")
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
 
 
 def add_ClickHouseServicer_to_server(servicer, server):
     rpc_method_handlers = {
-        "ExecuteQuery": grpc.unary_unary_rpc_method_handler(
-            servicer.ExecuteQuery,
-            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-        ),
-        "ExecuteQueryWithStreamInput": grpc.stream_unary_rpc_method_handler(
-            servicer.ExecuteQueryWithStreamInput,
-            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-        ),
-        "ExecuteQueryWithStreamOutput": grpc.unary_stream_rpc_method_handler(
-            servicer.ExecuteQueryWithStreamOutput,
-            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-        ),
-        "ExecuteQueryWithStreamIO": grpc.stream_stream_rpc_method_handler(
-            servicer.ExecuteQueryWithStreamIO,
-            request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
-            response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
-        ),
+            'ExecuteQuery': grpc.unary_unary_rpc_method_handler(
+                    servicer.ExecuteQuery,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamInput': grpc.stream_unary_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamInput,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamOutput': grpc.unary_stream_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamOutput,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamIO': grpc.stream_stream_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamIO,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
     }
     generic_handler = grpc.method_handlers_generic_handler(
-        "clickhouse.grpc.ClickHouse", rpc_method_handlers
-    )
+            'clickhouse.grpc.ClickHouse', rpc_method_handlers)
     server.add_generic_rpc_handlers((generic_handler,))
 
 
-# This class is part of an EXPERIMENTAL API.
+ # This class is part of an EXPERIMENTAL API.
 class ClickHouse(object):
     """Missing associated documentation comment in .proto file."""
 
     @staticmethod
-    def ExecuteQuery(
-        request,
-        target,
-        options=(),
-        channel_credentials=None,
-        call_credentials=None,
-        insecure=False,
-        compression=None,
-        wait_for_ready=None,
-        timeout=None,
-        metadata=None,
-    ):
-        return grpc.experimental.unary_unary(
-            request,
+    def ExecuteQuery(request,
             target,
-            "/clickhouse.grpc.ClickHouse/ExecuteQuery",
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.unary_unary(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQuery',
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options,
-            channel_credentials,
-            insecure,
-            call_credentials,
-            compression,
-            wait_for_ready,
-            timeout,
-            metadata,
-        )
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
 
     @staticmethod
-    def ExecuteQueryWithStreamInput(
-        request_iterator,
-        target,
-        options=(),
-        channel_credentials=None,
-        call_credentials=None,
-        insecure=False,
-        compression=None,
-        wait_for_ready=None,
-        timeout=None,
-        metadata=None,
-    ):
-        return grpc.experimental.stream_unary(
-            request_iterator,
+    def ExecuteQueryWithStreamInput(request_iterator,
             target,
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput",
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.stream_unary(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options,
-            channel_credentials,
-            insecure,
-            call_credentials,
-            compression,
-            wait_for_ready,
-            timeout,
-            metadata,
-        )
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
 
     @staticmethod
-    def ExecuteQueryWithStreamOutput(
-        request,
-        target,
-        options=(),
-        channel_credentials=None,
-        call_credentials=None,
-        insecure=False,
-        compression=None,
-        wait_for_ready=None,
-        timeout=None,
-        metadata=None,
-    ):
-        return grpc.experimental.unary_stream(
-            request,
+    def ExecuteQueryWithStreamOutput(request,
             target,
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput",
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.unary_stream(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options,
-            channel_credentials,
-            insecure,
-            call_credentials,
-            compression,
-            wait_for_ready,
-            timeout,
-            metadata,
-        )
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
 
     @staticmethod
-    def ExecuteQueryWithStreamIO(
-        request_iterator,
-        target,
-        options=(),
-        channel_credentials=None,
-        call_credentials=None,
-        insecure=False,
-        compression=None,
-        wait_for_ready=None,
-        timeout=None,
-        metadata=None,
-    ):
-        return grpc.experimental.stream_stream(
-            request_iterator,
+    def ExecuteQueryWithStreamIO(request_iterator,
             target,
-            "/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO",
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.stream_stream(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
             clickhouse__grpc__pb2.QueryInfo.SerializeToString,
             clickhouse__grpc__pb2.Result.FromString,
-            options,
-            channel_credentials,
-            insecure,
-            call_credentials,
-            compression,
-            wait_for_ready,
-            timeout,
-            metadata,
-        )
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)

From 5cda358e62c90a2345a60a249b6d7e8430f6454d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 06:26:04 +0100
Subject: [PATCH 0142/1081] Obey Python's quirky formatter

---
 tests/clickhouse-test | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index bd796dbfdf2..dd9047c293f 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -75,11 +75,13 @@ def stringhash(s):
     # only during process invocation https://stackoverflow.com/a/42089311
     return zlib.crc32(s.encode("utf-8"))
 
+
 def read_file_as_binary_string(file_path):
-    with open(file_path, 'rb') as file:
+    with open(file_path, "rb") as file:
         binary_data = file.read()
     return binary_data
 
+
 # First and last lines of the log
 def trim_for_log(s):
     if not s:
@@ -146,7 +148,7 @@ def clickhouse_execute_http(
             client.request(
                 "POST",
                 f"/?{base_args.client_options_query_str}{urllib.parse.urlencode(params)}",
-                body=body
+                body=body,
             )
             res = client.getresponse()
             data = res.read()

From 71bef27abfa9cd64a318306ddd11b21b907a37ac Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 06:26:54 +0100
Subject: [PATCH 0143/1081] Follow-up

---
 docker/test/base/setup_export_logs.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 26fcd10d666..96a15c33674 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -194,7 +194,7 @@ function setup_logs_replication
         echo "Creating table system.${table}_sender" >&2
 
         # Create Distributed table and materialized view to watch on the original table:
-        clickhouse-client --asterisk_include_materialized_columns 1 --query "
+        clickhouse-client --query "
             CREATE TABLE system.${table}_sender
             ENGINE = Distributed(${CLICKHOUSE_CI_LOGS_CLUSTER}, default, ${table}_${hash})
             SETTINGS flush_on_detach=0
@@ -205,7 +205,7 @@ function setup_logs_replication
 
         echo "Creating materialized view system.${table}_watcher" >&2
 
-        clickhouse-client --asterisk_include_materialized_columns 1 --query "
+        clickhouse-client --query "
             CREATE MATERIALIZED VIEW system.${table}_watcher TO system.${table}_sender AS
             SELECT ${EXTRA_COLUMNS_EXPRESSION_FOR_TABLE}, *
             FROM system.${table}

From 3eba7678057df92e8a7f91912863843d377eecd4 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Mon, 15 Jan 2024 19:17:13 +0000
Subject: [PATCH 0144/1081] init

---
 src/Interpreters/InterpreterCreateQuery.cpp            | 10 ++++++++--
 .../02973_dictionary_table_exception_fix.reference     |  0
 .../02973_dictionary_table_exception_fix.sql           |  6 ++++++
 3 files changed, 14 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference
 create mode 100644 tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 36e864ace26..c00f58de59a 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1405,8 +1405,14 @@ bool InterpreterCreateQuery::doCreateTable(ASTCreateQuery & create,
             interpreter.execute();
         }
         else
-            throw Exception(storage_already_exists_error_code,
-                "{} {}.{} already exists", storage_name, backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+        {
+            if (database->getTable(create.getTable(), getContext())->isDictionary())
+                throw Exception(ErrorCodes::DICTIONARY_ALREADY_EXISTS,
+                                "Dictionary {}.{} already exists", backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+            else
+                throw Exception(ErrorCodes::TABLE_ALREADY_EXISTS,
+                                "Table {}.{} already exists", backQuoteIfNeed(create.getDatabase()), backQuoteIfNeed(create.getTable()));
+        }
     }
     else if (!create.attach)
     {
diff --git a/tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql
new file mode 100644
index 00000000000..f8061b42670
--- /dev/null
+++ b/tests/queries/0_stateless/02973_dictionary_table_exception_fix.sql
@@ -0,0 +1,6 @@
+CREATE TABLE test_table (i Int64) engine=MergeTree order by i;
+CREATE DICTIONARY test_dict (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT());
+CREATE TABLE test_dict (y Int64) engine=MergeTree order by y; -- { serverError DICTIONARY_ALREADY_EXISTS }
+CREATE DICTIONARY test_table (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT()); -- { serverError TABLE_ALREADY_EXISTS }
+CREATE DICTIONARY test_dict (y String, value UInt64 DEFAULT 0) PRIMARY KEY y SOURCE(CLICKHOUSE(TABLE 'test_table')) LAYOUT(DIRECT()); -- { serverError DICTIONARY_ALREADY_EXISTS }
+CREATE TABLE test_table (y Int64) engine=MergeTree order by y; -- { serverError TABLE_ALREADY_EXISTS }

From c5024a5f6d7f88f0fd8dc2af2c52eb1c1d57d2c2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 15 Jan 2024 23:36:48 +0100
Subject: [PATCH 0145/1081] Fix typo

---
 docker/test/base/setup_export_logs.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 96a15c33674..416281c2aa3 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -30,7 +30,7 @@ EXTRA_COLUMNS_EXPRESSION_COVERAGE_LOG="${EXTRA_COLUMNS_EXPRESSION}, arrayMap(x -
 
 function __set_connection_args
 {
-    # It's impossible to use generous $CONNECTION_ARGS string, it's unsafe from word splitting perspective.
+    # It's impossible to use a generic $CONNECTION_ARGS string, it's unsafe from word splitting perspective.
     # That's why we must stick to the generated option
     CONNECTION_ARGS=(
         --receive_timeout=45 --send_timeout=45 --secure

From 1caef191436fc05856be3b85b19cfcd97d0dc804 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 16 Jan 2024 09:44:52 +0100
Subject: [PATCH 0146/1081] Maybe better

---
 programs/main.cpp | 81 ++++++++++++++++++++++++++---------------------
 1 file changed, 45 insertions(+), 36 deletions(-)

diff --git a/programs/main.cpp b/programs/main.cpp
index 8958d84e243..1ff7e5db560 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -394,6 +394,50 @@ void checkHarmfulEnvironmentVariables(char ** argv)
 }
 #endif
 
+
+#if defined(SANITIZE_COVERAGE)
+__attribute__((no_sanitize("coverage")))
+void dumpCoverage()
+{
+    /// A user can request to dump the coverage information into files at exit.
+    /// This is useful for non-server applications such as clickhouse-format or clickhouse-client,
+    /// that cannot introspect it with SQL functions at runtime.
+
+    /// The CLICKHOUSE_WRITE_COVERAGE environment variable defines a prefix for a filename 'prefix.pid'
+    /// containing the list of addresses of covered .
+
+    /// The format is even simpler than Clang's "sancov": an array of 64-bit addresses, native byte order, no header.
+
+    if (const char * coverage_filename_prefix = getenv("CLICKHOUSE_WRITE_COVERAGE")) // NOLINT(concurrency-mt-unsafe)
+    {
+        auto dump = [](const std::string & name, auto span)
+        {
+            /// Write only non-zeros.
+            std::vector<uintptr_t> data;
+            data.reserve(span.size());
+            for (auto addr : span)
+                if (addr)
+                    data.push_back(addr);
+
+            int fd = ::open(name.c_str(), O_WRONLY | O_CREAT | O_TRUNC | O_CLOEXEC, 0400);
+            if (-1 == fd)
+            {
+                writeError("Cannot open a file to write the coverage data\n");
+            }
+            else
+            {
+                if (!writeRetry(fd, reinterpret_cast<const char *>(data.data()), data.size() * sizeof(data[0])))
+                    writeError("Cannot write the coverage data to a file\n");
+                if (0 != ::close(fd))
+                    writeError("Cannot close the file with coverage data\n");
+            }
+        };
+
+        dump(fmt::format("{}.{}", coverage_filename_prefix, getpid()), getCumulativeCoverage());
+    }
+}
+#endif
+
 }
 
 bool isClickhouseApp(std::string_view app_suffix, std::vector<char *> & argv)
@@ -517,42 +561,7 @@ int main(int argc_, char ** argv_)
     int exit_code = main_func(static_cast<int>(argv.size()), argv.data());
 
 #if defined(SANITIZE_COVERAGE)
-    /// A user can request to dump the coverage information into files at exit.
-    /// This is useful for non-server applications such as clickhouse-format or clickhouse-client,
-    /// that cannot introspect it with SQL functions at runtime.
-
-    /// The CLICKHOUSE_WRITE_COVERAGE environment variable defines a prefix for a filename 'prefix.pid'
-    /// containing the list of addresses of covered .
-
-    /// The format is even simpler than Clang's "sancov": an array of 64-bit addresses, native byte order, no header.
-
-    if (const char * coverage_filename_prefix = getenv("CLICKHOUSE_WRITE_COVERAGE")) // NOLINT(concurrency-mt-unsafe)
-    {
-        auto dumpCoverage = [](const std::string & name, auto span)
-        {
-            /// Write only non-zeros.
-            std::vector<uintptr_t> data;
-            data.reserve(span.size());
-            for (auto addr : span)
-                if (addr)
-                    data.push_back(addr);
-
-            int fd = ::open(name.c_str(), O_WRONLY | O_CREAT | O_TRUNC | O_CLOEXEC, 0400);
-            if (-1 == fd)
-            {
-                writeError("Cannot open a file to write the coverage data\n");
-            }
-            else
-            {
-                if (!writeRetry(fd, reinterpret_cast<const char *>(data.data()), data.size() * sizeof(data[0])))
-                    writeError("Cannot write the coverage data to a file\n");
-                if (0 != ::close(fd))
-                    writeError("Cannot close the file with coverage data\n");
-            }
-        };
-
-        dumpCoverage(fmt::format("{}.{}", coverage_filename_prefix, getpid()), getCumulativeCoverage());
-    }
+    dumpCoverage();
 #endif
 
     return exit_code;

From 21082be9a681166b5585445c8aed62e705063081 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 16 Jan 2024 10:41:13 +0100
Subject: [PATCH 0147/1081] Better test

---
 tests/clickhouse-test | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index dd9047c293f..6d398115d43 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1269,13 +1269,17 @@ class TestCase:
             file_pattern = "coverage.*"
             matching_files = glob.glob(file_pattern)
             for file_path in matching_files:
-                body = read_file_as_binary_string(file_path)
-                clickhouse_execute(
-                    args,
-                    f"INSERT INTO system.coverage_log SELECT now(), '{self.case}', groupArray(data) FROM input('data UInt64') FORMAT RowBinary",
-                    body=body,
-                    retry_error_codes=True,
-                )
+                try:
+                    body = read_file_as_binary_string(file_path)
+                    clickhouse_execute(
+                        args,
+                        f"INSERT INTO system.coverage_log SELECT now(), '{self.case}', groupArray(data) FROM input('data UInt64') FORMAT RowBinary",
+                        body=body,
+                        retry_error_codes=True,
+                    )
+                except Exception as e:
+                    print("Cannot insert coverage data: ", str(e))
+                # Remove the file even in case of exception to avoid accumulation and quadratic complexity.
                 os.remove(file_path)
 
             coverage = clickhouse_execute(

From 6b8d53a9fa54e53c766c431201ea8dfd742630ea Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 16 Jan 2024 11:07:30 +0100
Subject: [PATCH 0148/1081] Remove obsolete comment

---
 tests/clickhouse-test | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 6d398115d43..02693b997b4 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -412,7 +412,6 @@ def get_stacktraces_from_gdb(server_pid):
 
 
 # collect server stacktraces from system.stack_trace table
-# it does not work in Sandbox
 def get_stacktraces_from_clickhouse(args):
     settings_str = " ".join(
         [

From 605c76e66ea5bdd2644026a5c7425e87f24c3702 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 16 Jan 2024 11:22:27 +0100
Subject: [PATCH 0149/1081] Fix test fails

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 22 +++++++++++++---------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 0dc3026afc0..b235918c438 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6400,23 +6400,27 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
 {
 
     String database_name = scope.context->getCurrentDatabase();
-    String table_name = table_function_node->getOriginalAST()->as<ASTFunction>()->name;
+    String table_name = "";
 
-    if (table_function_node->getOriginalAST()->as<ASTFunction>()->is_compound_name)
+    if (table_function_node->getOriginalAST() && table_function_node->getOriginalAST()->as<ASTFunction>())
     {
-        std::vector<std::string> parts;
-        splitInto<'.'>(parts, table_function_node->getOriginalAST()->as<ASTFunction>()->name);
-
-        if (parts.size() == 2)
+        table_name = table_function_node->getOriginalAST()->as<ASTFunction>()->name;
+        if (table_function_node->getOriginalAST()->as<ASTFunction>()->is_compound_name)
         {
-            database_name = parts[0];
-            table_name = parts[1];
+            std::vector<std::string> parts;
+            splitInto<'.'>(parts, table_function_node->getOriginalAST()->as<ASTFunction>()->name);
+
+            if (parts.size() == 2)
+            {
+                database_name = parts[0];
+                table_name = parts[1];
+            }
         }
     }
 
     auto & table_function_node_typed = table_function_node->as<TableFunctionNode &>();
 
-    StoragePtr table = DatabaseCatalog::instance().tryGetTable({database_name, table_name}, scope.context->getQueryContext());
+    StoragePtr table = table_name.empty() ? nullptr : DatabaseCatalog::instance().tryGetTable({database_name, table_name}, scope.context->getQueryContext());
     if (table)
     {
         if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())

From 7bc6a858c7778911a51e4c2430125f9c3741a535 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 16 Jan 2024 19:44:55 +0100
Subject: [PATCH 0150/1081] Rewrite bash test to integration test

---
 .../test_broken_projections/__init__.py       |   0
 .../config.d/backups.xml                      |  13 +
 .../test_broken_projections/test.py           | 492 +++++++++++++++++
 .../02916_broken_projection.reference         | 322 -----------
 .../0_stateless/02916_broken_projection.sh    | 515 ------------------
 5 files changed, 505 insertions(+), 837 deletions(-)
 create mode 100644 tests/integration/test_broken_projections/__init__.py
 create mode 100644 tests/integration/test_broken_projections/config.d/backups.xml
 create mode 100644 tests/integration/test_broken_projections/test.py
 delete mode 100644 tests/queries/0_stateless/02916_broken_projection.reference
 delete mode 100755 tests/queries/0_stateless/02916_broken_projection.sh

diff --git a/tests/integration/test_broken_projections/__init__.py b/tests/integration/test_broken_projections/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_broken_projections/config.d/backups.xml b/tests/integration/test_broken_projections/config.d/backups.xml
new file mode 100644
index 00000000000..4da8edffd67
--- /dev/null
+++ b/tests/integration/test_broken_projections/config.d/backups.xml
@@ -0,0 +1,13 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <backups>
+                <type>local</type>
+                <path>/var/lib/clickhouse/disks/backups/</path>
+            </backups>
+        </disks>
+    </storage_configuration>
+    <backups>
+        <allowed_disk>backups</allowed_disk>
+    </backups>
+</clickhouse>
diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
new file mode 100644
index 00000000000..ca1a29817a5
--- /dev/null
+++ b/tests/integration/test_broken_projections/test.py
@@ -0,0 +1,492 @@
+import time
+import pytest
+import logging
+import string
+import random
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+
+@pytest.fixture(scope="module")
+def cluster():
+    try:
+        cluster = ClickHouseCluster(__file__)
+        cluster.add_instance(
+            "node",
+            main_configs=["config.d/backups.xml"],
+            stay_alive=True,
+            with_zookeeper=True,
+        )
+
+        logging.info("Starting cluster...")
+        cluster.start()
+        logging.info("Cluster started")
+
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def create_table(node, table, replica, data_prefix = ""):
+    if data_prefix == "":
+        data_prefix = table
+
+    node.query(
+        f"""
+    DROP TABLE IF EXISTS {table} SYNC;
+    CREATE TABLE {table}
+    (
+        a String,
+        b String,
+        c Int64,
+        d Int64,
+        e Int64,
+
+        PROJECTION proj
+        (
+            SELECT c ORDER BY d
+        ),
+        PROJECTION proj_2
+        (
+            SELECT d ORDER BY c
+        )
+    )
+    ENGINE = ReplicatedMergeTree('/test_broken_projection_{data_prefix}/data/', '{replica}') ORDER BY a
+    SETTINGS min_bytes_for_wide_part = 0,
+        max_parts_to_merge_at_once=3,
+        enable_vertical_merge_algorithm=1,
+        vertical_merge_algorithm_min_rows_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_columns_to_activate = 1,
+        compress_primary_key=0;
+    """
+    )
+
+
+def insert(node, table, offset, size):
+    node.query(
+        f"""
+        INSERT INTO {table}
+        SELECT number, number, number, number, number%2 FROM numbers({offset}, {size})
+        SETTINGS insert_keeper_fault_injection_probability=0.0;
+        """
+    )
+
+
+def get_parts(node, table):
+    return (
+        node.query(
+            f"""
+    SELECT name
+    FROM system.parts
+    WHERE table='{table}' AND database=currentDatabase() AND active = 1
+    ORDER BY name;"
+    """
+        )
+        .strip()
+        .split("\n")
+    )
+
+
+def bash(node, command):
+    node.exec_in_container(["bash", "-c", command], privileged=True, user="root")
+
+
+def break_projection(node, table, part, parent_part, break_type):
+    part_path = node.query(
+        f"""
+    SELECT path
+    FROM system.projection_parts
+    WHERE table='{table}'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='{part}'
+    AND parent_name='{parent_part}'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    """
+    ).strip()
+
+    node.query(
+        f"select throwIf(substring('{part_path}', 1, 1) != '/', 'Path is relative: {part_path}')"
+    )
+
+    if break_type == "data":
+        bash(node, f"rm '{part_path}/d.bin'")
+        bash(node, f"rm '{part_path}/c.bin'")
+    elif break_type == "metadata":
+        bash(node, f"rm '{part_path}/columns.txt'")
+    elif break_type == "part":
+        bash(node, f"rm -r '{part_path}'")
+
+
+def break_part(node, table, part):
+    part_path = node.query(
+        f"""
+    SELECT path
+    FROM system.parts
+    WHERE table='{table}'
+    AND database=currentDatabase()
+    AND active=1
+    AND part_name='{part}'
+    ORDER BY modification_time DESC
+    LIMIT 1;
+    """
+    ).strip()
+
+    node.query(
+        f"select throwIf(substring('{part_path}', 1, 1) != '/', 'Path is relative: {part_path}')"
+    )
+    bash(node, f"rm '{part_path}/columns.txt'")
+
+
+def get_broken_projections_info(node, table):
+    return node.query(
+        f"""
+    SELECT parent_name, name, errors.name FROM
+    (
+        SELECT parent_name, name, exception_code
+        FROM system.projection_parts
+        WHERE table='{table}'
+        AND database=currentDatabase()
+        AND is_broken = 1
+    ) AS parts_info
+    INNER JOIN system.errors AS errors
+    ON parts_info.exception_code = errors.code
+    ORDER BY parent_name, name
+    """
+    ).strip()
+
+
+def optimize(node, table, final, no_wait):
+    query = f"OPTIMIZE TABLE {table}"
+    if final:
+        query += " FINAL"
+    if no_wait:
+        query += " SETTINGS alter_sync=0"
+    node.query(query)
+
+
+def reattach(node, table):
+    node.query(
+        f"""
+    DETACH TABLE {table};
+    ATTACH TABLE {table};
+    """
+    )
+
+
+def materialize_projection(node, table, proj):
+    node.query(
+        f"ALTER TABLE {table} MATERIALIZE PROJECTION {proj} SETTINGS mutations_sync=2"
+    )
+
+
+def check_table_full(node, table):
+    return node.query(
+        f"CHECK TABLE {table} SETTINGS check_query_single_value_result = 0;"
+    ).strip()
+
+
+def random_str(length=6):
+    alphabet = string.ascii_lowercase + string.digits
+    return "".join(random.SystemRandom().choice(alphabet) for _ in range(length))
+
+
+def check(node, table, check_result, expect_broken_part="", expected_error=""):
+    query_id = random_str()
+
+    if expect_broken_part == "proj":
+        assert expected_error in node.query_and_get_error(
+            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
+        )
+    else:
+        node.query(
+            f"SELECT c FROM '{table}' WHERE d == 12 OR d == 16 ORDER BY c",
+            query_id=query_id,
+        )
+        assert "proj" in node.query(
+            f"""
+        SYSTEM FLUSH LOGS;
+        SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+        FROM system.query_log
+        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        """
+        )
+
+    query_id = random_str()
+
+    if expect_broken_part == "proj_2":
+        assert expected_error in node.query_and_get_error(
+            f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
+        )
+    else:
+        node.query(
+            f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
+            query_id=query_id,
+        )
+        assert "proj" in node.query(
+            f"""
+        SYSTEM FLUSH LOGS;
+        SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+        FROM system.query_log
+        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        """
+        )
+
+    assert check_result == int(node.query(f"CHECK TABLE {table}"))
+
+
+def test_broken_ignored(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test1"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    # Break metadata (columns.txt) file of projection 'proj'
+    break_projection(node, table_name, "proj", "all_2_2_0", "metadata")
+
+    # Do select and after "check table" query.
+    # Select works because it does not read columns.txt.
+    # But expect check table result as 0.
+    check(node, table_name, 0)
+
+    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # because it was marked broken during "check table" query.
+    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+        node, table_name
+    )
+
+    # Check table query will also show a list of parts which have broken projections.
+    assert "all_2_2_0" in check_table_full(node, table_name)
+
+    # Break data file of projection 'proj_2' for part all_2_2_0
+    break_projection(node, table_name, "proj_2", "all_2_2_0", "data")
+
+    # It will not yet appear in broken projections info.
+    assert "proj_2" not in get_broken_projections_info(node, table_name)
+
+    # Select now fails with error "File doesn't exist"
+    check(node, table_name, 0, "proj_2", "FILE_DOESNT_EXIST")
+
+    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
+    assert "all_2_2_0\tproj_2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+
+    # Second select works, because projection is now marked as broken.
+    check(node, table_name, 0)
+
+    # Break data file of projection 'proj_2' for part all_3_3_0
+    break_projection(node, table_name, "proj_2", "all_3_3_0", "data")
+
+    # It will not yet appear in broken projections info.
+    assert "all_3_3_0" not in get_broken_projections_info(node, table_name)
+
+    insert(node, table_name, 20, 5)
+    insert(node, table_name, 25, 5)
+
+    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
+    # So a merge will be create for future part all_3_5_1.
+    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # Merge will be retried and on second attempt it will succeed.
+    # The result part all_3_5_1 will have only 1 projection - 'proj', because
+    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    optimize(node, table_name, 0, 1)
+    time.sleep(5)
+
+    # table_uuid=node.query(f"SELECT uuid FROM system.tables WHERE table='{table_name}' and database=currentDatabase()").strip()
+    # assert 0 < int(
+    #    node.query(
+    #        f"""
+    # SYSTEM FLUSH LOGS;
+    # SELECT count() FROM system.text_log
+    # WHERE level='Error'
+    # AND logger_name='MergeTreeBackgroundExecutor'
+    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj_2.proj/c.bin%'
+    # """)
+    # )
+
+    assert "all_3_3_0" in get_broken_projections_info(node, table_name)
+    check(node, table_name, 0)
+
+
+def test_materialize_broken_projection(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test2"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    break_projection(node, table_name, "proj", "all_1_1_0", "metadata")
+    reattach(node, table_name)
+
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+
+    break_projection(node, table_name, "proj_2", "all_1_1_0", "data")
+    reattach(node, table_name)
+
+    assert "all_1_1_0\tproj_2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+        node, table_name
+    )
+    assert "Part all_1_1_0 has a broken projection proj_2" in check_table_full(
+        node, table_name
+    )
+
+    materialize_projection(node, table_name, "proj")
+
+    assert "has a broken projection" not in check_table_full(node, table_name)
+
+
+def test_broken_ignored_replicated(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test3"
+    table_name2 = "test3_replica"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    check(node, table_name, 1)
+
+    create_table(node, table_name2, 2, table_name)
+    check(node, table_name2, 1)
+
+    break_projection(node, table_name, "proj", "all_0_0_0", "data")
+    assert "Part all_0_0_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+
+    break_part(node, table_name, "all_0_0_0")
+    node.query(f"SYSTEM SYNC REPLICA {table_name}")
+    assert "has a broken projection" not in check_table_full(node, table_name)
+
+
+def test_broken_projections_in_backups(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test4"
+    create_table(node, table_name, 1)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj", "all_2_2_0", "data")
+    check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+
+    assert "all_2_2_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b1') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b1');
+    """
+    )
+
+    check(node, table_name, 1)
+
+    assert "" == get_broken_projections_info(node, table_name)
+    # TODO: add a check for what projections are loaded
+
+    break_projection(node, table_name, "proj", "all_2_2_0", "part")
+
+    check(node, table_name, 0, "proj", "ErrnoException")
+
+    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "FILE_DOESNT_EXIST" in node.query_and_get_error(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b2')
+    """
+    )
+
+    materialize_projection(node, table_name, "proj")
+    check(node, table_name, 1)
+    # TODO:
+    # assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(node, table_name)
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b3') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b3');
+    """
+    )
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj", "all_1_1_0", "part")
+    # TODO: check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+        node, table_name
+    )
+    assert "all_1_1_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+        node, table_name
+    )
+
+    assert "BACKUP_CREATED" in node.query(
+        f"""
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false;
+    """
+    )
+
+    assert "RESTORED" in node.query(
+        f"""
+    drop table {table_name} sync;
+    set backup_restore_keeper_fault_injection_probability=0.0;
+    restore table {table_name} from Disk('backups', 'b4');
+    """
+    )
+    check(node, table_name, 1)
+    assert "" == get_broken_projections_info(node, table_name)
diff --git a/tests/queries/0_stateless/02916_broken_projection.reference b/tests/queries/0_stateless/02916_broken_projection.reference
deleted file mode 100644
index 3967215e5de..00000000000
--- a/tests/queries/0_stateless/02916_broken_projection.reference
+++ /dev/null
@@ -1,322 +0,0 @@
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke metadata of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-check table full (test - all_2_2_0)
-all_2_2_0
-0
-broke data of part 'proj_2' (parent part: all_2_2_0)
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2', expect error: proj_2
-FILE_DOESNT_EXIST
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-0
-broke data of part 'proj_2' (parent part: all_3_3_0)
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-insert new part
-insert new part
-optimize
-OPTIMIZE TABLE test SETTINGS alter_sync=0
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-all_2_2_0	proj_2	NO_FILE_IN_DATA_PART
-all_3_3_0	proj_2	NO_FILE_IN_DATA_PART
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-0
-broke metadata of part 'proj' (parent part: all_1_1_0)
-Detach - Attach
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj_2	FILE_DOESNT_EXIST
-all_3_3_0	proj_2	FILE_DOESNT_EXIST
-0
-broke data of part 'proj_2' (parent part: all_1_1_0)
-Detach - Attach
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
-all_1_1_0	proj_2	FILE_DOESNT_EXIST
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-all_2_2_0	proj_2	FILE_DOESNT_EXIST
-all_3_3_0	proj_2	FILE_DOESNT_EXIST
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-check table full (test - all_1_1_0)
-all_1_1_0
-materialize projection proj
-check table full (test - )
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-materialize projection proj_2
-check table full (test - )
-0
-broke data of part 'proj' (parent part: all_3_5_1_7)
-insert new part
-optimize
-OPTIMIZE TABLE test FINAL
-insert new part
-optimize
-OPTIMIZE TABLE test FINAL
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj_2
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-select from projection 'proj'
-used projections
-SELECT c FROM test2_replica WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2_replica WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke data of part 'proj' (parent part: all_0_0_0)
-check table full (test2 - all_0_0_0)
-all_0_0_0
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broke data of part 'all_0_0_0'
-check table full (test2 - all_0_0_0)
-all_0_0_0
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-select from projection 'proj'
-used projections
-SELECT c FROM test2 WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-used projections
-SELECT d FROM test2 WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-insert new part
-insert new part
-insert new part
-insert new part
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke data of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj', expect error: proj
-FILE_DOESNT_EXIST
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	NO_FILE_IN_DATA_PART
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-broken projections info
-0
-broke all data of part 'proj' (parent part: all_2_2_0)
-select from projection 'proj', expect error: proj
-Errno
-Errno
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-FILE_DOESNT_EXIST
-materialize projection proj
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-broken projections info
-all_2_2_0	proj	FILE_DOESNT_EXIST
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-1
-0
-broke all data of part 'proj' (parent part: all_1_1_0)
-select from projection 'proj', expect error: proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_1_1_0	proj	FILE_DOESNT_EXIST
-BACKUP_CREATED
-RESTORED
-select from projection 'proj'
-12
-16
-used projections
-SELECT c FROM test WHERE d == 12 OR d == 16 ORDER BY c;	proj
-select from projection 'proj_2'
-12
-16
-used projections
-SELECT d FROM test WHERE c == 12 OR c == 16 ORDER BY d;	proj_2
-check table
-0
-broken projections info
-all_1_1_0	proj	NO_FILE_IN_DATA_PART
diff --git a/tests/queries/0_stateless/02916_broken_projection.sh b/tests/queries/0_stateless/02916_broken_projection.sh
deleted file mode 100755
index fbd26e59f6f..00000000000
--- a/tests/queries/0_stateless/02916_broken_projection.sh
+++ /dev/null
@@ -1,515 +0,0 @@
-#!/usr/bin/env bash
-# Tags: long, no-random-merge-tree-settings, no-random-settings, no-s3-storage, no-parallel
-# shellcheck disable=SC2046
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-function create_table()
-{
-    test_id=$1
-    name=$2
-    replica=$3
-    $CLICKHOUSE_CLIENT -nm -q "
-    DROP TABLE IF EXISTS $name SYNC;
-    CREATE TABLE $name
-    (
-        a String,
-        b String,
-        c Int64,
-        d Int64,
-        e Int64,
-
-        PROJECTION proj
-        (
-            SELECT c ORDER BY d
-        ),
-        PROJECTION proj_2
-        (
-            SELECT d ORDER BY c
-        )
-    )
-    ENGINE = ReplicatedMergeTree('/test_broken_projection_32_$test_id/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/', '$replica') ORDER BY a
-    SETTINGS min_bytes_for_wide_part = 0,
-        max_parts_to_merge_at_once=3,
-        enable_vertical_merge_algorithm=1,
-        vertical_merge_algorithm_min_rows_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        compress_primary_key=0;
-    "
-}
-
-function random()
-{
-    cat /dev/urandom | LC_ALL=C tr -dc 'a-zA-Z' | fold -w ${1:-8} | head -n 1
-}
-
-function insert()
-{
-    table=$1
-    offset=$2
-    size=$3
-    echo 'insert new part'
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table SELECT number, number, number, number, number%2 FROM numbers($offset, $size) SETTINGS insert_keeper_fault_injection_probability=0.0;"
-}
-
-function break_projection()
-{
-    table=$1
-    part_name=$2
-    parent_name=$3
-    break_type=$4
-
-    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT path
-    FROM system.projection_parts
-    WHERE table='$table'
-    AND database=currentDatabase()
-    AND active=1
-    AND part_name='$part_name'
-    AND parent_name='$parent_name'
-    ORDER BY modification_time DESC
-    LIMIT 1;
-    ")
-
-    $CLICKHOUSE_CLIENT -q "select throwIf(substring('$part_path', 1, 1) != '/', 'Path is relative: $part_path')" || exit
-
-    if [ "$break_type" = "data" ]
-        then
-           rm "$part_path/d.bin"
-           rm "$part_path/c.bin"
-           echo "broke data of part '$part_name' (parent part: $parent_name)"
-    fi
-    if [ "$break_type" = "metadata" ]
-        then
-           rm "$part_path/columns.txt"
-           echo "broke metadata of part '$part_name' (parent part: $parent_name)"
-    fi
-    if [ "$break_type" = "part" ]
-        then
-           rm -r "$part_path"
-           echo "broke all data of part '$part_name' (parent part: $parent_name)"
-    fi
-}
-
-function break_part()
-{
-    table=$1
-    part_name=$2
-
-    read -r part_path <<< $($CLICKHOUSE_CLIENT -nm -q "
-    SELECT path
-    FROM system.parts
-    WHERE table='$table'
-    AND database=currentDatabase()
-    AND active=1
-    AND part_name='$part_name'
-    ORDER BY modification_time DESC
-    LIMIT 1;
-    ")
-
-    if [ "$part_path" = "" ]
-       then
-           echo "Part path is empty"
-           exit
-    fi
-
-    rm $part_path/columns.txt
-    echo "broke data of part '$part_name'"
-}
-
-function broken_projections_info()
-{
-    table=$1
-    echo 'broken projections info'
-    $CLICKHOUSE_CLIENT -q "
-    SELECT parent_name, name, errors.name FROM
-    (
-        SELECT parent_name, name, exception_code
-        FROM system.projection_parts
-        WHERE table='$table'
-        AND database=currentDatabase()
-        AND is_broken = 1
-    ) AS parts_info
-    INNER JOIN system.errors AS errors
-    ON parts_info.exception_code = errors.code
-    ORDER BY parent_name, name
-"
-}
-
-function check()
-{
-    table=$1
-    expect_broken_part=""
-    expected_error=""
-    if [ $# -gt 1 ]; then
-        expect_broken_part=$2
-        expected_error=$3
-    fi
-
-    #echo 'system.parts'
-    #$CLICKHOUSE_CLIENT -q "
-    #SELECT name, active, projections
-    #FROM system.parts
-    #WHERE table='$table' AND database=currentDatabase()
-    #ORDER BY name;"
-
-    query_id=$(random 8)
-
-    if [ "$expect_broken_part" = "proj" ]
-        then
-            echo "select from projection 'proj', expect error: $expect_broken_part"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-                SET send_logs_level='fatal';
-                SELECT c FROM $table WHERE d == 12 ORDER BY c;
-            " 2>&1 | grep -oF "$expected_error"
-        else
-            echo "select from projection 'proj'"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT c FROM $table WHERE d == 12 OR d == 16 ORDER BY c;"
-            echo 'used projections'
-            $CLICKHOUSE_CLIENT -nm -q "
-                SYSTEM FLUSH LOGS;
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
-            "
-    fi
-
-    query_id=$(random 8)
-
-    if [ "$expect_broken_part" = "proj_2" ]
-        then
-            echo "select from projection 'proj_2', expect error: $expect_broken_part"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -nm -q "
-                SET send_logs_level='fatal';
-                SELECT d FROM $table WHERE c == 12 ORDER BY d;
-            " 2>&1 | grep -oF "$expected_error"
-        else
-            echo "select from projection 'proj_2'"
-            $CLICKHOUSE_CLIENT --optimize_use_projections 1 --query_id $query_id -q "SELECT d FROM $table WHERE c == 12 OR c == 16 ORDER BY d;"
-            echo 'used projections'
-            $CLICKHOUSE_CLIENT -nm -q "
-                SYSTEM FLUSH LOGS;
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1] FROM system.query_log WHERE current_database=currentDatabase() AND query_id='$query_id' AND type='QueryFinish'
-            "
-    fi
-
-    echo 'check table'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    CHECK TABLE $table;"
-}
-
-function optimize()
-{
-    final=$1
-    no_wait=$2
-
-    echo 'optimize'
-    query="OPTIMIZE TABLE test"
-
-    if [ $final -eq 1 ]; then
-        query="$query FINAL"
-    fi
-    if [ $no_wait -eq 1 ]; then
-        query="$query SETTINGS alter_sync=0"
-    fi
-
-    echo $query
-
-    $CLICKHOUSE_CLIENT -q "$query"
-}
-
-function reattach()
-{
-    echo 'Detach - Attach'
-    $CLICKHOUSE_CLIENT -nm -q "
-    SET send_logs_level='fatal';
-    DETACH TABLE test;
-    ATTACH TABLE test;
-    "
-}
-
-function materialize_projection
-{
-    table=$1
-    projection=$2
-    echo "materialize projection $projection"
-    $CLICKHOUSE_CLIENT -q "ALTER TABLE $table MATERIALIZE PROJECTION $projection SETTINGS mutations_sync=2"
-}
-
-function check_table_full()
-{
-    table=$1
-    expect_broken_part=$2
-    echo "check table full ($1 - $2)"
-    if [ "$expect_broken_part" = "" ]
-       then
-           $CLICKHOUSE_CLIENT -nm -q "
-           SET send_logs_level='fatal';
-           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
-           " | grep "broken"
-       else
-           $CLICKHOUSE_CLIENT -nm -q "
-           SET send_logs_level='fatal';
-           CHECK TABLE $table SETTINGS check_query_single_value_result = 0;
-           " | grep "broken" | grep -o $expect_broken_part | head -n 1
-    fi
-}
-
-function test1()
-{
-    create_table test1 test 1
-
-    table_uuid=$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.tables WHERE table='test' and database=currentDatabase()")
-
-    insert test 0 5
-
-    insert test 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test
-
-    # Break metadata file of projection 'proj'
-    break_projection test proj all_2_2_0 metadata
-
-    # Do select and after "check table" query.
-    # Select works because it does not read columns.txt.
-    check test
-
-    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
-    # because it was marked broken during "check table" query.
-    # TODO: try to mark it during select as well
-    broken_projections_info test
-
-    # Check table query will also show a list of parts which have broken projections.
-    check_table_full test "all_2_2_0"
-
-    # Break data file of projection 'proj_2' for part all_2_2_0
-    break_projection test proj_2 all_2_2_0 data
-
-    # It will not yet appear in broken projections info.
-    broken_projections_info test
-
-    # Select now fails with error "File doesn't exist"
-    check test "proj_2" FILE_DOESNT_EXIST
-
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    broken_projections_info test
-
-    # Second select works, because projection is now marked as broken.
-    check test
-
-    # Break data file of projection 'proj_2' for part all_3_3_0
-    break_projection test proj_2 all_3_3_0 data
-
-    # It will not yet appear in broken projections info.
-    broken_projections_info test
-
-    insert test 20 5
-
-    insert test 25 5
-
-    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
-    # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
-    # So a merge will be create for future part all_3_5_1.
-    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
-    # Merge will be retried and on second attempt it will succeed.
-    # The result part all_3_5_1 will have only 1 projection - 'proj', because
-    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
-    optimize 0 1
-    sleep 2
-
-    $CLICKHOUSE_CLIENT -nm -q "
-    SYSTEM FLUSH LOGS;
-    SELECT count() FROM system.text_log
-    WHERE level='Error'
-    AND logger_name='MergeTreeBackgroundExecutor'
-    AND message like 'Exception while executing background task {$table_uuid:all_3_5_1}%Cannot open file%proj_2.proj/c.bin%'
-    "
-
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    broken_projections_info test
-
-    check test
-
-    break_projection test proj all_1_1_0 metadata
-
-    reattach
-
-    broken_projections_info test
-
-    break_projection test proj_2 all_1_1_0 data
-
-    reattach
-
-    broken_projections_info test
-
-    check test
-
-    check_table_full test all_1_1_0
-
-    materialize_projection test proj
-
-    check_table_full test
-
-    check test
-
-    materialize_projection test proj_2
-
-    check_table_full test
-
-    break_projection test proj all_3_5_1_7 data
-
-    insert test 30 5
-
-    optimize 1 0
-
-    insert test 35 5
-
-    optimize 1 0
-
-    check test
-}
-
-function test2()
-{
-    create_table test2 test2 1
-
-    insert test2 0 5
-
-    insert test2 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test2
-
-    create_table test2 test2_replica 2
-
-    check test2_replica
-
-    break_projection test2 proj all_0_0_0 data
-
-    check_table_full test2 all_0_0_0
-
-    check test2
-
-    break_part test2 all_0_0_0
-
-    check_table_full test2 all_0_0_0
-
-    check test2
-
-    $CLICKHOUSE_CLIENT -q "SYSTEM SYNC REPLICA test2;"
-
-    check test2
-}
-
-function test3()
-{
-    create_table test3 test 1
-
-    insert test 0 5
-
-    insert test 5 5
-
-    insert test 10 5
-
-    insert test 15 5
-
-    check test
-
-    break_projection test proj all_2_2_0 data
-
-    check test proj FILE_DOESNT_EXIST
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}') settings check_projection_parts=false;
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}');
-    " | grep -o "RESTORED"
-
-    check test
-
-    broken_projections_info test
-
-    break_projection test proj all_2_2_0 part
-
-    check test proj Errno
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_2')
-    " 2>&1 | grep -o "FILE_DOESNT_EXIST"
-
-    materialize_projection test proj
-
-    check test
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3')
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_3');
-    " | grep -o "RESTORED"
-
-    check test
-
-    break_projection test proj all_1_1_0 part
-
-    check test proj FILE_DOESNT_EXIST
-
-    broken_projections_info test
-
-    ${CLICKHOUSE_CLIENT} -nm --query "
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table ${CLICKHOUSE_DATABASE}.test to Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4')
-    settings check_projection_parts=false, allow_backup_broken_projections=true;
-    " | grep -o "BACKUP_CREATED"
-
-    ${CLICKHOUSE_CLIENT} -nm --stacktrace --query "
-    drop table test sync;
-    set send_logs_level='fatal';
-    set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table ${CLICKHOUSE_DATABASE}.test from Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}_4');
-    " | grep -o "RESTORED"
-
-    check test
-
-    broken_projections_info test
-}
-
-test1
-test2
-test3
-
-
-$CLICKHOUSE_CLIENT -nm -q "
-DROP TABLE IF EXISTS test SYNC;
-DROP TABLE IF EXISTS test2 SYNC;
-DROP TABLE IF EXISTS test2_replica SYNC;
-"

From 216769f43ea536a38b9e7d5650cdd02fae972caf Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 16 Jan 2024 18:55:23 +0000
Subject: [PATCH 0151/1081] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index ca1a29817a5..cc3e55402b3 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -28,7 +28,7 @@ def cluster():
         cluster.shutdown()
 
 
-def create_table(node, table, replica, data_prefix = ""):
+def create_table(node, table, replica, data_prefix=""):
     if data_prefix == "":
         data_prefix = table
 

From 8d88f4cf87d13c6760a5235abf4180102daf8b5c Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 17 Jan 2024 09:42:53 +0100
Subject: [PATCH 0152/1081] Update setting is_parameterized_view & settings
 columns for view

---
 src/Interpreters/InterpreterCreateQuery.cpp | 5 ++++-
 src/Storages/StorageView.cpp                | 2 +-
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 7985785aa9f..6031c8b4e46 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -780,8 +780,11 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
 
         properties.constraints = as_storage_metadata->getConstraints();
     }
-    else if (create.select && !create.isParameterizedView())
+    else if (create.select)
     {
+        if (create.isParameterizedView())
+            return properties;
+
         Block as_select_sample;
 
         if (getContext()->getSettingsRef().allow_experimental_analyzer)
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 1898e49de86..6b80e2450c4 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -112,7 +112,7 @@ StorageView::StorageView(
     : IStorage(table_id_)
 {
     StorageInMemoryMetadata storage_metadata;
-    if (is_parameterized_view_)
+    if (!is_parameterized_view_)
     {
         if (!query.isParameterizedView())
             storage_metadata.setColumns(columns_);

From dea8b10ae972b4fc2b20dbf90d90e362bf7e4207 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 17 Jan 2024 15:39:57 +0100
Subject: [PATCH 0153/1081] Fix test

---
 tests/integration/test_broken_projections/test.py | 11 +++--------
 1 file changed, 3 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index ca1a29817a5..90d82f9f010 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -425,9 +425,7 @@ def test_broken_projections_in_backups(cluster):
     )
 
     check(node, table_name, 1)
-
     assert "" == get_broken_projections_info(node, table_name)
-    # TODO: add a check for what projections are loaded
 
     break_projection(node, table_name, "proj", "all_2_2_0", "part")
 
@@ -446,8 +444,6 @@ def test_broken_projections_in_backups(cluster):
 
     materialize_projection(node, table_name, "proj")
     check(node, table_name, 1)
-    # TODO:
-    # assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(node, table_name)
 
     assert "BACKUP_CREATED" in node.query(
         f"""
@@ -466,7 +462,6 @@ def test_broken_projections_in_backups(cluster):
     check(node, table_name, 1)
 
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
-    # TODO: check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
     assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
         node, table_name
     )
@@ -477,7 +472,7 @@ def test_broken_projections_in_backups(cluster):
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false, allow_backup_broken_projections=true;
     """
     )
 
@@ -488,5 +483,5 @@ def test_broken_projections_in_backups(cluster):
     restore table {table_name} from Disk('backups', 'b4');
     """
     )
-    check(node, table_name, 1)
-    assert "" == get_broken_projections_info(node, table_name)
+    check(node, table_name, 0)
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(node, table_name)

From 1e9de73bf57de1eb66007cba0fecb9f0459c973e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 17 Jan 2024 15:40:46 +0100
Subject: [PATCH 0154/1081] Fix style check

---
 tests/integration/test_broken_projections/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index eb8c452fff0..1b192e0df24 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -484,4 +484,6 @@ def test_broken_projections_in_backups(cluster):
     """
     )
     check(node, table_name, 0)
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(node, table_name)
+    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
+        node, table_name
+    )

From d3b4dea8058e1cccb34bf39b3f26b4c0e5b2368a Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 17 Jan 2024 20:02:17 +0100
Subject: [PATCH 0155/1081] Fix clang tidy build

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp   | 2 +-
 src/Interpreters/InterpreterCreateQuery.cpp | 6 +-----
 2 files changed, 2 insertions(+), 6 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index d2270ea9910..7322d53d831 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6401,7 +6401,7 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
 {
 
     String database_name = scope.context->getCurrentDatabase();
-    String table_name = "";
+    String table_name;
 
     if (table_function_node->getOriginalAST() && table_function_node->getOriginalAST()->as<ASTFunction>())
     {
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 6031c8b4e46..e71946caafe 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -809,11 +809,7 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
               * for example: LIMIT, OFFSET, functions parameters, functions constant only arguments.
               */
 
-            SelectQueryOptions options;
-            if (create.isParameterizedView())
-                options = options.createParameterizedView();
-
-            InterpreterSelectWithUnionQuery interpreter(create.select->clone(), getContext(), options);
+            InterpreterSelectWithUnionQuery interpreter(create.select->clone(), getContext(), SelectQueryOptions());
             as_select_sample = interpreter.getSampleBlock();
         }
 

From e3f5058f6129badab2e0071e86f51ffb77e57ce5 Mon Sep 17 00:00:00 2001
From: MyroTk <44327070+MyroTk@users.noreply.github.com>
Date: Wed, 17 Jan 2024 12:13:15 -0800
Subject: [PATCH 0156/1081] Update Dockerfile

---
 docker/test/integration/runner/Dockerfile | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index c795fbf0672..2a81db78a3d 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -94,6 +94,7 @@ RUN python3 -m pip install --no-cache-dir \
     pytest-repeat \
     pytest-timeout \
     pytest-xdist \
+    pytest-reportlog==0.4.0 \
     pytz \
     pyyaml==5.3.1 \
     redis \

From f89803ebf65d7590e73816052b7ac2de81e04864 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 17 Jan 2024 23:17:53 +0100
Subject: [PATCH 0157/1081] Slightly better

---
 docker/test/base/setup_export_logs.sh | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 416281c2aa3..043adf99ffc 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -156,7 +156,8 @@ function setup_logs_replication
             # Do not try to resolve stack traces in case of debug/sanitizers
             # build, since it is too slow (flushing of trace_log can take ~1min
             # with such MV attached)
-            if [[ "$debug_or_sanitizer_build" = 1 ]]; then
+            if [[ "$debug_or_sanitizer_build" = 1 ]]
+            then
                 EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION}"
             else
                 EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION_TRACE_LOG}"
@@ -180,7 +181,7 @@ function setup_logs_replication
         # Create the destination table with adapted name and structure:
         statement=$(clickhouse-client --format TSVRaw --query "SHOW CREATE TABLE system.${table}" | sed -r -e '
             s/^\($/('"$EXTRA_COLUMNS_FOR_TABLE"'/;
-            s/ORDER BY \(/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"'/;
+            s/ORDER BY \(?(.+?)\)?/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)'/;
             s/^CREATE TABLE system\.\w+_log$/CREATE TABLE IF NOT EXISTS '"$table"'_'"$hash"'/;
             /^TTL /d
             ')

From f9ca4e3b8541d7db85effa3f9be286f7ad916965 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 00:52:05 +0100
Subject: [PATCH 0158/1081] Slightly better

---
 docker/test/base/setup_export_logs.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 043adf99ffc..7033d4b52e2 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -181,7 +181,7 @@ function setup_logs_replication
         # Create the destination table with adapted name and structure:
         statement=$(clickhouse-client --format TSVRaw --query "SHOW CREATE TABLE system.${table}" | sed -r -e '
             s/^\($/('"$EXTRA_COLUMNS_FOR_TABLE"'/;
-            s/ORDER BY \(?(.+?)\)?/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)'/;
+            s/ORDER BY \(?(.+?)\)?/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)/;
             s/^CREATE TABLE system\.\w+_log$/CREATE TABLE IF NOT EXISTS '"$table"'_'"$hash"'/;
             /^TTL /d
             ')

From 61101d1a577b441931ef74b24d449b085d0f0ec3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 01:16:50 +0100
Subject: [PATCH 0159/1081] Add a release build with coverage, turn off
 coverage in the debug build

---
 .github/workflows/master.yml       |  8 ++++++++
 .github/workflows/pull_request.yml |  8 ++++++++
 tests/ci/ci_config.py              | 17 +++++++++++++----
 3 files changed, 29 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index d2865eb737d..50d3eb4a062 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -98,6 +98,14 @@ jobs:
       build_name: package_release
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+  BuilderDebReleaseCoverage:
+    needs: [ RunConfig, BuildDockers ]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_build.yml
+    with:
+      build_name: package_release_coverage
+      checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
     needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index bd2b2b60904..7f843f82c01 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -146,6 +146,14 @@ jobs:
       build_name: package_release
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+  BuilderDebReleaseCoverage:
+    needs: [ RunConfig, FastTest ]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_build.yml
+    with:
+      build_name: package_release_coverage
+      checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
     needs: [RunConfig, FastTest]
     if: ${{ !failure() && !cancelled() }}
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index b8dff3f0a28..1ca4e06bc8c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -474,6 +474,12 @@ CI_CONFIG = CiConfig(
             name="package_debug",
             compiler="clang-17",
             debug_build=True,
+            package_type="deb",
+            sparse_checkout=True,
+        ),
+        "package_release_coverage": BuildConfig(
+            name="package_release_coverage",
+            compiler="clang-17",
             coverage=True,
             package_type="deb",
             sparse_checkout=True,
@@ -571,6 +577,7 @@ CI_CONFIG = CiConfig(
                 "package_tsan",
                 "package_msan",
                 "package_debug",
+                "package_release_coverage",
                 "binary_release",
                 "fuzzers",
             ]
@@ -660,16 +667,15 @@ CI_CONFIG = CiConfig(
         "Stateful tests (release)": TestConfig(
             "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
+        "Stateful tests (coverage)": TestConfig(
+            "package_release_coverage", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
         "Stateful tests (aarch64)": TestConfig(
             "package_aarch64", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
         "Stateful tests (release, DatabaseOrdinary)": TestConfig(
             "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
-        # "Stateful tests (release, DatabaseReplicated)": TestConfig(
-        #     "package_release", job_config=JobConfig(**stateful_test_common_params) # type: ignore
-        # ),
-        # Stateful tests for parallel replicas
         "Stateful tests (release, ParallelReplicas)": TestConfig(
             "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
@@ -712,6 +718,9 @@ CI_CONFIG = CiConfig(
         "Stateless tests (release)": TestConfig(
             "package_release", job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),
+        "Stateless tests (coverage)": TestConfig(
+            "package_release_coverage", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        ),
         "Stateless tests (aarch64)": TestConfig(
             "package_aarch64", job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),

From b9f8fff623448e7013bbe604b39d0f72b81032f9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 01:36:48 +0100
Subject: [PATCH 0160/1081] Fix YAML

---
 .github/workflows/master.yml       | 2 +-
 .github/workflows/pull_request.yml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 50d3eb4a062..1920f3a2a56 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -99,7 +99,7 @@ jobs:
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebReleaseCoverage:
-    needs: [ RunConfig, BuildDockers ]
+    needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 7f843f82c01..57199e6b9d9 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -147,7 +147,7 @@ jobs:
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebReleaseCoverage:
-    needs: [ RunConfig, FastTest ]
+    needs: [RunConfig, FastTest]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:

From cc5cc361ef561993bc7bbea6f1588562f7d3deae Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 12:35:49 +0100
Subject: [PATCH 0161/1081] Fix error

---
 docker/packager/packager | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index c310185b071..8efd3b8f302 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -289,7 +289,7 @@ def parse_env_variables(
         result.append("BUILD_TYPE=None")
 
     if coverage:
-        cmake_flags.append("-DSANITIZE_COVERAGE=1")
+        cmake_flags.append("-DSANITIZE_COVERAGE=1 -DBUILD_STANDALONE_KEEPER=0")
 
     if not cache:
         cmake_flags.append("-DCOMPILER_CACHE=disabled")

From 6c0445f36584a60724f7d616f47c7b953621997c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 12:47:18 +0100
Subject: [PATCH 0162/1081] Fix CMake

---
 cmake/sanitize.cmake | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 3882b51227e..23e9cc34fec 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -63,14 +63,14 @@ endif()
 option(WITH_COVERAGE "Instrumentation for code coverage with default implementation" OFF)
 
 if (WITH_COVERAGE)
-    message (INFORMATION "Enabled instrumentation for code coverage")
+    message (STATUS "Enabled instrumentation for code coverage")
     set(COVERAGE_FLAGS "-fprofile-instr-generate -fcoverage-mapping")
 endif()
 
 option (SANITIZE_COVERAGE "Instrumentation for code coverage with custom callbacks" OFF)
 
 if (SANITIZE_COVERAGE)
-    message (INFORMATION "Enabled instrumentation for code coverage")
+    message (STATUS "Enabled instrumentation for code coverage")
 
     # We set this define for whole build to indicate that at least some parts are compiled with coverage.
     # And to expose it in system.build_options.

From 6d6b8fcf8e988d78fc983ed4043ed556e36b833b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 18 Jan 2024 12:58:50 +0100
Subject: [PATCH 0163/1081] Add missing comments in code

---
 tests/ci/ci_config.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 1ca4e06bc8c..45bdfbecb0c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -55,6 +55,13 @@ class JobConfig:
     run_always: bool = False
 
 
+# About the "sparse_checkout" option:
+#
+# Misha f. Shiryaev
+# :facepalm:
+# we have this feature, it's used by devs, we need to test it in CI
+# It's not useful for the CI itself
+
 @dataclass
 class BuildConfig:
     name: str

From db3ffa5c86dba79ca7052abe8d53799ac3e4afb9 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 18 Jan 2024 12:11:03 +0000
Subject: [PATCH 0164/1081] Automatic style fix

---
 tests/ci/ci_config.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 45bdfbecb0c..ab37659e65b 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -62,6 +62,7 @@ class JobConfig:
 # we have this feature, it's used by devs, we need to test it in CI
 # It's not useful for the CI itself
 
+
 @dataclass
 class BuildConfig:
     name: str

From 0a6331f5f756d5d6465095edac89d2a03618d773 Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Thu, 18 Jan 2024 13:18:13 +0000
Subject: [PATCH 0165/1081] spell-check additions

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 73b7a081797..1f6b24597da 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2657 
+personal_ws-1.1 en 2697 
 AArch
 ACLs
 ALTERs
@@ -2016,6 +2016,7 @@ pcre
 performant
 perl
 persistency
+personal_ws-1.1 en 2657 
 phpclickhouse
 pipelining
 plaintext

From 8b730811efd055f1b200f277202a34258a93722e Mon Sep 17 00:00:00 2001
From: Dale McDiarmid <dale@clickhouse.com>
Date: Thu, 18 Jan 2024 13:24:40 +0000
Subject: [PATCH 0166/1081] Update aspell-dict.txt

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 73b7a081797..1f6b24597da 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2657 
+personal_ws-1.1 en 2697 
 AArch
 ACLs
 ALTERs
@@ -2016,6 +2016,7 @@ pcre
 performant
 perl
 persistency
+personal_ws-1.1 en 2657 
 phpclickhouse
 pipelining
 plaintext

From 8ac04c6dd8a945e0f189aae572c54ee4458f75dd Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 15:15:57 +0000
Subject: [PATCH 0167/1081] Address comments

---
 src/DataTypes/DataTypeVariant.cpp             |  9 ++++
 .../Serializations/SerializationVariant.cpp   | 48 +++++++------------
 .../Serializations/SerializationVariant.h     | 23 +++++++++
 .../SerializationVariantElement.cpp           | 14 +++---
 4 files changed, 57 insertions(+), 37 deletions(-)

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 2bc4dfa5a7a..e0510373960 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -105,6 +105,15 @@ ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & fiel
     }
     else
     {
+        /// We don't have exact mapping Field type -> Data type, so we cannot
+        /// always know in which variant we need to insert the field by it's type.
+        /// Examples:
+        /// Field(42) and Variant(UInt16, String). Type of the Field - UInt64, but we can insert it in UInt16
+        /// Field(42) and Variant(Date, String). Type of the Field - UInt64, but we can insert it in Date
+
+        /// Let's first apply FieldToDataType visitor to find best Data type for this field.
+        /// If we have variant with such type, we will insert this field into it.
+        /// Otherwise we will try to find the first variant that has default Field value with the same type.
         auto field_type = applyVisitor(FieldToDataType(), field);
         auto discr = tryGetVariantDiscriminator(field_type);
         if (!discr)
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 64fcb63d604..78ec0a5e2da 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -200,19 +200,12 @@ void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
         for (size_t i = 0; i != limit; ++i)
             writeBinaryLittleEndian(non_empty_global_discr, *discriminators_stream);
 
-        /// Second, serialize variants in global order.
+        /// Second, serialize non-empty variant (other variants are empty and we can skip their serialization).
         settings.path.push_back(Substream::VariantElements);
-        for (size_t i = 0; i != variants.size(); ++i)
-        {
-            addVariantElementToPath(settings.path, i);
-            /// For non empty variant use the same offset/limit as for whole Variant column
-            if (i == non_empty_global_discr)
-                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), offset, limit, settings, variant_state->states[i]);
-            /// For empty variants, use just 0/0, they won't serialize anything.
-            else
-                variants[i]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(i), 0, 0, settings, variant_state->states[i]);
-            settings.path.pop_back();
-        }
+        addVariantElementToPath(settings.path, non_empty_global_discr);
+        /// We can use the same offset/limit as for whole Variant column
+        variants[non_empty_global_discr]->serializeBinaryBulkWithMultipleStreams(col.getVariantByGlobalDiscriminator(non_empty_global_discr), offset, limit, settings, variant_state->states[non_empty_global_discr]);
+        settings.path.pop_back();
         settings.path.pop_back();
         return;
     }
@@ -237,26 +230,22 @@ void SerializationVariant::serializeBinaryBulkWithMultipleStreams(
         }
     }
 
-    /// If limit for some variant is 0, it means that we don't have its discriminator in the range.
-    /// Set offset to the size of column for such variants, so we won't serialize values from them.
-    for (size_t i = 0; i != variant_offsets_and_limits.size(); ++i)
-    {
-        if (!variant_offsets_and_limits[i].second)
-            variant_offsets_and_limits[i].first = col.getVariantByGlobalDiscriminator(i).size();
-    }
-
     /// Serialize variants in global order.
     settings.path.push_back(Substream::VariantElements);
     for (size_t i = 0; i != variants.size(); ++i)
     {
-        addVariantElementToPath(settings.path, i);
-        variants[i]->serializeBinaryBulkWithMultipleStreams(
-            col.getVariantByGlobalDiscriminator(i),
-            variant_offsets_and_limits[i].first,
-            variant_offsets_and_limits[i].second,
-            settings,
-            variant_state->states[i]);
-        settings.path.pop_back();
+        /// Serialize variant only if we have its discriminator in the range.
+        if (variant_offsets_and_limits[i].second)
+        {
+            addVariantElementToPath(settings.path, i);
+            variants[i]->serializeBinaryBulkWithMultipleStreams(
+                col.getVariantByGlobalDiscriminator(i),
+                variant_offsets_and_limits[i].first,
+                variant_offsets_and_limits[i].second,
+                settings,
+                variant_state->states[i]);
+            settings.path.pop_back();
+        }
     }
     settings.path.pop_back();
 }
@@ -564,9 +553,6 @@ std::vector<size_t> SerializationVariant::getVariantsDeserializeTextOrder(const
     }
 
     std::sort(order.begin(), order.end(), [&](size_t left, size_t right) { return priorities[left] > priorities[right]; });
-    String types_order;
-    for (auto i : order)
-        types_order += " " + variant_types[i]->getName();
     return order;
 }
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.h b/src/DataTypes/Serializations/SerializationVariant.h
index b6bee94c65f..3f53dcf1339 100644
--- a/src/DataTypes/Serializations/SerializationVariant.h
+++ b/src/DataTypes/Serializations/SerializationVariant.h
@@ -6,6 +6,29 @@
 namespace DB
 {
 
+/// Class for serializing/deserializing column with Variant type.
+/// It supports both text and binary bulk serializations/deserializations.
+///
+/// During text serialization it checks discriminator of the current row and
+/// uses corresponding text serialization of this variant.
+///
+/// During text deserialization it tries all variants deserializations
+/// (using tryDeserializeText* methods of ISerialization) in predefined order
+/// and inserts data in the first variant with succeeded deserialization.
+///
+/// During binary bulk serialization it transforms local discriminators
+/// to global and serializes them into a separate stream VariantDiscriminators.
+/// Each variant is serialized into a separate stream with path VariantElements/VariantElement
+/// (VariantElements stream is needed for correct sub-columns creation). We store and serialize
+/// variants in a sparse form (the size of a variant column equals to the number of its discriminator
+/// in the discriminators column), so during deserialization the limit for each variant is
+/// calculated according to discriminators column.
+/// Offsets column is not serialized and stored only in memory.
+///
+/// During binary bulk deserialization we first deserialize discriminators from corresponding stream
+/// and use them to calculate the limit for each variant. Each variant is deserialized from
+/// corresponding stream using calculated limit. Offsets column is not deserialized and constructed
+/// according to discriminators.
 class SerializationVariant : public ISerialization
 {
 public:
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index e06a20d2990..be91e0ba2ee 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -149,19 +149,21 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
             assert_cast<ColumnLowCardinality &>(*variant_element_state->variant->assumeMutable()).nestedRemoveNullable();
     }
 
+    /// If nothing to deserialize, just insert defaults.
+    if (variant_limit == 0)
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
-    /// If don't have our discriminator in range, just insert defaults.
-    if (variant_limit == 0)
-    {
-        mutable_column->insertManyDefaults(limit);
-    }
     /// If we have only our discriminator in range, insert the whole range to result column.
-    else if (variant_limit == limit)
+    if (variant_limit == limit)
     {
         mutable_column->insertRangeFrom(*variant_element_state->variant, variant_offset, variant_limit);
     }

From f202d713711857c083de5aaba1198198d2eaa3a4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 17:29:36 +0000
Subject: [PATCH 0168/1081] Make alter with variant espansion as no-op, add
 tests for alters

---
 src/DataTypes/DataTypeVariant.cpp             |  22 ++
 src/DataTypes/DataTypeVariant.h               |   4 +
 .../Serializations/SerializationVariant.cpp   |   2 +-
 .../SerializationVariantElement.cpp           |  16 +-
 src/Storages/MergeTree/MutateTask.cpp         |  20 +-
 .../02941_variant_type_alters.reference       | 330 ++++++++++++++++++
 .../0_stateless/02941_variant_type_alters.sh  |  61 ++++
 7 files changed, 452 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02941_variant_type_alters.reference
 create mode 100755 tests/queries/0_stateless/02941_variant_type_alters.sh

diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index e0510373960..3a39fdf9ea8 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -230,6 +230,28 @@ static DataTypePtr create(const ASTPtr & arguments)
     return std::make_shared<DataTypeVariant>(nested_types);
 }
 
+bool isVariantExtension(const DataTypePtr & from_type, const DataTypePtr & to_type)
+{
+    const auto * from_variant = typeid_cast<const DataTypeVariant *>(from_type.get());
+    const auto * to_variant = typeid_cast<const DataTypeVariant *>(to_type.get());
+    if (!from_variant || !to_variant)
+        return false;
+
+    const auto & to_variants = to_variant->getVariants();
+    std::unordered_set<String> to_variant_types;
+    to_variant_types.reserve(to_variants.size());
+    for (const auto & variant : to_variants)
+        to_variant_types.insert(variant->getName());
+
+    for (const auto & variant : from_variant->getVariants())
+    {
+        if (!to_variant_types.contains(variant->getName()))
+            return false;
+    }
+
+    return true;
+}
+
 
 void registerDataTypeVariant(DataTypeFactory & factory)
 {
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index ca15dff1476..1a1cb6c12f2 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -61,5 +61,9 @@ private:
     SerializationPtr doGetDefaultSerialization() const override;
 };
 
+/// Check if conversion from from_type to to_type is Variant extension
+/// (both types are Variants and to_type contains all variants from from_type).
+bool isVariantExtension(const DataTypePtr & from_type, const DataTypePtr & to_type);
+
 }
 
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 78ec0a5e2da..48a78dd54a9 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -275,7 +275,7 @@ void SerializationVariant::deserializeBinaryBulkWithMultipleStreams(
     {
         auto * discriminators_stream = settings.getter(settings.path);
         if (!discriminators_stream)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariant::deserializeBinaryBulkWithMultipleStreams");
+            return;
 
         SerializationNumber<ColumnVariant::Discriminator>().deserializeBinaryBulk(*col.getLocalDiscriminatorsPtr()->assumeMutable(), *discriminators_stream, limit, 0);
         addToSubstreamsCache(cache, settings.path, col.getLocalDiscriminatorsPtr());
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index be91e0ba2ee..80524cbd814 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -91,7 +91,7 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
     {
         auto * discriminators_stream = settings.getter(settings.path);
         if (!discriminators_stream)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got empty stream for VariantDiscriminators in SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams");
+            return;
 
         /// If we started to read a new column, reinitialize discriminators column in deserialization state.
         if (!variant_element_state->discriminators || result_column->empty())
@@ -156,10 +156,24 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
+    size_t prev_variant_size = variant_element_state->variant->size();
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
 
+    /// If nothing was deserialized when variant_limit > 0
+    /// it means that we don't have a stream for such sub-column.
+    /// It may happen during ALTER MODIFY column with Variant extension.
+    /// In this case we should just insert default values.
+    if (variant_element_state->variant->empty())
+    {
+        mutable_column->insertManyDefaults(limit);
+        return;
+    }
+
+    if (variant_element_state->variant->size() != prev_variant_size + variant_limit)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected variant column size after deserialization. Expected {}, got {}", prev_variant_size + variant_limit, variant_element_state->variant->size());
+
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
     /// If we have only our discriminator in range, insert the whole range to result column.
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index e4070aa8262..44734ec98c0 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -22,6 +22,7 @@
 #include <Storages/MergeTree/MergeTreeDataMergerMutator.h>
 #include <Storages/MergeTree/MergeTreeIndexInverted.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <boost/algorithm/string/replace.hpp>
 #include <Common/ProfileEventsScope.h>
 
@@ -1921,7 +1922,7 @@ static bool canSkipConversionToNullable(const MergeTreeDataPartPtr & part, const
     if (!part_column)
         return false;
 
-    /// For ALTER MODIFY COLUMN from 'Type' to 'Nullable(Type)' we can skip mutatation and
+    /// For ALTER MODIFY COLUMN from 'Type' to 'Nullable(Type)' we can skip mutation and
     /// apply only metadata conversion. But it doesn't work for custom serialization.
     const auto * to_nullable = typeid_cast<const DataTypeNullable *>(command.data_type.get());
     if (!to_nullable)
@@ -1937,6 +1938,20 @@ static bool canSkipConversionToNullable(const MergeTreeDataPartPtr & part, const
     return true;
 }
 
+static bool canSkipConversionToVariant(const MergeTreeDataPartPtr & part, const MutationCommand & command)
+{
+    if (command.type != MutationCommand::READ_COLUMN)
+        return false;
+
+    auto part_column = part->tryGetColumn(command.column_name);
+    if (!part_column)
+        return false;
+
+    /// For ALTER MODIFY COLUMN with Variant extension (like 'Variant(T1, T2)' to 'Variant(T1, T2, T3, ...)')
+    /// we can skip mutation and apply only metadata conversion.
+    return isVariantExtension(part_column->type, command.data_type);
+}
+
 static bool canSkipMutationCommandForPart(const MergeTreeDataPartPtr & part, const MutationCommand & command, const ContextPtr & context)
 {
     if (command.partition)
@@ -1952,6 +1967,9 @@ static bool canSkipMutationCommandForPart(const MergeTreeDataPartPtr & part, con
     if (canSkipConversionToNullable(part, command))
         return true;
 
+    if (canSkipConversionToVariant(part, command))
+        return true;
+
     return false;
 }
 
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.reference b/tests/queries/0_stateless/02941_variant_type_alters.reference
new file mode 100644
index 00000000000..52c834e455b
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_alters.reference
@@ -0,0 +1,330 @@
+Memory
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	\N	\N	\N	\N	\N	\N
+1	1	\N	\N	\N	\N	\N	\N
+2	2	\N	\N	\N	\N	\N	\N
+3	3	\N	\N	3	\N	3	\N
+4	4	\N	\N	4	\N	4	\N
+5	5	\N	\N	5	\N	5	\N
+6	6	\N	\N	str_6	str_6	\N	\N
+7	7	\N	\N	str_7	str_7	\N	\N
+8	8	\N	\N	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N	\N	\N
+10	10	\N	\N	\N	\N	\N	\N
+11	11	\N	\N	\N	\N	\N	\N
+12	12	\N	\N	12	\N	12	\N
+13	13	\N	\N	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N	\N	\N
+15	15	\N	\N	1970-01-16	\N	\N	1970-01-16
+16	16	\N	\N	1970-01-17	\N	\N	1970-01-17
+17	17	\N	\N	1970-01-18	\N	\N	1970-01-18
+18	18	\N	\N	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N	\N	\N
+20	20	\N	\N	20	\N	20	\N
+21	21	\N	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	\N	\N	\N	\N	\N	\N
+1	1	\N	\N	\N	\N	\N	\N
+2	2	\N	\N	\N	\N	\N	\N
+3	3	\N	\N	3	\N	3	\N
+4	4	\N	\N	4	\N	4	\N
+5	5	\N	\N	5	\N	5	\N
+6	6	\N	\N	str_6	str_6	\N	\N
+7	7	\N	\N	str_7	str_7	\N	\N
+8	8	\N	\N	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N	\N	\N
+10	10	\N	\N	\N	\N	\N	\N
+11	11	\N	\N	\N	\N	\N	\N
+12	12	\N	\N	12	\N	12	\N
+13	13	\N	\N	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N	\N	\N
+15	15	\N	\N	1970-01-16	\N	\N	1970-01-16
+16	16	\N	\N	1970-01-17	\N	\N	1970-01-17
+17	17	\N	\N	1970-01-18	\N	\N	1970-01-18
+18	18	\N	\N	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N	\N	\N
+20	20	\N	\N	20	\N	20	\N
+21	21	\N	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
+MergeTree compact
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
+MergeTree wide
+initial insert
+alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+insert after alter add column 1
+0	0	\N	\N	\N
+1	1	\N	\N	\N
+2	2	\N	\N	\N
+3	3	3	\N	3
+4	4	4	\N	4
+5	5	5	\N	5
+6	6	str_6	str_6	\N
+7	7	str_7	str_7	\N
+8	8	str_8	str_8	\N
+9	9	\N	\N	\N
+10	10	\N	\N	\N
+11	11	\N	\N	\N
+12	12	12	\N	12
+13	13	str_13	str_13	\N
+14	14	\N	\N	\N
+alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+insert after alter modify column 1
+0	0	\N	\N	\N	\N
+1	1	\N	\N	\N	\N
+2	2	\N	\N	\N	\N
+3	3	3	\N	3	\N
+4	4	4	\N	4	\N
+5	5	5	\N	5	\N
+6	6	str_6	str_6	\N	\N
+7	7	str_7	str_7	\N	\N
+8	8	str_8	str_8	\N	\N
+9	9	\N	\N	\N	\N
+10	10	\N	\N	\N	\N
+11	11	\N	\N	\N	\N
+12	12	12	\N	12	\N
+13	13	str_13	str_13	\N	\N
+14	14	\N	\N	\N	\N
+15	15	1970-01-16	\N	\N	1970-01-16
+16	16	1970-01-17	\N	\N	1970-01-17
+17	17	1970-01-18	\N	\N	1970-01-18
+18	18	1970-01-19	\N	\N	1970-01-19
+19	19	\N	\N	\N	\N
+20	20	20	\N	20	\N
+21	21	str_21	str_21	\N	\N
+alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+insert after alter modify column 2
+0	0	0	\N	\N	\N	\N	\N
+1	1	1	\N	\N	\N	\N	\N
+2	2	2	\N	\N	\N	\N	\N
+3	3	3	\N	3	\N	3	\N
+4	4	4	\N	4	\N	4	\N
+5	5	5	\N	5	\N	5	\N
+6	6	6	\N	str_6	str_6	\N	\N
+7	7	7	\N	str_7	str_7	\N	\N
+8	8	8	\N	str_8	str_8	\N	\N
+9	9	9	\N	\N	\N	\N	\N
+10	10	10	\N	\N	\N	\N	\N
+11	11	11	\N	\N	\N	\N	\N
+12	12	12	\N	12	\N	12	\N
+13	13	13	\N	str_13	str_13	\N	\N
+14	14	14	\N	\N	\N	\N	\N
+15	15	15	\N	1970-01-16	\N	\N	1970-01-16
+16	16	16	\N	1970-01-17	\N	\N	1970-01-17
+17	17	17	\N	1970-01-18	\N	\N	1970-01-18
+18	18	18	\N	1970-01-19	\N	\N	1970-01-19
+19	19	19	\N	\N	\N	\N	\N
+20	20	20	\N	20	\N	20	\N
+21	21	21	\N	str_21	str_21	\N	\N
+22	str_22	\N	str_22	\N	\N	\N	\N
+23	\N	\N	\N	\N	\N	\N	\N
+24	24	24	\N	\N	\N	\N	\N
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
new file mode 100755
index 00000000000..9b0d4febd65
--- /dev/null
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -0,0 +1,61 @@
+#!/usr/bin/env bash
+# Tags: long
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+
+function run()
+{
+    echo "initial insert"
+    $CH_CLIENT -q "insert into test select number, number from numbers(3)"
+
+    echo "alter add column 1"
+    $CH_CLIENT -q "alter table test add column v Variant(UInt64, String) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64 from test order by x"
+
+    echo "insert after alter add column 1"
+    $CH_CLIENT -q "insert into test select number, number, number from numbers(3, 3)"
+    $CH_CLIENT -q "insert into test select number, number, 'str_' || toString(number) from numbers(6, 3)"
+    $CH_CLIENT -q "insert into test select number, number, NULL from numbers(9, 3)"
+    $CH_CLIENT -q "insert into test select number, number, multiIf(number % 3 == 0, number, number % 3 == 1, 'str_' || toString(number), NULL) from numbers(12, 3)"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64 from test order by x"
+
+    echo "alter modify column 1"
+    $CH_CLIENT -q "alter table test modify column v Variant(UInt64, String, Date) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "insert after alter modify column 1"
+    $CH_CLIENT -q "insert into test select number, number, toDate(number) from numbers(15, 3)"
+    $CH_CLIENT -q "insert into test select number, number, multiIf(number % 4 == 0, number, number % 4 == 1, 'str_' || toString(number), number % 4 == 2, toDate(number), NULL) from numbers(18, 4)"
+    $CH_CLIENT -q "select x, y, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "alter modify column 2"
+    $CH_CLIENT -q "alter table test modify column y Variant(UInt64, String) settings mutations_sync=1"
+    $CH_CLIENT -q "select x, y, y.UInt64, y.String, v, v.String, v.UInt64, v.Date from test order by x"
+
+    echo "insert after alter modify column 2"
+    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 0, number, number % 3 == 1, 'str_' || toString(number), NULL), NULL from numbers(22, 3)"
+    $CH_CLIENT -q "select x, y, y.UInt64, y.String, v, v.String, v.UInt64, v.Date from test order by x"
+}
+
+$CH_CLIENT -q "drop table if exists test;"
+
+echo "Memory"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64) engine=Memory"
+run
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree compact"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64) engine=MergeTree order by x settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+run
+$CH_CLIENT -q "drop table test;"
+
+echo "MergeTree wide"
+$CH_CLIENT -q "create table test (x UInt64, y UInt64 ) engine=MergeTree order by x settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+run
+$CH_CLIENT -q "drop table test;"

From 4109b6608186b1b9d9dce60f1821313294b7e7c4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 17:30:32 +0000
Subject: [PATCH 0169/1081] Remove unneded tag from test

---
 tests/queries/0_stateless/02941_variant_type_alters.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 9b0d4febd65..7e2ecbd67aa 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -1,5 +1,4 @@
 #!/usr/bin/env bash
-# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From f1749217ee41b3b721fb8a185a929eb18db89b2f Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 18 Jan 2024 21:53:56 +0200
Subject: [PATCH 0170/1081] added format_schema_rows_template setting

---
 docs/en/operations/settings/settings-formats.md | 4 ++++
 src/Core/Settings.h                             | 1 +
 src/Formats/FormatFactory.cpp                   | 1 +
 src/Formats/FormatSettings.h                    | 1 +
 4 files changed, 7 insertions(+)

diff --git a/docs/en/operations/settings/settings-formats.md b/docs/en/operations/settings/settings-formats.md
index eb09af44efd..5dedaa2f6ab 100644
--- a/docs/en/operations/settings/settings-formats.md
+++ b/docs/en/operations/settings/settings-formats.md
@@ -1668,6 +1668,10 @@ Path to file which contains format string for rows (for Template format).
 
 Delimiter between rows (for Template format).
 
+### format_schema_rows_template {#format_schema_rows_template}
+
+Format string for rows (for Template format)
+
 ## CustomSeparated format settings {custom-separated-format-settings}
 
 ### format_custom_escaping_rule {#format_custom_escaping_rule}
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 292e945a29c..4de739ec405 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1079,6 +1079,7 @@ class IColumn;
     M(String, format_template_resultset, "", "Path to file which contains format string for result set (for Template format)", 0) \
     M(String, format_template_row, "", "Path to file which contains format string for rows (for Template format)", 0) \
     M(String, format_template_rows_between_delimiter, "\n", "Delimiter between rows (for Template format)", 0) \
+    M(String, format_schema_rows_template, "\n", "Format string for rows (for Template format)", 0) \
     \
     M(EscapingRule, format_custom_escaping_rule, "Escaped", "Field escaping rule (for CustomSeparated format)", 0) \
     M(String, format_custom_field_delimiter, "\t", "Delimiter between fields (for CustomSeparated format)", 0) \
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 608f9433d6f..6f414c5a69f 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -166,6 +166,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.template_settings.resultset_format = settings.format_template_resultset;
     format_settings.template_settings.row_between_delimiter = settings.format_template_rows_between_delimiter;
     format_settings.template_settings.row_format = settings.format_template_row;
+    format_settings.template_settings.row_format_schema_string = settings.format_schema_rows_template;
     format_settings.tsv.crlf_end_of_line = settings.output_format_tsv_crlf_end_of_line;
     format_settings.tsv.empty_as_default = settings.input_format_tsv_empty_as_default;
     format_settings.tsv.enum_as_number = settings.input_format_tsv_enum_as_number;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 30e4dd04513..70d33a1edcd 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -338,6 +338,7 @@ struct FormatSettings
         String resultset_format;
         String row_format;
         String row_between_delimiter;
+        String row_format_schema_string;
     } template_settings;
 
     struct

From 3dcc2056a59f9b374b4de3b72c30107dd7825d47 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 20:39:36 +0000
Subject: [PATCH 0171/1081] Fix conflicts

---
 src/DataTypes/Serializations/ISerialization.cpp       | 1 +
 src/DataTypes/Serializations/ISerialization.h         | 1 +
 src/DataTypes/Serializations/SerializationVariant.cpp | 2 +-
 3 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/Serializations/ISerialization.cpp b/src/DataTypes/Serializations/ISerialization.cpp
index 2f1eb1887af..7d57d72090b 100644
--- a/src/DataTypes/Serializations/ISerialization.cpp
+++ b/src/DataTypes/Serializations/ISerialization.cpp
@@ -54,6 +54,7 @@ const std::set<SubstreamType> ISerialization::Substream::named_types
     TupleElement,
     NamedOffsets,
     NamedNullMap,
+    NamedVariantDiscriminators,
 };
 
 String ISerialization::Substream::toString() const
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index 64a7a889640..7fba9db4acf 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -155,6 +155,7 @@ public:
             ObjectData,
 
             VariantDiscriminators,
+            NamedVariantDiscriminators,
             VariantOffsets,
             VariantElements,
             VariantElement,
diff --git a/src/DataTypes/Serializations/SerializationVariant.cpp b/src/DataTypes/Serializations/SerializationVariant.cpp
index 48a78dd54a9..5af94364167 100644
--- a/src/DataTypes/Serializations/SerializationVariant.cpp
+++ b/src/DataTypes/Serializations/SerializationVariant.cpp
@@ -36,7 +36,7 @@ void SerializationVariant::enumerateStreams(
     const auto * type_variant = data.type ? &assert_cast<const DataTypeVariant &>(*data.type) : nullptr;
     const auto * column_variant = data.column ? &assert_cast<const ColumnVariant &>(*data.column) : nullptr;
 
-    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", false);
+    auto discriminators_serialization = std::make_shared<SerializationNamed>(std::make_shared<SerializationNumber<ColumnVariant::Discriminator>>(), "discr", SubstreamType::NamedVariantDiscriminators);
     auto local_discriminators = column_variant ? column_variant->getLocalDiscriminatorsPtr() : nullptr;
 
     settings.path.push_back(Substream::VariantDiscriminators);

From cfc8c60aa70917e48281e3583adc922967326d50 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 18 Jan 2024 21:26:55 +0000
Subject: [PATCH 0172/1081] Fix build

---
 src/DataTypes/Serializations/SerializationVariantElement.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 80524cbd814..8d0acee1c2b 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -208,8 +208,8 @@ void SerializationVariantElement::removeVariantFromPath(DB::ISerialization::Subs
 }
 
 SerializationVariantElement::VariantSubcolumnCreator::VariantSubcolumnCreator(
-    const DB::ColumnPtr & local_discriminators_,
-    const DB::String & variant_element_name_,
+    const ColumnPtr & local_discriminators_,
+    const String & variant_element_name_,
     const ColumnVariant::Discriminator global_variant_discriminator_,
     const ColumnVariant::Discriminator local_variant_discriminator_)
     : local_discriminators(local_discriminators_)

From c966674c242552584540dc2e28026894c39f9b16 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 19 Jan 2024 03:59:05 +0100
Subject: [PATCH 0173/1081] Disable LTO with Coverage

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 063cfc77302..6e984ddd864 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -348,7 +348,7 @@ if (COMPILER_CLANG)
     set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fdiagnostics-absolute-paths")
     set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fdiagnostics-absolute-paths")
 
-    if (NOT ENABLE_TESTS AND NOT SANITIZE AND OS_LINUX)
+    if (NOT ENABLE_TESTS AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND OS_LINUX)
         # https://clang.llvm.org/docs/ThinLTO.html
         # Applies to clang and linux only.
         # Disabled when building with tests or sanitizers.

From c6afbe522cae20ee6041534bf7ee7e31e3acb51c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 19 Jan 2024 05:26:14 +0100
Subject: [PATCH 0174/1081] Do not check for large translation units with
 coverage

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6e984ddd864..d0f44f6f3ad 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -546,7 +546,7 @@ if (ENABLE_RUST)
     endif()
 endif()
 
-if (CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO" AND NOT SANITIZE AND OS_LINUX AND (ARCH_AMD64 OR ARCH_AARCH64))
+if (CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO" AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND OS_LINUX AND (ARCH_AMD64 OR ARCH_AARCH64))
     set(CHECK_LARGE_OBJECT_SIZES_DEFAULT ON)
 else ()
     set(CHECK_LARGE_OBJECT_SIZES_DEFAULT OFF)

From 482229cd27c7ddf4218af2ea5d9b087e51876ab0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 19 Jan 2024 08:04:34 +0100
Subject: [PATCH 0175/1081] Add tests with coverage

---
 .github/workflows/master.yml       | 16 ++++++++++++++++
 .github/workflows/pull_request.yml | 16 ++++++++++++++++
 2 files changed, 32 insertions(+)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 1920f3a2a56..5f683fa6c59 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -371,6 +371,14 @@ jobs:
       test_name: Stateless tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestCoverage:
+    needs: [RunConfig, BuilderDebReleaseCoverage]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (coverage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseOrdinary:
     needs: [RunConfig, BuilderDebRelease]
     if: ${{ !failure() && !cancelled() }}
@@ -463,6 +471,14 @@ jobs:
       test_name: Stateful tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestCoverage:
+    needs: [RunConfig, BuilderDebReleaseCoverage]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (coverage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
     needs: [RunConfig, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 28617695ad5..235c8042657 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -382,6 +382,14 @@ jobs:
       test_name: Stateless tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestCoverage:
+    needs: [RunConfig, BuilderDebReleaseCoverage]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (coverage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
     needs: [RunConfig, BuilderDebRelease]
     if: ${{ !failure() && !cancelled() }}
@@ -509,6 +517,14 @@ jobs:
       test_name: Stateful tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestCoverage:
+    needs: [RunConfig, BuilderDebReleaseCoverage]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (coverage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
     needs: [RunConfig, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}

From 7ae631de1ed1ff4bcb8bac5e06c2026db3ff972c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 10:23:40 +0000
Subject: [PATCH 0176/1081] Remove wron check, remove duplicate tests

---
 .../SerializationVariantElement.cpp           |  4 --
 ...> 02943_variant_read_subcolumns.reference} |  0
 ..._1.sh => 02943_variant_read_subcolumns.sh} |  0
 .../02943_variant_read_subcolumns_2.reference |  6 ---
 .../02943_variant_read_subcolumns_2.sh        | 38 -------------------
 5 files changed, 48 deletions(-)
 rename tests/queries/0_stateless/{02943_variant_read_subcolumns_1.reference => 02943_variant_read_subcolumns.reference} (100%)
 rename tests/queries/0_stateless/{02943_variant_read_subcolumns_1.sh => 02943_variant_read_subcolumns.sh} (100%)
 delete mode 100644 tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
 delete mode 100755 tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 8d0acee1c2b..56f0e5d77be 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -156,7 +156,6 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
-    size_t prev_variant_size = variant_element_state->variant->size();
     addVariantToPath(settings.path);
     nested_serialization->deserializeBinaryBulkWithMultipleStreams(variant_element_state->variant, variant_limit, settings, variant_element_state->variant_element_state, cache);
     removeVariantFromPath(settings.path);
@@ -171,9 +170,6 @@ void SerializationVariantElement::deserializeBinaryBulkWithMultipleStreams(
         return;
     }
 
-    if (variant_element_state->variant->size() != prev_variant_size + variant_limit)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected variant column size after deserialization. Expected {}, got {}", prev_variant_size + variant_limit, variant_element_state->variant->size());
-
     size_t variant_offset = variant_element_state->variant->size() - variant_limit;
 
     /// If we have only our discriminator in range, insert the whole range to result column.
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns.reference
similarity index 100%
rename from tests/queries/0_stateless/02943_variant_read_subcolumns_1.reference
rename to tests/queries/0_stateless/02943_variant_read_subcolumns.reference
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
similarity index 100%
rename from tests/queries/0_stateless/02943_variant_read_subcolumns_1.sh
rename to tests/queries/0_stateless/02943_variant_read_subcolumns.sh
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
deleted file mode 100644
index 4b93782cddf..00000000000
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.reference
+++ /dev/null
@@ -1,6 +0,0 @@
-Memory
-test
-MergeTree compact
-test
-MergeTree wide
-test
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
deleted file mode 100755
index 9ccad55191f..00000000000
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns_2.sh
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/env bash
-# Tags: long
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# reset --log_comment
-CLICKHOUSE_LOG_COMMENT=
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
-
-
-function test()
-{
-    echo "test"
-    $CH_CLIENT -q "insert into test select number, multiIf(number % 3 == 2, NULL, number % 3 == 1, number, arrayMap(x -> multiIf(number % 9 == 0, NULL, number % 9 == 3, 'str_' || toString(number), number), range(number % 10))) from numbers(1000000) settings min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "select v, v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
-    $CH_CLIENT -q "select v.UInt64, v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64 from test order by id format Null"
-    $CH_CLIENT -q "select v.\`Array(Variant(String, UInt64))\`,  v.\`Array(Variant(String, UInt64))\`.size0, v.\`Array(Variant(String, UInt64))\`.UInt64, v.\`Array(Variant(String, UInt64))\`.String from test order by id format Null"
-}
-
-$CH_CLIENT -q "drop table if exists test;"
-
-echo "Memory"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=Memory"
-test
-$CH_CLIENT -q "drop table test;"
-
-echo "MergeTree compact"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1000000000, min_bytes_for_wide_part=10000000000;"
-test
-$CH_CLIENT -q "drop table test;"
-
-echo "MergeTree wide"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, Array(Variant(String, UInt64)))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
-test
-$CH_CLIENT -q "drop table test;"
-

From 0c85339ddb26e00ac64d6c763a0f5019b7ee2619 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 10:50:13 +0000
Subject: [PATCH 0177/1081] Fix style

---
 src/DataTypes/Serializations/SerializationVariantElement.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 56f0e5d77be..053f8d22d5a 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -9,7 +9,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
-    extern const int LOGICAL_ERROR;
 }
 
 void SerializationVariantElement::enumerateStreams(

From a196d04a1c2d5f36ec43c2b0947916be7321037c Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 19 Jan 2024 12:04:16 +0100
Subject: [PATCH 0178/1081] Update test

---
 .../test_broken_projections/test.py           | 94 +++++++++++++++++--
 1 file changed, 84 insertions(+), 10 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 1b192e0df24..48ed10d0f87 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -159,6 +159,19 @@ def get_broken_projections_info(node, table):
     ).strip()
 
 
+def get_projections_info(node, table):
+    return node.query(
+        f"""
+    SELECT parent_name, name, is_broken
+    FROM system.projection_parts
+    WHERE table='{table}'
+    AND active = 1
+    AND database=currentDatabase()
+    ORDER BY parent_name, name
+    """
+    ).strip()
+
+
 def optimize(node, table, final, no_wait):
     query = f"OPTIMIZE TABLE {table}"
     if final:
@@ -389,6 +402,11 @@ def test_broken_ignored_replicated(cluster):
     assert "has a broken projection" not in check_table_full(node, table_name)
 
 
+def get_random_string(string_length=8):
+    alphabet = string.ascii_letters + string.digits
+    return "".join((random.choice(alphabet) for _ in range(string_length)))
+
+
 def test_broken_projections_in_backups(cluster):
     node = cluster.instances["node"]
 
@@ -400,6 +418,10 @@ def test_broken_projections_in_backups(cluster):
     insert(node, table_name, 10, 5)
     insert(node, table_name, 15, 5)
 
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
     check(node, table_name, 1)
 
     break_projection(node, table_name, "proj", "all_2_2_0", "data")
@@ -409,10 +431,23 @@ def test_broken_projections_in_backups(cluster):
         node, table_name
     )
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t1\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
+    backup_name = f"b1-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b1') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false;
     """
     )
 
@@ -420,18 +455,30 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b1');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     check(node, table_name, 1)
     assert "" == get_broken_projections_info(node, table_name)
 
-    break_projection(node, table_name, "proj", "all_2_2_0", "part")
+    break_projection(node, table_name, "proj_2", "all_2_2_0", "part")
 
-    check(node, table_name, 0, "proj", "ErrnoException")
+    check(node, table_name, 0, "proj_2", "ErrnoException")
 
-    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+    assert "all_2_2_0\tproj_2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -442,13 +489,14 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    materialize_projection(node, table_name, "proj")
+    materialize_projection(node, table_name, "proj_2")
     check(node, table_name, 1)
 
+    backup_name = f"b3-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b3') settings check_projection_parts=false;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false;
     """
     )
 
@@ -456,11 +504,23 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b3');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
     check(node, table_name, 1)
 
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t0\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
     assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
         node, table_name
@@ -469,10 +529,11 @@ def test_broken_projections_in_backups(cluster):
         node, table_name
     )
 
+    backup_name = f"b4-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
     set backup_restore_keeper_fault_injection_probability=0.0;
-    backup table {table_name} to Disk('backups', 'b4') settings check_projection_parts=false, allow_backup_broken_projections=true;
+    backup table {table_name} to Disk('backups', '{backup_name}') settings check_projection_parts=false, allow_backup_broken_projections=true;
     """
     )
 
@@ -480,9 +541,22 @@ def test_broken_projections_in_backups(cluster):
         f"""
     drop table {table_name} sync;
     set backup_restore_keeper_fault_injection_probability=0.0;
-    restore table {table_name} from Disk('backups', 'b4');
+    restore table {table_name} from Disk('backups', '{backup_name}');
     """
     )
+
+    assert (
+        "all_0_0_0\tproj\t0\n"
+        "all_0_0_0\tproj_2\t0\n"
+        "all_1_1_0\tproj\t1\n"
+        "all_1_1_0\tproj_2\t0\n"
+        "all_2_2_0\tproj\t0\n"
+        "all_2_2_0\tproj_2\t0\n"
+        "all_3_3_0\tproj\t0\n"
+        "all_3_3_0\tproj_2\t0"
+        == get_projections_info(node, table_name)
+    )
+
     check(node, table_name, 0)
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name

From 580501c2b42231eacc4e843968aeb876ff784297 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 19 Jan 2024 11:08:56 +0000
Subject: [PATCH 0179/1081] Add new settings to settings changes history

---
 src/Core/SettingsChangesHistory.h | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 62ffd837a33..af213983b66 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -83,7 +83,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
 {
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
-              {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"}}},
+              {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
+              {"allow_experimental_variant_type", false, false, "Add new experimental Variant type"},
+              {"use_variant_when_no_common_type_in_if", false, false, "Allow to use Variant in if/multiIf if there is no common type"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From 7c66141e08ec203dbff908d69d929ea3bfc0995f Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 19 Jan 2024 11:11:13 +0000
Subject: [PATCH 0180/1081] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 48ed10d0f87..8e3978a078e 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -439,8 +439,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t1\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     backup_name = f"b1-{get_random_string()}"
@@ -467,8 +466,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     check(node, table_name, 1)
@@ -517,8 +515,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     break_projection(node, table_name, "proj", "all_1_1_0", "part")
@@ -553,8 +550,7 @@ def test_broken_projections_in_backups(cluster):
         "all_2_2_0\tproj\t0\n"
         "all_2_2_0\tproj_2\t0\n"
         "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0"
-        == get_projections_info(node, table_name)
+        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
     )
 
     check(node, table_name, 0)

From c51d1f04f6d135c63f5123d4aaef47cef5474525 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 19 Jan 2024 15:57:20 +0100
Subject: [PATCH 0181/1081] Add settings max_unexpected_write_error_retries for
 Azure Blob Storage

---
 src/Core/Settings.h                                    |  1 +
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp       | 10 +++++-----
 src/Disks/IO/WriteBufferFromAzureBlobStorage.h         |  2 ++
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp          |  3 ++-
 .../AzureBlobStorage/AzureObjectStorage.cpp            |  1 +
 .../AzureBlobStorage/AzureObjectStorage.h              |  5 ++++-
 6 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 292e945a29c..59f32c60f63 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -86,6 +86,7 @@ class IColumn;
     M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0) \
     M(UInt64, s3_max_single_read_retries, 4, "The maximum number of retries during single S3 read.", 0) \
     M(UInt64, azure_max_single_read_retries, 4, "The maximum number of retries during single Azure blob storage read.", 0) \
+    M(UInt64, azure_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write", 0) \
     M(UInt64, s3_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during S3 write.", 0) \
     M(UInt64, s3_max_redirects, 10, "Max number of S3 redirects hops allowed.", 0) \
     M(UInt64, s3_max_connections, 1024, "The maximum number of connections per server.", 0) \
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 60bc04f5f95..b4665eb7346 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -18,17 +18,17 @@ namespace ProfileEvents
 namespace DB
 {
 
-static constexpr auto DEFAULT_RETRY_NUM = 3;
-
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
     size_t max_single_part_upload_size_,
+    size_t max_unexpected_write_error_retries_,
     size_t buf_size_,
     const WriteSettings & write_settings_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(&Poco::Logger::get("WriteBufferFromAzureBlobStorage"))
     , max_single_part_upload_size(max_single_part_upload_size_)
+    , max_unexpected_write_error_retries(max_unexpected_write_error_retries_)
     , blob_path(blob_path_)
     , write_settings(write_settings_)
     , blob_container_client(blob_container_client_)
@@ -77,13 +77,13 @@ void WriteBufferFromAzureBlobStorage::execWithRetry(std::function<void()> func,
 
 void WriteBufferFromAzureBlobStorage::finalizeImpl()
 {
-    execWithRetry([this](){ next(); }, DEFAULT_RETRY_NUM);
+    execWithRetry([this](){ next(); }, max_unexpected_write_error_retries);
 
     if (tmp_buffer_write_offset > 0)
         uploadBlock(tmp_buffer->data(), tmp_buffer_write_offset);
 
     auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
-    execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, DEFAULT_RETRY_NUM);
+    execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, max_unexpected_write_error_retries);
 
     LOG_TRACE(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
 }
@@ -94,7 +94,7 @@ void WriteBufferFromAzureBlobStorage::uploadBlock(const char * data, size_t size
     const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
 
     Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data), size);
-    execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, DEFAULT_RETRY_NUM, size);
+    execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, size);
     tmp_buffer_write_offset = 0;
 
     LOG_TRACE(log, "Staged block (id: {}) of size {} (blob path: {}).", block_id, size, blob_path);
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index f1be81922e1..7494130134b 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -30,6 +30,7 @@ public:
         AzureClientPtr blob_container_client_,
         const String & blob_path_,
         size_t max_single_part_upload_size_,
+        size_t max_unexpected_write_error_retries_,
         size_t buf_size_,
         const WriteSettings & write_settings_);
 
@@ -48,6 +49,7 @@ private:
     Poco::Logger * log;
 
     const size_t max_single_part_upload_size;
+    const size_t max_unexpected_write_error_retries;
     const std::string blob_path;
     const WriteSettings write_settings;
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index a5c8afe0264..a209049ceee 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -164,7 +164,8 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024),
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
-        config.getInt(config_prefix + ".list_object_keys_size", 1000)
+        config.getInt(config_prefix + ".list_object_keys_size", 1000),
+        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", 4)
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 068e2aebab1..683bfeb74a7 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -268,6 +268,7 @@ std::unique_ptr<WriteBufferFromFileBase> AzureObjectStorage::writeObject( /// NO
         client.get(),
         object.remote_path,
         settings.get()->max_single_part_upload_size,
+        settings.get()->max_unexpected_write_error_retries,
         buf_size,
         patchSettings(write_settings));
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 4718dce9bf9..2d505c6a022 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -23,12 +23,14 @@ struct AzureObjectStorageSettings
         uint64_t min_bytes_for_seek_,
         int max_single_read_retries_,
         int max_single_download_retries_,
-        int list_object_keys_size_)
+        int list_object_keys_size_,
+        size_t max_unexpected_write_error_retries_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
+        , max_unexpected_write_error_retries (max_unexpected_write_error_retries_)
     {
     }
 
@@ -39,6 +41,7 @@ struct AzureObjectStorageSettings
     size_t max_single_read_retries = 3;
     size_t max_single_download_retries = 3;
     int list_object_keys_size = 1000;
+    size_t max_unexpected_write_error_retries = 4;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;

From d22fc3a224ac29857f3dc3eb60ff872221829006 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 19 Jan 2024 16:13:58 +0100
Subject: [PATCH 0182/1081] Updated to fetch default from settings

---
 .../ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index a209049ceee..e0199fde98b 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -7,6 +7,7 @@
 #include <optional>
 #include <azure/identity/managed_identity_credential.hpp>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <Interpreters/Context.h>
 
 using namespace Azure::Storage::Blobs;
 
@@ -157,7 +158,7 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
     }
 }
 
-std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr /*context*/)
+std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
     return std::make_unique<AzureObjectStorageSettings>(
         config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024),
@@ -165,7 +166,7 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
-        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", 4)
+        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries)
     );
 }
 

From 05609cf75d5048fbd62508fcf6454cec1855943d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 19 Jan 2024 17:02:17 +0100
Subject: [PATCH 0183/1081] Ci to CI

---
 tests/ci/ci_config.py      | 6 +++---
 tests/ci/test_ci_config.py | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 1d94f4fc1cc..611767be2e4 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -270,9 +270,9 @@ sql_test_params = {
 
 
 @dataclass
-class CiConfig:
+class CIConfig:
     """
-    Contains configs for ALL jobs in CI pipeline
+    Contains configs for all jobs in the CI pipeline
     each config item in the below dicts should be an instance of JobConfig class or inherited from it
     """
 
@@ -435,7 +435,7 @@ class CiConfig:
             raise KeyError("config contains errors", errors)
 
 
-CI_CONFIG = CiConfig(
+CI_CONFIG = CIConfig(
     label_configs={
         Labels.DO_NOT_TEST_LABEL.value: LabelConfig(run_jobs=["Style check"]),
     },
diff --git a/tests/ci/test_ci_config.py b/tests/ci/test_ci_config.py
index d22ed16748e..49d49d9c328 100644
--- a/tests/ci/test_ci_config.py
+++ b/tests/ci/test_ci_config.py
@@ -3,7 +3,7 @@
 import unittest
 
 
-class TestCiConfig(unittest.TestCase):
+class TestCIConfig(unittest.TestCase):
     def test_no_errors_in_ci_config(self):
         raised = None
         try:

From 639d7745d450073234405d0725cbd64884d4f8c5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 19 Jan 2024 17:02:23 +0100
Subject: [PATCH 0184/1081] Fix error

---
 docker/test/base/setup_export_logs.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 7033d4b52e2..d3721108426 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -181,7 +181,7 @@ function setup_logs_replication
         # Create the destination table with adapted name and structure:
         statement=$(clickhouse-client --format TSVRaw --query "SHOW CREATE TABLE system.${table}" | sed -r -e '
             s/^\($/('"$EXTRA_COLUMNS_FOR_TABLE"'/;
-            s/ORDER BY \(?(.+?)\)?/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)/;
+            s/^ORDER BY \(?(.+?)\)?$/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)/;
             s/^CREATE TABLE system\.\w+_log$/CREATE TABLE IF NOT EXISTS '"$table"'_'"$hash"'/;
             /^TTL /d
             ')

From 8c54a09e6652b491764abeddf3a0e8e6800374ef Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 20 Jan 2024 08:59:29 +0100
Subject: [PATCH 0185/1081] Fix error

---
 docker/test/base/setup_export_logs.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index d3721108426..156adb1d1e4 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -17,7 +17,7 @@ CLICKHOUSE_CI_LOGS_CLUSTER=${CLICKHOUSE_CI_LOGS_CLUSTER:-system_logs_export}
 
 EXTRA_COLUMNS=${EXTRA_COLUMNS:-"pull_request_number UInt32, commit_sha String, check_start_time DateTime('UTC'), check_name LowCardinality(String), instance_type LowCardinality(String), instance_id String, INDEX ix_pr (pull_request_number) TYPE set(100), INDEX ix_commit (commit_sha) TYPE set(100), INDEX ix_check_time (check_start_time) TYPE minmax, "}
 EXTRA_COLUMNS_EXPRESSION=${EXTRA_COLUMNS_EXPRESSION:-"CAST(0 AS UInt32) AS pull_request_number, '' AS commit_sha, now() AS check_start_time, toLowCardinality('') AS check_name, toLowCardinality('') AS instance_type, '' AS instance_id"}
-EXTRA_ORDER_BY_COLUMNS=${EXTRA_ORDER_BY_COLUMNS:-"check_name, "}
+EXTRA_ORDER_BY_COLUMNS=${EXTRA_ORDER_BY_COLUMNS:-"check_name"}
 
 # trace_log needs more columns for symbolization
 EXTRA_COLUMNS_TRACE_LOG="${EXTRA_COLUMNS} symbols Array(LowCardinality(String)), lines Array(LowCardinality(String)), "
@@ -181,7 +181,7 @@ function setup_logs_replication
         # Create the destination table with adapted name and structure:
         statement=$(clickhouse-client --format TSVRaw --query "SHOW CREATE TABLE system.${table}" | sed -r -e '
             s/^\($/('"$EXTRA_COLUMNS_FOR_TABLE"'/;
-            s/^ORDER BY \(?(.+?)\)?$/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \1)/;
+            s/^ORDER BY (([^\(].+?)|\((.+?)\))$/ORDER BY ('"$EXTRA_ORDER_BY_COLUMNS"', \2\3)/;
             s/^CREATE TABLE system\.\w+_log$/CREATE TABLE IF NOT EXISTS '"$table"'_'"$hash"'/;
             /^TTL /d
             ')

From caf9d8df6d789203a4e408341c9494952eb14ad2 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 20 Jan 2024 14:59:13 +0100
Subject: [PATCH 0186/1081] Update test.py

---
 tests/integration/test_broken_projections/test.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 8e3978a078e..d750bb5827d 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -413,6 +413,8 @@ def test_broken_projections_in_backups(cluster):
     table_name = "test4"
     create_table(node, table_name, 1)
 
+    node.qeury("SYSTEM STOP MERGES")
+
     insert(node, table_name, 0, 5)
     insert(node, table_name, 5, 5)
     insert(node, table_name, 10, 5)
@@ -557,3 +559,4 @@ def test_broken_projections_in_backups(cluster):
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
+    node.qeury("SYSTEM START MERGES")

From e5c3b67f379efdd6d403be08f8bce164348663a1 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 20 Jan 2024 16:10:09 +0100
Subject: [PATCH 0187/1081] Update test.py

---
 tests/integration/test_broken_projections/test.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index d750bb5827d..acf0160cf1b 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -413,7 +413,7 @@ def test_broken_projections_in_backups(cluster):
     table_name = "test4"
     create_table(node, table_name, 1)
 
-    node.qeury("SYSTEM STOP MERGES")
+    node.query("SYSTEM STOP MERGES")
 
     insert(node, table_name, 0, 5)
     insert(node, table_name, 5, 5)
@@ -559,4 +559,4 @@ def test_broken_projections_in_backups(cluster):
     assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
-    node.qeury("SYSTEM START MERGES")
+    node.query("SYSTEM START MERGES")

From cfe60586c007a230df68771b3f914d9a66414b7d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 20 Jan 2024 21:45:11 +0100
Subject: [PATCH 0188/1081] Reset coverage after each test

---
 tests/clickhouse-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index b62bd5975ea..49c517852a6 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -2894,7 +2894,7 @@ def parse_args():
     parser.add_argument(
         "--reset-coverage-before-every-test",
         action="store_true",
-        default=False,
+        default=True,
         help="Collect isolated test coverage for every test instead of a cumulative. Useful only when tests are run sequentially.",
     )
     parser.add_argument(

From 51cc01f8be8fea1fcaea0af9c85ca2930536e593 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 21 Jan 2024 14:36:03 +0100
Subject: [PATCH 0189/1081] Minor change

---
 base/base/coverage.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/base/base/coverage.cpp b/base/base/coverage.cpp
index 499e384d21f..05bef21049b 100644
--- a/base/base/coverage.cpp
+++ b/base/base/coverage.cpp
@@ -62,6 +62,7 @@ namespace
 
     uintptr_t * allocate(size_t size)
     {
+        /// Note: mmap return zero-initialized memory, and we count on that.
         void * map = mmap(nullptr, size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
         if (MAP_FAILED == map)
             return nullptr;
@@ -91,8 +92,6 @@ void __sanitizer_cov_trace_pc_guard_init(uint32_t * start, uint32_t * stop)
     /// Note: we will leak this.
     current_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
     cumulative_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
-
-    resetCoverage();
 }
 
 /// This is called at least once for every DSO for initialization

From b967cc6af9deac20eff318e3433fc5b09fd6314a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 21 Jan 2024 15:30:50 +0100
Subject: [PATCH 0190/1081] Fix error

---
 base/base/coverage.cpp | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/base/base/coverage.cpp b/base/base/coverage.cpp
index 05bef21049b..b85f1a16d32 100644
--- a/base/base/coverage.cpp
+++ b/base/base/coverage.cpp
@@ -92,6 +92,8 @@ void __sanitizer_cov_trace_pc_guard_init(uint32_t * start, uint32_t * stop)
     /// Note: we will leak this.
     current_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
     cumulative_coverage_array = allocate(sizeof(uintptr_t) * coverage_array_size);
+
+    resetCoverage();
 }
 
 /// This is called at least once for every DSO for initialization
@@ -102,8 +104,8 @@ void __sanitizer_cov_pcs_init(const uintptr_t * pcs_begin, const uintptr_t * pcs
         return;
     pc_table_initialized = true;
 
-    all_addresses_array = allocate(sizeof(uintptr_t) * coverage_array_size);
     all_addresses_array_size = pcs_end - pcs_begin;
+    all_addresses_array = allocate(sizeof(uintptr_t) * all_addresses_array_size);
 
     /// They are not a real pointers, but also contain a flag in the most significant bit,
     /// in which we are not interested for now. Reset it.
@@ -125,10 +127,10 @@ void __sanitizer_cov_trace_pc_guard(uint32_t * guard)
     /// The values of `*guard` are as you set them in
     /// __sanitizer_cov_trace_pc_guard_init and so you can make them consecutive
     /// and use them to dereference an array or a bit vector.
-    void * pc = __builtin_return_address(0);
+    intptr_t pc = reinterpret_cast<uintptr_t>(__builtin_return_address(0));
 
-    current_coverage_array[guard - guards_start] = reinterpret_cast<uintptr_t>(pc);
-    cumulative_coverage_array[guard - guards_start] = reinterpret_cast<uintptr_t>(pc);
+    current_coverage_array[guard - guards_start] = pc;
+    cumulative_coverage_array[guard - guards_start] = pc;
 }
 
 }

From eae39ff545978386a8a57bca7c68b1ff97cf6d6d Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sun, 21 Jan 2024 21:51:06 +0200
Subject: [PATCH 0191/1081] #31363 - modified TemplateBlockOutputFormat to work
 with added format_schema_rows_template setting

---
 src/Core/Settings.h                           |  2 +-
 src/Formats/FormatFactory.cpp                 |  3 +-
 src/Formats/FormatSettings.h                  |  2 +-
 .../Impl/TemplateBlockOutputFormat.cpp        | 33 +++++++++++++++----
 4 files changed, 31 insertions(+), 9 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 4de739ec405..3143ada7d65 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1078,8 +1078,8 @@ class IColumn;
     M(String, format_schema, "", "Schema identifier (used by schema-based formats)", 0) \
     M(String, format_template_resultset, "", "Path to file which contains format string for result set (for Template format)", 0) \
     M(String, format_template_row, "", "Path to file which contains format string for rows (for Template format)", 0) \
-    M(String, format_template_rows_between_delimiter, "\n", "Delimiter between rows (for Template format)", 0) \
     M(String, format_schema_rows_template, "\n", "Format string for rows (for Template format)", 0) \
+    M(String, format_template_rows_between_delimiter, "\n", "Delimiter between rows (for Template format)", 0) \
     \
     M(EscapingRule, format_custom_escaping_rule, "Escaped", "Field escaping rule (for CustomSeparated format)", 0) \
     M(String, format_custom_field_delimiter, "\t", "Delimiter between fields (for CustomSeparated format)", 0) \
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 6f414c5a69f..6f7f758621c 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -166,7 +166,8 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.template_settings.resultset_format = settings.format_template_resultset;
     format_settings.template_settings.row_between_delimiter = settings.format_template_rows_between_delimiter;
     format_settings.template_settings.row_format = settings.format_template_row;
-    format_settings.template_settings.row_format_schema_string = settings.format_schema_rows_template;
+    format_settings.template_settings.row_format_schema = settings.format_schema_rows_template;
+    format_settings.template_settings.row_between_delimiter_schema = settings.format_schema_rows_between_delimiter;
     format_settings.tsv.crlf_end_of_line = settings.output_format_tsv_crlf_end_of_line;
     format_settings.tsv.empty_as_default = settings.input_format_tsv_empty_as_default;
     format_settings.tsv.enum_as_number = settings.input_format_tsv_enum_as_number;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 70d33a1edcd..28a2076af84 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -338,7 +338,7 @@ struct FormatSettings
         String resultset_format;
         String row_format;
         String row_between_delimiter;
-        String row_format_schema_string;
+        String row_format_schema;
     } template_settings;
 
     struct
diff --git a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
index 6d8fe1e5a2c..495cc0e541e 100644
--- a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
@@ -11,6 +11,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int SYNTAX_ERROR;
+    extern const int INVALID_TEMPLATE_FORMAT;
 }
 
 TemplateBlockOutputFormat::TemplateBlockOutputFormat(const Block & header_, WriteBuffer & out_, const FormatSettings & settings_,
@@ -213,14 +214,34 @@ void registerOutputFormatTemplate(FormatFactory & factory)
                     });
         }
 
-        ParsedTemplateFormatString row_format = ParsedTemplateFormatString(
+        ParsedTemplateFormatString row_format;
+        auto idx_by_name = [&](const String & colName)
+        {
+            return sample.getPositionByName(colName);
+        };
+        if (settings.template_settings.row_format.empty())
+        {
+            if (settings.template_settings.row_format_schema.empty())
+            {
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template");
+            }
+            else
+            {
+                row_format = ParsedTemplateFormatString();
+                row_format.parse(settings.template_settings.row_format_schema,idx_by_name);
+            }
+        }
+        else
+        {
+            if (settings.template_settings.row_format_schema.empty())
+            {
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template");
+            }
+            row_format = ParsedTemplateFormatString(
                 FormatSchemaInfo(settings.template_settings.row_format, "Template", false,
                         settings.schema.is_server, settings.schema.format_schema_path),
-                [&](const String & colName)
-                {
-                    return sample.getPositionByName(colName);
-                });
-
+                idx_by_name);
+        }
         return std::make_shared<TemplateBlockOutputFormat>(sample, buf, settings, resultset_format, row_format, settings.template_settings.row_between_delimiter);
     });
 

From 02b178cc9c9b38a30344e2ddd896c1eaf429c3de Mon Sep 17 00:00:00 2001
From: MochiXu <mochi_xu@icloud.com>
Date: Mon, 22 Jan 2024 11:08:03 +0800
Subject: [PATCH 0192/1081] fix drop inverted index

---
 src/Storages/MergeTree/MutateTask.cpp | 22 ++++++++++++++--------
 1 file changed, 14 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index e4070aa8262..8ed8b8bba4c 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -674,15 +674,21 @@ static NameToNameVector collectFilesForRenames(
     {
         if (command.type == MutationCommand::Type::DROP_INDEX)
         {
-            if (source_part->checksums.has(INDEX_FILE_PREFIX + command.column_name + ".idx2"))
+            const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
+
+            for (const auto& suffix : suffixes)
             {
-                add_rename(INDEX_FILE_PREFIX + command.column_name + ".idx2", "");
-                add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
-            }
-            else if (source_part->checksums.has(INDEX_FILE_PREFIX + command.column_name + ".idx"))
-            {
-                add_rename(INDEX_FILE_PREFIX + command.column_name + ".idx", "");
-                add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+
+                if ((suffix == ".idx2" || suffix == ".idx") && source_part->checksums.has(filename))
+                {
+                    add_rename(filename, "");
+                    add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                }
+                else if (source_part->checksums.has(filename))
+                {
+                    add_rename(filename, "");
+                }
             }
         }
         else if (command.type == MutationCommand::Type::DROP_PROJECTION)

From d2c671c17eb4a85583b30d81033f7180ea93f627 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Fri, 19 Jan 2024 20:38:08 +0000
Subject: [PATCH 0193/1081] 1st attempt at vectorization

80 mio arrays with 150 elements each, runtimes in sec

WITH
    (SELECT vec FROM vectors limit 1) AS const_vec
SELECT sum(dist)
FROM
    (SELECT <distance>(const_vec, vec) AS dist FROM vectors)

                        auto-vectorized         hand-vectorized
L2      Float32         0.61                    0.57
L2      Float64         1.15                    0.99
cos     Float32         0.78                    0.65
cos     Float64         1.35                    1.05
---
 src/Functions/array/arrayDistance.cpp         | 145 +++++++++++++++++-
 .../02282_array_distance.reference            |   4 +
 .../0_stateless/02282_array_distance.sql      |  40 +++--
 3 files changed, 172 insertions(+), 17 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index c68c89ee0d5..670442c0c79 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -1,6 +1,7 @@
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/IColumn.h>
+#include <Common/TargetSpecific.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/IDataType.h>
@@ -9,6 +10,10 @@
 #include <Functions/FunctionHelpers.h>
 #include <base/range.h>
 
+#if USE_MULTITARGET_CODE
+#include <immintrin.h>
+#endif
+
 namespace DB
 {
 namespace ErrorCodes
@@ -75,6 +80,49 @@ struct L2Distance
         state.sum += other_state.sum;
     }
 
+#if USE_MULTITARGET_CODE
+    template <typename ResultType>
+    AVX512_FUNCTION_SPECIFIC_ATTRIBUTE static void accumulateCombine(
+        const ResultType * __restrict data_x,
+        const ResultType * __restrict data_y,
+        size_t i_max,
+        size_t & i_x,
+        size_t & i_y,
+        State<ResultType> & state)
+    {
+        __m512 sums;
+        if constexpr (std::is_same_v<ResultType, Float32>)
+            sums = _mm512_setzero_ps();
+        else
+            sums = _mm512_setzero_pd();
+
+        const size_t n = (std::is_same_v<ResultType, Float32>) ? 16 : 8;
+
+        for (; i_x + n < i_max; i_x += n, i_y += n)
+        {
+            if constexpr (std::is_same_v<ResultType, Float32>)
+            {
+                __m512 x = _mm512_loadu_ps(data_x + i_x);
+                __m512 y = _mm512_loadu_ps(data_y + i_y);
+                __m512 differences = _mm512_sub_ps(x, y);
+                sums = _mm512_fmadd_ps(differences, differences, sums);
+            }
+            else
+            {
+                __m512 x = _mm512_loadu_pd(data_x + i_x);
+                __m512 y = _mm512_loadu_pd(data_y + i_y);
+                __m512 differences = _mm512_sub_pd(x, y);
+                sums = _mm512_fmadd_pd(differences, differences, sums);
+            }
+        }
+
+        if constexpr (std::is_same_v<ResultType, Float32>)
+            state.sum = _mm512_reduce_add_ps(sums);
+        else
+            state.sum = _mm512_reduce_add_pd(sums);
+    }
+#endif
+
     template <typename ResultType>
     static ResultType finalize(const State<ResultType> & state, const ConstParams &)
     {
@@ -189,6 +237,70 @@ struct CosineDistance
         state.y_squared += other_state.y_squared;
     }
 
+#if USE_MULTITARGET_CODE
+    template <typename ResultType>
+    AVX512_FUNCTION_SPECIFIC_ATTRIBUTE static void accumulateCombine(
+        const ResultType * __restrict data_x,
+        const ResultType * __restrict data_y,
+        size_t i_max,
+        size_t & i_x,
+        size_t & i_y,
+        State<ResultType> & state)
+    {
+        __m512 dot_products;
+        __m512 x_squareds;
+        __m512 y_squareds;
+
+        if constexpr (std::is_same_v<ResultType, Float32>)
+        {
+            dot_products = _mm512_setzero_ps();
+            x_squareds = _mm512_setzero_ps();
+            y_squareds = _mm512_setzero_ps();
+        }
+        else
+        {
+            dot_products = _mm512_setzero_pd();
+            x_squareds = _mm512_setzero_pd();
+            y_squareds = _mm512_setzero_pd();
+        }
+
+        const size_t n = (std::is_same_v<ResultType, Float32>) ? 16 : 8;
+
+        for (; i_x + n < i_max; i_x += n, i_y += n)
+        {
+            if constexpr (std::is_same_v<ResultType, Float32>)
+            {
+                __m512 x = _mm512_loadu_ps(data_x + i_x);
+                __m512 y = _mm512_loadu_ps(data_y + i_y);
+                dot_products = _mm512_fmadd_ps(x, y, dot_products);
+                x_squareds = _mm512_fmadd_ps(x, x, x_squareds);
+                y_squareds = _mm512_fmadd_ps(y, y, y_squareds);
+            }
+            else
+            {
+                __m512 x = _mm512_loadu_pd(data_x + i_x);
+                __m512 y = _mm512_loadu_pd(data_y + i_y);
+                dot_products = _mm512_fmadd_pd(x, y, dot_products);
+                x_squareds = _mm512_fmadd_pd(x, x, x_squareds);
+                y_squareds = _mm512_fmadd_pd(y, y, y_squareds);
+            }
+        }
+
+        if constexpr (std::is_same_v<ResultType, Float32>)
+        {
+            state.dot_prod = _mm512_reduce_add_ps(dot_products);
+            state.x_squared = _mm512_reduce_add_ps(x_squareds);
+            state.y_squared = _mm512_reduce_add_ps(y_squareds);
+        }
+        else
+        {
+            state.dot_prod = _mm512_reduce_add_pd(dot_products);
+            state.x_squared = _mm512_reduce_add_pd(x_squareds);
+            state.y_squared = _mm512_reduce_add_pd(y_squareds);
+        }
+    }
+#endif
+
     template <typename ResultType>
     static ResultType finalize(const State<ResultType> & state, const ConstParams &)
     {
@@ -352,7 +464,7 @@ private:
         /// Check that arrays in both columns are the sames size
         for (size_t row = 0; row < offsets_x.size(); ++row)
         {
-            if (unlikely(offsets_x[row] != offsets_y[row]))
+            if (offsets_x[row] != offsets_y[row]) [[unlikely]]
             {
                 ColumnArray::Offset prev_offset = row > 0 ? offsets_x[row] : 0;
                 throw Exception(
@@ -420,7 +532,7 @@ private:
         ColumnArray::Offset prev_offset = 0;
         for (size_t row : collections::range(0, offsets_y.size()))
         {
-            if (unlikely(offsets_x[0] != offsets_y[row] - prev_offset))
+            if (offsets_x[0] != offsets_y[row] - prev_offset) [[unlikely]]
             {
                 throw Exception(
                     ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
@@ -438,14 +550,35 @@ private:
         auto & result_data = result->getData();
 
         /// Do the actual computation
-        ColumnArray::Offset prev = 0;
+        size_t prev = 0;
         size_t row = 0;
+
         for (auto off : offsets_y)
         {
+            size_t i = 0;
+            typename Kernel::template State<ResultType> state;
+
+            /// SIMD optimization: process multiple elements in both input arrays at once.
+            /// To avoid combinatorial explosion of SIMD kernels, focus on
+            /// - the two most common input/output types (Float32 x Float32) --> Float32 and (Float64 x Float64) --> Float64 instead of 10 x
+            ///   10 input types x 2 output types,
+            /// - const/non-const inputs instead of non-const/non-const inputs
+            /// - the two most common metrics L2 and cosine distance,
+            /// - the most powerful SIMD instruction set (AVX-512F).
+#if USE_MULTITARGET_CODE
+            if constexpr (std::is_same_v<ResultType, FirstArgType> && std::is_same_v<ResultType, SecondArgType>) /// ResultType is Float32 or Float64
+            {
+                if constexpr (std::is_same_v<Kernel, L2Distance>
+                           || std::is_same_v<Kernel, CosineDistance>)
+                {
+                    if (isArchSupported(TargetArch::AVX512F))
+                        Kernel::template accumulateCombine<ResultType>(data_x.data(), data_y.data(), i + offsets_x[0], i, prev, state);
+                }
+            }
+#else
             /// Process chunks in vectorized manner
             static constexpr size_t VEC_SIZE = 4;
             typename Kernel::template State<ResultType> states[VEC_SIZE];
-            size_t i = 0;
             for (; prev + VEC_SIZE < off; i += VEC_SIZE, prev += VEC_SIZE)
             {
                 for (size_t s = 0; s < VEC_SIZE; ++s)
@@ -453,10 +586,9 @@ private:
                         states[s], static_cast<ResultType>(data_x[i + s]), static_cast<ResultType>(data_y[prev + s]), kernel_params);
             }
 
-            typename Kernel::template State<ResultType> state;
             for (const auto & other_state : states)
                 Kernel::template combine<ResultType>(state, other_state, kernel_params);
-
+#endif
             /// Process the tail
             for (; prev < off; ++i, ++prev)
             {
@@ -466,6 +598,7 @@ private:
             result_data[row] = Kernel::finalize(state, kernel_params);
             row++;
         }
+
         return result;
     }
 
diff --git a/tests/queries/0_stateless/02282_array_distance.reference b/tests/queries/0_stateless/02282_array_distance.reference
index 9758da9a833..c21e294cb62 100644
--- a/tests/queries/0_stateless/02282_array_distance.reference
+++ b/tests/queries/0_stateless/02282_array_distance.reference
@@ -80,3 +80,7 @@ nan
 5	6	268	2	10.234459893824097	23.15167380558045	536	0.00007815428961455151
 6	5	268	2	10.234459893824097	23.15167380558045	536	0.00007815428961455151
 6	6	0	0	0	0	0	0
+5.8309517
+0.0003244877
+5.830951894845301
+0.0003245172890904424
diff --git a/tests/queries/0_stateless/02282_array_distance.sql b/tests/queries/0_stateless/02282_array_distance.sql
index 9c16071dc1f..2cca853fd67 100644
--- a/tests/queries/0_stateless/02282_array_distance.sql
+++ b/tests/queries/0_stateless/02282_array_distance.sql
@@ -12,10 +12,10 @@ SELECT cosineDistance([1, 2, 3], [0, 0, 0]);
 -- Overflows
 WITH CAST([-547274980, 1790553898, 1981517754, 1908431500, 1352428565, -573412550, -552499284, 2096941042], 'Array(Int32)') AS a
 SELECT
-    L1Distance(a,a),
-    L2Distance(a,a),
-    L2SquaredDistance(a,a),
-    LinfDistance(a,a),
+    L1Distance(a, a),
+    L2Distance(a, a),
+    L2SquaredDistance(a, a),
+    LinfDistance(a, a),
     cosineDistance(a, a);
 
 DROP TABLE IF EXISTS vec1;
@@ -88,15 +88,33 @@ SELECT
 FROM vec2f v1, vec2d v2
 WHERE length(v1.v) == length(v2.v);
 
-SELECT L1Distance([0, 0], [1]); -- { serverError 190 }
-SELECT L2Distance([1, 2], (3,4)); -- { serverError 43 }
-SELECT L2SquaredDistance([1, 2], (3,4)); -- { serverError 43 }
-SELECT LpDistance([1, 2], [3,4]); -- { serverError 42 }
-SELECT LpDistance([1, 2], [3,4], -1.); -- { serverError 69 }
-SELECT LpDistance([1, 2], [3,4], 'aaa'); -- { serverError 43 }
-SELECT LpDistance([1, 2], [3,4], materialize(2.7)); -- { serverError 44 }
+SELECT L1Distance([0, 0], [1]); -- { serverError SIZES_OF_ARRAYS_DONT_MATCH }
+SELECT L2Distance([1, 2], (3,4)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT L2SquaredDistance([1, 2], (3,4)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT LpDistance([1, 2], [3,4]); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+SELECT LpDistance([1, 2], [3,4], -1.); -- { serverError ARGUMENT_OUT_OF_BOUND }
+SELECT LpDistance([1, 2], [3,4], 'aaa'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT LpDistance([1, 2], [3,4], materialize(2.7)); -- { serverError ILLEGAL_COLUMN }
 
 DROP TABLE vec1;
 DROP TABLE vec2;
 DROP TABLE vec2f;
 DROP TABLE vec2d;
+
+-- Queries which trigger manually vectorized implementation
+
+SELECT L2Distance(
+    [toFloat32(0.0), toFloat32(1.0), toFloat32(2.0), toFloat32(3.0), toFloat32(4.0), toFloat32(5.0), toFloat32(6.0), toFloat32(7.0), toFloat32(8.0), toFloat32(9.0), toFloat32(10.0), toFloat32(11.0), toFloat32(12.0), toFloat32(13.0), toFloat32(14.0), toFloat32(15.0), toFloat32(16.0), toFloat32(17.0), toFloat32(18.0), toFloat32(19.0), toFloat32(20.0), toFloat32(21.0), toFloat32(22.0), toFloat32(23.0), toFloat32(24.0), toFloat32(25.0), toFloat32(26.0), toFloat32(27.0), toFloat32(28.0), toFloat32(29.0), toFloat32(30.0), toFloat32(31.0), toFloat32(32.0), toFloat32(33.0)],
+    materialize([toFloat32(1.0), toFloat32(2.0), toFloat32(3.0), toFloat32(4.0), toFloat32(5.0), toFloat32(6.0), toFloat32(7.0), toFloat32(8.0), toFloat32(9.0), toFloat32(10.0), toFloat32(11.0), toFloat32(12.0), toFloat32(13.0), toFloat32(14.0), toFloat32(15.0), toFloat32(16.0), toFloat32(17.0), toFloat32(18.0), toFloat32(19.0), toFloat32(20.0), toFloat32(21.0), toFloat32(22.0), toFloat32(23.0), toFloat32(24.0), toFloat32(25.0), toFloat32(26.0), toFloat32(27.0), toFloat32(28.0), toFloat32(29.0), toFloat32(30.0), toFloat32(31.0), toFloat32(32.0), toFloat32(33.0), toFloat32(34.0)]));
+
+SELECT cosineDistance(
+    [toFloat32(0.0), toFloat32(1.0), toFloat32(2.0), toFloat32(3.0), toFloat32(4.0), toFloat32(5.0), toFloat32(6.0), toFloat32(7.0), toFloat32(8.0), toFloat32(9.0), toFloat32(10.0), toFloat32(11.0), toFloat32(12.0), toFloat32(13.0), toFloat32(14.0), toFloat32(15.0), toFloat32(16.0), toFloat32(17.0), toFloat32(18.0), toFloat32(19.0), toFloat32(20.0), toFloat32(21.0), toFloat32(22.0), toFloat32(23.0), toFloat32(24.0), toFloat32(25.0), toFloat32(26.0), toFloat32(27.0), toFloat32(28.0), toFloat32(29.0), toFloat32(30.0), toFloat32(31.0), toFloat32(32.0), toFloat32(33.0)],
+    materialize([toFloat32(1.0), toFloat32(2.0), toFloat32(3.0), toFloat32(4.0), toFloat32(5.0), toFloat32(6.0), toFloat32(7.0), toFloat32(8.0), toFloat32(9.0), toFloat32(10.0), toFloat32(11.0), toFloat32(12.0), toFloat32(13.0), toFloat32(14.0), toFloat32(15.0), toFloat32(16.0), toFloat32(17.0), toFloat32(18.0), toFloat32(19.0), toFloat32(20.0), toFloat32(21.0), toFloat32(22.0), toFloat32(23.0), toFloat32(24.0), toFloat32(25.0), toFloat32(26.0), toFloat32(27.0), toFloat32(28.0), toFloat32(29.0), toFloat32(30.0), toFloat32(31.0), toFloat32(32.0), toFloat32(33.0), toFloat32(34.0)]));
+
+SELECT L2Distance(
+    [toFloat64(0.0), toFloat64(1.0), toFloat64(2.0), toFloat64(3.0), toFloat64(4.0), toFloat64(5.0), toFloat64(6.0), toFloat64(7.0), toFloat64(8.0), toFloat64(9.0), toFloat64(10.0), toFloat64(11.0), toFloat64(12.0), toFloat64(13.0), toFloat64(14.0), toFloat64(15.0), toFloat64(16.0), toFloat64(17.0), toFloat64(18.0), toFloat64(19.0), toFloat64(20.0), toFloat64(21.0), toFloat64(22.0), toFloat64(23.0), toFloat64(24.0), toFloat64(25.0), toFloat64(26.0), toFloat64(27.0), toFloat64(28.0), toFloat64(29.0), toFloat64(30.0), toFloat64(31.0), toFloat64(32.0), toFloat64(33.0)],
+    materialize([toFloat64(1.0), toFloat64(2.0), toFloat64(3.0), toFloat64(4.0), toFloat64(5.0), toFloat64(6.0), toFloat64(7.0), toFloat64(8.0), toFloat64(9.0), toFloat64(10.0), toFloat64(11.0), toFloat64(12.0), toFloat64(13.0), toFloat64(14.0), toFloat64(15.0), toFloat64(16.0), toFloat64(17.0), toFloat64(18.0), toFloat64(19.0), toFloat64(20.0), toFloat64(21.0), toFloat64(22.0), toFloat64(23.0), toFloat64(24.0), toFloat64(25.0), toFloat64(26.0), toFloat64(27.0), toFloat64(28.0), toFloat64(29.0), toFloat64(30.0), toFloat64(31.0), toFloat64(32.0), toFloat64(33.0), toFloat64(34.0)]));
+
+SELECT cosineDistance(
+    [toFloat64(0.0), toFloat64(1.0), toFloat64(2.0), toFloat64(3.0), toFloat64(4.0), toFloat64(5.0), toFloat64(6.0), toFloat64(7.0), toFloat64(8.0), toFloat64(9.0), toFloat64(10.0), toFloat64(11.0), toFloat64(12.0), toFloat64(13.0), toFloat64(14.0), toFloat64(15.0), toFloat64(16.0), toFloat64(17.0), toFloat64(18.0), toFloat64(19.0), toFloat64(20.0), toFloat64(21.0), toFloat64(22.0), toFloat64(23.0), toFloat64(24.0), toFloat64(25.0), toFloat64(26.0), toFloat64(27.0), toFloat64(28.0), toFloat64(29.0), toFloat64(30.0), toFloat64(31.0), toFloat64(32.0), toFloat64(33.0)],
+    materialize([toFloat64(1.0), toFloat64(2.0), toFloat64(3.0), toFloat64(4.0), toFloat64(5.0), toFloat64(6.0), toFloat64(7.0), toFloat64(8.0), toFloat64(9.0), toFloat64(10.0), toFloat64(11.0), toFloat64(12.0), toFloat64(13.0), toFloat64(14.0), toFloat64(15.0), toFloat64(16.0), toFloat64(17.0), toFloat64(18.0), toFloat64(19.0), toFloat64(20.0), toFloat64(21.0), toFloat64(22.0), toFloat64(23.0), toFloat64(24.0), toFloat64(25.0), toFloat64(26.0), toFloat64(27.0), toFloat64(28.0), toFloat64(29.0), toFloat64(30.0), toFloat64(31.0), toFloat64(32.0), toFloat64(33.0), toFloat64(34.0)]));

From 68d0f4e42161713f3b54de2069d894b1f84ed833 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sat, 20 Jan 2024 21:36:25 +0000
Subject: [PATCH 0194/1081] (Futile) unrolling attempt at vectorization

---
 src/Functions/array/arrayDistance.cpp | 88 ++++++++++++++++++++++-----
 1 file changed, 72 insertions(+), 16 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 670442c0c79..aa13ee01d9a 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -90,36 +90,92 @@ struct L2Distance
         size_t & i_y,
         State<ResultType> & state)
     {
-        __m512 sums;
-        if constexpr (std::is_same_v<ResultType, Float32>)
-            sums = _mm512_setzero_ps();
-        else
-            sums = _mm512_setzero_pd();
+        __m512 sums1;
+        __m512 sums2;
+        __m512 sums3;
+        __m512 sums4;
 
-        const size_t n = (std::is_same_v<ResultType, Float32>) ? 16 : 8;
+        if constexpr (std::is_same_v<ResultType, Float32>)
+        {
+            sums1 = _mm512_setzero_ps();
+            sums2 = _mm512_setzero_ps();
+            sums3 = _mm512_setzero_ps();
+            sums4 = _mm512_setzero_ps();
+        }
+        else
+        {
+            sums1 = _mm512_setzero_pd();
+            sums2 = _mm512_setzero_pd();
+            sums3 = _mm512_setzero_pd();
+            sums4 = _mm512_setzero_pd();
+        }
+
+        const size_t n = (std::is_same_v<ResultType, Float32>) ? 64 : 32;
 
         for (; i_x + n < i_max; i_x += n, i_y += n)
         {
             if constexpr (std::is_same_v<ResultType, Float32>)
             {
-                __m512 x = _mm512_loadu_ps(data_x + i_x);
-                __m512 y = _mm512_loadu_ps(data_y + i_y);
-                __m512 differences = _mm512_sub_ps(x, y);
-                sums = _mm512_fmadd_ps(differences, differences, sums);
+                __m512 x1 = _mm512_loadu_ps(data_x + i_x);
+                __m512 y1 = _mm512_loadu_ps(data_y + i_y);
+                __m512 diff1 = _mm512_sub_ps(x1, y1);
+                sums1 = _mm512_fmadd_ps(diff1, diff1, sums1);
+
+                __m512 x2 = _mm512_loadu_ps(data_x + i_x + 16);
+                __m512 y2 = _mm512_loadu_ps(data_y + i_y + 16);
+                __m512 diff2 = _mm512_sub_ps(x2, y2);
+                sums2 = _mm512_fmadd_ps(diff2, diff2, sums2);
+
+                __m512 x3 = _mm512_loadu_ps(data_x + i_x + 32);
+                __m512 y3 = _mm512_loadu_ps(data_y + i_y + 32);
+                __m512 diff3 = _mm512_sub_ps(x3, y3);
+                sums3 = _mm512_fmadd_ps(diff3, diff3, sums3);
+
+                __m512 x4 = _mm512_loadu_ps(data_x + i_x + 48);
+                __m512 y4 = _mm512_loadu_ps(data_y + i_y + 48);
+                __m512 diff4 = _mm512_sub_ps(x4, y4);
+                sums4 = _mm512_fmadd_ps(diff4, diff4, sums4);
             }
             else
             {
-                __m512 x = _mm512_loadu_pd(data_x + i_x);
-                __m512 y = _mm512_loadu_pd(data_y + i_y);
-                __m512 differences = _mm512_sub_pd(x, y);
-                sums = _mm512_fmadd_pd(differences, differences, sums);
+                __m512 x1 = _mm512_loadu_pd(data_x + i_x);
+                __m512 y1 = _mm512_loadu_pd(data_y + i_y);
+                __m512 diff1 = _mm512_sub_pd(x1, y1);
+                sums1 = _mm512_fmadd_pd(diff1, diff1, sums1);
+
+                __m512 x2 = _mm512_loadu_pd(data_x + i_x + 8);
+                __m512 y2 = _mm512_loadu_pd(data_y + i_y + 8);
+                __m512 diff2 = _mm512_sub_pd(x2, y2);
+                sums2 = _mm512_fmadd_pd(diff2, diff2, sums2);
+
+                __m512 x3 = _mm512_loadu_pd(data_x + i_x + 16);
+                __m512 y3 = _mm512_loadu_pd(data_y + i_y + 16);
+                __m512 diff3 = _mm512_sub_pd(x3, y3);
+                sums3 = _mm512_fmadd_pd(diff3, diff3, sums3);
+
+                __m512 x4 = _mm512_loadu_pd(data_x + i_x + 24);
+                __m512 y4 = _mm512_loadu_pd(data_y + i_y + 24);
+                __m512 diff4 = _mm512_sub_pd(x4, y4);
+                sums4 = _mm512_fmadd_pd(diff4, diff4, sums4);
             }
         }
 
         if constexpr (std::is_same_v<ResultType, Float32>)
-            state.sum = _mm512_reduce_add_ps(sums);
+        {
+            Float32 sum1 = _mm512_reduce_add_ps(sums1);
+            Float32 sum2 = _mm512_reduce_add_ps(sums2);
+            Float32 sum3 = _mm512_reduce_add_ps(sums3);
+            Float32 sum4 = _mm512_reduce_add_ps(sums4);
+            state.sum = sum1 + sum2 + sum3 + sum4;
+        }
         else
-            state.sum = _mm512_reduce_add_pd(sums);
+        {
+            Float64 sum1 = _mm512_reduce_add_pd(sums1);
+            Float64 sum2 = _mm512_reduce_add_pd(sums2);
+            Float64 sum3 = _mm512_reduce_add_pd(sums3);
+            Float64 sum4 = _mm512_reduce_add_pd(sums4);
+            state.sum = sum1 + sum2 + sum3 + sum4;
+        }
     }
 #endif
 

From 68fc97089ec22d29b5d25df4e3865a22cf9701db Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sat, 20 Jan 2024 21:50:13 +0000
Subject: [PATCH 0195/1081] Revert "(Futile) unrolling attempt at
 vectorization"

This reverts commit df30a990545eafdf5e6a09034d81a97fb0188ba0.
---
 src/Functions/array/arrayDistance.cpp | 84 +++++----------------------
 1 file changed, 14 insertions(+), 70 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index aa13ee01d9a..670442c0c79 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -90,92 +90,36 @@ struct L2Distance
         size_t & i_y,
         State<ResultType> & state)
     {
-        __m512 sums1;
-        __m512 sums2;
-        __m512 sums3;
-        __m512 sums4;
-
+        __m512 sums;
         if constexpr (std::is_same_v<ResultType, Float32>)
-        {
-            sums1 = _mm512_setzero_ps();
-            sums2 = _mm512_setzero_ps();
-            sums3 = _mm512_setzero_ps();
-            sums4 = _mm512_setzero_ps();
-        }
+            sums = _mm512_setzero_ps();
         else
-        {
-            sums1 = _mm512_setzero_pd();
-            sums2 = _mm512_setzero_pd();
-            sums3 = _mm512_setzero_pd();
-            sums4 = _mm512_setzero_pd();
-        }
+            sums = _mm512_setzero_pd();
 
-        const size_t n = (std::is_same_v<ResultType, Float32>) ? 64 : 32;
+        const size_t n = (std::is_same_v<ResultType, Float32>) ? 16 : 8;
 
         for (; i_x + n < i_max; i_x += n, i_y += n)
         {
             if constexpr (std::is_same_v<ResultType, Float32>)
             {
-                __m512 x1 = _mm512_loadu_ps(data_x + i_x);
-                __m512 y1 = _mm512_loadu_ps(data_y + i_y);
-                __m512 diff1 = _mm512_sub_ps(x1, y1);
-                sums1 = _mm512_fmadd_ps(diff1, diff1, sums1);
-
-                __m512 x2 = _mm512_loadu_ps(data_x + i_x + 16);
-                __m512 y2 = _mm512_loadu_ps(data_y + i_y + 16);
-                __m512 diff2 = _mm512_sub_ps(x2, y2);
-                sums2 = _mm512_fmadd_ps(diff2, diff2, sums2);
-
-                __m512 x3 = _mm512_loadu_ps(data_x + i_x + 32);
-                __m512 y3 = _mm512_loadu_ps(data_y + i_y + 32);
-                __m512 diff3 = _mm512_sub_ps(x3, y3);
-                sums3 = _mm512_fmadd_ps(diff3, diff3, sums3);
-
-                __m512 x4 = _mm512_loadu_ps(data_x + i_x + 48);
-                __m512 y4 = _mm512_loadu_ps(data_y + i_y + 48);
-                __m512 diff4 = _mm512_sub_ps(x4, y4);
-                sums4 = _mm512_fmadd_ps(diff4, diff4, sums4);
+                __m512 x = _mm512_loadu_ps(data_x + i_x);
+                __m512 y = _mm512_loadu_ps(data_y + i_y);
+                __m512 differences = _mm512_sub_ps(x, y);
+                sums = _mm512_fmadd_ps(differences, differences, sums);
             }
             else
             {
-                __m512 x1 = _mm512_loadu_pd(data_x + i_x);
-                __m512 y1 = _mm512_loadu_pd(data_y + i_y);
-                __m512 diff1 = _mm512_sub_pd(x1, y1);
-                sums1 = _mm512_fmadd_pd(diff1, diff1, sums1);
-
-                __m512 x2 = _mm512_loadu_pd(data_x + i_x + 8);
-                __m512 y2 = _mm512_loadu_pd(data_y + i_y + 8);
-                __m512 diff2 = _mm512_sub_pd(x2, y2);
-                sums2 = _mm512_fmadd_pd(diff2, diff2, sums2);
-
-                __m512 x3 = _mm512_loadu_pd(data_x + i_x + 16);
-                __m512 y3 = _mm512_loadu_pd(data_y + i_y + 16);
-                __m512 diff3 = _mm512_sub_pd(x3, y3);
-                sums3 = _mm512_fmadd_pd(diff3, diff3, sums3);
-
-                __m512 x4 = _mm512_loadu_pd(data_x + i_x + 24);
-                __m512 y4 = _mm512_loadu_pd(data_y + i_y + 24);
-                __m512 diff4 = _mm512_sub_pd(x4, y4);
-                sums4 = _mm512_fmadd_pd(diff4, diff4, sums4);
+                __m512 x = _mm512_loadu_pd(data_x + i_x);
+                __m512 y = _mm512_loadu_pd(data_y + i_y);
+                __m512 differences = _mm512_sub_pd(x, y);
+                sums = _mm512_fmadd_pd(differences, differences, sums);
             }
         }
 
         if constexpr (std::is_same_v<ResultType, Float32>)
-        {
-            Float32 sum1 = _mm512_reduce_add_ps(sums1);
-            Float32 sum2 = _mm512_reduce_add_ps(sums2);
-            Float32 sum3 = _mm512_reduce_add_ps(sums3);
-            Float32 sum4 = _mm512_reduce_add_ps(sums4);
-            state.sum = sum1 + sum2 + sum3 + sum4;
-        }
+            state.sum = _mm512_reduce_add_ps(sums);
         else
-        {
-            Float64 sum1 = _mm512_reduce_add_pd(sums1);
-            Float64 sum2 = _mm512_reduce_add_pd(sums2);
-            Float64 sum3 = _mm512_reduce_add_pd(sums3);
-            Float64 sum4 = _mm512_reduce_add_pd(sums4);
-            state.sum = sum1 + sum2 + sum3 + sum4;
-        }
+            state.sum = _mm512_reduce_add_pd(sums);
     }
 #endif
 

From df0c018a9be06e9ccbfb40460f29b155aa86b57f Mon Sep 17 00:00:00 2001
From: Hongbin Ma <mahongbin@apache.org>
Date: Fri, 12 Jan 2024 16:09:09 +0800
Subject: [PATCH 0196/1081] support T64 for date32 type

---
 src/Compression/CompressionCodecT64.cpp       |  6 +++++
 .../00873_t64_codec_date.reference            |  4 +++
 .../0_stateless/00873_t64_codec_date.sql      | 26 +++++++++++++++++++
 3 files changed, 36 insertions(+)
 create mode 100644 tests/queries/0_stateless/00873_t64_codec_date.reference
 create mode 100644 tests/queries/0_stateless/00873_t64_codec_date.sql

diff --git a/src/Compression/CompressionCodecT64.cpp b/src/Compression/CompressionCodecT64.cpp
index bf9a9414bc1..42c6a18aa77 100644
--- a/src/Compression/CompressionCodecT64.cpp
+++ b/src/Compression/CompressionCodecT64.cpp
@@ -91,6 +91,7 @@ enum class MagicNumber : uint8_t
     Decimal32   = 19,
     Decimal64   = 20,
     IPv4        = 21,
+    Date32      = 22,
 };
 
 MagicNumber serializeTypeId(std::optional<TypeIndex> type_id)
@@ -109,6 +110,7 @@ MagicNumber serializeTypeId(std::optional<TypeIndex> type_id)
         case TypeIndex::Int32:      return MagicNumber::Int32;
         case TypeIndex::Int64:      return MagicNumber::Int64;
         case TypeIndex::Date:       return MagicNumber::Date;
+        case TypeIndex::Date32:     return MagicNumber::Date32;
         case TypeIndex::DateTime:   return MagicNumber::DateTime;
         case TypeIndex::DateTime64: return MagicNumber::DateTime64;
         case TypeIndex::Enum8:      return MagicNumber::Enum8;
@@ -137,6 +139,7 @@ TypeIndex deserializeTypeId(uint8_t serialized_type_id)
         case MagicNumber::Int32:        return TypeIndex::Int32;
         case MagicNumber::Int64:        return TypeIndex::Int64;
         case MagicNumber::Date:         return TypeIndex::Date;
+        case MagicNumber::Date32:       return TypeIndex::Date32;
         case MagicNumber::DateTime:     return TypeIndex::DateTime;
         case MagicNumber::DateTime64:   return TypeIndex::DateTime64;
         case MagicNumber::Enum8:        return TypeIndex::Enum8;
@@ -177,6 +180,8 @@ TypeIndex baseType(TypeIndex type_idx)
         case TypeIndex::Enum16:
         case TypeIndex::Date:
             return TypeIndex::UInt16;
+        case TypeIndex::Date32:
+            return TypeIndex::Int32;
         case TypeIndex::UInt32:
         case TypeIndex::DateTime:
         case TypeIndex::IPv4:
@@ -205,6 +210,7 @@ TypeIndex typeIdx(const IDataType * data_type)
         case TypeIndex::UInt16:
         case TypeIndex::Enum16:
         case TypeIndex::Date:
+        case TypeIndex::Date32:
         case TypeIndex::Int32:
         case TypeIndex::UInt32:
         case TypeIndex::IPv4:
diff --git a/tests/queries/0_stateless/00873_t64_codec_date.reference b/tests/queries/0_stateless/00873_t64_codec_date.reference
new file mode 100644
index 00000000000..1568c3122e6
--- /dev/null
+++ b/tests/queries/0_stateless/00873_t64_codec_date.reference
@@ -0,0 +1,4 @@
+1970-01-01	1970-01-01	1950-01-01	1950-01-01
+1970-01-01	1970-01-01	1970-01-01	1970-01-01
+2149-06-06	2149-06-06	2149-06-08	2149-06-08
+2149-06-06	2149-06-06	2149-06-06	2149-06-06
diff --git a/tests/queries/0_stateless/00873_t64_codec_date.sql b/tests/queries/0_stateless/00873_t64_codec_date.sql
new file mode 100644
index 00000000000..e9230c75665
--- /dev/null
+++ b/tests/queries/0_stateless/00873_t64_codec_date.sql
@@ -0,0 +1,26 @@
+DROP TABLE IF EXISTS t64;
+
+CREATE TABLE t64
+(
+    date16 Date,
+    t_date16 Date Codec(T64, ZSTD),
+    date_32 Date32,
+    t_date32 Date32 Codec(T64, ZSTD)
+) ENGINE MergeTree() ORDER BY tuple();
+
+INSERT INTO t64 values ('1970-01-01', '1970-01-01', '1970-01-01', '1970-01-01');
+INSERT INTO t64 values ('2149-06-06', '2149-06-06', '2149-06-06', '2149-06-06');
+INSERT INTO t64 values ('2149-06-08', '2149-06-08', '2149-06-08', '2149-06-08');
+INSERT INTO t64 values ('1950-01-01', '1950-01-01', '1950-01-01', '1950-01-01');
+
+SELECT * FROM t64 ORDER BY date16;
+
+SELECT * FROM t64 WHERE date16 != t_date16;
+SELECT * FROM t64 WHERE date_32 != t_date32;
+
+OPTIMIZE TABLE t64 FINAL;
+
+SELECT * FROM t64 WHERE date16 != t_date16;
+SELECT * FROM t64 WHERE date_32 != t_date32;
+
+DROP TABLE t64;

From b4dcd6755a8a2384e5937991e0656058aed4f95a Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 22 Jan 2024 13:41:58 +0000
Subject: [PATCH 0197/1081] Use ColumnConst instead of Field in
 IColumn::createWithOffsets

---
 src/Columns/ColumnConst.cpp                   | 22 +++++++++++++++++++
 src/Columns/ColumnConst.h                     |  5 +++++
 src/Columns/ColumnNullable.cpp                | 16 ++++++--------
 src/Columns/ColumnNullable.h                  |  2 +-
 src/Columns/ColumnObject.cpp                  |  3 ++-
 src/Columns/ColumnSparse.cpp                  |  3 ++-
 src/Columns/ColumnVector.cpp                  |  5 +++--
 src/Columns/ColumnVector.h                    |  2 +-
 src/Columns/IColumn.cpp                       |  6 ++---
 src/Columns/IColumn.h                         |  5 +++--
 src/Functions/IFunction.cpp                   |  4 ++--
 .../0_stateless/02941_variant_type_alters.sh  |  1 +
 12 files changed, 52 insertions(+), 22 deletions(-)

diff --git a/src/Columns/ColumnConst.cpp b/src/Columns/ColumnConst.cpp
index 9aa0f5cfa49..6e5a3c45c4e 100644
--- a/src/Columns/ColumnConst.cpp
+++ b/src/Columns/ColumnConst.cpp
@@ -159,4 +159,26 @@ void ColumnConst::compareColumn(
     std::fill(compare_results.begin(), compare_results.end(), res);
 }
 
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, Field value)
+{
+    auto data = column->cloneEmpty();
+    data->insert(value);
+    return ColumnConst::create(std::move(data), 1);
+}
+
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, size_t const_value_index)
+{
+    auto data = column->cloneEmpty();
+    data->insertFrom(*column, const_value_index);
+    return ColumnConst::create(std::move(data), 1);
+}
+
+ColumnConst::Ptr createColumnConstWithDefaultValue(const ColumnPtr & column)
+{
+    auto data = column->cloneEmpty();
+    data->insertDefault();
+    return ColumnConst::create(std::move(data), 1);
+}
+
+
 }
diff --git a/src/Columns/ColumnConst.h b/src/Columns/ColumnConst.h
index dc84e0c2402..3c646a62795 100644
--- a/src/Columns/ColumnConst.h
+++ b/src/Columns/ColumnConst.h
@@ -292,4 +292,9 @@ public:
     bool isCollationSupported() const override { return data->isCollationSupported(); }
 };
 
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, Field value);
+ColumnConst::Ptr createColumnConst(const ColumnPtr & column, size_t const_value_index);
+ColumnConst::Ptr createColumnConstWithDefaultValue(const ColumnPtr  &column);
+
+
 }
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 25b0e35e15e..c0b13204b8e 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -827,24 +827,22 @@ void ColumnNullable::checkConsistency() const
                         "Logical error: Sizes of nested column and null map of Nullable column are not equal");
 }
 
-ColumnPtr ColumnNullable::createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr ColumnNullable::createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     ColumnPtr new_values;
     ColumnPtr new_null_map;
 
-    if (default_field.getType() == Field::Types::Null)
+    const ColumnNullable & nullable_column_with_default_value = assert_cast<const ColumnNullable &>(column_with_default_value.getDataColumn());
+    if (nullable_column_with_default_value.isNullAt(0))
     {
-        auto default_column = nested_column->cloneEmpty();
-        default_column->insertDefault();
-
         /// Value in main column, when null map is 1 is implementation defined. So, take any value.
-        new_values = nested_column->createWithOffsets(offsets, (*default_column)[0], total_rows, shift);
-        new_null_map = null_map->createWithOffsets(offsets, Field(1u), total_rows, shift);
+        new_values = nested_column->createWithOffsets(offsets, *createColumnConstWithDefaultValue(nested_column), total_rows, shift);
+        new_null_map = null_map->createWithOffsets(offsets, *createColumnConst(null_map, Field(1u)), total_rows, shift);
     }
     else
     {
-        new_values = nested_column->createWithOffsets(offsets, default_field, total_rows, shift);
-        new_null_map = null_map->createWithOffsets(offsets, Field(0u), total_rows, shift);
+        new_values = nested_column->createWithOffsets(offsets, *ColumnConst::create(nullable_column_with_default_value.getNestedColumnPtr(), 1), total_rows, shift);
+        new_null_map = null_map->createWithOffsets(offsets, *createColumnConst(null_map, Field(0u)), total_rows, shift);
     }
 
     return ColumnNullable::create(new_values, new_null_map);
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index 60c7750f8fc..3e04ba8a180 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -167,7 +167,7 @@ public:
         getIndicesOfNonDefaultRowsImpl<ColumnNullable>(indices, from, limit);
     }
 
-    ColumnPtr createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const override;
+    ColumnPtr createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const override;
 
     bool isNullable() const override { return true; }
     bool isFixedAndContiguous() const override { return false; }
diff --git a/src/Columns/ColumnObject.cpp b/src/Columns/ColumnObject.cpp
index f7176568a1b..0ec9c616bab 100644
--- a/src/Columns/ColumnObject.cpp
+++ b/src/Columns/ColumnObject.cpp
@@ -2,6 +2,7 @@
 #include <Columns/ColumnObject.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnArray.h>
+#include <Columns/ColumnConst.h>
 #include <Common/iota.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/getLeastSupertype.h>
@@ -475,7 +476,7 @@ void ColumnObject::Subcolumn::finalize()
             {
                 auto values = part->index(*offsets, offsets->size());
                 values = castColumn({values, from_type, ""}, to_type);
-                part = values->createWithOffsets(offsets_data, to_type->getDefault(), part_size, /*shift=*/ 0);
+                part = values->createWithOffsets(offsets_data, *createColumnConstWithDefaultValue(result_column->getPtr()), part_size, /*shift=*/ 0);
             }
         }
 
diff --git a/src/Columns/ColumnSparse.cpp b/src/Columns/ColumnSparse.cpp
index 02e6e9e56b4..eeeec912ce8 100644
--- a/src/Columns/ColumnSparse.cpp
+++ b/src/Columns/ColumnSparse.cpp
@@ -1,6 +1,7 @@
 #include <Columns/ColumnCompressed.h>
 #include <Columns/ColumnSparse.h>
 #include <Columns/ColumnTuple.h>
+#include <Columns/ColumnConst.h>
 #include <Columns/ColumnsCommon.h>
 #include <Processors/Transforms/ColumnGathererTransform.h>
 #include <Common/HashTable/Hash.h>
@@ -130,7 +131,7 @@ StringRef ColumnSparse::getDataAt(size_t n) const
 
 ColumnPtr ColumnSparse::convertToFullColumnIfSparse() const
 {
-    return values->createWithOffsets(getOffsetsData(), (*values)[0], _size, /*shift=*/ 1);
+    return values->createWithOffsets(getOffsetsData(), *createColumnConst(values, 0), _size, /*shift=*/ 1);
 }
 
 void ColumnSparse::insertSingleValue(const Inserter & inserter)
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index b1cf449dfde..3aadc530878 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -2,6 +2,7 @@
 
 #include <Columns/ColumnCompressed.h>
 #include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnConst.h>
 #include <Columns/MaskOperations.h>
 #include <Columns/RadixSortHelper.h>
 #include <IO/WriteHelpers.h>
@@ -940,7 +941,7 @@ ColumnPtr ColumnVector<T>::compress() const
 }
 
 template <typename T>
-ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     if (offsets.size() + shift != size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -949,7 +950,7 @@ ColumnPtr ColumnVector<T>::createWithOffsets(const IColumn::Offsets & offsets, c
     auto res = this->create();
     auto & res_data = res->getData();
 
-    T default_value = static_cast<T>(default_field.safeGet<T>());
+    T default_value = assert_cast<const ColumnVector<T> &>(column_with_default_value.getDataColumn()).getElement(0);
     res_data.resize_fill(total_rows, default_value);
     for (size_t i = 0; i < offsets.size(); ++i)
         res_data[offsets[i]] = data[i + shift];
diff --git a/src/Columns/ColumnVector.h b/src/Columns/ColumnVector.h
index fab2d5f06aa..652cc1f5ff9 100644
--- a/src/Columns/ColumnVector.h
+++ b/src/Columns/ColumnVector.h
@@ -379,7 +379,7 @@ public:
         return this->template getIndicesOfNonDefaultRowsImpl<Self>(indices, from, limit);
     }
 
-    ColumnPtr createWithOffsets(const IColumn::Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const override;
+    ColumnPtr createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const override;
 
     ColumnPtr compress() const override;
 
diff --git a/src/Columns/IColumn.cpp b/src/Columns/IColumn.cpp
index 82dc82e0bd9..d7f83b822d2 100644
--- a/src/Columns/IColumn.cpp
+++ b/src/Columns/IColumn.cpp
@@ -35,7 +35,7 @@ void IColumn::insertFrom(const IColumn & src, size_t n)
     insert(src[n]);
 }
 
-ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const
+ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
 {
     if (offsets.size() + shift != size())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -51,14 +51,14 @@ ColumnPtr IColumn::createWithOffsets(const Offsets & offsets, const Field & defa
         current_offset = offsets[i];
 
         if (offsets_diff > 1)
-            res->insertMany(default_field, offsets_diff - 1);
+            res->insertManyFrom(column_with_default_value.getDataColumn(), 0, offsets_diff - 1);
 
         res->insertFrom(*this, i + shift);
     }
 
     ssize_t offsets_diff = static_cast<ssize_t>(total_rows) - current_offset;
     if (offsets_diff > 1)
-        res->insertMany(default_field, offsets_diff - 1);
+        res->insertManyFrom(column_with_default_value.getDataColumn(), 0, offsets_diff - 1);
 
     return res;
 }
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 3f866e6213d..1dcd3acdd19 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -34,6 +34,7 @@ class Arena;
 class ColumnGathererStream;
 class Field;
 class WeakHash32;
+class ColumnConst;
 
 /*
  * Represents a set of equal ranges in previous column to perform sorting in current column.
@@ -462,10 +463,10 @@ public:
 
     /// Returns column with @total_size elements.
     /// In result column values from current column are at positions from @offsets.
-    /// Other values are filled by @default_value.
+    /// Other values are filled by value from @column_with_default_value.
     /// @shift means how much rows to skip from the beginning of current column.
     /// Used to create full column from sparse.
-    [[nodiscard]] virtual Ptr createWithOffsets(const Offsets & offsets, const Field & default_field, size_t total_rows, size_t shift) const;
+    [[nodiscard]] virtual Ptr createWithOffsets(const Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const;
 
     /// Compress column in memory to some representation that allows to decompress it back.
     /// Return itself if compression is not applicable for this column type.
diff --git a/src/Functions/IFunction.cpp b/src/Functions/IFunction.cpp
index a46f4d2a11d..d4c6b8f4ba6 100644
--- a/src/Functions/IFunction.cpp
+++ b/src/Functions/IFunction.cpp
@@ -313,7 +313,7 @@ ColumnPtr IExecutableFunction::execute(const ColumnsWithTypeAndName & arguments,
 {
     bool use_default_implementation_for_sparse_columns = useDefaultImplementationForSparseColumns();
     /// DataTypeFunction does not support obtaining default (isDefaultAt())
-    /// ColumnFunction does not support getting specific values
+    /// ColumnFunction does not support getting specific values.
     if (result_type->getTypeId() != TypeIndex::Function && use_default_implementation_for_sparse_columns)
     {
         size_t num_sparse_columns = 0;
@@ -368,7 +368,7 @@ ColumnPtr IExecutableFunction::execute(const ColumnsWithTypeAndName & arguments,
             if (!result_type->canBeInsideSparseColumns() || !res->isDefaultAt(0) || res->getNumberOfDefaultRows() != 1)
             {
                 const auto & offsets_data = assert_cast<const ColumnVector<UInt64> &>(*sparse_offsets).getData();
-                return res->createWithOffsets(offsets_data, (*res)[0], input_rows_count, /*shift=*/ 1);
+                return res->createWithOffsets(offsets_data, *createColumnConst(res, 0), input_rows_count, /*shift=*/ 1);
             }
 
             return ColumnSparse::create(res, sparse_offsets, input_rows_count);
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 7e2ecbd67aa..9b0d4febd65 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: long
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment

From 15e3a5b3961ac304a30ef211594f57bda3a2f584 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 22 Jan 2024 14:57:10 +0100
Subject: [PATCH 0198/1081] Try fix flaky test

---
 .../integration/test_broken_projections/test.py  | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index acf0160cf1b..87d910b9c77 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -28,10 +28,17 @@ def cluster():
         cluster.shutdown()
 
 
-def create_table(node, table, replica, data_prefix=""):
+def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
 
+    if aggressive_merge:
+        vertical_merge_algorithm_min_rows_to_activate = 1
+        vertical_merge_algorithm_min_columns_to_activate = 1
+    else:
+        vertical_merge_algorithm_min_rows_to_activate = 100000
+        vertical_merge_algorithm_min_columns_to_activate = 100
+
     node.query(
         f"""
     DROP TABLE IF EXISTS {table} SYNC;
@@ -56,9 +63,8 @@ def create_table(node, table, replica, data_prefix=""):
     SETTINGS min_bytes_for_wide_part = 0,
         max_parts_to_merge_at_once=3,
         enable_vertical_merge_algorithm=1,
-        vertical_merge_algorithm_min_rows_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
-        vertical_merge_algorithm_min_columns_to_activate = 1,
+        vertical_merge_algorithm_min_rows_to_activate = {vertical_merge_algorithm_min_rows_to_activate},
+        vertical_merge_algorithm_min_columns_to_activate = {vertical_merge_algorithm_min_columns_to_activate},
         compress_primary_key=0;
     """
     )
@@ -411,7 +417,7 @@ def test_broken_projections_in_backups(cluster):
     node = cluster.instances["node"]
 
     table_name = "test4"
-    create_table(node, table_name, 1)
+    create_table(node, table_name, 1, aggressive_merge=False)
 
     node.query("SYSTEM STOP MERGES")
 

From 0606a772674fdecf08a9a904ef46293e8bba9acc Mon Sep 17 00:00:00 2001
From: mochi <mochi_xu@icloud.com>
Date: Mon, 22 Jan 2024 22:02:50 +0800
Subject: [PATCH 0199/1081] Update src/Storages/MergeTree/MutateTask.cpp

Co-authored-by: Dmitry Novik <mrnovikd@gmail.com>
---
 src/Storages/MergeTree/MutateTask.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 8ed8b8bba4c..fccee6bd887 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -676,7 +676,7 @@ static NameToNameVector collectFilesForRenames(
         {
             const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
 
-            for (const auto& suffix : suffixes)
+            for (const auto & suffix : suffixes)
             {
                 String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
 

From 2e7ce5b0e208c91874d44eb0c828a1e01544a387 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 22 Jan 2024 16:24:43 +0100
Subject: [PATCH 0200/1081] Updated settings ptr and fetching of client from
 Disk & ObjectStorage

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     | 32 ++++++++-----------
 src/Backups/BackupIO_AzureBlobStorage.h       |  4 +--
 .../AzureBlobStorage/AzureObjectStorage.h     |  7 +++-
 .../Cached/CachedObjectStorage.h              |  8 +++++
 src/Disks/ObjectStorages/IObjectStorage.h     | 13 ++++++++
 .../copyAzureBlobStorageFile.cpp              | 22 ++++++-------
 .../copyAzureBlobStorageFile.h                |  4 +--
 src/Storages/StorageAzureBlob.cpp             |  2 +-
 8 files changed, 57 insertions(+), 35 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 8c6c1040eec..fca324869ae 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -37,13 +37,12 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     , configuration(configuration_)
 {
     auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
-    settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
-    auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupReaderAzureBlobStorage",
                                                           std::move(client_ptr),
-                                                          std::move(settings_as_unique_ptr),
+                                                          StorageAzureBlob::createSettings(context_),
                                                           configuration_.container);
-    client = object_storage->getClient();
+    client = object_storage->getAzureBlobStorageClient();
+    settings = object_storage->getSettings();
 }
 
 BackupReaderAzureBlobStorage::~BackupReaderAzureBlobStorage() = default;
@@ -89,8 +88,8 @@ std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const
         key = file_name;
     }
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client.get(), key, read_settings, settings->max_single_read_retries,
-        settings->max_single_download_retries);
+        client.get(), key, read_settings, settings.get()->max_single_read_retries,
+        settings.get()->max_single_download_retries);
 }
 
 void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
@@ -98,10 +97,8 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
 {
     LOG_INFO(&Poco::Logger::get("BackupReaderAzureBlobStorage"), "Enter copyFileToDisk");
 
-    /// Use the native copy as a more optimal way to copy a file from AzureBlobStorage to AzureBlobStorage if it's possible.
-    /// We don't check for `has_throttling` here because the native copy almost doesn't use network.
     auto destination_data_source_description = destination_disk->getDataSourceDescription();
-    if (destination_data_source_description.sameKind(data_source_description)
+    if ((destination_data_source_description.type == DataSourceType::AzureBlobStorage)
         && (destination_data_source_description.is_encrypted == encrypted_in_backup))
     {
         LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
@@ -115,7 +112,7 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
 
             copyAzureBlobStorageFile(
                 client,
-                reinterpret_cast<AzureObjectStorage *>(destination_disk->getObjectStorage().get())->getClient(),
+                destination_disk->getObjectStorage()->getAzureBlobStorageClient(),
                 configuration.container,
                 fs::path(configuration.blob_path) / path_in_backup,
                 0,
@@ -150,13 +147,12 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     , configuration(configuration_)
 {
     auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
-    settings = StorageAzureBlob::createSettingsAsSharedPtr(context_);
-    auto settings_as_unique_ptr = StorageAzureBlob::createSettings(context_);
     object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
                                                           std::move(client_ptr),
-                                                          std::move(settings_as_unique_ptr),
+                                                          StorageAzureBlob::createSettings(context_),
                                                           configuration_.container);
-    client = object_storage->getClient();
+    client = object_storage->getAzureBlobStorageClient();
+    settings = object_storage->getSettings();
 }
 
 void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
@@ -172,7 +168,7 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
         {
             LOG_TRACE(log, "Copying file {} from disk {} to AzureBlobStorag", src_path, src_disk->getName());
             copyAzureBlobStorageFile(
-                reinterpret_cast<AzureObjectStorage *>(src_disk->getObjectStorage().get())->getClient(),
+                src_disk->getObjectStorage()->getAzureBlobStorageClient(),
                 client,
                 /* src_container */ blob_path[1],
                 /* src_path */ blob_path[0],
@@ -267,8 +263,8 @@ std::unique_ptr<ReadBuffer> BackupWriterAzureBlobStorage::readFile(const String
     }
 
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client.get(), key, read_settings, settings->max_single_read_retries,
-        settings->max_single_download_retries);
+        client.get(), key, read_settings, settings.get()->max_single_read_retries,
+        settings.get()->max_single_download_retries);
 }
 
 std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const String & file_name)
@@ -285,7 +281,7 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
         client.get(),
         key,
-        settings->max_single_part_upload_size,
+        settings.get()->max_single_part_upload_size,
         DBMS_DEFAULT_BUFFER_SIZE,
         write_settings);
 }
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 12bf073cd08..87dc470cdb3 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -31,7 +31,7 @@ private:
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
-    std::shared_ptr<AzureObjectStorageSettings> settings;
+    MultiVersion<AzureObjectStorageSettings> settings;
 };
 
 class BackupWriterAzureBlobStorage : public BackupWriterDefault
@@ -60,7 +60,7 @@ private:
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
-    std::shared_ptr<AzureObjectStorageSettings> settings;
+    MultiVersion<AzureObjectStorageSettings> settings;
 };
 
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 52d535054ff..a9d082539e6 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -139,7 +139,12 @@ public:
 
     bool isRemote() const override { return true; }
 
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getClient() { return client; }
+    MultiVersion<AzureObjectStorageSettings> & getSettings() { return settings; }
+
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient() override
+    {
+        return client;
+    }
 
 private:
     const String name;
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
index 4c185db051d..6b0ff8be58a 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
@@ -3,6 +3,7 @@
 #include <Disks/ObjectStorages/IObjectStorage.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Cache/FileCacheSettings.h>
+#include "config.h"
 
 namespace Poco
 {
@@ -118,6 +119,13 @@ public:
 
     static bool canUseReadThroughCache(const ReadSettings & settings);
 
+#if USE_AZURE_BLOB_STORAGE
+    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient() override
+    {
+        return object_storage->getAzureBlobStorageClient();
+    }
+#endif
+
 private:
     FileCache::Key getCacheKey(const std::string & path) const;
 
diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index f405be72287..cf113586ddf 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -23,7 +23,12 @@
 #include <Disks/DirectoryIterator.h>
 #include <Common/ThreadPool.h>
 #include <Interpreters/threadPoolCallbackRunner.h>
+#include "config.h"
 
+#if USE_AZURE_BLOB_STORAGE
+#include <Common/MultiVersion.h>
+#include <azure/storage/blobs.hpp>
+#endif
 
 namespace DB
 {
@@ -212,6 +217,14 @@ public:
 
     virtual WriteSettings patchSettings(const WriteSettings & write_settings) const;
 
+#if USE_AZURE_BLOB_STORAGE
+    virtual MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient()
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "This function is only implemented for AzureBlobStorage");
+    }
+#endif
+
+
 private:
     mutable std::mutex throttlers_mutex;
     ThrottlerPtr remote_read_throttler;
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 272be914cc1..bb8702e9b41 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -49,7 +49,7 @@ namespace
             size_t total_size_,
             const String & dest_container_,
             const String & dest_blob_,
-            std::shared_ptr<AzureObjectStorageSettings> settings_,
+            MultiVersion<AzureObjectStorageSettings> settings_,
             const std::optional<std::map<String, String>> & object_metadata_,
             ThreadPoolCallbackRunner<void> schedule_,
             bool for_disk_azure_blob_storage_,
@@ -65,7 +65,7 @@ namespace
             , schedule(schedule_)
             , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
             , log(log_)
-            , max_single_part_upload_size(settings_->max_single_part_upload_size)
+            , max_single_part_upload_size(settings_.get()->max_single_part_upload_size)
         {
         }
 
@@ -78,7 +78,7 @@ namespace
         size_t total_size;
         const String & dest_container;
         const String & dest_blob;
-        std::shared_ptr<AzureObjectStorageSettings> settings;
+        MultiVersion<AzureObjectStorageSettings> settings;
         const std::optional<std::map<String, String>> & object_metadata;
         ThreadPoolCallbackRunner<void> schedule;
         bool for_disk_azure_blob_storage;
@@ -114,9 +114,9 @@ namespace
             if (!total_size)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Chosen multipart upload for an empty file. This must not happen");
 
-            auto max_part_number = settings->max_part_number;
-            auto min_upload_part_size = settings->min_upload_part_size;
-            auto max_upload_part_size = settings->max_upload_part_size;
+            auto max_part_number = settings.get()->max_part_number;
+            auto min_upload_part_size = settings.get()->min_upload_part_size;
+            auto max_upload_part_size = settings.get()->max_upload_part_size;
 
             if (!max_part_number)
                 throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_part_number must not be 0");
@@ -333,7 +333,7 @@ void copyDataToAzureBlobStorageFile(
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
     const String & dest_container,
     const String & dest_blob,
-    std::shared_ptr<AzureObjectStorageSettings> settings,
+    MultiVersion<AzureObjectStorageSettings> settings,
     const std::optional<std::map<String, String>> & object_metadata,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
@@ -352,14 +352,14 @@ void copyAzureBlobStorageFile(
     size_t size,
     const String & dest_container,
     const String & dest_blob,
-    std::shared_ptr<AzureObjectStorageSettings> settings,
+    MultiVersion<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     const std::optional<std::map<String, String>> & object_metadata,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
 
-    if (settings->use_native_copy)
+    if (settings.get()->use_native_copy)
     {
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)
@@ -393,8 +393,8 @@ void copyAzureBlobStorageFile(
         LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container, src_blob);
         auto create_read_buffer = [&]
         {
-            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client.get(), src_blob, read_settings, settings->max_single_read_retries,
-            settings->max_single_download_retries);
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client.get(), src_blob, read_settings, settings.get()->max_single_read_retries,
+            settings.get()->max_single_download_retries);
         };
 
         UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container, dest_blob, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index b022151d32d..491f7cd7176 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -29,7 +29,7 @@ void copyAzureBlobStorageFile(
     size_t src_size,
     const String & dest_container,
     const String & dest_blob,
-    std::shared_ptr<AzureObjectStorageSettings> settings,
+    MultiVersion<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},
@@ -48,7 +48,7 @@ void copyDataToAzureBlobStorageFile(
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client,
     const String & dest_container,
     const String & dest_blob,
-    std::shared_ptr<AzureObjectStorageSettings> settings,
+    MultiVersion<AzureObjectStorageSettings> settings,
     const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},
     bool for_disk_azure_blob_storage = false);
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 7a40d2dcb73..e54838c7a61 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -1214,7 +1214,7 @@ StorageAzureBlobSource::ReaderHolder StorageAzureBlobSource::createReader()
     QueryPipelineBuilder builder;
     std::shared_ptr<ISource> source;
     std::unique_ptr<ReadBuffer> read_buf;
-        std::optional<size_t> num_rows_from_cache = need_only_count && getContext()->getSettingsRef().use_cache_for_count_from_files
+    std::optional<size_t> num_rows_from_cache = need_only_count && getContext()->getSettingsRef().use_cache_for_count_from_files
         ? tryGetNumRowsFromCache(path_with_metadata) : std::nullopt;
     if (num_rows_from_cache)
     {

From 4e5249275ed67c52d958007978c66619db22a1a5 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Mon, 22 Jan 2024 16:45:25 +0100
Subject: [PATCH 0201/1081] Do not resolve remote table id on initiator

---
 src/Storages/StorageDistributed.cpp | 9 +--------
 1 file changed, 1 insertion(+), 8 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 987ea4a4957..9972517bbac 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -779,18 +779,11 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
     }
     else
     {
-        auto resolved_remote_storage_id = remote_storage_id;
-        // In case of cross-replication we don't know what database is used for the table.
-        // `storage_id.hasDatabase()` can return false only on the initiator node.
-        // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
-        if (remote_storage_id.hasDatabase())
-            resolved_remote_storage_id = query_context->resolveStorageID(remote_storage_id);
-
         auto get_column_options = GetColumnsOptions(GetColumnsOptions::All).withExtendedObjects().withVirtuals();
 
         auto column_names_and_types = distributed_storage_snapshot->getColumns(get_column_options);
 
-        auto storage = std::make_shared<StorageDummy>(resolved_remote_storage_id, ColumnsDescription{column_names_and_types});
+        auto storage = std::make_shared<StorageDummy>(remote_storage_id, ColumnsDescription{column_names_and_types});
         auto table_node = std::make_shared<TableNode>(std::move(storage), query_context);
 
         if (table_expression_modifiers)

From 7b235fe643e744b643be6e4d0788de63cae4a07c Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Mon, 22 Jan 2024 22:59:59 +0200
Subject: [PATCH 0202/1081] #31363 - remove schema delimiter setting and add
 test 00937_format_schema_rows_template.sh and reference

---
 src/Formats/FormatFactory.cpp                 |  1 -
 .../Impl/TemplateBlockOutputFormat.cpp        | 15 +++------
 ...0937_format_schema_rows_template.reference |  4 +++
 .../00937_format_schema_rows_template.sh      | 32 +++++++++++++++++++
 4 files changed, 40 insertions(+), 12 deletions(-)
 create mode 100644 tests/queries/0_stateless/00937_format_schema_rows_template.reference
 create mode 100755 tests/queries/0_stateless/00937_format_schema_rows_template.sh

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 6f7f758621c..184778a9fa9 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -167,7 +167,6 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.template_settings.row_between_delimiter = settings.format_template_rows_between_delimiter;
     format_settings.template_settings.row_format = settings.format_template_row;
     format_settings.template_settings.row_format_schema = settings.format_schema_rows_template;
-    format_settings.template_settings.row_between_delimiter_schema = settings.format_schema_rows_between_delimiter;
     format_settings.tsv.crlf_end_of_line = settings.output_format_tsv_crlf_end_of_line;
     format_settings.tsv.empty_as_default = settings.input_format_tsv_empty_as_default;
     format_settings.tsv.enum_as_number = settings.input_format_tsv_enum_as_number;
diff --git a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
index 495cc0e541e..99a7f59c09e 100644
--- a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
@@ -221,21 +221,14 @@ void registerOutputFormatTemplate(FormatFactory & factory)
         };
         if (settings.template_settings.row_format.empty())
         {
-            if (settings.template_settings.row_format_schema.empty())
-            {
-                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template");
-            }
-            else
-            {
-                row_format = ParsedTemplateFormatString();
-                row_format.parse(settings.template_settings.row_format_schema,idx_by_name);
-            }
+            row_format = ParsedTemplateFormatString();
+            row_format.parse(settings.template_settings.row_format_schema,idx_by_name);
         }
         else
         {
-            if (settings.template_settings.row_format_schema.empty())
+            if (!settings.template_settings.row_format_schema.empty())
             {
-                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template");
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template, but not both");
             }
             row_format = ParsedTemplateFormatString(
                 FormatSchemaInfo(settings.template_settings.row_format, "Template", false,
diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.reference b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
new file mode 100644
index 00000000000..167f16ec55f
--- /dev/null
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
@@ -0,0 +1,4 @@
+Question: 'How awesome is clickhouse?', Answer: 'unbelievably awesome!', Number of Likes: 456, Date: 2016-01-02;
+Question: 'How fast is clickhouse?', Answer: 'Lightning fast!', Number of Likes: 9876543210, Date: 2016-01-03;
+Question: 'Is it opensource', Answer: 'of course it is!', Number of Likes: 789, Date: 2016-01-04
+
diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
new file mode 100755
index 00000000000..651e3618f83
--- /dev/null
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -0,0 +1,32 @@
+#!/usr/bin/env bash
+# shellcheck disable=SC2016
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# Test format_schema_rows_template setting 
+
+$CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS template";
+$CLICKHOUSE_CLIENT --query="CREATE TABLE template (question String, answer String, likes UInt64, date Date) ENGINE = Memory";
+$CLICKHOUSE_CLIENT --query="INSERT INTO template VALUES
+('How awesome is clickhouse?', 'unbelievably awesome!', 456, '2016-01-02'),\
+('How fast is clickhouse?', 'Lightning fast!', 9876543210, '2016-01-03'),\
+('Is it opensource', 'of course it is!', 789, '2016-01-04')";
+
+$CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
+format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_rows_between_delimiter = ';\n'";
+
+echo -e "\n"
+
+# Test that if both format_schema_rows_template setting and format_template_row are provided, error is thrown 
+
+echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > "$CURDIR"/00937_template_output_format_row.tmp
+$CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
+format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
+format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_rows_between_delimiter = ';\n'"; -- { serverError 474 }
+
+$CLICKHOUSE_CLIENT --query="DROP TABLE template";
+rm "$CURDIR"/00937_template_output_format_row.tmp
\ No newline at end of file

From 3832a8261a19004e88a32b4bab39f6b46b14daa6 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Mon, 22 Jan 2024 23:20:02 +0200
Subject: [PATCH 0203/1081] #31363 - update documentation for En and Ru

---
 docs/en/interfaces/formats.md | 4 +++-
 docs/ru/interfaces/formats.md | 4 +++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index a11c3e5ef19..fd44fbf4462 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -253,7 +253,7 @@ This format is also available under the name `TSVRawWithNamesAndNames`.
 
 This format allows specifying a custom format string with placeholders for values with a specified escaping rule.
 
-It uses settings `format_template_resultset`, `format_template_row`, `format_template_rows_between_delimiter` and some settings of other formats (e.g. `output_format_json_quote_64bit_integers` when using `JSON` escaping, see further)
+It uses settings `format_template_resultset`, `format_template_row` (`format_schema_rows_template`), `format_template_rows_between_delimiter` and some settings of other formats (e.g. `output_format_json_quote_64bit_integers` when using `JSON` escaping, see further)
 
 Setting `format_template_row` specifies the path to the file containing format strings for rows with the following syntax:
 
@@ -279,6 +279,8 @@ the values of `SearchPhrase`, `c` and `price` columns, which are escaped as `Quo
 
 `Search phrase: 'bathroom interior design', count: 2166, ad price: $3;`
 
+In cases where it is challenging or not possible to deploy format output configuration for the template format to a directory on all nodes in a cluste, or if the format is trivial then `format_schema_rows_template` can be used to pass the template string directly in the query, rather than a path to the file which contains it.
+
 The `format_template_rows_between_delimiter` setting specifies the delimiter between rows, which is printed (or expected) after every row except the last one (`\n` by default)
 
 Setting `format_template_resultset` specifies the path to the file, which contains a format string for resultset. Format string for resultset has the same syntax as a format string for row and allows to specify a prefix, a suffix and a way to print some additional information. It contains the following placeholders instead of column names:
diff --git a/docs/ru/interfaces/formats.md b/docs/ru/interfaces/formats.md
index b4794b02743..8f8197e2221 100644
--- a/docs/ru/interfaces/formats.md
+++ b/docs/ru/interfaces/formats.md
@@ -201,7 +201,7 @@ SELECT * FROM nestedt FORMAT TSV
 
 Этот формат позволяет указать произвольную форматную строку, в которую подставляются значения, сериализованные выбранным способом.
 
-Для этого используются настройки `format_template_resultset`, `format_template_row`, `format_template_rows_between_delimiter` и настройки экранирования других форматов (например, `output_format_json_quote_64bit_integers` при экранировании как в `JSON`, см. далее)
+Для этого используются настройки `format_template_resultset`, `format_template_row` (`format_schema_rows_template`), `format_template_rows_between_delimiter` и настройки экранирования других форматов (например, `output_format_json_quote_64bit_integers` при экранировании как в `JSON`, см. далее)
 
 Настройка `format_template_row` задаёт путь к файлу, содержащему форматную строку для строк таблицы, которая должна иметь вид:
 
@@ -227,6 +227,8 @@ SELECT * FROM nestedt FORMAT TSV
 
     `Search phrase: 'bathroom interior design', count: 2166, ad price: $3;`
 
+В тех случаях, когда не удобно или не возможно указать произвольную форматную строку в файле, можно использовать `format_schema_rows_template` указать произвольную форматную строку в запросе.    
+
 Настройка `format_template_rows_between_delimiter` задаёт разделитель между строками, который выводится (или ожмдается при вводе) после каждой строки, кроме последней. По умолчанию `\n`.
 
 Настройка `format_template_resultset` задаёт путь к файлу, содержащему форматную строку для результата. Форматная строка для результата имеет синтаксис аналогичный форматной строке для строк таблицы и позволяет указать префикс, суффикс и способ вывода дополнительной информации. Вместо имён столбцов в ней указываются следующие имена подстановок:

From c59f3e164ffedf1a7561b0fd0a65c2555685ca91 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Thu, 18 Jan 2024 12:08:29 -0800
Subject: [PATCH 0204/1081] Return baseline component as fourth array

---
 .../sql-reference/functions/time-series-functions.md   |  8 ++++++--
 src/Functions/seriesDecomposeSTL.cpp                   | 10 +++++++++-
 .../0_stateless/02813_seriesDecomposeSTL.reference     |  8 ++++----
 3 files changed, 19 insertions(+), 7 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 144d832b36a..2e42aa884b4 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -77,8 +77,8 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of three arrays where the first array include seasonal components, the second array - trend,
-and the third array - residue component.
+- An array of four arrays where the first array include seasonal components, the second array - trend,
+the third array - residue component, and the fourth array - baseline component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -107,6 +107,10 @@ Result:
     [
         0, 0.0000019073486, -0.0000019073486, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, -0.0000019073486, 0,
         0
+    ],
+    [
+        10.1, 20.449999, 40.340004, 10.100001, 20.45, 40.34, 10.100001, 20.45, 40.34, 10.1, 20.45, 40.34,
+        10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.100002, 20.45, 40.34
     ]]                                                                                                                   │
 └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
 ```
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 21e36761213..0c44afa32a6 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -128,6 +128,10 @@ public:
                 res_data.insert(residue.begin(), residue.end());
                 res_col_offsets_data.push_back(res_data.size());
 
+                // Create Baseline = seasonal + trend 
+                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
+                res_col_offsets_data.push_back(res_data.size());
+
                 root_offsets_data.push_back(res_col_offsets->size());
 
                 prev_src_offset = curr_offset;
@@ -201,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of three arrays where the first array include seasonal components, the second array - trend, and the third array - residue component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -230,6 +234,10 @@ Result:
     [
         0, 0.0000019073486, -0.0000019073486, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, -0.0000019073486, 0,
         0
+    ],
+    [
+        10.1, 20.449999, 40.340004, 10.100001, 20.45, 40.34, 10.100001, 20.45, 40.34, 10.1, 20.45, 40.34,
+        10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.100002, 20.45, 40.34
     ]]                                                                                                                   │
 └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
 ```)",
diff --git a/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference b/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
index dc30e7f8371..28dae705335 100644
--- a/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
+++ b/tests/queries/0_stateless/02813_seriesDecomposeSTL.reference
@@ -1,4 +1,4 @@
-[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0]]
-[[4.04452e-8,-1.7846537e-8,-5.9488454e-9,0,0,0,0,0,0,-1.9868216e-8,-9.5297715e-8,2.2540547e-9,3.4229203e-8,8.573613e-8],[1.9999999,2,2,2,2,2,2,2,2,2,2,2,1.9999996,1.9999996],[1.1920929e-7,0,0,0,0,0,0,0,0,0,0,0,3.5762787e-7,2.3841858e-7]]
-[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0]]
-[[53.946846,-4.8119445,43.525013,-23.71359,-42.472305,-51.636955,-50.458298,-51.982674,37.62072,-15.9006605,56.65076,-5.809669,57.143845,-2.0370207,54.050922,-4.897961,43.954018,-23.808758,-42.651337,-51.86827,-50.709732,-52.18156,37.734905,-15.853402,56.91643,-5.8815174,57.253094,-2.012879,54.157806,-4.9817176,44.384747,-23.902956,-42.830154,-52.10025,-50.96271,-52.3829,37.84573,-15.81032,57.177113,-5.958963,57.356136,-1.9952412,54.27533,-5.066312,44.878296,-23.956438,-42.993656,-52.337124,-51.208073,-52.615646,37.91102,-15.8062525,57.49891,-6.056076,57.45604,-1.9797823,54.39525,-5.1483474,45.374573],[88.028534,88.95315,89.87776,90.802376,91.64913,92.49588,93.342636,94.19737,95.0521,95.90684,96.712975,97.51912,98.32526,98.36342,98.40158,98.43974,98.36777,98.29579,98.223816,98.536446,98.849075,99.161705,99.7552,100.348694,100.94219,101.53184,102.12149,102.711136,103.79921,104.88729,105.975365,107.50462,109.033875,110.56313,111.79767,113.032196,114.26673,115.02128,115.775826,116.53037,117.15541,117.78044,118.40548,118.86489,119.3243,119.783714,120.04031,120.29691,120.55351,120.78621,121.01891,121.25161,121.533585,121.81555,122.09753,122.41821,122.7389,123.059586,123.39267],[-2.97538,2.8587952,-23.402771,0.91121674,4.8231735,9.141075,8.115662,10.785301,0.32717896,5.99382,-12.363731,5.29055,0.53089905,-2.3264008,-3.4524994,1.4582214,-2.321785,2.51297,5.4275208,3.3318253,5.8606567,0.019859314,-4.4901123,-12.495293,-5.8586197,-1.650322,-11.374588,4.3017426,4.042984,1.094429,9.639885,3.3983307,-3.20372,-5.462883,-5.834961,-6.649292,-1.1124649,3.7890396,16.047066,-2.5714111,8.488449,-2.785202,2.319191,-0.79857635,13.797401,-5.827278,-6.0466614,-5.9597855,-7.3454437,-3.1705627,6.0700684,3.5546417,1.9675064,-0.7594757,2.446434,0.5615692,0.86585236,-3.9112396,1.2327576]]
+[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0],[10.1,20.449999,40.340004,10.100001,20.45,40.34,10.100001,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.100002,20.45,40.34]]
+[[4.04452e-8,-1.7846537e-8,-5.9488454e-9,0,0,0,0,0,0,-1.9868216e-8,-9.5297715e-8,2.2540547e-9,3.4229203e-8,8.573613e-8],[1.9999999,2,2,2,2,2,2,2,2,2,2,2,1.9999996,1.9999996],[1.1920929e-7,0,0,0,0,0,0,0,0,0,0,0,3.5762787e-7,2.3841858e-7],[1.9999999,2,2,2,2,2,2,2,2,2,1.9999999,2,1.9999996,1.9999998]]
+[[-13.529999,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.53,-3.1799996,16.71,-13.530001,-3.18,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1800003,16.710001,-13.530001,-3.1799994,16.71,-13.529999,-3.1799994,16.709997],[23.63,23.63,23.630003,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.63,23.630001,23.630001,23.630001,23.630001,23.630001,23.630003],[0,0.0000019073486,-0.0000019073486,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,-0.0000019073486,0,0],[10.1,20.449999,40.340004,10.100001,20.45,40.34,10.100001,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.1,20.45,40.34,10.100002,20.45,40.34]]
+[[53.946846,-4.8119445,43.525013,-23.71359,-42.472305,-51.636955,-50.458298,-51.982674,37.62072,-15.9006605,56.65076,-5.809669,57.143845,-2.0370207,54.050922,-4.897961,43.954018,-23.808758,-42.651337,-51.86827,-50.709732,-52.18156,37.734905,-15.853402,56.91643,-5.8815174,57.253094,-2.012879,54.157806,-4.9817176,44.384747,-23.902956,-42.830154,-52.10025,-50.96271,-52.3829,37.84573,-15.81032,57.177113,-5.958963,57.356136,-1.9952412,54.27533,-5.066312,44.878296,-23.956438,-42.993656,-52.337124,-51.208073,-52.615646,37.91102,-15.8062525,57.49891,-6.056076,57.45604,-1.9797823,54.39525,-5.1483474,45.374573],[88.028534,88.95315,89.87776,90.802376,91.64913,92.49588,93.342636,94.19737,95.0521,95.90684,96.712975,97.51912,98.32526,98.36342,98.40158,98.43974,98.36777,98.29579,98.223816,98.536446,98.849075,99.161705,99.7552,100.348694,100.94219,101.53184,102.12149,102.711136,103.79921,104.88729,105.975365,107.50462,109.033875,110.56313,111.79767,113.032196,114.26673,115.02128,115.775826,116.53037,117.15541,117.78044,118.40548,118.86489,119.3243,119.783714,120.04031,120.29691,120.55351,120.78621,121.01891,121.25161,121.533585,121.81555,122.09753,122.41821,122.7389,123.059586,123.39267],[-2.97538,2.8587952,-23.402771,0.91121674,4.8231735,9.141075,8.115662,10.785301,0.32717896,5.99382,-12.363731,5.29055,0.53089905,-2.3264008,-3.4524994,1.4582214,-2.321785,2.51297,5.4275208,3.3318253,5.8606567,0.019859314,-4.4901123,-12.495293,-5.8586197,-1.650322,-11.374588,4.3017426,4.042984,1.094429,9.639885,3.3983307,-3.20372,-5.462883,-5.834961,-6.649292,-1.1124649,3.7890396,16.047066,-2.5714111,8.488449,-2.785202,2.319191,-0.79857635,13.797401,-5.827278,-6.0466614,-5.9597855,-7.3454437,-3.1705627,6.0700684,3.5546417,1.9675064,-0.7594757,2.446434,0.5615692,0.86585236,-3.9112396,1.2327576],[141.97537,84.141205,133.40277,67.08878,49.176826,40.858925,42.88434,42.2147,132.67282,80.00618,153.36374,91.70945,155.4691,96.3264,152.4525,93.54178,142.32178,74.48703,55.57248,46.668175,48.139343,46.980145,137.49011,84.49529,157.85863,95.65032,159.37459,100.69826,157.95702,99.90557,150.3601,83.60167,66.20372,58.462883,60.834957,60.649296,152.11246,99.21096,172.95294,110.57141,174.51155,115.7852,172.68082,113.79858,164.2026,95.82728,77.04666,67.95979,69.34544,68.17056,158.92993,105.44536,179.0325,115.759476,179.55356,120.43843,177.13416,117.91124,168.76724]]

From f935493f284e1acd94eacdf0c50f91de688d817e Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Fri, 19 Jan 2024 09:05:04 -0800
Subject: [PATCH 0205/1081] fix trailing whitespaces

---
 docs/en/sql-reference/functions/time-series-functions.md | 2 +-
 src/Functions/seriesDecomposeSTL.cpp                     | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 2e42aa884b4..21e66302ad2 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -78,7 +78,7 @@ The number of data points in `series` should be at least twice the value of `per
 **Returned value**
 
 - An array of four arrays where the first array include seasonal components, the second array - trend,
-the third array - residue component, and the fourth array - baseline component.
+the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 0c44afa32a6..9a6a229e282 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -128,7 +128,7 @@ public:
                 res_data.insert(residue.begin(), residue.end());
                 res_col_offsets_data.push_back(res_data.size());
 
-                // Create Baseline = seasonal + trend 
+                // Create Baseline = seasonal + trend
                 std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
                 res_col_offsets_data.push_back(res_data.size());
 
@@ -205,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 

From d9edd5a7f36491a8d86705e6c7221c1a74cd6ef5 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Fri, 19 Jan 2024 10:20:01 -0800
Subject: [PATCH 0206/1081] fix spell check

---
 docs/en/sql-reference/functions/time-series-functions.md | 2 +-
 src/Functions/seriesDecomposeSTL.cpp                     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 21e66302ad2..016c3410944 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -78,7 +78,7 @@ The number of data points in `series` should be at least twice the value of `per
 **Returned value**
 
 - An array of four arrays where the first array include seasonal components, the second array - trend,
-the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
+the third array - residue component, and the fourth array - baseline(seasonal + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 9a6a229e282..4376691868b 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -205,7 +205,7 @@ The number of data points in `series` should be at least twice the value of `per
 
 **Returned value**
 
-- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasoanl + trend) component.
+- An array of four arrays where the first array include seasonal components, the second array - trend, the third array - residue component, and the fourth array - baseline(seasonal + trend) component.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 

From 084ee74b6898214024feafcfa292ff8419bc0050 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Mon, 22 Jan 2024 07:31:33 -0800
Subject: [PATCH 0207/1081] minor fix

---
 src/Functions/seriesDecomposeSTL.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/seriesDecomposeSTL.cpp b/src/Functions/seriesDecomposeSTL.cpp
index 4376691868b..e9276c4aefb 100644
--- a/src/Functions/seriesDecomposeSTL.cpp
+++ b/src/Functions/seriesDecomposeSTL.cpp
@@ -129,7 +129,7 @@ public:
                 res_col_offsets_data.push_back(res_data.size());
 
                 // Create Baseline = seasonal + trend
-                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<Float32>());
+                std::transform(seasonal.begin(), seasonal.end(), trend.begin(), std::back_inserter(res_data), std::plus<>());
                 res_col_offsets_data.push_back(res_data.size());
 
                 root_offsets_data.push_back(res_col_offsets->size());

From e78eb41264ebb37d3fd813850a3e55ce7690ecea Mon Sep 17 00:00:00 2001
From: MyroTk <44327070+MyroTk@users.noreply.github.com>
Date: Mon, 22 Jan 2024 15:19:31 -0800
Subject: [PATCH 0208/1081] Update Dockerfile

---
 docker/test/integration/runner/Dockerfile | 57 +++++++++++------------
 1 file changed, 28 insertions(+), 29 deletions(-)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index 2a81db78a3d..dbf90f9b810 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -63,47 +63,46 @@ RUN curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add - \
 
 
 RUN python3 -m pip install --no-cache-dir \
-    PyMySQL \
-    aerospike==11.1.0 \
-    asyncio \
+    PyMySQL==1.1.0 \
+    asyncio==3.4.3 \
     avro==1.10.2 \
-    azure-storage-blob \
-    boto3 \
-    cassandra-driver \
+    azure-storage-blob==12.19.0 \
+    boto3==1.34.24 \
+    cassandra-driver==3.29.0 \
     confluent-kafka==1.9.2 \
     delta-spark==2.3.0 \
-    dict2xml \
-    dicttoxml \
+    dict2xml==1.7.4 \
+    dicttoxml==1.7.16 \
     docker==6.1.3 \
     docker-compose==1.29.2 \
-    grpcio \
-    grpcio-tools \
-    kafka-python \
-    kazoo \
-    lz4 \
-    minio \
-    nats-py \
-    protobuf \
+    grpcio==1.60.0 \
+    grpcio-tools==1.60.0 \
+    kafka-python==2.0.2 \
+    kazoo==2.9.0 \
+    lz4==4.3.3 \
+    minio==7.2.3 \
+    nats-py==2.6.0 \
+    protobuf==4.25.2 \
     psycopg2-binary==2.9.6 \
-    pyhdfs \
+    pyhdfs==0.3.1 \
     pymongo==3.11.0 \
     pyspark==3.3.2 \
-    pytest \
+    pytest==7.4.4 \
     pytest-order==1.0.0 \
-    pytest-random \
-    pytest-repeat \
-    pytest-timeout \
-    pytest-xdist \
+    pytest-random==0.2 \
+    pytest-repeat==0.9.3 \
+    pytest-timeout==2.2.0 \
+    pytest-xdist==3.5.0 \
     pytest-reportlog==0.4.0 \
-    pytz \
+    pytz==2023.3.post1 \
     pyyaml==5.3.1 \
-    redis \
-    requests-kerberos \
+    redis==5.0.1 \
+    requests-kerberos==0.14.0 \
     tzlocal==2.1 \
-    retry \
-    bs4 \
-    lxml \
-    urllib3
+    retry==0.9.2 \
+    bs4==0.0.2 \
+    lxml==5.1.0 \
+    urllib3==2.0.7
 # bs4, lxml are for cloud tests, do not delete
 
 # Hudi supports only spark 3.3.*, not 3.4

From 276ccd3d47be40b79abbaf7734f557d578501b19 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 23 Jan 2024 07:18:14 +0200
Subject: [PATCH 0209/1081] empty commit to restart CI checks


From 78df07199bc57c8dac9a56fb8092eb1256ad8b56 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 23 Jan 2024 07:16:38 +0000
Subject: [PATCH 0210/1081] More consistent tests for inverted index

---
 ...> 02346_inverted_index_bug47393.reference} |  0
 .../02346_inverted_index_bug47393.sql         | 25 +++++++++++++++++++
 ...> 02346_inverted_index_bug52019.reference} |  0
 ....sql => 02346_inverted_index_bug52019.sql} | 17 ++++++++++---
 ...46_inverted_index_detach_attach.reference} |  0
 ...=> 02346_inverted_index_detach_attach.sql} |  6 ++---
 ...nverted_index_experimental_flag.reference} |  0
 ...2346_inverted_index_experimental_flag.sql} |  3 +++
 ..._inverted_index_match_predicate.reference} |  0
 ... 02346_inverted_index_match_predicate.sql} |  2 ++
 .../02346_inverted_index_mutation.sql         | 25 -------------------
 ... => 02346_inverted_index_search.reference} |  0
 ...ch.sql => 02346_inverted_index_search.sql} |  0
 13 files changed, 47 insertions(+), 31 deletions(-)
 rename tests/queries/0_stateless/{02346_inverted_index_mutation.reference => 02346_inverted_index_bug47393.reference} (100%)
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug47393.sql
 rename tests/queries/0_stateless/{02696_inverted_idx_checksums.reference => 02346_inverted_index_bug52019.reference} (100%)
 rename tests/queries/0_stateless/{02862_index_inverted_incorrect_args.sql => 02346_inverted_index_bug52019.sql} (62%)
 rename tests/queries/0_stateless/{02862_index_inverted_incorrect_args.reference => 02346_inverted_index_detach_attach.reference} (100%)
 rename tests/queries/0_stateless/{02696_inverted_idx_checksums.sql => 02346_inverted_index_detach_attach.sql} (75%)
 rename tests/queries/0_stateless/{02895_forbid_create_inverted_index.reference => 02346_inverted_index_experimental_flag.reference} (100%)
 rename tests/queries/0_stateless/{02895_forbid_create_inverted_index.sql => 02346_inverted_index_experimental_flag.sql} (72%)
 rename tests/queries/0_stateless/{02951_inverted_index_support_match.reference => 02346_inverted_index_match_predicate.reference} (100%)
 rename tests/queries/0_stateless/{02951_inverted_index_support_match.sql => 02346_inverted_index_match_predicate.sql} (97%)
 delete mode 100644 tests/queries/0_stateless/02346_inverted_index_mutation.sql
 rename tests/queries/0_stateless/{02346_full_text_search.reference => 02346_inverted_index_search.reference} (100%)
 rename tests/queries/0_stateless/{02346_full_text_search.sql => 02346_inverted_index_search.sql} (100%)

diff --git a/tests/queries/0_stateless/02346_inverted_index_mutation.reference b/tests/queries/0_stateless/02346_inverted_index_bug47393.reference
similarity index 100%
rename from tests/queries/0_stateless/02346_inverted_index_mutation.reference
rename to tests/queries/0_stateless/02346_inverted_index_bug47393.reference
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug47393.sql b/tests/queries/0_stateless/02346_inverted_index_bug47393.sql
new file mode 100644
index 00000000000..166e051b120
--- /dev/null
+++ b/tests/queries/0_stateless/02346_inverted_index_bug47393.sql
@@ -0,0 +1,25 @@
+SET allow_experimental_inverted_index = 1;
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab
+(
+    id UInt64,
+    str String,
+    INDEX idx str TYPE inverted(3) GRANULARITY 1
+)
+ENGINE = MergeTree
+ORDER BY tuple()
+SETTINGS min_rows_for_wide_part = 1, min_bytes_for_wide_part = 1;
+
+INSERT INTO tab (str) VALUES ('I am inverted');
+
+SELECT data_version FROM system.parts WHERE database = currentDatabase() AND table = 'tab' AND active = 1;
+
+-- update column synchronously
+ALTER TABLE tab UPDATE str = 'I am not inverted' WHERE 1 SETTINGS mutations_sync=1;
+
+SELECT data_version FROM system.parts WHERE database = currentDatabase() AND table = 'tab' AND active = 1;
+
+SELECT str FROM tab WHERE str LIKE '%inverted%' SETTINGS force_data_skipping_indices = 'idx';
+
+DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02696_inverted_idx_checksums.reference b/tests/queries/0_stateless/02346_inverted_index_bug52019.reference
similarity index 100%
rename from tests/queries/0_stateless/02696_inverted_idx_checksums.reference
rename to tests/queries/0_stateless/02346_inverted_index_bug52019.reference
diff --git a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql b/tests/queries/0_stateless/02346_inverted_index_bug52019.sql
similarity index 62%
rename from tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
rename to tests/queries/0_stateless/02346_inverted_index_bug52019.sql
index 7ba122a7155..c61e17d9cea 100644
--- a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_bug52019.sql
@@ -1,9 +1,20 @@
--- https://github.com/ClickHouse/ClickHouse/issues/52019
-DROP TABLE IF EXISTS tab;
+-- Test for Bug 52019: Undefined behavior
+
 SET allow_experimental_inverted_index=1;
-CREATE TABLE tab (`k` UInt64, `s` Map(String, String), INDEX af mapKeys(s) TYPE inverted(2) GRANULARITY 1) ENGINE = MergeTree ORDER BY k SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi';
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab (
+    k UInt64,
+    s Map(String, String),
+    INDEX idx mapKeys(s) TYPE inverted(2) GRANULARITY 1)
+ENGINE = MergeTree
+ORDER BY k
+SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi';
+
 INSERT INTO tab (k) VALUES (0);
 SELECT * FROM tab PREWHERE (s[NULL]) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
 SELECT * FROM tab PREWHERE (s[1]) = 'Click a03' SETTINGS allow_experimental_analyzer=1; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT * FROM tab PREWHERE (s['foo']) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
+
 DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.reference b/tests/queries/0_stateless/02346_inverted_index_detach_attach.reference
similarity index 100%
rename from tests/queries/0_stateless/02862_index_inverted_incorrect_args.reference
rename to tests/queries/0_stateless/02346_inverted_index_detach_attach.reference
diff --git a/tests/queries/0_stateless/02696_inverted_idx_checksums.sql b/tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
similarity index 75%
rename from tests/queries/0_stateless/02696_inverted_idx_checksums.sql
rename to tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
index 92ffa7a6196..762d78922fe 100644
--- a/tests/queries/0_stateless/02696_inverted_idx_checksums.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_detach_attach.sql
@@ -2,8 +2,8 @@ SET allow_experimental_inverted_index = 1;
 
 CREATE TABLE t
 (
-    `key` UInt64,
-    `str` String,
+    key UInt64,
+    str String,
     INDEX inv_idx str TYPE inverted(0) GRANULARITY 1
 )
 ENGINE = MergeTree
@@ -13,4 +13,4 @@ INSERT INTO t VALUES (1, 'Hello World');
 
 ALTER TABLE t DETACH PART 'all_1_1_0';
 
-ALTER TABLE t ATTACH PART 'all_1_1_0';
\ No newline at end of file
+ALTER TABLE t ATTACH PART 'all_1_1_0';
diff --git a/tests/queries/0_stateless/02895_forbid_create_inverted_index.reference b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.reference
similarity index 100%
rename from tests/queries/0_stateless/02895_forbid_create_inverted_index.reference
rename to tests/queries/0_stateless/02346_inverted_index_experimental_flag.reference
diff --git a/tests/queries/0_stateless/02895_forbid_create_inverted_index.sql b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
similarity index 72%
rename from tests/queries/0_stateless/02895_forbid_create_inverted_index.sql
rename to tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
index dc92d9198fb..bf89265372e 100644
--- a/tests/queries/0_stateless/02895_forbid_create_inverted_index.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_experimental_flag.sql
@@ -1,4 +1,7 @@
+-- Tests that the inverted index can only be supported when allow_experimental_inverted_index = 1.
+
 SET allow_experimental_inverted_index = 0;
+
 DROP TABLE IF EXISTS tab;
 CREATE TABLE tab
 (
diff --git a/tests/queries/0_stateless/02951_inverted_index_support_match.reference b/tests/queries/0_stateless/02346_inverted_index_match_predicate.reference
similarity index 100%
rename from tests/queries/0_stateless/02951_inverted_index_support_match.reference
rename to tests/queries/0_stateless/02346_inverted_index_match_predicate.reference
diff --git a/tests/queries/0_stateless/02951_inverted_index_support_match.sql b/tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
similarity index 97%
rename from tests/queries/0_stateless/02951_inverted_index_support_match.sql
rename to tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
index 9ebf10412d9..99405c0acf2 100644
--- a/tests/queries/0_stateless/02951_inverted_index_support_match.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_match_predicate.sql
@@ -1,3 +1,5 @@
+-- Tests that match() utilizes the inverted index
+
 SET allow_experimental_inverted_index = true;
 
 DROP TABLE IF EXISTS tab;
diff --git a/tests/queries/0_stateless/02346_inverted_index_mutation.sql b/tests/queries/0_stateless/02346_inverted_index_mutation.sql
deleted file mode 100644
index 83b73807cd7..00000000000
--- a/tests/queries/0_stateless/02346_inverted_index_mutation.sql
+++ /dev/null
@@ -1,25 +0,0 @@
-SET allow_experimental_inverted_index=1;
-
-DROP TABLE IF EXISTS t;
-CREATE TABLE t
-(
-    `timestamp` UInt64,
-    `s` String,
-    INDEX idx s TYPE inverted(3) GRANULARITY 1
-)
-ENGINE = MergeTree
-ORDER BY tuple()
-SETTINGS min_rows_for_wide_part = 1, min_bytes_for_wide_part = 1;
-
-INSERT INTO t (s) VALUES ('I am inverted');
-
-SELECT data_version FROM system.parts WHERE database=currentDatabase() AND table='t' AND active=1;
-
--- do update column synchronously
-ALTER TABLE t UPDATE s='I am not inverted' WHERE 1 SETTINGS mutations_sync=1;
-
-SELECT data_version FROM system.parts WHERE database=currentDatabase() AND table='t' AND active=1;
-
-SELECT s FROM t WHERE s LIKE '%inverted%' SETTINGS force_data_skipping_indices='idx';
-
-DROP TABLE t;
diff --git a/tests/queries/0_stateless/02346_full_text_search.reference b/tests/queries/0_stateless/02346_inverted_index_search.reference
similarity index 100%
rename from tests/queries/0_stateless/02346_full_text_search.reference
rename to tests/queries/0_stateless/02346_inverted_index_search.reference
diff --git a/tests/queries/0_stateless/02346_full_text_search.sql b/tests/queries/0_stateless/02346_inverted_index_search.sql
similarity index 100%
rename from tests/queries/0_stateless/02346_full_text_search.sql
rename to tests/queries/0_stateless/02346_inverted_index_search.sql

From bfec324b2818a3764c09347508125051273dac25 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 23 Jan 2024 10:06:25 +0000
Subject: [PATCH 0211/1081] Some fixups + test

---
 src/Storages/MergeTree/MutateTask.cpp         | 18 ++++++++++-------
 .../02346_inverted_index_bug59039.reference   |  0
 .../02346_inverted_index_bug59039.sql         | 20 +++++++++++++++++++
 3 files changed, 31 insertions(+), 7 deletions(-)
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug59039.reference
 create mode 100644 tests/queries/0_stateless/02346_inverted_index_bug59039.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index fccee6bd887..48aad368dd4 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -674,21 +674,25 @@ static NameToNameVector collectFilesForRenames(
     {
         if (command.type == MutationCommand::Type::DROP_INDEX)
         {
-            const std::vector<String> suffixes = {".idx2", ".idx", ".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"};
+            static const std::array<String, 2> suffixes = {".idx2", ".idx"};
+            static const std::array<String, 4> gin_suffixes = {".gin_dict", ".gin_post", ".gin_seg", ".gin_sid"}; /// .gin_* is inverted index
 
             for (const auto & suffix : suffixes)
             {
-                String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+                const String filename = INDEX_FILE_PREFIX + command.column_name + suffix;
+                const String filename_mrk = INDEX_FILE_PREFIX + command.column_name + mrk_extension;
 
-                if ((suffix == ".idx2" || suffix == ".idx") && source_part->checksums.has(filename))
+                if (source_part->checksums.has(filename))
                 {
                     add_rename(filename, "");
-                    add_rename(INDEX_FILE_PREFIX + command.column_name + mrk_extension, "");
+                    add_rename(filename_mrk, "");
                 }
-                else if (source_part->checksums.has(filename))
-                {
+            }
+            for (const auto & gin_suffix : gin_suffixes)
+            {
+                const String filename = INDEX_FILE_PREFIX + command.column_name + gin_suffix;
+                if (source_part->checksums.has(filename))
                     add_rename(filename, "");
-                }
             }
         }
         else if (command.type == MutationCommand::Type::DROP_PROJECTION)
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug59039.reference b/tests/queries/0_stateless/02346_inverted_index_bug59039.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02346_inverted_index_bug59039.sql b/tests/queries/0_stateless/02346_inverted_index_bug59039.sql
new file mode 100644
index 00000000000..0ef0cb0c733
--- /dev/null
+++ b/tests/queries/0_stateless/02346_inverted_index_bug59039.sql
@@ -0,0 +1,20 @@
+-- This is supposed to test that DROP INDEX removes all index related files. Can't test this directly but at least run the statement and
+-- check that no bad things happen.
+
+SET allow_experimental_inverted_index = 1;
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab
+(
+    id UInt64,
+    doc String,
+    INDEX text_idx doc TYPE inverted
+)
+ENGINE = MergeTree
+ORDER BY id
+SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi', min_bytes_for_wide_part = 0, min_rows_for_wide_part = 0;
+
+ALTER TABLE tab DROP INDEX text_idx;
+
+DROP TABLE tab;

From 992d859e726895dadc9fbab1ebf99acd4b29881c Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 23 Jan 2024 14:16:14 +0100
Subject: [PATCH 0212/1081] Fix style check

---
 src/Disks/ObjectStorages/IObjectStorage.h | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index cf113586ddf..b7db353fb6a 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -23,6 +23,7 @@
 #include <Disks/DirectoryIterator.h>
 #include <Common/ThreadPool.h>
 #include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/Exception.h>
 #include "config.h"
 
 #if USE_AZURE_BLOB_STORAGE
@@ -33,6 +34,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+}
+
 class ReadBufferFromFileBase;
 class WriteBufferFromFileBase;
 

From bef0fcb482c4b8782a1d2e485be9f6d8ffc2dfe9 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 23 Jan 2024 14:56:24 +0100
Subject: [PATCH 0213/1081] Fix is_order_by_all flag in QueryNode

---
 src/Analyzer/QueryNode.cpp | 28 +++++++++++++++++-----------
 1 file changed, 17 insertions(+), 11 deletions(-)

diff --git a/src/Analyzer/QueryNode.cpp b/src/Analyzer/QueryNode.cpp
index 738b1ac62e8..a82fb4489b5 100644
--- a/src/Analyzer/QueryNode.cpp
+++ b/src/Analyzer/QueryNode.cpp
@@ -119,6 +119,9 @@ void QueryNode::dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, s
     if (is_group_by_all)
         buffer << ", is_group_by_all: " << is_group_by_all;
 
+    if (is_order_by_all)
+        buffer << ", is_order_by_all: " << is_order_by_all;
+
     std::string group_by_type;
     if (is_group_by_with_rollup)
         group_by_type = "rollup";
@@ -257,6 +260,7 @@ bool QueryNode::isEqualImpl(const IQueryTreeNode & rhs) const
         is_group_by_with_cube == rhs_typed.is_group_by_with_cube &&
         is_group_by_with_grouping_sets == rhs_typed.is_group_by_with_grouping_sets &&
         is_group_by_all == rhs_typed.is_group_by_all &&
+        is_order_by_all == rhs_typed.is_order_by_all &&
         cte_name == rhs_typed.cte_name &&
         projection_columns == rhs_typed.projection_columns &&
         settings_changes == rhs_typed.settings_changes;
@@ -288,6 +292,7 @@ void QueryNode::updateTreeHashImpl(HashState & state) const
     state.update(is_group_by_with_cube);
     state.update(is_group_by_with_grouping_sets);
     state.update(is_group_by_all);
+    state.update(is_order_by_all);
 
     state.update(settings_changes.size());
 
@@ -306,18 +311,19 @@ QueryTreeNodePtr QueryNode::cloneImpl() const
 {
     auto result_query_node = std::make_shared<QueryNode>(context);
 
-    result_query_node->is_subquery = is_subquery;
-    result_query_node->is_cte = is_cte;
-    result_query_node->is_distinct = is_distinct;
-    result_query_node->is_limit_with_ties = is_limit_with_ties;
-    result_query_node->is_group_by_with_totals = is_group_by_with_totals;
-    result_query_node->is_group_by_with_rollup = is_group_by_with_rollup;
-    result_query_node->is_group_by_with_cube = is_group_by_with_cube;
+    result_query_node->is_subquery                    = is_subquery;
+    result_query_node->is_cte                         = is_cte;
+    result_query_node->is_distinct                    = is_distinct;
+    result_query_node->is_limit_with_ties             = is_limit_with_ties;
+    result_query_node->is_group_by_with_totals        = is_group_by_with_totals;
+    result_query_node->is_group_by_with_rollup        = is_group_by_with_rollup;
+    result_query_node->is_group_by_with_cube          = is_group_by_with_cube;
     result_query_node->is_group_by_with_grouping_sets = is_group_by_with_grouping_sets;
-    result_query_node->is_group_by_all = is_group_by_all;
-    result_query_node->cte_name = cte_name;
-    result_query_node->projection_columns = projection_columns;
-    result_query_node->settings_changes = settings_changes;
+    result_query_node->is_group_by_all                = is_group_by_all;
+    result_query_node->is_order_by_all                = is_order_by_all;
+    result_query_node->cte_name                       = cte_name;
+    result_query_node->projection_columns             = projection_columns;
+    result_query_node->settings_changes               = settings_changes;
 
     return result_query_node;
 }

From 8e0aea301ee4b416d6bb4bcfdf664756ebff55ec Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 23 Jan 2024 14:29:26 +0000
Subject: [PATCH 0214/1081] Analyzer: Add cast for ConstantNode from constant
 folding

---
 src/Analyzer/ConstantNode.cpp | 5 ++++-
 tests/analyzer_tech_debt.txt  | 1 -
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Analyzer/ConstantNode.cpp b/src/Analyzer/ConstantNode.cpp
index cb05e6ed4e3..69bed3dbe90 100644
--- a/src/Analyzer/ConstantNode.cpp
+++ b/src/Analyzer/ConstantNode.cpp
@@ -128,7 +128,10 @@ ASTPtr ConstantNode::toASTImpl(const ConvertToASTOptions & options) const
         }
     }
 
-    if (need_to_add_cast_function)
+    // Add cast if constant was created as a result of constant folding.
+    // Constant folding may lead to type transformation and literal on shard
+    // may have a different type.
+    if (need_to_add_cast_function || source_expression != nullptr)
     {
         auto constant_type_name_ast = std::make_shared<ASTLiteral>(constant_value->getType()->getName());
         return makeASTFunction("_CAST", std::move(constant_value_ast), std::move(constant_type_name_ast));
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 4643d109c3d..dd747fff7df 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -6,7 +6,6 @@
 01155_rename_move_materialized_view
 01214_test_storage_merge_aliases_with_where
 01244_optimize_distributed_group_by_sharding_key
-01268_shard_avgweighted
 01495_subqueries_in_with_statement
 01560_merge_distributed_join
 01584_distributed_buffer_cannot_find_column

From 799a94081ba7587ec47d85554bdbb458ffb1436d Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 11:40:42 -0300
Subject: [PATCH 0215/1081] Revert "Revert "Allow to attach partition from
 table with different partition expression when destination partition
 expression doesn't re-partition""

This reverts commit a1c83e2f51117a69d484c7ae7884c3bc5dd98129.
---
 .../statements/alter/partition.md             |   2 +-
 src/Interpreters/MonotonicityCheckVisitor.h   | 102 +++-
 src/Interpreters/applyFunction.cpp            |  43 ++
 src/Interpreters/applyFunction.h              |  16 +
 src/Parsers/queryToString.cpp                 |   5 +
 src/Parsers/queryToString.h                   |   1 +
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  37 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   1 +
 src/Storages/MergeTree/KeyCondition.cpp       |  83 +--
 src/Storages/MergeTree/MergeTreeData.cpp      | 350 +++++--------
 src/Storages/MergeTree/MergeTreeData.h        |  18 +
 .../MergeTree/MergeTreeDataPartCloner.cpp     | 320 ++++++++++++
 .../MergeTree/MergeTreeDataPartCloner.h       |  43 ++
 src/Storages/MergeTree/MergeTreePartition.cpp |  39 ++
 src/Storages/MergeTree/MergeTreePartition.h   |  10 +-
 ...ergeTreePartitionCompatibilityVerifier.cpp |  91 ++++
 .../MergeTreePartitionCompatibilityVerifier.h |  30 ++
 ...TreePartitionGlobalMinMaxIdxCalculator.cpp |  25 +
 ...geTreePartitionGlobalMinMaxIdxCalculator.h |  24 +
 src/Storages/StorageMergeTree.cpp             |  93 +++-
 src/Storages/StorageReplicatedMergeTree.cpp   | 135 ++++-
 .../__init__.py                               |   0
 .../configs/remote_servers.xml                |  17 +
 .../test.py                                   | 214 ++++++++
 ...artition_different_partition_exp.reference | 467 +++++++++++++++++
 ...tach_partition_different_partition_exp.sql | 485 ++++++++++++++++++
 26 files changed, 2310 insertions(+), 341 deletions(-)
 create mode 100644 src/Interpreters/applyFunction.cpp
 create mode 100644 src/Interpreters/applyFunction.h
 create mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.h
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
 create mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/test.py
 create mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
 create mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql

diff --git a/docs/en/sql-reference/statements/alter/partition.md b/docs/en/sql-reference/statements/alter/partition.md
index 114b8d5ffe3..5659a0565c5 100644
--- a/docs/en/sql-reference/statements/alter/partition.md
+++ b/docs/en/sql-reference/statements/alter/partition.md
@@ -112,7 +112,7 @@ Note that:
 For the query to run successfully, the following conditions must be met:
 
 - Both tables must have the same structure.
-- Both tables must have the same partition key, the same order by key and the same primary key.
+- Both tables must have the same order by key and the same primary key.
 - Both tables must have the same indices and projections.
 - Both tables must have the same storage policy.
 
diff --git a/src/Interpreters/MonotonicityCheckVisitor.h b/src/Interpreters/MonotonicityCheckVisitor.h
index cc386825024..4e71bd56851 100644
--- a/src/Interpreters/MonotonicityCheckVisitor.h
+++ b/src/Interpreters/MonotonicityCheckVisitor.h
@@ -1,13 +1,17 @@
 #pragma once
 
 #include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <Core/Range.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/FieldToDataType.h>
 #include <Functions/FunctionFactory.h>
 #include <IO/WriteHelpers.h>
-#include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/IdentifierSemantic.h>
+#include <Interpreters/InDepthNodeVisitor.h>
+#include <Interpreters/applyFunction.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTOrderByElement.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/IAST.h>
@@ -33,6 +37,8 @@ public:
         ASTIdentifier * identifier = nullptr;
         DataTypePtr arg_data_type = {};
 
+        Range range = Range::createWholeUniverse();
+
         void reject() { monotonicity.is_monotonic = false; }
         bool isRejected() const { return !monotonicity.is_monotonic; }
 
@@ -97,13 +103,30 @@ public:
         if (data.isRejected())
             return;
 
-        /// TODO: monotonicity for functions of several arguments
-        if (!ast_function.arguments || ast_function.arguments->children.size() != 1)
+        /// Monotonicity check only works for functions that contain at most two arguments and one of them must be a constant.
+        if (!ast_function.arguments)
         {
             data.reject();
             return;
         }
 
+        auto arguments_size = ast_function.arguments->children.size();
+
+        if (arguments_size == 0 || arguments_size > 2)
+        {
+            data.reject();
+            return;
+        }
+        else if (arguments_size == 2)
+        {
+            /// If the function has two arguments, then one of them must be a constant.
+            if (!ast_function.arguments->children[0]->as<ASTLiteral>() && !ast_function.arguments->children[1]->as<ASTLiteral>())
+            {
+                data.reject();
+                return;
+            }
+        }
+
         if (!data.canOptimize(ast_function))
         {
             data.reject();
@@ -124,14 +147,33 @@ public:
             return;
         }
 
-        ColumnsWithTypeAndName args;
-        args.emplace_back(data.arg_data_type, "tmp");
-        auto function_base = function->build(args);
+        auto function_arguments = getFunctionArguments(ast_function, data);
+
+        auto function_base = function->build(function_arguments);
 
         if (function_base && function_base->hasInformationAboutMonotonicity())
         {
             bool is_positive = data.monotonicity.is_positive;
-            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, Field(), Field());
+            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, data.range.left, data.range.right);
+
+            auto & key_range = data.range;
+
+            /// If we apply function to open interval, we can get empty intervals in result.
+            /// E.g. for ('2020-01-03', '2020-01-20') after applying 'toYYYYMM' we will get ('202001', '202001').
+            /// To avoid this we make range left and right included.
+            /// Any function that treats NULL specially is not monotonic.
+            /// Thus we can safely use isNull() as an -Inf/+Inf indicator here.
+            if (!key_range.left.isNull())
+            {
+                key_range.left = applyFunction(function_base, data.arg_data_type, key_range.left);
+                key_range.left_included = true;
+            }
+
+            if (!key_range.right.isNull())
+            {
+                key_range.right = applyFunction(function_base, data.arg_data_type, key_range.right);
+                key_range.right_included = true;
+            }
 
             if (!is_positive)
                 data.monotonicity.is_positive = !data.monotonicity.is_positive;
@@ -143,13 +185,53 @@ public:
 
     static bool needChildVisit(const ASTPtr & parent, const ASTPtr &)
     {
-        /// Currently we check monotonicity only for single-argument functions.
-        /// Although, multi-argument functions with all but one constant arguments can also be monotonic.
+        /// Multi-argument functions with all but one constant arguments can be monotonic.
         if (const auto * func = typeid_cast<const ASTFunction *>(parent.get()))
-            return func->arguments->children.size() < 2;
+            return func->arguments->children.size() <= 2;
 
         return true;
     }
+
+    static ColumnWithTypeAndName extractLiteralColumnAndTypeFromAstLiteral(const ASTLiteral * literal)
+    {
+        ColumnWithTypeAndName result;
+
+        result.type = applyVisitor(FieldToDataType(), literal->value);
+        result.column = result.type->createColumnConst(0, literal->value);
+
+        return result;
+    }
+
+    static ColumnsWithTypeAndName getFunctionArguments(const ASTFunction & ast_function, const Data & data)
+    {
+        ColumnsWithTypeAndName args;
+
+        auto arguments_size = ast_function.arguments->children.size();
+
+        chassert(arguments_size == 1 || arguments_size == 2);
+
+        if (arguments_size == 2)
+        {
+            if (ast_function.arguments->children[0]->as<ASTLiteral>())
+            {
+                const auto * literal = ast_function.arguments->children[0]->as<ASTLiteral>();
+                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
+                args.emplace_back(data.arg_data_type, "tmp");
+            }
+            else
+            {
+                const auto * literal = ast_function.arguments->children[1]->as<ASTLiteral>();
+                args.emplace_back(data.arg_data_type, "tmp");
+                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
+            }
+        }
+        else
+        {
+            args.emplace_back(data.arg_data_type, "tmp");
+        }
+
+        return args;
+    }
 };
 
 using MonotonicityCheckVisitor = ConstInDepthNodeVisitor<MonotonicityCheckMatcher, false>;
diff --git a/src/Interpreters/applyFunction.cpp b/src/Interpreters/applyFunction.cpp
new file mode 100644
index 00000000000..a53f14f0381
--- /dev/null
+++ b/src/Interpreters/applyFunction.cpp
@@ -0,0 +1,43 @@
+#include <Interpreters/applyFunction.h>
+
+#include <Core/Range.h>
+#include <Functions/IFunction.h>
+
+namespace DB
+{
+
+static Field applyFunctionForField(const FunctionBasePtr & func, const DataTypePtr & arg_type, const Field & arg_value)
+{
+    ColumnsWithTypeAndName columns{
+        {arg_type->createColumnConst(1, arg_value), arg_type, "x"},
+    };
+
+    auto col = func->execute(columns, func->getResultType(), 1);
+    return (*col)[0];
+}
+
+FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
+{
+    /// Fallback for fields without block reference.
+    if (field.isExplicit())
+        return applyFunctionForField(func, current_type, field);
+
+    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
+    const auto & columns = field.columns;
+    size_t result_idx = columns->size();
+
+    for (size_t i = 0; i < result_idx; ++i)
+        if ((*columns)[i].name == result_name)
+            result_idx = i;
+
+    if (result_idx == columns->size())
+    {
+        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
+        field.columns->emplace_back(ColumnWithTypeAndName{nullptr, func->getResultType(), result_name});
+        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
+    }
+
+    return {field.columns, field.row_idx, result_idx};
+}
+
+}
diff --git a/src/Interpreters/applyFunction.h b/src/Interpreters/applyFunction.h
new file mode 100644
index 00000000000..9b8ae43a53c
--- /dev/null
+++ b/src/Interpreters/applyFunction.h
@@ -0,0 +1,16 @@
+#pragma once
+
+#include <memory>
+
+namespace DB
+{
+struct FieldRef;
+
+class IFunctionBase;
+class IDataType;
+
+using DataTypePtr = std::shared_ptr<const IDataType>;
+using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
+
+FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field);
+}
diff --git a/src/Parsers/queryToString.cpp b/src/Parsers/queryToString.cpp
index 9721aa1f128..4a1903393f6 100644
--- a/src/Parsers/queryToString.cpp
+++ b/src/Parsers/queryToString.cpp
@@ -3,6 +3,11 @@
 
 namespace DB
 {
+    String queryToStringNullable(const ASTPtr & query)
+    {
+        return query ? queryToString(query) : "";
+    }
+
     String queryToString(const ASTPtr & query)
     {
         return queryToString(*query);
diff --git a/src/Parsers/queryToString.h b/src/Parsers/queryToString.h
index 873de218293..3acd560b1e2 100644
--- a/src/Parsers/queryToString.h
+++ b/src/Parsers/queryToString.h
@@ -6,4 +6,5 @@ namespace DB
 {
     String queryToString(const ASTPtr & query);
     String queryToString(const IAST & query);
+    String queryToStringNullable(const ASTPtr & query);
 }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 87f23b0da2a..f3057a8254f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -81,6 +81,7 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
     size_t minmax_idx_size = minmax_column_types.size();
 
+    hyperrectangle.clear();
     hyperrectangle.reserve(minmax_idx_size);
     for (size_t i = 0; i < minmax_idx_size; ++i)
     {
@@ -104,6 +105,39 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     initialized = true;
 }
 
+Block IMergeTreeDataPart::MinMaxIndex::getBlock(const MergeTreeData & data) const
+{
+    if (!initialized)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to get block from uninitialized MinMax index.");
+
+    Block block;
+
+    const auto metadata_snapshot = data.getInMemoryMetadataPtr();
+    const auto & partition_key = metadata_snapshot->getPartitionKey();
+
+    const auto minmax_column_names = data.getMinMaxColumnsNames(partition_key);
+    const auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
+    const auto minmax_idx_size = minmax_column_types.size();
+
+    for (size_t i = 0; i < minmax_idx_size; ++i)
+    {
+        const auto & data_type = minmax_column_types[i];
+        const auto & column_name = minmax_column_names[i];
+
+        const auto column = data_type->createColumn();
+
+        const auto min_val = hyperrectangle.at(i).left;
+        const auto max_val = hyperrectangle.at(i).right;
+
+        column->insert(min_val);
+        column->insert(max_val);
+
+        block.insert(ColumnWithTypeAndName(column->getPtr(), data_type, column_name));
+    }
+
+    return block;
+}
+
 IMergeTreeDataPart::MinMaxIndex::WrittenFiles IMergeTreeDataPart::MinMaxIndex::store(
     const MergeTreeData & data, IDataPartStorage & part_storage, Checksums & out_checksums) const
 {
@@ -185,8 +219,7 @@ void IMergeTreeDataPart::MinMaxIndex::merge(const MinMaxIndex & other)
 
     if (!initialized)
     {
-        hyperrectangle = other.hyperrectangle;
-        initialized = true;
+        *this = other;
     }
     else
     {
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 640a1f1d0a3..29f0f54d419 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -336,6 +336,7 @@ public:
         }
 
         void load(const MergeTreeData & data, const PartMetadataManagerPtr & manager);
+        Block getBlock(const MergeTreeData & data) const;
 
         using WrittenFiles = std::vector<std::unique_ptr<WriteBufferFromFileBase>>;
 
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index d5922ae1bc2..e5bcb11091f 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1,36 +1,37 @@
-#include <Storages/MergeTree/KeyCondition.h>
-#include <Storages/MergeTree/BoolMask.h>
-#include <DataTypes/DataTypesNumber.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnSet.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeNothing.h>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/FieldToDataType.h>
-#include <DataTypes/getLeastSupertype.h>
 #include <DataTypes/Utils.h>
-#include <Interpreters/TreeRewriter.h>
-#include <Interpreters/ExpressionAnalyzer.h>
-#include <Interpreters/ExpressionActions.h>
-#include <Interpreters/castColumn.h>
-#include <Interpreters/misc.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/indexHint.h>
+#include <DataTypes/getLeastSupertype.h>
 #include <Functions/CastOverloadResolver.h>
+#include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>
-#include <Common/FieldVisitorToString.h>
-#include <Common/MortonUtils.h>
-#include <Common/typeid_cast.h>
-#include <Columns/ColumnSet.h>
-#include <Columns/ColumnConst.h>
-#include <Interpreters/convertFieldToType.h>
+#include <Functions/indexHint.h>
+#include <IO/Operators.h>
+#include <IO/WriteBufferFromString.h>
+#include <Interpreters/ExpressionActions.h>
+#include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/Set.h>
-#include <Parsers/queryToString.h>
+#include <Interpreters/TreeRewriter.h>
+#include <Interpreters/applyFunction.h>
+#include <Interpreters/castColumn.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/misc.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTSelectQuery.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/Operators.h>
+#include <Parsers/queryToString.h>
+#include <Storages/MergeTree/BoolMask.h>
+#include <Storages/MergeTree/KeyCondition.h>
 #include <Storages/MergeTree/MergeTreeIndexUtils.h>
+#include <Common/FieldVisitorToString.h>
+#include <Common/MortonUtils.h>
+#include <Common/typeid_cast.h>
 
 #include <algorithm>
 #include <cassert>
@@ -836,21 +837,6 @@ bool KeyCondition::getConstant(const ASTPtr & expr, Block & block_with_constants
     return node.tryGetConstant(out_value, out_type);
 }
 
-
-static Field applyFunctionForField(
-    const FunctionBasePtr & func,
-    const DataTypePtr & arg_type,
-    const Field & arg_value)
-{
-    ColumnsWithTypeAndName columns
-    {
-        { arg_type->createColumnConst(1, arg_value), arg_type, "x" },
-    };
-
-    auto col = func->execute(columns, func->getResultType(), 1);
-    return (*col)[0];
-}
-
 /// The case when arguments may have types different than in the primary key.
 static std::pair<Field, DataTypePtr> applyFunctionForFieldOfUnknownType(
     const FunctionBasePtr & func,
@@ -890,33 +876,6 @@ static std::pair<Field, DataTypePtr> applyBinaryFunctionForFieldOfUnknownType(
     return {std::move(result), std::move(return_type)};
 }
 
-
-static FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
-{
-    /// Fallback for fields without block reference.
-    if (field.isExplicit())
-        return applyFunctionForField(func, current_type, field);
-
-    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
-    const auto & columns = field.columns;
-    size_t result_idx = columns->size();
-
-    for (size_t i = 0; i < result_idx; ++i)
-    {
-        if ((*columns)[i].name == result_name)
-            result_idx = i;
-    }
-
-    if (result_idx == columns->size())
-    {
-        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
-        field.columns->emplace_back(ColumnWithTypeAndName {nullptr, func->getResultType(), result_name});
-        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
-    }
-
-    return {field.columns, field.row_idx, result_idx};
-}
-
 /** When table's key has expression with these functions from a column,
   * and when a column in a query is compared with a constant, such as:
   * CREATE TABLE (x String) ORDER BY toDate(x)
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61332a4ff38..c3e348a549a 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -8,21 +8,6 @@
 #include <Backups/BackupEntryWrappedWith.h>
 #include <Backups/IBackup.h>
 #include <Backups/RestorerFromBackup.h>
-#include <Common/Config/ConfigHelper.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/Increment.h>
-#include <Common/ProfileEventsScope.h>
-#include <Common/SimpleIncrement.h>
-#include <Common/Stopwatch.h>
-#include <Common/StringUtils/StringUtils.h>
-#include <Common/ThreadFuzzer.h>
-#include <Common/escapeForFileName.h>
-#include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Common/noexcept_scope.h>
-#include <Common/quoteString.h>
-#include <Common/scope_guard_safe.h>
-#include <Common/typeid_cast.h>
-#include <Storages/MergeTree/RangesInDataPart.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Core/QueryProcessingStage.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -43,19 +28,20 @@
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Aggregator.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/MergeTreeTransaction.h>
 #include <Interpreters/PartLog.h>
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/TreeRewriter.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/inplaceBlockConversions.h>
+#include <Parsers/ASTAlterQuery.h>
 #include <Parsers/ASTExpressionList.h>
-#include <Parsers/ASTIndexDeclaration.h>
-#include <Parsers/ASTHelpers.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTHelpers.h>
+#include <Parsers/ASTIndexDeclaration.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTNameTypePair.h>
 #include <Parsers/ASTPartition.h>
@@ -64,26 +50,41 @@
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
-#include <Parsers/ASTAlterQuery.h>
 #include <Processors/Formats/IInputFormat.h>
 #include <Processors/QueryPlan/QueryIdHolder.h>
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/BlockNumberColumn.h>
 #include <Storages/Freeze.h>
+#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
+#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergeTreeDataPartWide.h>
 #include <Storages/Statistics/Estimator.h>
 #include <Storages/MergeTree/MergeTreeSelectProcessor.h>
+#include <Storages/MergeTree/RangesInDataPart.h>
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MutationCommands.h>
-#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/StorageMergeTree.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
+#include <Common/Config/ConfigHelper.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/Increment.h>
+#include <Common/ProfileEventsScope.h>
+#include <Common/SimpleIncrement.h>
+#include <Common/Stopwatch.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/ThreadFuzzer.h>
+#include <Common/escapeForFileName.h>
+#include <Common/getNumberOfPhysicalCPUCores.h>
+#include <Common/noexcept_scope.h>
+#include <Common/quoteString.h>
+#include <Common/scope_guard_safe.h>
+#include <Common/typeid_cast.h>
 
 #include <boost/range/algorithm_ext/erase.hpp>
 #include <boost/algorithm/string/join.hpp>
@@ -197,6 +198,50 @@ namespace ErrorCodes
     extern const int LIMIT_EXCEEDED;
 }
 
+static size_t getPartitionAstFieldsCount(const ASTPartition & partition_ast, ASTPtr partition_value_ast)
+{
+    if (partition_ast.fields_count.has_value())
+        return *partition_ast.fields_count;
+
+    if (partition_value_ast->as<ASTLiteral>())
+        return 1;
+
+    const auto * tuple_ast = partition_value_ast->as<ASTFunction>();
+
+    if (!tuple_ast)
+    {
+        throw Exception(
+            ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
+    }
+
+    if (tuple_ast->name != "tuple")
+    {
+        if (!isFunctionCast(tuple_ast))
+            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+
+        if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
+            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+
+        auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
+        if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
+        {
+            const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+            return arguments_ast ? arguments_ast->children.size() : 0;
+        }
+        else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
+        {
+            return inner_literal_tuple->value.getType() == Field::Types::Tuple ? inner_literal_tuple->value.safeGet<Tuple>().size() : 1;
+        }
+
+        throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+    }
+    else
+    {
+        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+        return arguments_ast ? arguments_ast->children.size() : 0;
+    }
+}
+
 static void checkSuspiciousIndices(const ASTFunction * index_function)
 {
     std::unordered_set<UInt64> unique_index_expression_hashes;
@@ -4854,7 +4899,7 @@ void MergeTreeData::removePartContributionToColumnAndSecondaryIndexSizes(const D
 }
 
 void MergeTreeData::checkAlterPartitionIsPossible(
-    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr local_context) const
+    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr) const
 {
     for (const auto & command : commands)
     {
@@ -4882,7 +4927,15 @@ void MergeTreeData::checkAlterPartitionIsPossible(
                         throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH PARTITION ALL currently");
                 }
                 else
-                    getPartitionIDFromQuery(command.partition, local_context);
+                {
+                    // The below `getPartitionIDFromQuery` call will not work for attach / replace because it assumes the partition expressions
+                    // are the same and deliberately uses this storage. Later on, `MergeTreeData::replaceFrom` is called, and it makes the right
+                    // call to `getPartitionIDFromQuery` using source storage.
+                    // Note: `PartitionCommand::REPLACE_PARTITION` is used both for `REPLACE PARTITION` and `ATTACH PARTITION FROM` queries.
+                    // But not for `ATTACH PARTITION` queries.
+                    if (command.type != PartitionCommand::REPLACE_PARTITION)
+                        getPartitionIDFromQuery(command.partition, getContext());
+                }
             }
         }
     }
@@ -5616,69 +5669,8 @@ String MergeTreeData::getPartitionIDFromQuery(const ASTPtr & ast, ContextPtr loc
         MergeTreePartInfo::validatePartitionID(partition_ast.id->clone(), format_version);
         return partition_ast.id->as<ASTLiteral>()->value.safeGet<String>();
     }
-    size_t partition_ast_fields_count = 0;
     ASTPtr partition_value_ast = partition_ast.value->clone();
-    if (!partition_ast.fields_count.has_value())
-    {
-        if (partition_value_ast->as<ASTLiteral>())
-        {
-            partition_ast_fields_count = 1;
-        }
-        else if (const auto * tuple_ast = partition_value_ast->as<ASTFunction>())
-        {
-            if (tuple_ast->name != "tuple")
-            {
-                if (isFunctionCast(tuple_ast))
-                {
-                    if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
-                    {
-                        throw Exception(
-                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-                    }
-                    auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
-                    if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
-                    {
-                        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-                        if (arguments_ast)
-                            partition_ast_fields_count = arguments_ast->children.size();
-                        else
-                            partition_ast_fields_count = 0;
-                    }
-                    else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
-                    {
-                        if (inner_literal_tuple->value.getType() == Field::Types::Tuple)
-                            partition_ast_fields_count = inner_literal_tuple->value.safeGet<Tuple>().size();
-                        else
-                            partition_ast_fields_count = 1;
-                    }
-                    else
-                    {
-                        throw Exception(
-                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-                    }
-                }
-                else
-                    throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-            }
-            else
-            {
-                const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-                if (arguments_ast)
-                    partition_ast_fields_count = arguments_ast->children.size();
-                else
-                    partition_ast_fields_count = 0;
-            }
-        }
-        else
-        {
-            throw Exception(
-                ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
-        }
-    }
-    else
-    {
-        partition_ast_fields_count = *partition_ast.fields_count;
-    }
+    auto partition_ast_fields_count = getPartitionAstFieldsCount(partition_ast, partition_value_ast);
 
     if (format_version < MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING)
     {
@@ -7014,23 +7006,35 @@ MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(IStorage & sour
     if (my_snapshot->getColumns().getAllPhysical().sizeOfDifference(src_snapshot->getColumns().getAllPhysical()))
         throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS, "Tables have different structure");
 
-    auto query_to_string = [] (const ASTPtr & ast)
-    {
-        return ast ? queryToString(ast) : "";
-    };
-
-    if (query_to_string(my_snapshot->getSortingKeyAST()) != query_to_string(src_snapshot->getSortingKeyAST()))
+    if (queryToStringNullable(my_snapshot->getSortingKeyAST()) != queryToStringNullable(src_snapshot->getSortingKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different ordering");
 
-    if (query_to_string(my_snapshot->getPartitionKeyAST()) != query_to_string(src_snapshot->getPartitionKeyAST()))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different partition key");
-
     if (format_version != src_data->format_version)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different format_version");
 
-    if (query_to_string(my_snapshot->getPrimaryKeyAST()) != query_to_string(src_snapshot->getPrimaryKeyAST()))
+    if (queryToStringNullable(my_snapshot->getPrimaryKeyAST()) != queryToStringNullable(src_snapshot->getPrimaryKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different primary key");
 
+    const auto is_a_subset_of = [](const auto & lhs, const auto & rhs)
+    {
+        if (lhs.size() > rhs.size())
+            return false;
+
+        const auto rhs_set = NameSet(rhs.begin(), rhs.end());
+        for (const auto & lhs_element : lhs)
+            if (!rhs_set.contains(lhs_element))
+                return false;
+
+        return true;
+    };
+
+    if (!is_a_subset_of(my_snapshot->getColumnsRequiredForPartitionKey(), src_snapshot->getColumnsRequiredForPartitionKey()))
+    {
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Destination table partition expression columns must be a subset of source table partition expression columns");
+    }
+
     const auto check_definitions = [](const auto & my_descriptions, const auto & src_descriptions)
     {
         if (my_descriptions.size() != src_descriptions.size())
@@ -7071,128 +7075,56 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
-    /// Check that the storage policy contains the disk where the src_part is located.
-    bool does_storage_policy_allow_same_disk = false;
-    for (const DiskPtr & disk : getStoragePolicy()->getDisks())
-    {
-        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
-        {
-            does_storage_policy_allow_same_disk = true;
-            break;
-        }
-    }
-    if (!does_storage_policy_allow_same_disk)
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "Could not clone and load part {} because disk does not belong to storage policy",
-            quoteString(src_part->getDataPartStorage().getFullPath()));
+    return MergeTreeDataPartCloner::clone(
+        this, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, require_part_metadata, params, read_settings, write_settings);
+}
 
-    String dst_part_name = src_part->getNewName(dst_part_info);
-    String tmp_dst_part_name = tmp_part_prefix + dst_part_name;
-    auto temporary_directory_lock = getTemporaryPartDirectoryHolder(tmp_dst_part_name);
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+    const MergeTreeData::DataPartPtr & src_part,
+    const MergeTreePartition & new_partition,
+    const String & partition_id,
+    const IMergeTreeDataPart::MinMaxIndex & min_max_index,
+    const String & tmp_part_prefix,
+    const StorageMetadataPtr & my_metadata_snapshot,
+    const IDataPartStorage::ClonePartParams & clone_params,
+    ContextPtr local_context,
+    Int64 min_block,
+    Int64 max_block
+)
+{
+    MergeTreePartInfo dst_part_info(partition_id, min_block, max_block, src_part->info.level);
 
-    /// Why it is needed if we only hardlink files?
-    auto reservation = src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
-    auto src_part_storage = src_part->getDataPartStoragePtr();
+    return MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
+        this,
+        src_part,
+        my_metadata_snapshot,
+        dst_part_info,
+        tmp_part_prefix,
+        local_context->getReadSettings(),
+        local_context->getWriteSettings(),
+        new_partition,
+        min_max_index,
+        false,
+        clone_params);
+}
 
-    scope_guard src_flushed_tmp_dir_lock;
-    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
+std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> MergeTreeData::createPartitionAndMinMaxIndexFromSourcePart(
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr local_context)
+{
+    const auto & src_data = src_part->storage;
 
-    /// If source part is in memory, flush it to disk and clone it already in on-disk format
-    /// Protect tmp dir from removing by cleanup thread with src_flushed_tmp_dir_lock
-    /// Construct src_flushed_tmp_part in order to delete part with its directory at destructor
-    if (auto src_part_in_memory = asInMemoryPart(src_part))
-    {
-        auto flushed_part_path = *src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
+    auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(src_part.get());
+    IMergeTreeDataPart::MinMaxIndex min_max_index;
 
-        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
-        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
+    min_max_index.load(src_data, metadata_manager);
 
-        auto flushed_part_storage = src_part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
+    MergeTreePartition new_partition;
 
-        src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, src_part->name, flushed_part_storage)
-            .withPartInfo(src_part->info)
-            .withPartFormatFromDisk()
-            .build();
+    new_partition.create(metadata_snapshot, min_max_index.getBlock(src_data), 0u, local_context);
 
-        src_flushed_tmp_part->is_temp = true;
-        src_part_storage = flushed_part_storage;
-    }
-
-    String with_copy;
-    if (params.copy_instead_of_hardlink)
-        with_copy = " (copying data)";
-
-    auto dst_part_storage = src_part_storage->freeze(
-        relative_data_path,
-        tmp_dst_part_name,
-        read_settings,
-        write_settings,
-        /* save_metadata_callback= */ {},
-        params);
-
-    if (params.metadata_version_to_write.has_value())
-    {
-        chassert(!params.keep_metadata_version);
-        auto out_metadata = dst_part_storage->writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, getContext()->getWriteSettings());
-        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
-        out_metadata->finalize();
-        if (getSettings()->fsync_after_insert)
-            out_metadata->sync();
-    }
-
-    LOG_DEBUG(log, "Clone{} part {} to {}{}",
-              src_flushed_tmp_part ? " flushed" : "",
-              src_part_storage->getFullPath(),
-              std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
-              with_copy);
-
-    auto dst_data_part = MergeTreeDataPartBuilder(*this, dst_part_name, dst_part_storage)
-        .withPartFormatFromDisk()
-        .build();
-
-    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
-    {
-        params.hardlinked_files->source_part_name = src_part->name;
-        params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
-
-        for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
-        {
-            if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
-                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-            {
-                params.hardlinked_files->hardlinks_from_source_part.insert(it->name());
-            }
-        }
-
-        auto projections = src_part->getProjectionParts();
-        for (const auto & [name, projection_part] : projections)
-        {
-            const auto & projection_storage = projection_part->getDataPartStorage();
-            for (auto it = projection_storage.iterate(); it->isValid(); it->next())
-            {
-                auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
-                if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
-                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                    && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-                {
-                    params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
-                }
-            }
-        }
-    }
-
-    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
-    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
-    dst_data_part->version.setCreationTID(tid, nullptr);
-    dst_data_part->storeVersionMetadata();
-
-    dst_data_part->is_temp = true;
-
-    dst_data_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
-    dst_data_part->modification_time = dst_part_storage->getLastModified().epochTime();
-    return std::make_pair(dst_data_part, std::move(temporary_directory_lock));
+    return {new_partition, min_max_index};
 }
 
 String MergeTreeData::getFullPathOnDisk(const DiskPtr & disk) const
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index f0dbaf0e307..9c433e11b84 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -231,6 +231,7 @@ public:
         }
     };
 
+
     using DataParts = std::set<DataPartPtr, LessDataPart>;
     using MutableDataParts = std::set<MutableDataPartPtr, LessDataPart>;
     using DataPartsVector = std::vector<DataPartPtr>;
@@ -848,6 +849,23 @@ public:
         const ReadSettings & read_settings,
         const WriteSettings & write_settings);
 
+    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+        const MergeTreeData::DataPartPtr & src_part,
+        const MergeTreePartition & new_partition,
+        const String & partition_id,
+        const IMergeTreeDataPart::MinMaxIndex & min_max_index,
+        const String & tmp_part_prefix,
+        const StorageMetadataPtr & my_metadata_snapshot,
+        const IDataPartStorage::ClonePartParams & clone_params,
+        ContextPtr local_context,
+        Int64 min_block,
+        Int64 max_block);
+
+    static std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> createPartitionAndMinMaxIndexFromSourcePart(
+        const MergeTreeData::DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        ContextPtr local_context);
+
     virtual std::vector<MergeTreeMutationStatus> getMutationsStatus() const = 0;
 
     /// Returns true if table can create new parts with adaptive granularity
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
new file mode 100644
index 00000000000..78cb9aa0624
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -0,0 +1,320 @@
+#include <Interpreters/MergeTreeTransaction.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+#include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
+#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
+#include <Common/escapeForFileName.h>
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+}
+
+static Poco::Logger * log = &Poco::Logger::get("MergeTreeDataPartCloner");
+
+namespace DistinctPartitionExpression
+{
+std::unique_ptr<WriteBufferFromFileBase> updatePartitionFile(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreePartition & partition,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    IDataPartStorage & storage)
+{
+    storage.removeFile("partition.dat");
+    // Leverage already implemented MergeTreePartition::store to create & store partition.dat.
+    // Checksum is re-calculated later.
+    return partition.store(merge_tree_data, storage, dst_part->checksums);
+}
+
+IMergeTreeDataPart::MinMaxIndex::WrittenFiles updateMinMaxFiles(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    IDataPartStorage & storage,
+    const StorageMetadataPtr & metadata_snapshot)
+{
+    for (const auto & column_name : MergeTreeData::getMinMaxColumnsNames(metadata_snapshot->partition_key))
+    {
+        auto file = "minmax_" + escapeForFileName(column_name) + ".idx";
+        storage.removeFile(file);
+    }
+
+    return dst_part->minmax_idx->store(merge_tree_data, storage, dst_part->checksums);
+}
+
+void finalizeNewFiles(const std::vector<std::unique_ptr<WriteBufferFromFileBase>> & files, bool sync_new_files)
+{
+    for (const auto & file : files)
+    {
+        file->finalize();
+        if (sync_new_files)
+            file->sync();
+    }
+}
+
+void updateNewPartFiles(
+    const MergeTreeData & merge_tree_data,
+    const MergeTreeData::MutableDataPartPtr & dst_part,
+    const MergeTreePartition & new_partition,
+    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+    const StorageMetadataPtr & src_metadata_snapshot,
+    bool sync_new_files)
+{
+    auto & storage = dst_part->getDataPartStorage();
+
+    *dst_part->minmax_idx = new_min_max_index;
+
+    auto partition_file = updatePartitionFile(merge_tree_data, new_partition, dst_part, storage);
+
+    auto min_max_files = updateMinMaxFiles(merge_tree_data, dst_part, storage, src_metadata_snapshot);
+
+    IMergeTreeDataPart::MinMaxIndex::WrittenFiles written_files;
+
+    if (partition_file)
+        written_files.emplace_back(std::move(partition_file));
+
+    written_files.insert(written_files.end(), std::make_move_iterator(min_max_files.begin()), std::make_move_iterator(min_max_files.end()));
+
+    finalizeNewFiles(written_files, sync_new_files);
+
+    // MergeTreeDataPartCloner::finalize_part calls IMergeTreeDataPart::loadColumnsChecksumsIndexes, which will re-create
+    // the checksum file if it doesn't exist. Relying on that is cumbersome, but this refactoring is simply a code extraction
+    // with small improvements. It can be further improved in the future.
+    storage.removeFile("checksums.txt");
+}
+}
+
+namespace
+{
+bool doesStoragePolicyAllowSameDisk(MergeTreeData * merge_tree_data, const MergeTreeData::DataPartPtr & src_part)
+{
+    for (const DiskPtr & disk : merge_tree_data->getStoragePolicy()->getDisks())
+        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
+            return true;
+    return false;
+}
+
+DataPartStoragePtr flushPartStorageToDiskIfInMemory(
+    MergeTreeData * merge_tree_data,
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const String & tmp_part_prefix,
+    const String & tmp_dst_part_name,
+    scope_guard & src_flushed_tmp_dir_lock,
+    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part)
+{
+    if (auto src_part_in_memory = asInMemoryPart(src_part))
+    {
+        auto flushed_part_path = src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
+        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
+
+        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
+
+        auto flushed_part_storage = src_part_in_memory->flushToDisk(*flushed_part_path, metadata_snapshot);
+
+        src_flushed_tmp_part = MergeTreeDataPartBuilder(*merge_tree_data, src_part->name, flushed_part_storage)
+                                   .withPartInfo(src_part->info)
+                                   .withPartFormatFromDisk()
+                                   .build();
+
+        src_flushed_tmp_part->is_temp = true;
+
+        return flushed_part_storage;
+    }
+
+    return src_part->getDataPartStoragePtr();
+}
+
+std::shared_ptr<IDataPartStorage> hardlinkAllFiles(
+    MergeTreeData * merge_tree_data,
+    const DB::ReadSettings & read_settings,
+    const DB::WriteSettings & write_settings,
+    const DataPartStoragePtr & storage,
+    const String & path,
+    const DB::IDataPartStorage::ClonePartParams & params)
+{
+    return storage->freeze(
+        merge_tree_data->getRelativeDataPath(),
+        path,
+        read_settings,
+        write_settings,
+        /*save_metadata_callback=*/{},
+        params);
+}
+
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
+    MergeTreeData * merge_tree_data,
+    const MergeTreeData::DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const DB::IDataPartStorage::ClonePartParams & params)
+{
+    const auto dst_part_name = src_part->getNewName(dst_part_info);
+
+    const auto tmp_dst_part_name = tmp_part_prefix + dst_part_name;
+
+    auto temporary_directory_lock = merge_tree_data->getTemporaryPartDirectoryHolder(tmp_dst_part_name);
+
+    src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
+
+    scope_guard src_flushed_tmp_dir_lock;
+    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
+
+    auto src_part_storage = flushPartStorageToDiskIfInMemory(
+        merge_tree_data, src_part, metadata_snapshot, tmp_part_prefix, tmp_dst_part_name, src_flushed_tmp_dir_lock, src_flushed_tmp_part);
+
+    auto dst_part_storage = hardlinkAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name, params);
+
+    if (params.metadata_version_to_write.has_value())
+    {
+        chassert(!params.keep_metadata_version);
+        auto out_metadata = dst_part_storage->writeFile(
+            IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, merge_tree_data->getContext()->getWriteSettings());
+        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
+        out_metadata->finalize();
+        if (merge_tree_data->getSettings()->fsync_after_insert)
+            out_metadata->sync();
+    }
+
+    LOG_DEBUG(
+        log,
+        "Clone {} part {} to {}{}",
+        src_flushed_tmp_part ? "flushed" : "",
+        src_part_storage->getFullPath(),
+        std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
+        false);
+
+
+    auto part = MergeTreeDataPartBuilder(*merge_tree_data, dst_part_name, dst_part_storage).withPartFormatFromDisk().build();
+
+    return std::make_pair(part, std::move(temporary_directory_lock));
+}
+
+void handleHardLinkedParameterFiles(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
+{
+    const auto & hardlinked_files = params.hardlinked_files;
+
+    hardlinked_files->source_part_name = src_part->name;
+    hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
+
+    for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
+    {
+        if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
+            && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+            && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+        {
+            hardlinked_files->hardlinks_from_source_part.insert(it->name());
+        }
+    }
+}
+
+void handleProjections(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
+{
+    auto projections = src_part->getProjectionParts();
+    for (const auto & [name, projection_part] : projections)
+    {
+        const auto & projection_storage = projection_part->getDataPartStorage();
+        for (auto it = projection_storage.iterate(); it->isValid(); it->next())
+        {
+            auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
+            if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
+                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+            {
+                params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
+            }
+        }
+    }
+}
+
+MergeTreeData::MutableDataPartPtr finalizePart(
+    const MergeTreeData::MutableDataPartPtr & dst_part, const DB::IDataPartStorage::ClonePartParams & params, bool require_part_metadata)
+{
+    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
+    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
+    dst_part->version.setCreationTID(tid, nullptr);
+    dst_part->storeVersionMetadata();
+
+    dst_part->is_temp = true;
+
+    dst_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
+
+    dst_part->modification_time = dst_part->getDataPartStorage().getLastModified().epochTime();
+
+    return dst_part;
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHandleHardlinksAndProjections(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const IDataPartStorage::ClonePartParams & params)
+{
+    if (!doesStoragePolicyAllowSameDisk(merge_tree_data, src_part))
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Could not clone and load part {} because disk does not belong to storage policy",
+            quoteString(src_part->getDataPartStorage().getFullPath()));
+
+    auto [destination_part, temporary_directory_lock] = cloneSourcePart(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
+    {
+        handleHardLinkedParameterFiles(src_part, params);
+        handleProjections(src_part, params);
+    }
+
+    return std::make_pair(destination_part, std::move(temporary_directory_lock));
+}
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::clone(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    bool require_part_metadata,
+    const IDataPartStorage::ClonePartParams & params,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings)
+{
+    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
+}
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const MergeTreePartition & new_partition,
+    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+    bool sync_new_files,
+    const IDataPartStorage::ClonePartParams & params)
+{
+    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    DistinctPartitionExpression::updateNewPartFiles(
+        *merge_tree_data, destination_part, new_partition, new_min_max_index, src_part->storage.getInMemoryMetadataPtr(), sync_new_files);
+
+    return std::make_pair(finalizePart(destination_part, params, false), std::move(temporary_directory_lock));
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.h b/src/Storages/MergeTree/MergeTreeDataPartCloner.h
new file mode 100644
index 00000000000..53585f20b7f
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.h
@@ -0,0 +1,43 @@
+#pragma once
+
+namespace DB
+{
+
+struct StorageInMemoryMetadata;
+using StorageMetadataPtr = std::shared_ptr<const StorageInMemoryMetadata>;
+struct MergeTreePartition;
+class IMergeTreeDataPart;
+
+class MergeTreeDataPartCloner
+{
+public:
+    using DataPart = IMergeTreeDataPart;
+    using MutableDataPartPtr = std::shared_ptr<DataPart>;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+
+    static std::pair<MutableDataPartPtr, scope_guard> clone(
+        MergeTreeData * merge_tree_data,
+        const DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        const MergeTreePartInfo & dst_part_info,
+        const String & tmp_part_prefix,
+        bool require_part_metadata,
+        const IDataPartStorage::ClonePartParams & params,
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings);
+
+    static std::pair<MutableDataPartPtr, scope_guard> cloneWithDistinctPartitionExpression(
+        MergeTreeData * merge_tree_data,
+        const DataPartPtr & src_part,
+        const StorageMetadataPtr & metadata_snapshot,
+        const MergeTreePartInfo & dst_part_info,
+        const String & tmp_part_prefix,
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings,
+        const MergeTreePartition & new_partition,
+        const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
+        bool sync_new_files,
+        const IDataPartStorage::ClonePartParams & params);
+};
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index ddeaf69136a..76ef3be25b3 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -467,6 +467,45 @@ void MergeTreePartition::create(const StorageMetadataPtr & metadata_snapshot, Bl
     }
 }
 
+void MergeTreePartition::createAndValidateMinMaxPartitionIds(
+    const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context)
+{
+    if (!metadata_snapshot->hasPartitionKey())
+        return;
+
+    auto partition_key_names_and_types = executePartitionByExpression(metadata_snapshot, block_with_min_max_partition_ids, context);
+    value.resize(partition_key_names_and_types.size());
+
+    /// Executing partition_by expression adds new columns to passed block according to partition functions.
+    /// The block is passed by reference and is used afterwards. `moduloLegacy` needs to be substituted back
+    /// with just `modulo`, because it was a temporary substitution.
+    static constexpr std::string_view modulo_legacy_function_name = "moduloLegacy";
+
+    size_t i = 0;
+    for (const auto & element : partition_key_names_and_types)
+    {
+        auto & partition_column = block_with_min_max_partition_ids.getByName(element.name);
+
+        if (element.name.starts_with(modulo_legacy_function_name))
+            partition_column.name.replace(0, modulo_legacy_function_name.size(), "modulo");
+
+        Field extracted_min_partition_id_field;
+        Field extracted_max_partition_id_field;
+
+        partition_column.column->get(0, extracted_min_partition_id_field);
+        partition_column.column->get(1, extracted_max_partition_id_field);
+
+        if (extracted_min_partition_id_field != extracted_max_partition_id_field)
+        {
+            throw Exception(
+                ErrorCodes::INVALID_PARTITION_VALUE,
+                "Can not create the partition. A partition can not contain values that have different partition ids");
+        }
+
+        partition_column.column->get(0u, value[i++]);
+    }
+}
+
 NamesAndTypesList MergeTreePartition::executePartitionByExpression(const StorageMetadataPtr & metadata_snapshot, Block & block, ContextPtr context)
 {
     auto adjusted_partition_key = adjustPartitionKey(metadata_snapshot, context);
diff --git a/src/Storages/MergeTree/MergeTreePartition.h b/src/Storages/MergeTree/MergeTreePartition.h
index 78b141f26ec..fd7ae02cde4 100644
--- a/src/Storages/MergeTree/MergeTreePartition.h
+++ b/src/Storages/MergeTree/MergeTreePartition.h
@@ -1,11 +1,12 @@
 #pragma once
 
-#include <base/types.h>
+#include <Core/Field.h>
 #include <Disks/IDisk.h>
 #include <IO/WriteBuffer.h>
 #include <Storages/KeyDescription.h>
 #include <Storages/MergeTree/IPartMetadataManager.h>
-#include <Core/Field.h>
+#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
+#include <base/types.h>
 
 namespace DB
 {
@@ -51,6 +52,11 @@ public:
 
     void create(const StorageMetadataPtr & metadata_snapshot, Block block, size_t row, ContextPtr context);
 
+    /// Copy of MergeTreePartition::create, but also validates if min max partition keys are equal. If they are different,
+    /// it means the partition can't be created because the data doesn't belong to the same partition.
+    void createAndValidateMinMaxPartitionIds(
+        const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context);
+
     static void appendFiles(const MergeTreeData & storage, Strings & files);
 
     /// Adjust partition key and execute its expression on block. Return sample block according to used expression.
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
new file mode 100644
index 00000000000..21bcdb84a96
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
@@ -0,0 +1,91 @@
+#include <Interpreters/MonotonicityCheckVisitor.h>
+#include <Interpreters/getTableExpressions.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
+#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+}
+
+namespace
+{
+bool isDestinationPartitionExpressionMonotonicallyIncreasing(
+    const std::vector<Range> & hyperrectangle, const MergeTreeData & destination_storage)
+{
+    auto destination_table_metadata = destination_storage.getInMemoryMetadataPtr();
+
+    auto key_description = destination_table_metadata->getPartitionKey();
+    auto definition_ast = key_description.definition_ast->clone();
+
+    auto table_identifier = std::make_shared<ASTIdentifier>(destination_storage.getStorageID().getTableName());
+    auto table_with_columns
+        = TableWithColumnNamesAndTypes{DatabaseAndTableWithAlias(table_identifier), destination_table_metadata->getColumns().getOrdinary()};
+
+    auto expression_list = extractKeyExpressionList(definition_ast);
+
+    MonotonicityCheckVisitor::Data data{{table_with_columns}, destination_storage.getContext(), /*group_by_function_hashes*/ {}};
+
+    for (auto i = 0u; i < expression_list->children.size(); i++)
+    {
+        data.range = hyperrectangle[i];
+
+        MonotonicityCheckVisitor(data).visit(expression_list->children[i]);
+
+        if (!data.monotonicity.is_monotonic || !data.monotonicity.is_positive)
+            return false;
+    }
+
+    return true;
+}
+
+bool isExpressionDirectSubsetOf(const ASTPtr source, const ASTPtr destination)
+{
+    auto source_expression_list = extractKeyExpressionList(source);
+    auto destination_expression_list = extractKeyExpressionList(destination);
+
+    std::unordered_set<std::string> source_columns;
+
+    for (auto i = 0u; i < source_expression_list->children.size(); ++i)
+        source_columns.insert(source_expression_list->children[i]->getColumnName());
+
+    for (auto i = 0u; i < destination_expression_list->children.size(); ++i)
+        if (!source_columns.contains(destination_expression_list->children[i]->getColumnName()))
+            return false;
+
+    return true;
+}
+}
+
+void MergeTreePartitionCompatibilityVerifier::verify(
+    const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts)
+{
+    const auto source_metadata = source_storage.getInMemoryMetadataPtr();
+    const auto destination_metadata = destination_storage.getInMemoryMetadataPtr();
+
+    const auto source_partition_key_ast = source_metadata->getPartitionKeyAST();
+    const auto destination_partition_key_ast = destination_metadata->getPartitionKeyAST();
+
+    // If destination partition expression columns are a subset of source partition expression columns,
+    // there is no need to check for monotonicity.
+    if (isExpressionDirectSubsetOf(source_partition_key_ast, destination_partition_key_ast))
+        return;
+
+    const auto src_global_min_max_indexes = MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(source_parts, destination_storage);
+
+    assert(!src_global_min_max_indexes.hyperrectangle.empty());
+
+    if (!isDestinationPartitionExpressionMonotonicallyIncreasing(src_global_min_max_indexes.hyperrectangle, destination_storage))
+        throw DB::Exception(ErrorCodes::BAD_ARGUMENTS, "Destination table partition expression is not monotonically increasing");
+
+    MergeTreePartition().createAndValidateMinMaxPartitionIds(
+        destination_storage.getInMemoryMetadataPtr(),
+        src_global_min_max_indexes.getBlock(destination_storage),
+        destination_storage.getContext());
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
new file mode 100644
index 00000000000..1682add3ebd
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
@@ -0,0 +1,30 @@
+#pragma once
+
+#include <Core/Field.h>
+#include <Storages/MergeTree/IMergeTreeDataPart.h>
+
+namespace DB
+{
+
+/*
+ * Verifies that source and destination partitions are compatible.
+ * To be compatible, one of the following criteria must be met:
+ * 1. Destination partition expression columns are a subset of source partition columns; or
+ * 2. Destination partition expression is monotonic on the source global min_max idx Range AND the computer partition id for
+ * the source global min_max idx range is the same.
+ *
+ * If not, an exception is thrown.
+ * */
+
+class MergeTreePartitionCompatibilityVerifier
+{
+public:
+    using DataPart = IMergeTreeDataPart;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+    using DataPartsVector = std::vector<DataPartPtr>;
+
+    static void
+    verify(const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts);
+};
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
new file mode 100644
index 00000000000..0871efadf0c
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
@@ -0,0 +1,25 @@
+#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
+
+namespace DB
+{
+
+IMergeTreeDataPart::MinMaxIndex
+MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(const DataPartsVector & parts, const MergeTreeData & storage)
+{
+    IMergeTreeDataPart::MinMaxIndex global_min_max_indexes;
+
+    for (const auto & part : parts)
+    {
+        auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(part.get());
+
+        auto local_min_max_index = MergeTreeData::DataPart::MinMaxIndex();
+
+        local_min_max_index.load(storage, metadata_manager);
+
+        global_min_max_indexes.merge(local_min_max_index);
+    }
+
+    return global_min_max_indexes;
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
new file mode 100644
index 00000000000..4f271177246
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
@@ -0,0 +1,24 @@
+#pragma once
+
+#include <utility>
+
+#include <Core/Field.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+
+namespace DB
+{
+
+/*
+ * Calculates global min max indexes for a given set of parts on given storage.
+ * */
+class MergeTreePartitionGlobalMinMaxIdxCalculator
+{
+    using DataPart = IMergeTreeDataPart;
+    using DataPartPtr = std::shared_ptr<const DataPart>;
+    using DataPartsVector = std::vector<DataPartPtr>;
+
+public:
+    static IMergeTreeDataPart::MinMaxIndex calculate(const DataPartsVector & parts, const MergeTreeData & storage);
+};
+
+}
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 4761ccd8b58..fd5354a00a9 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -5,9 +5,9 @@
 #include <optional>
 #include <ranges>
 
-#include <base/sort.h>
 #include <Backups/BackupEntriesCollector.h>
 #include <Databases/IDatabase.h>
+#include <IO/copyData.h>
 #include "Common/Exception.h"
 #include <Common/MemoryTracker.h>
 #include <Common/escapeForFileName.h>
@@ -20,25 +20,30 @@
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
+#include <Interpreters/InterpreterAlterQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
-#include <IO/copyData.h>
 #include <Parsers/ASTCheckQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTPartition.h>
 #include <Parsers/ASTSetQuery.h>
-#include <Parsers/queryToString.h>
 #include <Parsers/formatAST.h>
+#include <Parsers/queryToString.h>
+#include <Planner/Utils.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/AlterCommands.h>
-#include <Storages/PartitionCommands.h>
-#include <Storages/MergeTree/MergeTreeSink.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
-#include <Storages/MergeTree/PartitionPruner.h>
 #include <Storages/MergeTree/MergeList.h>
+#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
+#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
+#include <Storages/MergeTree/MergeTreeSink.h>
+#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
+#include <Storages/MergeTree/PartitionPruner.h>
 #include <Storages/MergeTree/checkDataPart.h>
+#include <Storages/PartitionCommands.h>
+#include <base/sort.h>
+#include <Storages/buildQueryTreeForShard.h>
 #include <QueryPipeline/Pipe.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
@@ -2039,41 +2044,73 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, my_metadata_snapshot);
-    String partition_id = getPartitionIDFromQuery(partition, local_context);
+    String partition_id = src_data.getPartitionIDFromQuery(partition, local_context);
 
     DataPartsVector src_parts = src_data.getVisibleDataPartsVectorInPartition(local_context, partition_id);
+
+    bool attach_empty_partition = !replace && src_parts.empty();
+    if (attach_empty_partition)
+        return;
+
     MutableDataPartsVector dst_parts;
     std::vector<scope_guard> dst_parts_locks;
 
     static const String TMP_PREFIX = "tmp_replace_from_";
 
-    for (const DataPartPtr & src_part : src_parts)
+    const auto my_partition_expression = my_metadata_snapshot->getPartitionKeyAST();
+    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
+    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+    if (is_partition_exp_different && !src_parts.empty())
+        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_parts);
+
+    for (DataPartPtr & src_part : src_parts)
     {
         if (!canReplacePartition(src_part))
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                             "Cannot replace partition '{}' because part '{}' has inconsistent granularity with table",
                             partition_id, src_part->name);
 
-        /// This will generate unique name in scope of current server process.
-        Int64 temp_index = insert_increment.get();
-        MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
-
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
-        auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-            src_part,
-            TMP_PREFIX,
-            dst_part_info,
-            my_metadata_snapshot,
-            clone_params,
-            local_context->getReadSettings(),
-            local_context->getWriteSettings());
-        dst_parts.emplace_back(std::move(dst_part));
-        dst_parts_locks.emplace_back(std::move(part_lock));
-    }
+        /// This will generate unique name in scope of current server process.
+        auto index = insert_increment.get();
 
-    /// ATTACH empty part set
-    if (!replace && dst_parts.empty())
-        return;
+        if (is_partition_exp_different)
+        {
+            auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
+                src_part, my_metadata_snapshot, local_context);
+
+            auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                src_part,
+                new_partition,
+                new_partition.getID(*this),
+                new_min_max_index,
+                TMP_PREFIX,
+                my_metadata_snapshot,
+                clone_params,
+                local_context,
+                index,
+                index);
+
+            dst_parts.emplace_back(std::move(dst_part));
+            dst_parts_locks.emplace_back(std::move(part_lock));
+        }
+        else
+        {
+            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
+
+            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                src_part,
+                TMP_PREFIX,
+                dst_part_info,
+                my_metadata_snapshot,
+                clone_params,
+                local_context->getReadSettings(),
+                local_context->getWriteSettings());
+            dst_parts.emplace_back(std::move(dst_part));
+            dst_parts_locks.emplace_back(std::move(part_lock));
+        }
+    }
 
     MergeTreePartInfo drop_range;
     if (replace)
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index f7e6783dbc2..512811e39d7 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -26,22 +26,21 @@
 
 #include <base/sort.h>
 
-#include <Storages/buildQueryTreeForShard.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
 #include <Storages/MergeTree/AsyncBlockIDsCache.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/LeaderElection.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MergeFromLogEntryTask.h>
 #include <Storages/MergeTree/MergeList.h>
 #include <Storages/MergeTree/MergeTreeBackgroundExecutor.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 #include <Storages/MergeTree/MergeTreePartInfo.h>
+#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
 #include <Storages/MergeTree/MergeTreeReaderCompact.h>
+#include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MutateFromLogEntryTask.h>
 #include <Storages/MergeTree/PinnedPartUUIDs.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeAddress.h>
@@ -53,9 +52,11 @@
 #include <Storages/MergeTree/ReplicatedMergeTreeSink.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h>
 #include <Storages/MergeTree/ZeroCopyLock.h>
+#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/PartitionCommands.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
+#include <Storages/buildQueryTreeForShard.h>
 
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabaseReplicated.h>
@@ -2713,16 +2714,48 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || ((our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
-                part_desc->src_table_part,
-                TMP_PREFIX + "clone_",
-                part_desc->new_part_info,
-                metadata_snapshot,
-                clone_params,
-                getContext()->getReadSettings(),
-                getContext()->getWriteSettings());
-            part_desc->res_part = std::move(res_part);
-            part_desc->temporary_part_lock = std::move(temporary_part_lock);
+
+            const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
+            const auto src_partition_expression = source_table->getInMemoryMetadataPtr()->getPartitionKeyAST();
+
+            const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+            if (is_partition_exp_different)
+            {
+                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
+                    part_desc->src_table_part, metadata_snapshot, getContext());
+
+                auto partition_id = new_partition.getID(*this);
+
+                auto [res_part, temporary_part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                    part_desc->src_table_part,
+                    new_partition,
+                    partition_id,
+                    new_min_max_index,
+                    TMP_PREFIX + "clone_",
+                    metadata_snapshot,
+                    clone_params,
+                    getContext(),
+                    part_desc->new_part_info.min_block,
+                    part_desc->new_part_info.max_block);
+
+                part_desc->res_part = std::move(res_part);
+                part_desc->temporary_part_lock = std::move(temporary_part_lock);
+            }
+            else
+            {
+                auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
+                    part_desc->src_table_part,
+                    TMP_PREFIX + "clone_",
+                    part_desc->new_part_info,
+                    metadata_snapshot,
+                    clone_params,
+                    getContext()->getReadSettings(),
+                    getContext()->getWriteSettings());
+
+                part_desc->res_part = std::move(res_part);
+                part_desc->temporary_part_lock = std::move(temporary_part_lock);
+            }
         }
         else if (!part_desc->replica.empty())
         {
@@ -7852,11 +7885,22 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, metadata_snapshot);
-    String partition_id = getPartitionIDFromQuery(partition, query_context);
+    String partition_id = src_data.getPartitionIDFromQuery(partition, query_context);
 
     /// NOTE: Some covered parts may be missing in src_all_parts if corresponding log entries are not executed yet.
     DataPartsVector src_all_parts = src_data.getVisibleDataPartsVectorInPartition(query_context, partition_id);
 
+    bool attach_empty_partition = !replace && src_all_parts.empty();
+    if (attach_empty_partition)
+        return;
+
+    const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
+    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
+    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
+
+    if (is_partition_exp_different && !src_all_parts.empty())
+        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_all_parts);
+
     LOG_DEBUG(log, "Cloning {} parts", src_all_parts.size());
 
     static const String TMP_PREFIX = "tmp_replace_from_";
@@ -7911,6 +7955,18 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                                 "Cannot replace partition '{}' because part '{}"
                                 "' has inconsistent granularity with table", partition_id, src_part->name);
 
+            IMergeTreeDataPart::MinMaxIndex min_max_index = *src_part->minmax_idx;
+            MergeTreePartition merge_tree_partition = src_part->partition;
+
+            if (is_partition_exp_different)
+            {
+                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(src_part, metadata_snapshot, query_context);
+
+                merge_tree_partition = new_partition;
+                min_max_index = new_min_max_index;
+                partition_id = merge_tree_partition.getID(*this);
+            }
+
             String hash_hex = src_part->checksums.getTotalChecksumHex();
             const bool is_duplicated_part = replaced_parts.contains(hash_hex);
             replaced_parts.insert(hash_hex);
@@ -7929,27 +7985,52 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 continue;
             }
 
-            UInt64 index = lock->getNumber();
-            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-
             bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
                 || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+
+            UInt64 index = lock->getNumber();
+
             IDataPartStorage::ClonePartParams clone_params
             {
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                metadata_snapshot,
-                clone_params,
-                query_context->getReadSettings(),
-                query_context->getWriteSettings());
+
+            if (is_partition_exp_different)
+            {
+                auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
+                    src_part,
+                    merge_tree_partition,
+                    partition_id,
+                    min_max_index,
+                    TMP_PREFIX,
+                    metadata_snapshot,
+                    clone_params,
+                    query_context,
+                    index,
+                    index);
+
+                dst_parts.emplace_back(dst_part);
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
+            else
+            {
+                MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
+
+                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                    src_part,
+                    TMP_PREFIX,
+                    dst_part_info,
+                    metadata_snapshot,
+                    clone_params,
+                    query_context->getReadSettings(),
+                    query_context->getWriteSettings());
+
+                dst_parts.emplace_back(dst_part);
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
+
             src_parts.emplace_back(src_part);
-            dst_parts.emplace_back(dst_part);
-            dst_parts_locks.emplace_back(std::move(part_lock));
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
             part_checksums.emplace_back(hash_hex);
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py b/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml b/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
new file mode 100644
index 00000000000..b40730e9f7d
--- /dev/null
+++ b/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
@@ -0,0 +1,17 @@
+<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>replica1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>replica2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/test.py b/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
new file mode 100644
index 00000000000..1d8ac4e9e37
--- /dev/null
+++ b/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
@@ -0,0 +1,214 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry
+
+cluster = ClickHouseCluster(__file__)
+
+replica1 = cluster.add_instance(
+    "replica1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+replica2 = cluster.add_instance(
+    "replica2", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    except Exception as ex:
+        print(ex)
+    finally:
+        cluster.shutdown()
+
+
+def cleanup(nodes):
+    for node in nodes:
+        node.query("DROP TABLE IF EXISTS source SYNC")
+        node.query("DROP TABLE IF EXISTS destination SYNC")
+
+
+def create_table(node, table_name, replicated):
+    replica = node.name
+    engine = (
+        f"ReplicatedMergeTree('/clickhouse/tables/1/{table_name}', '{replica}')"
+        if replicated
+        else "MergeTree()"
+    )
+    partition_expression = (
+        "toYYYYMMDD(timestamp)" if table_name == "source" else "toYYYYMM(timestamp)"
+    )
+    node.query_with_retry(
+        """
+        CREATE TABLE {table_name}(timestamp DateTime)
+        ENGINE = {engine}
+        ORDER BY tuple() PARTITION BY {partition_expression}
+        SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+        """.format(
+            table_name=table_name,
+            engine=engine,
+            partition_expression=partition_expression,
+        )
+    )
+
+
+def test_both_replicated(start_cluster):
+    for node in [replica1, replica2]:
+        create_table(node, "source", True)
+        create_table(node, "destination", True)
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination",
+        replica2.query(f"SELECT * FROM destination"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_only_destination_replicated(start_cluster):
+    create_table(replica1, "source", False)
+    create_table(replica1, "destination", True)
+    create_table(replica2, "destination", True)
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination",
+        replica2.query(f"SELECT * FROM destination"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_both_replicated_partitioned_to_unpartitioned(start_cluster):
+    def create_tables(nodes):
+        for node in nodes:
+            source_engine = (
+                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
+            )
+            node.query(
+                """
+                CREATE TABLE source(timestamp DateTime)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp)
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=source_engine,
+                )
+            )
+
+            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
+            node.query(
+                """
+                CREATE TABLE destination(timestamp DateTime)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY tuple()
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=destination_engine,
+                )
+            )
+
+    create_tables([replica1, replica2])
+
+    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
+    replica1.query("INSERT INTO source VALUES ('2010-03-03 02:01:01')")
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
+    )
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION ID '20100303' FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY timestamp",
+        "2010-03-02 02:01:01\n2010-03-03 02:01:01\n",
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY timestamp",
+        replica2.query(f"SELECT * FROM destination ORDER BY timestamp"),
+    )
+
+    cleanup([replica1, replica2])
+
+
+def test_both_replicated_different_exp_same_id(start_cluster):
+    def create_tables(nodes):
+        for node in nodes:
+            source_engine = (
+                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
+            )
+            node.query(
+                """
+                CREATE TABLE source(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY a % 3
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=source_engine,
+                )
+            )
+
+            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
+            node.query(
+                """
+                CREATE TABLE destination(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
+                ENGINE = {engine}
+                ORDER BY tuple() PARTITION BY a
+                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
+                """.format(
+                    engine=destination_engine,
+                )
+            )
+
+    create_tables([replica1, replica2])
+
+    replica1.query(
+        "INSERT INTO source (a, b, c, extra, sign) VALUES (1, 5, 9, 1000, 1)"
+    )
+    replica1.query(
+        "INSERT INTO source (a, b, c, extra, sign) VALUES (2, 6, 10, 1000, 1)"
+    )
+    replica1.query("SYSTEM SYNC REPLICA source")
+    replica1.query("SYSTEM SYNC REPLICA destination")
+
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 1 FROM source")
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 2 FROM source")
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY a",
+        "1\t5\t9\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n2\t6\t10\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n",
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT * FROM destination ORDER BY a",
+        replica2.query(f"SELECT * FROM destination ORDER BY a"),
+    )
+
+    cleanup([replica1, replica2])
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
new file mode 100644
index 00000000000..f1d036b08bf
--- /dev/null
+++ b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
@@ -0,0 +1,467 @@
+-- { echoOn }
+-- Should be allowed since destination partition expr is monotonically increasing and compatible
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
+-- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+20100302
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+20100302
+-- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION 0 FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1
+2010-03-02 02:01:03	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+-- Should be allowed because dst partition exp is monot inc and data is not split
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
+SELECT * FROM source ORDER BY productName;
+mop	general
+rice	food
+spaghetti	food
+SELECT * FROM destination ORDER BY productName;
+rice	food
+spaghetti	food
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+59532f3c39a412a413f0f014c7750a9d
+59532f3c39a412a413f0f014c7750a9d
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
+SELECT * FROM source ORDER BY productName;
+mop	general
+rice	food
+spaghetti	food
+SELECT * FROM destination ORDER BY productName;
+rice	food
+spaghetti	food
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+59532f3c39a412a413f0f014c7750a9d
+59532f3c39a412a413f0f014c7750a9d
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
+CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
+INSERT INTO TABLE source VALUES (1267495261123);
+ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+1267495261123
+SELECT * FROM destination ORDER BY timestamp;
+1267495261123
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+2010
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '14670' from source;
+SELECT * FROM source ORDER BY timestamp;
+1267495261123
+SELECT * FROM destination ORDER BY timestamp;
+1267495261123
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+2010
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
+CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
+ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+2011-02-02 02:01:03	1	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+14670
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '2010' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+2011-02-02 02:01:03	1	1
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	1	1
+2010-03-02 02:01:01	1	1
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+14670
+-- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
+-- fall into the same partition.
+-- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+-- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
+-- partition by tuple() is accepted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+all
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1-2
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1-2
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+SELECT * FROM source ORDER BY (a, b, c);
+1	2	3
+1	2	4
+SELECT * FROM destination ORDER BY (a, b, c);
+1	2	3
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+1
+-- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
+-- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
+-- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
+CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
+ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+5
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01	5
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+5
+-- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
+-- increasing in the source partition min max indexes.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+INSERT INTO TABLE source VALUES (6, 12);
+ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+3-6
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+3-6
+-- Should be allowed. The same scenario as above, but partition expressions inverted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+INSERT INTO TABLE source VALUES (6, 12);
+ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+6-12
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
+SELECT * FROM source ORDER BY A;
+6	12
+SELECT * FROM destination ORDER BY A;
+6	12
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+6-12
+-- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE
+    source(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMMDD(timestamp)
+        ORDER BY tuple();
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+TRUNCATE TABLE destination;
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+SELECT * FROM source ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT * FROM destination ORDER BY timestamp;
+2010-03-02 02:01:01
+2010-03-02 02:01:03
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+201003
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
+-- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+-- Should not be allowed because dst partition exp depends on a different set of columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+-- Should not be allowed because dst partition exp is not monotonically increasing
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
+CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
+INSERT INTO TABLE source VALUES ('bread'), ('mop');
+INSERT INTO TABLE source VALUES ('broccoli');
+ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
+-- Empty/ non-existent partition, same partition expression. Nothing should happen
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Empty/ non-existent partition, different partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+-- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+INSERT INTO TABLE destination VALUES (1);
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
new file mode 100644
index 00000000000..9547d6ae249
--- /dev/null
+++ b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
@@ -0,0 +1,485 @@
+-- { echoOn }
+-- Should be allowed since destination partition expr is monotonically increasing and compatible
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
+-- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
+
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION 0 FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because dst partition exp is monot inc and data is not split
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
+
+SELECT * FROM source ORDER BY productName;
+SELECT * FROM destination ORDER BY productName;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
+
+SELECT * FROM source ORDER BY productName;
+SELECT * FROM destination ORDER BY productName;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
+CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
+
+INSERT INTO TABLE source VALUES (1267495261123);
+
+ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '14670' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
+
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
+CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
+
+ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '2010' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
+-- fall into the same partition.
+-- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
+-- partition by tuple() is accepted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '201003' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
+
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
+-- Columns in this case refer to the expression elements, not to the actual table columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
+CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
+
+INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
+
+ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
+
+SELECT * FROM source ORDER BY (a, b, c);
+SELECT * FROM destination ORDER BY (a, b, c);
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
+-- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
+-- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
+CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
+
+ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
+-- increasing in the source partition min max indexes.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES (6, 12);
+
+ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed. The same scenario as above, but partition expressions inverted.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
+CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES (6, 12);
+
+ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
+
+SELECT * FROM source ORDER BY A;
+SELECT * FROM destination ORDER BY A;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+CREATE TABLE
+    source(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMMDD(timestamp)
+        ORDER BY tuple();
+
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
+
+CREATE TABLE
+    destination(timestamp DateTime)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
+        PARTITION BY toYYYYMM(timestamp)
+        ORDER BY tuple();
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+TRUNCATE TABLE destination;
+
+ALTER TABLE destination ATTACH PARTITION '20100302' from source;
+
+SELECT * FROM source ORDER BY timestamp;
+SELECT * FROM destination ORDER BY timestamp;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source SYNC;
+DROP TABLE IF EXISTS destination SYNC;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
+
+ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
+
+-- Should not be allowed because data would be split into two different partitions
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
+
+CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
+
+INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
+
+ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
+ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
+
+-- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+
+-- Should not be allowed because dst partition exp depends on a different set of columns
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
+CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
+
+INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
+INSERT INTO TABLE source VALUES ('rice', 'food');
+
+ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
+
+-- Should not be allowed because dst partition exp is not monotonically increasing
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
+CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
+
+INSERT INTO TABLE source VALUES ('bread'), ('mop');
+INSERT INTO TABLE source VALUES ('broccoli');
+
+ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
+ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
+
+-- Empty/ non-existent partition, same partition expression. Nothing should happen
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Empty/ non-existent partition, different partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
+ALTER TABLE destination ATTACH PARTITION 1 FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
+
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
+
+-- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
+-- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
+DROP TABLE IF EXISTS source;
+DROP TABLE IF EXISTS destination;
+
+CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
+
+INSERT INTO TABLE destination VALUES (1);
+
+ALTER TABLE destination REPLACE PARTITION '1' FROM source;
+
+SELECT * FROM destination;
+SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;

From 5179891aef9792366d948efd9f1a2454dfe8da69 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 11:43:08 -0300
Subject: [PATCH 0216/1081] remove static log

---
 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index 78cb9aa0624..e384e1b7066 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -13,8 +13,6 @@ namespace ErrorCodes
 extern const int BAD_ARGUMENTS;
 }
 
-static Poco::Logger * log = &Poco::Logger::get("MergeTreeDataPartCloner");
-
 namespace DistinctPartitionExpression
 {
 std::unique_ptr<WriteBufferFromFileBase> updatePartitionFile(
@@ -182,7 +180,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
     }
 
     LOG_DEBUG(
-        log,
+        &Poco::Logger::get("MergeTreeDataPartCloner"),
         "Clone {} part {} to {}{}",
         src_flushed_tmp_part ? "flushed" : "",
         src_part_storage->getFullPath(),

From 7e86c0e9280bb6e46183c2c358474bfd283e2554 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Tue, 23 Jan 2024 23:03:15 +0800
Subject: [PATCH 0217/1081] Compress state of dashboard

---
 programs/server/dashboard.html     | 6 +++---
 programs/server/js/lz-string.js    | 1 +
 src/Server/WebUIRequestHandler.cpp | 9 +++++++++
 3 files changed, 13 insertions(+), 3 deletions(-)
 create mode 100644 programs/server/js/lz-string.js

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 04fdfb2d3ca..1f32048da79 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -5,6 +5,7 @@
     <title>ClickHouse Dashboard</title>
     <link rel="icon" href="data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHdpZHRoPSI1NCIgaGVpZ2h0PSI0OCIgdmlld0JveD0iMCAwIDkgOCI+PHN0eWxlPi5ve2ZpbGw6I2ZjMH0ucntmaWxsOnJlZH08L3N0eWxlPjxwYXRoIGQ9Ik0wLDcgaDEgdjEgaC0xIHoiIGNsYXNzPSJyIi8+PHBhdGggZD0iTTAsMCBoMSB2NyBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNMiwwIGgxIHY4IGgtMSB6IiBjbGFzcz0ibyIvPjxwYXRoIGQ9Ik00LDAgaDEgdjggaC0xIHoiIGNsYXNzPSJvIi8+PHBhdGggZD0iTTYsMCBoMSB2OCBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNOCwzLjI1IGgxIHYxLjUgaC0xIHoiIGNsYXNzPSJvIi8+PC9zdmc+">
     <script src="https://cdn.jsdelivr.net/npm/uplot@1.6.21/dist/uPlot.iife.min.js"></script>
+    <script src="https://cdn.jsdelivr.net/npm/lz-string@1.5.0/libs/lz-string.min.js"></script>
     <style>
         :root {
             --color: black;
@@ -484,7 +485,6 @@
   *
   * TODO:
   * - zoom on the graphs should work on touch devices;
-  * - compress the state for URL's #hash;
   * - footer with "about" or a link to source code;
   * - allow to configure a table on a server to save the dashboards;
   * - if a query returned one value, display this value instead of a diagram;
@@ -1384,7 +1384,7 @@ document.getElementById('params').onsubmit = function(event) {
 function saveState() {
     const state = { host, user, queries, params, search_query, customized };
     history.pushState(state, '',
-        window.location.pathname + (window.location.search || '') + '#' + btoa(JSON.stringify(state)));
+        window.location.pathname + (window.location.search || '') + '#' + LZString.compressToEncodedURIComponent(JSON.stringify(state)));
 }
 
 async function searchQueries() {
@@ -1450,7 +1450,7 @@ window.onpopstate = function(event) {
 if (window.location.hash) {
     try {
         let search_query_, customized_;
-        ({host, user, queries, params, search_query_, customized_} = JSON.parse(atob(window.location.hash.substring(1))));
+        ({host, user, queries, params, search_query_, customized_} = JSON.parse(LZString.decompressFromEncodedURIComponent(window.location.hash.substring(1))));
         // For compatibility with old URLs' hashes
         search_query = search_query_ !== undefined ? search_query_ : search_query;
         customized = customized_ !== undefined ? customized_ : true;
diff --git a/programs/server/js/lz-string.js b/programs/server/js/lz-string.js
new file mode 100644
index 00000000000..534b61ff6b6
--- /dev/null
+++ b/programs/server/js/lz-string.js
@@ -0,0 +1 @@
+var LZString=function(){var r=String.fromCharCode,o="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/=",n="ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+-$",e={};function t(r,o){if(!e[r]){e[r]={};for(var n=0;n<r.length;n++)e[r][r.charAt(n)]=n}return e[r][o]}var i={compressToBase64:function(r){if(null==r)return"";var n=i._compress(r,6,function(r){return o.charAt(r)});switch(n.length%4){default:case 0:return n;case 1:return n+"===";case 2:return n+"==";case 3:return n+"="}},decompressFromBase64:function(r){return null==r?"":""==r?null:i._decompress(r.length,32,function(n){return t(o,r.charAt(n))})},compressToUTF16:function(o){return null==o?"":i._compress(o,15,function(o){return r(o+32)})+" "},decompressFromUTF16:function(r){return null==r?"":""==r?null:i._decompress(r.length,16384,function(o){return r.charCodeAt(o)-32})},compressToUint8Array:function(r){for(var o=i.compress(r),n=new Uint8Array(2*o.length),e=0,t=o.length;e<t;e++){var s=o.charCodeAt(e);n[2*e]=s>>>8,n[2*e+1]=s%256}return n},decompressFromUint8Array:function(o){if(null==o)return i.decompress(o);for(var n=new Array(o.length/2),e=0,t=n.length;e<t;e++)n[e]=256*o[2*e]+o[2*e+1];var s=[];return n.forEach(function(o){s.push(r(o))}),i.decompress(s.join(""))},compressToEncodedURIComponent:function(r){return null==r?"":i._compress(r,6,function(r){return n.charAt(r)})},decompressFromEncodedURIComponent:function(r){return null==r?"":""==r?null:(r=r.replace(/ /g,"+"),i._decompress(r.length,32,function(o){return t(n,r.charAt(o))}))},compress:function(o){return i._compress(o,16,function(o){return r(o)})},_compress:function(r,o,n){if(null==r)return"";var e,t,i,s={},u={},a="",p="",c="",l=2,f=3,h=2,d=[],m=0,v=0;for(i=0;i<r.length;i+=1)if(a=r.charAt(i),Object.prototype.hasOwnProperty.call(s,a)||(s[a]=f++,u[a]=!0),p=c+a,Object.prototype.hasOwnProperty.call(s,p))c=p;else{if(Object.prototype.hasOwnProperty.call(u,c)){if(c.charCodeAt(0)<256){for(e=0;e<h;e++)m<<=1,v==o-1?(v=0,d.push(n(m)),m=0):v++;for(t=c.charCodeAt(0),e=0;e<8;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}else{for(t=1,e=0;e<h;e++)m=m<<1|t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t=0;for(t=c.charCodeAt(0),e=0;e<16;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}0==--l&&(l=Math.pow(2,h),h++),delete u[c]}else for(t=s[c],e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;0==--l&&(l=Math.pow(2,h),h++),s[p]=f++,c=String(a)}if(""!==c){if(Object.prototype.hasOwnProperty.call(u,c)){if(c.charCodeAt(0)<256){for(e=0;e<h;e++)m<<=1,v==o-1?(v=0,d.push(n(m)),m=0):v++;for(t=c.charCodeAt(0),e=0;e<8;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}else{for(t=1,e=0;e<h;e++)m=m<<1|t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t=0;for(t=c.charCodeAt(0),e=0;e<16;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1}0==--l&&(l=Math.pow(2,h),h++),delete u[c]}else for(t=s[c],e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;0==--l&&(l=Math.pow(2,h),h++)}for(t=2,e=0;e<h;e++)m=m<<1|1&t,v==o-1?(v=0,d.push(n(m)),m=0):v++,t>>=1;for(;;){if(m<<=1,v==o-1){d.push(n(m));break}v++}return d.join("")},decompress:function(r){return null==r?"":""==r?null:i._decompress(r.length,32768,function(o){return r.charCodeAt(o)})},_decompress:function(o,n,e){var t,i,s,u,a,p,c,l=[],f=4,h=4,d=3,m="",v=[],g={val:e(0),position:n,index:1};for(t=0;t<3;t+=1)l[t]=t;for(s=0,a=Math.pow(2,2),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;switch(s){case 0:for(s=0,a=Math.pow(2,8),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;c=r(s);break;case 1:for(s=0,a=Math.pow(2,16),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;c=r(s);break;case 2:return""}for(l[3]=c,i=c,v.push(c);;){if(g.index>o)return"";for(s=0,a=Math.pow(2,d),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;switch(c=s){case 0:for(s=0,a=Math.pow(2,8),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;l[h++]=r(s),c=h-1,f--;break;case 1:for(s=0,a=Math.pow(2,16),p=1;p!=a;)u=g.val&g.position,g.position>>=1,0==g.position&&(g.position=n,g.val=e(g.index++)),s|=(u>0?1:0)*p,p<<=1;l[h++]=r(s),c=h-1,f--;break;case 2:return v.join("")}if(0==f&&(f=Math.pow(2,d),d++),l[c])m=l[c];else{if(c!==h)return null;m=i+i.charAt(0)}v.push(m),l[h++]=i+m.charAt(0),i=m,0==--f&&(f=Math.pow(2,d),d++)}}};return i}();"function"==typeof define&&define.amd?define(function(){return LZString}):"undefined"!=typeof module&&null!=module?module.exports=LZString:"undefined"!=typeof angular&&null!=angular&&angular.module("LZString",[]).factory("LZString",function(){return LZString});
diff --git a/src/Server/WebUIRequestHandler.cpp b/src/Server/WebUIRequestHandler.cpp
index ac7a3bfccf3..e45d2a55acb 100644
--- a/src/Server/WebUIRequestHandler.cpp
+++ b/src/Server/WebUIRequestHandler.cpp
@@ -17,6 +17,7 @@
 INCBIN(resource_play_html, SOURCE_DIR "/programs/server/play.html");
 INCBIN(resource_dashboard_html, SOURCE_DIR "/programs/server/dashboard.html");
 INCBIN(resource_uplot_js, SOURCE_DIR "/programs/server/js/uplot.js");
+INCBIN(resource_lz_string_js, SOURCE_DIR "/programs/server/js/lz-string.js");
 INCBIN(resource_binary_html, SOURCE_DIR "/programs/server/binary.html");
 
 
@@ -59,6 +60,9 @@ void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerR
         static re2::RE2 uplot_url = R"(https://[^\s"'`]+u[Pp]lot[^\s"'`]*\.js)";
         RE2::Replace(&html, uplot_url, "/js/uplot.js");
 
+        static re2::RE2 lz_string_url = R"(https://[^\s"'`]+lz-string[^\s"'`]*\.js)";
+        RE2::Replace(&html, lz_string_url, "/js/lz-string.js");
+
         WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(html);
     }
     else if (request.getURI().starts_with("/binary"))
@@ -71,6 +75,11 @@ void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerR
         response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
         WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(reinterpret_cast<const char *>(gresource_uplot_jsData), gresource_uplot_jsSize);
     }
+    else if (request.getURI() == "/js/lz-string.js")
+    {
+        response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
+        WriteBufferFromHTTPServerResponse(response, request.getMethod() == HTTPRequest::HTTP_HEAD, keep_alive_timeout).write(reinterpret_cast<const char *>(gresource_lz_string_jsData), gresource_lz_string_jsSize);
+    }
     else
     {
         response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_NOT_FOUND);

From 94a79c081da87ffedc31841cc5b45083693f4323 Mon Sep 17 00:00:00 2001
From: HarryLeeIBM <hleeatwork@outlook.com>
Date: Tue, 23 Jan 2024 09:21:17 -0800
Subject: [PATCH 0218/1081] Fix aggregation issue in mixed cluster of x86_64
 and aarch64

---
 src/Common/HashTable/StringHashTable.h | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/src/Common/HashTable/StringHashTable.h b/src/Common/HashTable/StringHashTable.h
index bfa369ef8e4..f3ba54e7d6e 100644
--- a/src/Common/HashTable/StringHashTable.h
+++ b/src/Common/HashTable/StringHashTable.h
@@ -71,6 +71,28 @@ struct StringHashTableHash
         res = _mm_crc32_u64(res, key.c);
         return res;
     }
+#elif defined(__aarch64__) && defined(__ARM_FEATURE_CRC32)
+    size_t ALWAYS_INLINE operator()(StringKey8 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key);
+        return res;
+    }
+    size_t ALWAYS_INLINE operator()(StringKey16 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key.items[0]);
+        res = __crc32cd(static_cast<UInt32>(res), key.items[1]);
+        return res;
+    }
+    size_t ALWAYS_INLINE operator()(StringKey24 key) const
+    {
+        size_t res = -1ULL;
+        res = __crc32cd(static_cast<UInt32>(res), key.a);
+        res = __crc32cd(static_cast<UInt32>(res), key.b);
+        res = __crc32cd(static_cast<UInt32>(res), key.c);
+        return res;
+    }
 #elif defined(__s390x__) && __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
     size_t ALWAYS_INLINE operator()(StringKey8 key) const
     {

From dba792dff0e8e46712753e80e7e7244458dde1c8 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Tue, 23 Jan 2024 15:03:31 -0300
Subject: [PATCH 0219/1081] Remove duplicate includ

---
 src/Storages/StorageMergeTree.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index b08590242a1..a2c667a5e1d 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -44,7 +44,6 @@
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/PartitionCommands.h>
 #include <base/sort.h>
-#include <Storages/buildQueryTreeForShard.h>
 #include <QueryPipeline/Pipe.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>

From 617cc514b74a610ff1f314f911bfb78c779f0b4b Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 22 Jan 2024 22:55:50 +0000
Subject: [PATCH 0220/1081] Try to detect file format automatically during
 schema inference if it's unknown

---
 docs/en/interfaces/schema-inference.md        |  48 +-
 programs/local/LocalServer.cpp                |   2 +-
 programs/obfuscator/Obfuscator.cpp            |   2 +-
 src/Client/ClientBase.cpp                     |   2 +-
 src/Common/ErrorCodes.cpp                     |   1 +
 src/Databases/DatabaseFilesystem.cpp          |  15 +-
 src/Formats/FormatFactory.cpp                 |  86 ++--
 src/Formats/FormatFactory.h                   |  28 +-
 src/Formats/ReadSchemaUtils.cpp               | 423 +++++++++++++-----
 src/Formats/ReadSchemaUtils.h                 |  76 +++-
 src/IO/Archives/IArchiveReader.h              |   1 +
 src/IO/Archives/LibArchiveReader.cpp          |   9 +
 src/IO/Archives/LibArchiveReader.h            |   1 +
 src/IO/Archives/ZipArchiveReader.cpp          |   9 +
 src/IO/Archives/ZipArchiveReader.h            |   1 +
 src/Processors/Formats/ISchemaReader.cpp      |   2 +-
 src/Processors/Formats/ISchemaReader.h        |   4 +-
 .../Impl/JSONColumnsBlockInputFormatBase.cpp  |   2 +-
 .../Impl/JSONColumnsBlockInputFormatBase.h    |   2 +-
 .../Formats/Impl/JSONRowInputFormat.cpp       |  39 +-
 .../Formats/Impl/JSONRowInputFormat.h         |   5 +-
 .../Formats/Impl/TemplateRowInputFormat.cpp   |   4 +-
 .../Formats/Impl/ValuesBlockInputFormat.h     |   2 +-
 src/Server/TCPHandler.cpp                     |   1 -
 src/Storages/DataLakes/IStorageDataLake.h     |  14 +-
 .../DataLakes/Iceberg/StorageIceberg.cpp      |   4 +-
 .../DataLakes/Iceberg/StorageIceberg.h        |   8 +-
 src/Storages/HDFS/StorageHDFS.cpp             | 142 ++++--
 src/Storages/HDFS/StorageHDFS.h               |  17 +-
 src/Storages/HDFS/StorageHDFSCluster.cpp      |  22 +-
 src/Storages/HDFS/StorageHDFSCluster.h        |   6 +-
 src/Storages/IStorageCluster.cpp              |   7 +-
 src/Storages/IStorageCluster.h                |   7 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |   8 +-
 src/Storages/StorageAzureBlob.cpp             | 159 +++++--
 src/Storages/StorageAzureBlob.h               |  36 +-
 src/Storages/StorageAzureBlobCluster.cpp      |  22 +-
 src/Storages/StorageAzureBlobCluster.h        |   5 +-
 src/Storages/StorageFile.cpp                  | 421 +++++++++++------
 src/Storages/StorageFile.h                    |  36 +-
 src/Storages/StorageFileCluster.cpp           |  32 +-
 src/Storages/StorageFileCluster.h             |   8 +-
 src/Storages/StorageS3.cpp                    | 191 ++++++--
 src/Storages/StorageS3.h                      |  28 +-
 src/Storages/StorageS3Cluster.cpp             |  31 +-
 src/Storages/StorageS3Cluster.h               |   5 +-
 src/Storages/StorageURL.cpp                   | 190 ++++++--
 src/Storages/StorageURL.h                     |  36 +-
 src/Storages/StorageURLCluster.cpp            |  40 +-
 src/Storages/StorageURLCluster.h              |  10 +-
 src/Storages/StorageXDBC.cpp                  |   4 +-
 src/Storages/StorageXDBC.h                    |   4 +-
 src/TableFunctions/ITableFunctionCluster.h    |   5 +-
 src/TableFunctions/ITableFunctionFileLike.cpp |  36 +-
 src/TableFunctions/ITableFunctionFileLike.h   |   4 +-
 .../TableFunctionAzureBlobStorage.cpp         | 124 +++--
 .../TableFunctionAzureBlobStorage.h           |   2 +-
 .../TableFunctionAzureBlobStorageCluster.cpp  |   6 +-
 src/TableFunctions/TableFunctionFile.cpp      |   9 +-
 src/TableFunctions/TableFunctionFile.h        |   2 +-
 .../TableFunctionFileCluster.cpp              |   3 +-
 src/TableFunctions/TableFunctionFormat.cpp    |  45 +-
 src/TableFunctions/TableFunctionHDFS.cpp      |   2 +
 .../TableFunctionHDFSCluster.cpp              |   3 +-
 src/TableFunctions/TableFunctionS3.cpp        |  90 +++-
 src/TableFunctions/TableFunctionS3.h          |   2 +-
 src/TableFunctions/TableFunctionS3Cluster.cpp |   6 +-
 src/TableFunctions/TableFunctionURL.cpp       |  39 +-
 src/TableFunctions/TableFunctionURL.h         |   5 +-
 .../TableFunctionURLCluster.cpp               |   3 +-
 tests/integration/test_file_cluster/test.py   |  88 ++++
 tests/integration/test_s3_cluster/test.py     |  34 +-
 .../test_storage_azure_blob_storage/test.py   |  70 +++
 .../test_cluster.py                           |  69 +++
 tests/integration/test_storage_hdfs/test.py   |  68 +++
 tests/integration/test_storage_s3/test.py     |  54 +++
 .../02969_auto_format_detection.reference     | 123 +++++
 .../02969_auto_format_detection.sh            |  46 ++
 78 files changed, 2433 insertions(+), 763 deletions(-)
 create mode 100644 tests/queries/0_stateless/02969_auto_format_detection.reference
 create mode 100755 tests/queries/0_stateless/02969_auto_format_detection.sh

diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index 4db1d53987a..d255688da1f 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -13,7 +13,7 @@ can control it.
 
 Schema inference is used when ClickHouse needs to read the data in a specific data format and the structure is unknown.
 
-## Table functions [file](../sql-reference/table-functions/file.md), [s3](../sql-reference/table-functions/s3.md), [url](../sql-reference/table-functions/url.md), [hdfs](../sql-reference/table-functions/hdfs.md).
+## Table functions [file](../sql-reference/table-functions/file.md), [s3](../sql-reference/table-functions/s3.md), [url](../sql-reference/table-functions/url.md), [hdfs](../sql-reference/table-functions/hdfs.md), [azureBlobStorage](../sql-reference/table-functions/azureBlobStorage.md).
 
 These table functions have the optional argument `structure` with the structure of input data. If this argument is not specified or set to `auto`, the structure will be inferred from the data.
 
@@ -55,7 +55,7 @@ DESCRIBE file('hobbies.jsonl')
 └─────────┴─────────────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 
-## Table engines [File](../engines/table-engines/special/file.md), [S3](../engines/table-engines/integrations/s3.md), [URL](../engines/table-engines/special/url.md), [HDFS](../engines/table-engines/integrations/hdfs.md)
+## Table engines [File](../engines/table-engines/special/file.md), [S3](../engines/table-engines/integrations/s3.md), [URL](../engines/table-engines/special/url.md), [HDFS](../engines/table-engines/integrations/hdfs.md), [azureBlobStorage](./engines/table-engines/integrations/azureBlobStorage.md)
 
 If the list of columns is not specified in `CREATE TABLE` query, the structure of the table will be inferred automatically from the data.
 
@@ -1061,7 +1061,7 @@ $$)
 └──────────────┴───────────────┘
 ```
 
-## Values {#values}
+### Values {#values}
 
 In Values format ClickHouse extracts column value from the row and then parses it using
 the recursive parser similar to how literals are parsed.
@@ -1986,3 +1986,45 @@ Note:
 - As some of the files may not contain some columns from the resulting schema, union mode is supported only for formats that support reading subset of columns (like JSONEachRow, Parquet, TSVWithNames, etc) and won't work for other formats (like CSV, TSV, JSONCompactEachRow, etc).
 - If ClickHouse cannot infer the schema from one of the files, the exception will be thrown.
 - If you have a lot of files, reading schema from all of them can take a lot of time.
+
+
+## Automatic format detection {#autimatic-format-detection}
+
+If data format is not specified and cannot be determined by the file extension, ClickHouse will try to detect the file format by its content.
+
+**Examples:**
+
+Let's say we have `data` with the next content:
+`data1`:
+```
+"a","b"
+1,"Data1"
+2,"Data2"
+3,"Data3"
+```
+
+We can inspect and query this file without specifying format or structure:
+```sql
+:) desc file(data);
+```
+
+```text
+┌─name─┬─type─────────────┐
+│ a    │ Nullable(Int64)  │
+│ b    │ Nullable(String) │
+└──────┴──────────────────┘
+```
+
+```sql
+:) select * from file(data);
+```
+
+```text
+┌─a─┬─b─────┐
+│ 1 │ Data1 │
+│ 2 │ Data2 │
+│ 3 │ Data3 │
+└───┴───────┘
+```
+
+**Note:** ClickHouse can detect only some subset of formats and this detection takes some time, it's always better to specify the format explicitly.
\ No newline at end of file
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 4e0b9eeb731..dd96532aadd 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -348,7 +348,7 @@ std::string LocalServer::getInitialCreateTableQuery()
         /// Use regular file
         auto file_name = config().getString("table-file");
         table_file = quoteString(file_name);
-        format_from_file_name = FormatFactory::instance().getFormatFromFileName(file_name, false);
+        format_from_file_name = FormatFactory::instance().getFormatFromFileName(file_name);
     }
 
     auto data_format = backQuoteIfNeed(
diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index 7e09d5e8046..242e995e466 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -1310,7 +1310,7 @@ try
             throw ErrnoException(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Input must be seekable file (it will be read twice)");
 
         SingleReadBufferIterator read_buffer_iterator(std::move(file));
-        schema_columns = readSchemaFromFormat(input_format, {}, read_buffer_iterator, false, context_const);
+        schema_columns = readSchemaFromFormat(input_format, {}, read_buffer_iterator, context_const);
     }
     else
     {
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index e099aac0de9..01eff0d3e4c 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -1508,7 +1508,7 @@ void ClientBase::sendData(Block & sample, const ColumnsDescription & columns_des
 
         String current_format = parsed_insert_query->format;
         if (current_format.empty())
-            current_format = FormatFactory::instance().getFormatFromFileName(in_file, true);
+            current_format = FormatFactory::instance().getFormatFromFileName(in_file);
 
         /// Create temporary storage file, to support globs and parallel reading
         /// StorageFile doesn't support ephemeral/materialized/alias columns.
diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 975970bbeeb..01d1d2c679b 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -592,6 +592,7 @@
     M(710, FAULT_INJECTED) \
     M(711, FILECACHE_ACCESS_DENIED) \
     M(712, TOO_MANY_MATERIALIZED_VIEWS) \
+    M(713, CANNOT_DETECT_FORMAT) \
     \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
diff --git a/src/Databases/DatabaseFilesystem.cpp b/src/Databases/DatabaseFilesystem.cpp
index 5564f1d07cf..4105236f0ef 100644
--- a/src/Databases/DatabaseFilesystem.cpp
+++ b/src/Databases/DatabaseFilesystem.cpp
@@ -146,9 +146,18 @@ StoragePtr DatabaseFilesystem::getTableImpl(const String & name, ContextPtr cont
     if (!checkTableFilePath(table_path, context_, throw_on_error))
         return {};
 
-    auto format = FormatFactory::instance().getFormatFromFileName(table_path, throw_on_error);
-    if (format.empty())
-        return {};
+    String format;
+    if (throw_on_error)
+    {
+        format = FormatFactory::instance().getFormatFromFileName(table_path);
+    }
+    else
+    {
+        auto format_maybe = FormatFactory::instance().tryGetFormatFromFileName(table_path);
+        if (!format_maybe)
+            return {};
+        format = *format_maybe;
+    }
 
     auto ast_function_ptr = makeASTFunction("file", std::make_shared<ASTLiteral>(table_path), std::make_shared<ASTLiteral>(format));
 
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 608f9433d6f..cacb5a510da 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -39,7 +39,7 @@ const FormatFactory::Creators & FormatFactory::getCreators(const String & name)
     throw Exception(ErrorCodes::UNKNOWN_FORMAT, "Unknown format {}", name);
 }
 
-FormatSettings getFormatSettings(ContextPtr context)
+FormatSettings getFormatSettings(const ContextPtr & context)
 {
     const auto & settings = context->getSettingsRef();
 
@@ -47,7 +47,7 @@ FormatSettings getFormatSettings(ContextPtr context)
 }
 
 template <typename Settings>
-FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
+FormatSettings getFormatSettings(const ContextPtr & context, const Settings & settings)
 {
     FormatSettings format_settings;
 
@@ -253,16 +253,16 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     return format_settings;
 }
 
-template FormatSettings getFormatSettings<FormatFactorySettings>(ContextPtr context, const FormatFactorySettings & settings);
+template FormatSettings getFormatSettings<FormatFactorySettings>(const ContextPtr & context, const FormatFactorySettings & settings);
 
-template FormatSettings getFormatSettings<Settings>(ContextPtr context, const Settings & settings);
+template FormatSettings getFormatSettings<Settings>(const ContextPtr & context, const Settings & settings);
 
 
 InputFormatPtr FormatFactory::getInput(
     const String & name,
     ReadBuffer & _buf,
     const Block & sample,
-    ContextPtr context,
+    const ContextPtr & context,
     UInt64 max_block_size,
     const std::optional<FormatSettings> & _format_settings,
     std::optional<size_t> _max_parsing_threads,
@@ -425,7 +425,7 @@ std::unique_ptr<ReadBuffer> FormatFactory::wrapReadBufferIfNeeded(
     return res;
 }
 
-static void addExistingProgressToOutputFormat(OutputFormatPtr format, ContextPtr context)
+static void addExistingProgressToOutputFormat(OutputFormatPtr format, const ContextPtr & context)
 {
     auto element_id = context->getProcessListElementSafe();
     if (element_id)
@@ -444,7 +444,7 @@ OutputFormatPtr FormatFactory::getOutputFormatParallelIfPossible(
     const String & name,
     WriteBuffer & buf,
     const Block & sample,
-    ContextPtr context,
+    const ContextPtr & context,
     const std::optional<FormatSettings> & _format_settings) const
 {
     const auto & output_getter = getCreators(name).output_creator;
@@ -482,7 +482,7 @@ OutputFormatPtr FormatFactory::getOutputFormat(
     const String & name,
     WriteBuffer & buf,
     const Block & sample,
-    ContextPtr context,
+    const ContextPtr & context,
     const std::optional<FormatSettings> & _format_settings) const
 {
     const auto & output_getter = getCreators(name).output_creator;
@@ -516,7 +516,7 @@ OutputFormatPtr FormatFactory::getOutputFormat(
 
 String FormatFactory::getContentType(
     const String & name,
-    ContextPtr context,
+    const ContextPtr & context,
     const std::optional<FormatSettings> & _format_settings) const
 {
     const auto & output_getter = getCreators(name).output_creator;
@@ -535,7 +535,7 @@ String FormatFactory::getContentType(
 SchemaReaderPtr FormatFactory::getSchemaReader(
     const String & name,
     ReadBuffer & buf,
-    ContextPtr & context,
+    const ContextPtr & context,
     const std::optional<FormatSettings> & _format_settings) const
 {
     const auto & schema_reader_creator = dict.at(name).schema_reader_creator;
@@ -551,7 +551,7 @@ SchemaReaderPtr FormatFactory::getSchemaReader(
 
 ExternalSchemaReaderPtr FormatFactory::getExternalSchemaReader(
     const String & name,
-    ContextPtr & context,
+    const ContextPtr & context,
     const std::optional<FormatSettings> & _format_settings) const
 {
     const auto & external_schema_reader_creator = dict.at(name).external_schema_reader_creator;
@@ -605,7 +605,7 @@ void FormatFactory::markFormatHasNoAppendSupport(const String & name)
     registerAppendSupportChecker(name, [](const FormatSettings &){ return false; });
 }
 
-bool FormatFactory::checkIfFormatSupportAppend(const String & name, ContextPtr context, const std::optional<FormatSettings> & format_settings_)
+bool FormatFactory::checkIfFormatSupportAppend(const String & name, const ContextPtr & context, const std::optional<FormatSettings> & format_settings_)
 {
     auto format_settings = format_settings_ ? *format_settings_ : getFormatSettings(context);
     auto & append_support_checker = dict[name].append_support_checker;
@@ -628,10 +628,10 @@ void FormatFactory::registerFileExtension(const String & extension, const String
     file_extension_formats[boost::to_lower_copy(extension)] = format_name;
 }
 
-String FormatFactory::getFormatFromFileName(String file_name, bool throw_if_not_found)
+std::optional<String> FormatFactory::tryGetFormatFromFileName(String file_name)
 {
     if (file_name == "stdin")
-        return getFormatFromFileDescriptor(STDIN_FILENO);
+        return tryGetFormatFromFileDescriptor(STDIN_FILENO);
 
     CompressionMethod compression_method = chooseCompressionMethod(file_name, "");
     if (CompressionMethod::None != compression_method)
@@ -643,43 +643,53 @@ String FormatFactory::getFormatFromFileName(String file_name, bool throw_if_not_
 
     auto pos = file_name.find_last_of('.');
     if (pos == String::npos)
-    {
-        if (throw_if_not_found)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot determine the file format by it's extension");
-        return "";
-    }
+        return std::nullopt;
 
     String file_extension = file_name.substr(pos + 1, String::npos);
     boost::algorithm::to_lower(file_extension);
     auto it = file_extension_formats.find(file_extension);
     if (it == file_extension_formats.end())
-    {
-        if (throw_if_not_found)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot determine the file format by it's extension");
-        return "";
-    }
+        return std::nullopt;
+
     return it->second;
 }
 
-String FormatFactory::getFormatFromFileDescriptor(int fd)
+String FormatFactory::getFormatFromFileName(String file_name)
+{
+    if (auto format = tryGetFormatFromFileName(file_name))
+        return *format;
+
+    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot determine the format of the file {} by it's extension", file_name);
+}
+
+std::optional<String> FormatFactory::tryGetFormatFromFileDescriptor(int fd)
 {
 #ifdef OS_LINUX
     std::string proc_path = fmt::format("/proc/self/fd/{}", fd);
     char file_path[PATH_MAX] = {'\0'};
     if (readlink(proc_path.c_str(), file_path, sizeof(file_path) - 1) != -1)
-        return getFormatFromFileName(file_path, false);
-    return "";
+        return tryGetFormatFromFileName(file_path);
+    return std::nullopt;
 #elif defined(OS_DARWIN)
     char file_path[PATH_MAX] = {'\0'};
     if (fcntl(fd, F_GETPATH, file_path) != -1)
-        return getFormatFromFileName(file_path, false);
-    return "";
+        return tryGetFormatFromFileName(file_path, false);
+    return std::nullopt;
 #else
     (void)fd;
-    return "";
+    return std::nullopt;
 #endif
 }
 
+String FormatFactory::getFormatFromFileDescriptor(int fd)
+{
+    if (auto format = tryGetFormatFromFileDescriptor(fd))
+        return *format;
+
+    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot determine the format of the data by the file descriptor {}", fd);
+}
+
+
 void FormatFactory::registerFileSegmentationEngine(const String & name, FileSegmentationEngine file_segmentation_engine)
 {
     auto & target = dict[name].file_segmentation_engine_creator;
@@ -765,7 +775,7 @@ void FormatFactory::registerAdditionalInfoForSchemaCacheGetter(
     target = std::move(additional_info_for_schema_cache_getter);
 }
 
-String FormatFactory::getAdditionalInfoForSchemaCache(const String & name, ContextPtr context, const std::optional<FormatSettings> & format_settings_)
+String FormatFactory::getAdditionalInfoForSchemaCache(const String & name, const ContextPtr & context, const std::optional<FormatSettings> & format_settings_)
 {
     const auto & additional_info_getter = getCreators(name).additional_info_for_schema_cache_getter;
     if (!additional_info_getter)
@@ -810,7 +820,7 @@ bool FormatFactory::checkIfOutputFormatPrefersLargeBlocks(const String & name) c
     return target.prefers_large_blocks;
 }
 
-bool FormatFactory::checkParallelizeOutputAfterReading(const String & name, ContextPtr context) const
+bool FormatFactory::checkParallelizeOutputAfterReading(const String & name, const ContextPtr & context) const
 {
     if (name == "Parquet" && context->getSettingsRef().input_format_parquet_preserve_order)
         return false;
@@ -825,6 +835,18 @@ void FormatFactory::checkFormatName(const String & name) const
         throw Exception(ErrorCodes::UNKNOWN_FORMAT, "Unknown format {}", name);
 }
 
+std::vector<String> FormatFactory::getAllInputFormats() const
+{
+    std::vector<String> input_formats;
+    for (const auto & [format_name, creators] : dict)
+    {
+        if (creators.input_creator || creators.random_access_input_creator)
+            input_formats.push_back(format_name);
+    }
+
+    return input_formats;
+}
+
 FormatFactory & FormatFactory::instance()
 {
     static FormatFactory ret;
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index 9670c690456..165a20f7c4d 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -48,10 +48,10 @@ using RowOutputFormatPtr = std::shared_ptr<IRowOutputFormat>;
 template <typename Allocator>
 struct Memory;
 
-FormatSettings getFormatSettings(ContextPtr context);
+FormatSettings getFormatSettings(const ContextPtr & context);
 
 template <typename T>
-FormatSettings getFormatSettings(ContextPtr context, const T & settings);
+FormatSettings getFormatSettings(const ContextPtr & context, const T & settings);
 
 /** Allows to create an IInputFormat or IOutputFormat by the name of the format.
   * Note: format and compression are independent things.
@@ -161,7 +161,7 @@ public:
         const String & name,
         ReadBuffer & buf,
         const Block & sample,
-        ContextPtr context,
+        const ContextPtr & context,
         UInt64 max_block_size,
         const std::optional<FormatSettings> & format_settings = std::nullopt,
         std::optional<size_t> max_parsing_threads = std::nullopt,
@@ -178,30 +178,30 @@ public:
         const String & name,
         WriteBuffer & buf,
         const Block & sample,
-        ContextPtr context,
+        const ContextPtr & context,
         const std::optional<FormatSettings> & format_settings = std::nullopt) const;
 
     OutputFormatPtr getOutputFormat(
         const String & name,
         WriteBuffer & buf,
         const Block & sample,
-        ContextPtr context,
+        const ContextPtr & context,
         const std::optional<FormatSettings> & _format_settings = std::nullopt) const;
 
     String getContentType(
         const String & name,
-        ContextPtr context,
+        const ContextPtr & context,
         const std::optional<FormatSettings> & format_settings = std::nullopt) const;
 
     SchemaReaderPtr getSchemaReader(
         const String & name,
         ReadBuffer & buf,
-        ContextPtr & context,
+        const ContextPtr & context,
         const std::optional<FormatSettings> & format_settings = std::nullopt) const;
 
     ExternalSchemaReaderPtr getExternalSchemaReader(
         const String & name,
-        ContextPtr & context,
+        const ContextPtr & context,
         const std::optional<FormatSettings> & format_settings = std::nullopt) const;
 
     void registerFileSegmentationEngine(const String & name, FileSegmentationEngine file_segmentation_engine);
@@ -216,7 +216,7 @@ public:
     /// registerAppendSupportChecker with append_support_checker that always returns true.
     void markFormatHasNoAppendSupport(const String & name);
 
-    bool checkIfFormatSupportAppend(const String & name, ContextPtr context, const std::optional<FormatSettings> & format_settings_ = std::nullopt);
+    bool checkIfFormatSupportAppend(const String & name, const ContextPtr & context, const std::optional<FormatSettings> & format_settings_ = std::nullopt);
 
     /// Register format by its name.
     void registerInputFormat(const String & name, InputCreator input_creator);
@@ -225,8 +225,10 @@ public:
 
     /// Register file extension for format
     void registerFileExtension(const String & extension, const String & format_name);
-    String getFormatFromFileName(String file_name, bool throw_if_not_found = false);
+    String getFormatFromFileName(String file_name);
+    std::optional<String> tryGetFormatFromFileName(String file_name);
     String getFormatFromFileDescriptor(int fd);
+    std::optional<String> tryGetFormatFromFileDescriptor(int fd);
 
     /// Register schema readers for format its name.
     void registerSchemaReader(const String & name, SchemaReaderCreator schema_reader_creator);
@@ -244,16 +246,18 @@ public:
     bool checkIfFormatHasAnySchemaReader(const String & name) const;
     bool checkIfOutputFormatPrefersLargeBlocks(const String & name) const;
 
-    bool checkParallelizeOutputAfterReading(const String & name, ContextPtr context) const;
+    bool checkParallelizeOutputAfterReading(const String & name, const ContextPtr & context) const;
 
     void registerAdditionalInfoForSchemaCacheGetter(const String & name, AdditionalInfoForSchemaCacheGetter additional_info_for_schema_cache_getter);
-    String getAdditionalInfoForSchemaCache(const String & name, ContextPtr context, const std::optional<FormatSettings> & format_settings_ = std::nullopt);
+    String getAdditionalInfoForSchemaCache(const String & name, const ContextPtr & context, const std::optional<FormatSettings> & format_settings_ = std::nullopt);
 
     const FormatsDictionary & getAllFormats() const
     {
         return dict;
     }
 
+    std::vector<String> getAllInputFormats() const;
+
     bool isInputFormat(const String & name) const;
     bool isOutputFormat(const String & name) const;
 
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 43931be3449..b4fba7b9ce6 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -4,6 +4,7 @@
 #include <Common/assert_cast.h>
 #include <IO/WithFileSize.h>
 #include <IO/EmptyReadBuffer.h>
+#include <IO/PeekableReadBuffer.h>
 
 namespace DB
 {
@@ -14,7 +15,9 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int ONLY_NULLS_WHILE_READING_SCHEMA;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int CANNOT_DETECT_FORMAT;
     extern const int TYPE_MISMATCH;
+    extern const int LOGICAL_ERROR;
 }
 
 static std::optional<NamesAndTypesList> getOrderedColumnsList(const NamesAndTypesList & columns_list, const Names & columns_order_hint)
@@ -43,48 +46,86 @@ bool isRetryableSchemaInferenceError(int code)
     return code == ErrorCodes::EMPTY_DATA_PASSED || code == ErrorCodes::ONLY_NULLS_WHILE_READING_SCHEMA;
 }
 
-ColumnsDescription readSchemaFromFormat(
-    const String & format_name,
+/// Order of formats to try in automatic format detection.
+/// If we can successfully detect some format, we won't try next ones.
+static const std::vector<String> & getFormatsOrderForDetection()
+{
+    static const std::vector<String> formats_order =
+    {
+        "Parquet",
+        "ORC",
+        "Arrow",
+        "ArrowStream",
+        "Avro",
+        "AvroConfluent",
+        "Npy",
+        "Native",
+        "BSONEachRow",
+        "JSONCompact",
+        "Values",
+        "TSKV",
+        "JSONObjectEachRow",
+        "JSONColumns",
+        "JSONCompactColumns",
+        "JSONCompact",
+        "JSON",
+    };
+
+    return formats_order;
+}
+
+/// The set of similar formats to try in automatic format detection.
+/// We will try all formats from this set and then choose the best one
+/// according to inferred schema.
+static const std::vector<String> & getSimilarFormatsSetForDetection()
+{
+    static const std::vector<String> formats_order =
+    {
+        "TSV",
+        "CSV",
+    };
+
+    return formats_order;
+}
+
+std::pair<ColumnsDescription, String> readSchemaFromFormatImpl(
+    std::optional<String> format_name,
     const std::optional<FormatSettings> & format_settings,
     IReadBufferIterator & read_buffer_iterator,
-    bool retry,
-    ContextPtr & context,
-    std::unique_ptr<ReadBuffer> & buf)
+    const ContextPtr & context)
 try
 {
     NamesAndTypesList names_and_types;
     SchemaInferenceMode mode = context->getSettingsRef().schema_inference_mode;
-    if (mode == SchemaInferenceMode::UNION && !FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(format_name, context, format_settings))
+    if (format_name && mode == SchemaInferenceMode::UNION && !FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(*format_name, context, format_settings))
     {
         String additional_message;
         /// Better exception message for WithNames(AndTypes) formats.
-        if (format_name.ends_with("WithNames") || format_name.ends_with("WithNamesAndTypes"))
+        if (format_name->ends_with("WithNames") || format_name->ends_with("WithNamesAndTypes"))
             additional_message = " (formats -WithNames(AndTypes) support reading subset of columns only when setting input_format_with_names_use_header is enabled)";
 
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "UNION schema inference mode is not supported for format {}, because it doesn't support reading subset of columns{}", format_name, additional_message);
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "UNION schema inference mode is not supported for format {}, because it doesn't support reading subset of columns{}", *format_name, additional_message);
     }
 
-    if (FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format_name))
+    if (format_name && FormatFactory::instance().checkIfFormatHasExternalSchemaReader(*format_name))
     {
-        auto external_schema_reader = FormatFactory::instance().getExternalSchemaReader(format_name, context, format_settings);
+        auto external_schema_reader = FormatFactory::instance().getExternalSchemaReader(*format_name, context, format_settings);
         try
         {
-            names_and_types = external_schema_reader->readSchema();
+            return {ColumnsDescription(external_schema_reader->readSchema()), *format_name};
         }
         catch (Exception & e)
         {
             e.addMessage(
-                fmt::format("Cannot extract table structure from {} format file. You can specify the structure manually", format_name));
+                fmt::format("The table structure cannot be extracted from a {} format file. You can specify the structure manually", *format_name));
             throw;
         }
     }
-    else if (FormatFactory::instance().checkIfFormatHasSchemaReader(format_name))
-    {
-        if (mode == SchemaInferenceMode::UNION)
-            retry = false;
 
+    if (!format_name || FormatFactory::instance().checkIfFormatHasSchemaReader(*format_name))
+    {
+        IReadBufferIterator::Data iterator_data;
         std::vector<std::pair<NamesAndTypesList, String>> schemas_for_union_mode;
-        std::optional<ColumnsDescription> cached_columns;
         std::string exception_messages;
         SchemaReaderPtr schema_reader;
         size_t max_rows_to_read = format_settings ? format_settings->max_rows_to_read_for_schema_inference
@@ -94,45 +135,71 @@ try
         size_t iterations = 0;
         while (true)
         {
+            /// When we finish working with current buffer we should put it back to iterator.
+            SCOPE_EXIT(if (iterator_data.buf) read_buffer_iterator.setPreviousReadBuffer(std::move(iterator_data.buf)));
             bool is_eof = false;
             try
             {
-                read_buffer_iterator.setPreviousReadBuffer(std::move(buf));
-                std::tie(buf, cached_columns) = read_buffer_iterator.next();
-                if (cached_columns)
+                iterator_data = read_buffer_iterator.next();
+
+                /// Read buffer iterator can determine the data format if it's unknown.
+                /// For example by scanning schema cache or by finding new file with format extension.
+                if (!format_name && iterator_data.format_name)
                 {
+                    format_name = *iterator_data.format_name;
+                    read_buffer_iterator.setFormatName(*iterator_data.format_name);
+                }
+
+                if (iterator_data.cached_columns)
+                {
+                    /// If we have schema in cache, we must also know the format.
+                    if (!format_name)
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Schema from cache was returned, but format name is unknown");
+
                     if (mode == SchemaInferenceMode::DEFAULT)
-                        return *cached_columns;
-                    schemas_for_union_mode.emplace_back(cached_columns->getAll(), read_buffer_iterator.getLastFileName());
+                    {
+                        read_buffer_iterator.setResultingSchema(*iterator_data.cached_columns);
+                        return {*iterator_data.cached_columns, *format_name};
+                    }
+
+                    schemas_for_union_mode.emplace_back(iterator_data.cached_columns->getAll(), read_buffer_iterator.getLastFileName());
                     continue;
                 }
 
-                if (!buf)
+                if (!iterator_data.buf)
                     break;
 
                 /// We just want to check for eof, but eof() can be pretty expensive.
                 /// So we use getFileSize() when available, which has better worst case.
                 /// (For remote files, typically eof() would read 1 MB from S3, which may be much
                 ///  more than what the schema reader and even data reader will read).
-                auto size = tryGetFileSizeFromReadBuffer(*buf);
+                auto size = tryGetFileSizeFromReadBuffer(*iterator_data.buf);
                 if (size.has_value())
                     is_eof = *size == 0;
                 else
-                    is_eof = buf->eof();
+                    is_eof = iterator_data.buf->eof();
             }
             catch (Exception & e)
             {
-                e.addMessage(
-                    fmt::format("Cannot extract table structure from {} format file. You can specify the structure manually", format_name));
+                if (format_name)
+                    e.addMessage(fmt::format("The table structure cannot be extracted from a {} format file. You can specify the structure manually", *format_name));
+                else
+                    e.addMessage("The data format cannot be detected by the contents of the files. You can specify the format manually");
                 throw;
             }
             catch (...)
             {
                 auto exception_message = getCurrentExceptionMessage(false);
+                if (format_name)
+                    throw Exception(
+                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                        "The table structure cannot be extracted from a {} format file:\n{}\nYou can specify the structure manually",
+                        *format_name,
+                        exception_message);
+
                 throw Exception(
-                    ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                    "Cannot extract table structure from {} format file:\n{}\nYou can specify the structure manually",
-                    format_name,
+                    ErrorCodes::CANNOT_DETECT_FORMAT,
+                    "The data format cannot be detected by the contents of the files:\n{}\nYou can specify the format manually",
                     exception_message);
             }
 
@@ -140,91 +207,218 @@ try
 
             if (is_eof)
             {
-                auto exception_message = fmt::format("Cannot extract table structure from {} format file, file is empty", format_name);
+                String exception_message;
+                if (format_name)
+                    exception_message = fmt::format("The table structure cannot be extracted from a {} format file: the file is empty", *format_name);
+                else
+                    exception_message = fmt::format("The data format cannot be detected by the contents of the files: the file is empty");
 
-                if (!retry)
-                    throw Exception(
-                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE, "{}. You can specify the structure manually", exception_message);
+                if (mode == SchemaInferenceMode::UNION)
+                {
+                    if (!format_name)
+                        throw Exception(ErrorCodes::CANNOT_DETECT_FORMAT, "The data format cannot be detected by the contents of the files: the file is empty. You can specify the format manually");
 
-                exception_messages += "\n" + exception_message;
+                    throw Exception(ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE, "{}. You can specify the structure manually", exception_message);
+                }
+
+                if (!exception_messages.empty())
+                    exception_messages += "\n";
+                exception_messages += exception_message;
                 continue;
             }
 
-            try
+            if (format_name)
             {
-                schema_reader = FormatFactory::instance().getSchemaReader(format_name, *buf, context, format_settings);
-                schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
-                names_and_types = schema_reader->readSchema();
-                auto num_rows = schema_reader->readNumberOrRows();
-                if (num_rows)
-                    read_buffer_iterator.setNumRowsToLastFile(*num_rows);
-
-                /// In default mode, we finish when schema is inferred successfully from any file.
-                if (mode == SchemaInferenceMode::DEFAULT)
-                    break;
-
-                if (!names_and_types.empty())
-                    read_buffer_iterator.setSchemaToLastFile(ColumnsDescription(names_and_types));
-                schemas_for_union_mode.emplace_back(names_and_types, read_buffer_iterator.getLastFileName());
-            }
-            catch (...)
-            {
-                auto exception_message = getCurrentExceptionMessage(false);
-                if (schema_reader && mode == SchemaInferenceMode::DEFAULT)
+                try
                 {
-                    size_t rows_read = schema_reader->getNumRowsRead();
-                    assert(rows_read <= max_rows_to_read);
-                    max_rows_to_read -= schema_reader->getNumRowsRead();
-                    size_t bytes_read = buf->count();
-                    /// We could exceed max_bytes_to_read a bit to complete row parsing.
-                    max_bytes_to_read -= std::min(bytes_read, max_bytes_to_read);
-                    if (rows_read != 0 && (max_rows_to_read == 0 || max_bytes_to_read == 0))
-                    {
-                        exception_message += "\nTo increase the maximum number of rows/bytes to read for structure determination, use setting "
-                                             "input_format_max_rows_to_read_for_schema_inference/input_format_max_bytes_to_read_for_schema_inference";
+                    schema_reader = FormatFactory::instance().getSchemaReader(*format_name, *iterator_data.buf, context, format_settings);
+                    schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
+                    names_and_types = schema_reader->readSchema();
+                    auto num_rows = schema_reader->readNumberOrRows();
+                    if (num_rows)
+                        read_buffer_iterator.setNumRowsToLastFile(*num_rows);
 
-                        if (iterations > 1)
+                    /// In default mode, we finish when schema is inferred successfully from any file.
+                    if (mode == SchemaInferenceMode::DEFAULT)
+                        break;
+
+                    if (!names_and_types.empty())
+                        read_buffer_iterator.setSchemaToLastFile(ColumnsDescription(names_and_types));
+                    schemas_for_union_mode.emplace_back(names_and_types, read_buffer_iterator.getLastFileName());
+                }
+                catch (...)
+                {
+                    auto exception_message = getCurrentExceptionMessage(false);
+                    if (schema_reader && mode == SchemaInferenceMode::DEFAULT)
+                    {
+                        size_t rows_read = schema_reader->getNumRowsRead();
+                        assert(rows_read <= max_rows_to_read);
+                        max_rows_to_read -= schema_reader->getNumRowsRead();
+                        size_t bytes_read = iterator_data.buf->count();
+                        /// We could exceed max_bytes_to_read a bit to complete row parsing.
+                        max_bytes_to_read -= std::min(bytes_read, max_bytes_to_read);
+                        if (rows_read != 0 && (max_rows_to_read == 0 || max_bytes_to_read == 0))
                         {
-                            exception_messages += "\n" + exception_message;
+                            exception_message
+                                += "\nTo increase the maximum number of rows/bytes to read for structure determination, use setting "
+                                   "input_format_max_rows_to_read_for_schema_inference/input_format_max_bytes_to_read_for_schema_inference";
+                            if (!exception_messages.empty())
+                                exception_messages += "\n";
+                            exception_messages += exception_message;
                             break;
                         }
-                        retry = false;
                     }
-                }
 
-                if (!retry || !isRetryableSchemaInferenceError(getCurrentExceptionCode()))
-                {
-                    try
-                    {
-                        throw;
-                    }
-                    catch (Exception & e)
-                    {
-                        e.addMessage(fmt::format(
-                            "Cannot extract table structure from {} format file. You can specify the structure manually", format_name));
-                        throw;
-                    }
-                    catch (...)
+                    if (mode == SchemaInferenceMode::UNION || !isRetryableSchemaInferenceError(getCurrentExceptionCode()))
                     {
                         throw Exception(
                             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                            "Cannot extract table structure from {} format file. "
+                            "The table structure cannot be extracted from a {} format file. "
                             "Error: {}. You can specify the structure manually",
-                            format_name,
+                            *format_name,
                             exception_message);
                     }
+
+                    if (!exception_messages.empty())
+                        exception_messages += "\n";
+                    exception_messages += exception_message;
+                }
+            }
+            else
+            {
+                /// If the format is unknown we try some formats in order and try to apply their schema readers.
+                /// If we can successfully infer the schema in some format, most likely we can use this format to read this data.
+
+                /// If read_buffer_iterator supports recreation of last buffer, we will recreate it for
+                /// each format. Otherwise we will use PeekableReadBuffer and will rollback to the
+                /// beginning of the file before each format. Using PeekableReadBuffer can lead
+                /// to high memory usage as it will save all the read data from the beginning of the file,
+                /// especially it will be noticeable for formats like Parquet/ORC/Arrow that do seeks to the
+                /// end of file.
+                std::unique_ptr<PeekableReadBuffer> peekable_buf;
+                bool support_buf_recreation = read_buffer_iterator.supportsLastReadBufferRecreation();
+                if (!support_buf_recreation)
+                {
+                    peekable_buf = std::make_unique<PeekableReadBuffer>(*iterator_data.buf);
+                    peekable_buf->setCheckpoint();
+                }
+
+                /// First, try some formats in order. If we successfully inferred the schema for any format,
+                /// we will use this format.
+                for (const auto & format_to_detect : getFormatsOrderForDetection())
+                {
+                    try
+                    {
+                        schema_reader = FormatFactory::instance().getSchemaReader(format_to_detect, support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
+                        schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
+                        names_and_types = schema_reader->readSchema();
+                        if (names_and_types.empty())
+                            continue;
+
+                        /// We successfully inferred schema from this file using current format.
+                        format_name = format_to_detect;
+                        read_buffer_iterator.setFormatName(format_to_detect);
+
+                        auto num_rows = schema_reader->readNumberOrRows();
+                        if (num_rows)
+                            read_buffer_iterator.setNumRowsToLastFile(*num_rows);
+
+                        break;
+                    }
+                    catch (...)
+                    {
+                        /// We failed to infer the schema for this format.
+                        /// Recreate read buffer or rollback to the beginning of the data
+                        /// before trying next format.
+                        if (support_buf_recreation)
+                        {
+                            read_buffer_iterator.setPreviousReadBuffer(std::move(iterator_data.buf));
+                            iterator_data.buf = read_buffer_iterator.recreateLastReadBuffer();
+                        }
+                        else
+                        {
+                            peekable_buf->rollbackToCheckpoint();
+                        }
+                    }
                 }
 
-                exception_messages += "\n" + exception_message;
+                /// If no format was detected from first set of formats, we try second set.
+                /// In this set formats are similar and it can happen that data matches some of them.
+                /// We try to infer schema for all of the formats from this set and then choose the best
+                /// one according to the inferred schema.
+                if (!format_name)
+                {
+                    std::unordered_map<String, NamesAndTypesList> format_to_schema;
+                    for (const auto & format_to_detect : getSimilarFormatsSetForDetection())
+                    {
+                        try
+                        {
+                            schema_reader = FormatFactory::instance().getSchemaReader(
+                                format_to_detect, support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
+                            schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
+                            auto tmp_names_and_types = schema_reader->readSchema();
+                            /// If schema was inferred successfully for this format, remember it and try next format.
+                            if (!tmp_names_and_types.empty())
+                                format_to_schema[format_to_detect] = tmp_names_and_types;
+                        }
+                        catch (...) // NOLINT(bugprone-empty-catch)
+                        {
+                            /// Try next format.
+                        }
+
+                        if (support_buf_recreation)
+                        {
+                            read_buffer_iterator.setPreviousReadBuffer(std::move(iterator_data.buf));
+                            iterator_data.buf = read_buffer_iterator.recreateLastReadBuffer();
+                        }
+                        else
+                        {
+                            peekable_buf->rollbackToCheckpoint();
+                        }
+                    }
+
+                    /// We choose the format with larger number of columns in inferred schema.
+                    size_t max_number_of_columns = 0;
+                    for (const auto & [format_to_detect, schema] : format_to_schema )
+                    {
+                        if (schema.size() > max_number_of_columns)
+                        {
+                            names_and_types = schema;
+                            format_name = format_to_detect;
+                            max_number_of_columns = schema.size();
+                        }
+                    }
+
+                    if (format_name)
+                        read_buffer_iterator.setFormatName(*format_name);
+                }
+
+                if (mode == SchemaInferenceMode::UNION)
+                {
+                    /// For UNION mode we need to know the schema of each file,
+                    /// if we failed to detect the format, we failed to detect the schema of this file
+                    /// in any format. It doesn't make sense to continue.
+                    if (!format_name)
+                        throw Exception(ErrorCodes::CANNOT_DETECT_FORMAT, "The data format cannot be detected by the contents of the files. You can specify the format manually");
+
+                    read_buffer_iterator.setSchemaToLastFile(ColumnsDescription(names_and_types));
+                    schemas_for_union_mode.emplace_back(names_and_types, read_buffer_iterator.getLastFileName());
+                }
+
+                if (format_name && mode == SchemaInferenceMode::DEFAULT)
+                    break;
             }
         }
 
+        if (!format_name)
+            throw Exception(ErrorCodes::CANNOT_DETECT_FORMAT, "The data format cannot be detected by the contents of the files. You can specify the format manually");
+
         /// If we got all schemas from cache, schema_reader can be uninitialized.
         /// But we still need some stateless methods of ISchemaReader,
         /// let's initialize it with empty buffer.
         EmptyReadBuffer empty;
         if (!schema_reader)
-            schema_reader = FormatFactory::instance().getSchemaReader(format_name, empty, context, format_settings);
+            schema_reader = FormatFactory::instance().getSchemaReader(*format_name, empty, context, format_settings);
 
         if (mode == SchemaInferenceMode::UNION)
         {
@@ -273,11 +467,23 @@ try
         }
 
         if (names_and_types.empty())
+        {
+            if (iterations <= 1)
+            {
+                throw Exception(
+                    ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                    "The table structure cannot be extracted from a {} format file. "
+                    "Error: {}. You can specify the structure manually",
+                    *format_name,
+                    exception_messages);
+            }
+
             throw Exception(
                 ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                 "All attempts to extract table structure from files failed. "
-                "Errors:{}\nYou can specify the structure manually",
+                "Errors:\n{}\nYou can specify the structure manually",
                 exception_messages);
+        }
 
         /// If we have "INSERT SELECT" query then try to order
         /// columns as they are ordered in table schema for formats
@@ -294,22 +500,22 @@ try
             if (ordered_list)
                 names_and_types = *ordered_list;
         }
+
+        /// Some formats like CSVWithNames can contain empty column names. We don't support empty column names and further processing can fail with an exception. Let's just remove columns with empty names from the structure.
+        names_and_types.erase(
+            std::remove_if(names_and_types.begin(), names_and_types.end(), [](const NameAndTypePair & pair) { return pair.name.empty(); }),
+            names_and_types.end());
+
+        auto columns = ColumnsDescription(names_and_types);
+        if (mode == SchemaInferenceMode::DEFAULT)
+            read_buffer_iterator.setResultingSchema(columns);
+        return {columns, *format_name};
     }
-    else
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "{} file format doesn't support schema inference. You must specify the structure manually",
-            format_name);
 
-    /// Some formats like CSVWithNames can contain empty column names. We don't support empty column names and further processing can fail with an exception. Let's just remove columns with empty names from the structure.
-    names_and_types.erase(
-        std::remove_if(names_and_types.begin(), names_and_types.end(), [](const NameAndTypePair & pair) { return pair.name.empty(); }),
-        names_and_types.end());
-
-    auto columns = ColumnsDescription(names_and_types);
-    if (mode == SchemaInferenceMode::DEFAULT)
-        read_buffer_iterator.setResultingSchema(columns);
-    return columns;
+    throw Exception(
+        ErrorCodes::BAD_ARGUMENTS,
+        "{} file format doesn't support schema inference. You must specify the structure manually",
+        *format_name);
 }
 catch (Exception & e)
 {
@@ -319,16 +525,21 @@ catch (Exception & e)
     throw;
 }
 
-
 ColumnsDescription readSchemaFromFormat(
     const String & format_name,
     const std::optional<FormatSettings> & format_settings,
     IReadBufferIterator & read_buffer_iterator,
-    bool retry,
-    ContextPtr & context)
+    const ContextPtr & context)
 {
-    std::unique_ptr<ReadBuffer> buf_out;
-    return readSchemaFromFormat(format_name, format_settings, read_buffer_iterator, retry, context, buf_out);
+    return readSchemaFromFormatImpl(format_name, format_settings, read_buffer_iterator, context).first;
+}
+
+std::pair<ColumnsDescription, String> detectFormatAndReadSchema(
+    const std::optional<FormatSettings> & format_settings,
+    IReadBufferIterator & read_buffer_iterator,
+    const ContextPtr & context)
+{
+    return readSchemaFromFormatImpl(std::nullopt, format_settings, read_buffer_iterator, context);
 }
 
 SchemaCache::Key getKeyForSchemaCache(
diff --git a/src/Formats/ReadSchemaUtils.h b/src/Formats/ReadSchemaUtils.h
index 6aa8f3f9c4c..bb5e068f696 100644
--- a/src/Formats/ReadSchemaUtils.h
+++ b/src/Formats/ReadSchemaUtils.h
@@ -7,29 +7,68 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+}
+
 struct IReadBufferIterator
 {
     virtual ~IReadBufferIterator() = default;
 
-    virtual void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> /* buffer */) {}
-
     /// Return read buffer of the next file or cached schema.
     /// In DEFAULT schema inference mode cached schema can be from any file.
     /// In UNION mode cached schema can be only from current file.
     /// When there is no files to process, return pair (nullptr, nullopt)
-    virtual std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() = 0;
 
+    struct Data
+    {
+        /// Read buffer of the next file. Can be nullptr if there are no more files
+        /// or when schema was found in cache.
+        std::unique_ptr<ReadBuffer> buf;
+
+        /// Schema from cache.
+        /// In DEFAULT schema inference mode cached schema can be from any file.
+        /// In UNION mode cached schema can be only from current file.
+        std::optional<ColumnsDescription> cached_columns;
+
+        /// Format of the file if known.
+        std::optional<String> format_name;
+    };
+
+    virtual Data next() = 0;
+
+    /// Set read buffer returned in previous iteration.
+    virtual void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> /* buffer */) {}
+
+    /// Set number of rows to last file extracted during schema inference.
+    /// Used for caching number of rows from files metadata during schema inference.
     virtual void setNumRowsToLastFile(size_t /*num_rows*/) {}
 
     /// Set schema inferred from last file. Used for UNION mode to cache schema
     /// per file.
     virtual void setSchemaToLastFile(const ColumnsDescription & /*columns*/) {}
+
     /// Set resulting inferred schema. Used for DEFAULT mode to cache schema
     /// for all files.
     virtual void setResultingSchema(const ColumnsDescription & /*columns*/) {}
 
+    /// Set auto detected format name.
+    virtual void setFormatName(const String & /*format_name*/) {}
+
     /// Get last processed file name for better exception messages.
     virtual String getLastFileName() const { return ""; }
+
+    /// Return true if method recreateLastReadBuffer is implemented.
+    virtual bool supportsLastReadBufferRecreation() const { return false; }
+
+    /// Recreate last read buffer to read data from the same file again.
+    /// Used to detect format from the file content to avoid
+    /// copying data.
+    virtual std::unique_ptr<ReadBuffer> recreateLastReadBuffer()
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method recreateLastReadBuffer is not implemented");
+    }
 };
 
 struct SingleReadBufferIterator : public IReadBufferIterator
@@ -39,12 +78,22 @@ public:
     {
     }
 
-    std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+    Data next() override
     {
         if (done)
-            return {nullptr, {}};
+            return {nullptr, {}, std::nullopt};
         done = true;
-        return {std::move(buf), {}};
+        return Data{std::move(buf), {}, std::nullopt};
+    }
+
+    void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> buf_) override
+    {
+        buf = std::move(buf_);
+    }
+
+    std::unique_ptr<ReadBuffer> releaseBuffer()
+    {
+        return std::move(buf);
     }
 
 private:
@@ -73,17 +122,16 @@ ColumnsDescription readSchemaFromFormat(
     const String & format_name,
     const std::optional<FormatSettings> & format_settings,
     IReadBufferIterator & read_buffer_iterator,
-    bool retry,
-    ContextPtr & context);
+    const ContextPtr & context);
 
-/// If ReadBuffer is created, it will be written to buf_out.
-ColumnsDescription readSchemaFromFormat(
-    const String & format_name,
+/// Try to detect the format of the data and it's schema.
+/// It runs schema inference for some set of formats on the same file.
+/// If schema reader of some format successfully inferred the schema from
+/// some file, we consider that the data is in this format.
+std::pair<ColumnsDescription, String> detectFormatAndReadSchema(
     const std::optional<FormatSettings> & format_settings,
     IReadBufferIterator & read_buffer_iterator,
-    bool retry,
-    ContextPtr & context,
-    std::unique_ptr<ReadBuffer> & buf_out);
+    const ContextPtr & context);
 
 SchemaCache::Key getKeyForSchemaCache(const String & source, const String & format, const std::optional<FormatSettings> & format_settings, const ContextPtr & context);
 SchemaCache::Keys getKeysForSchemaCache(const Strings & sources, const String & format, const std::optional<FormatSettings> & format_settings, const ContextPtr & context);
diff --git a/src/IO/Archives/IArchiveReader.h b/src/IO/Archives/IArchiveReader.h
index 84a1dc21f5b..ee516d2655b 100644
--- a/src/IO/Archives/IArchiveReader.h
+++ b/src/IO/Archives/IArchiveReader.h
@@ -56,6 +56,7 @@ public:
     /// It's possible to convert a file enumerator to a read buffer and vice versa.
     virtual std::unique_ptr<ReadBufferFromFileBase> readFile(std::unique_ptr<FileEnumerator> enumerator) = 0;
     virtual std::unique_ptr<FileEnumerator> nextFile(std::unique_ptr<ReadBuffer> read_buffer) = 0;
+    virtual std::unique_ptr<FileEnumerator> currentFile(std::unique_ptr<ReadBuffer> read_buffer) = 0;
 
     virtual std::vector<std::string> getAllFiles() = 0;
     virtual std::vector<std::string> getAllFiles(NameFilter filter) = 0;
diff --git a/src/IO/Archives/LibArchiveReader.cpp b/src/IO/Archives/LibArchiveReader.cpp
index 763cd3b171b..eb190f2e0fc 100644
--- a/src/IO/Archives/LibArchiveReader.cpp
+++ b/src/IO/Archives/LibArchiveReader.cpp
@@ -340,6 +340,15 @@ std::unique_ptr<LibArchiveReader::FileEnumerator> LibArchiveReader::nextFile(std
     return std::make_unique<FileEnumeratorImpl>(std::move(handle));
 }
 
+std::unique_ptr<LibArchiveReader::FileEnumerator> LibArchiveReader::currentFile(std::unique_ptr<ReadBuffer> read_buffer)
+{
+    if (!dynamic_cast<ReadBufferFromLibArchive *>(read_buffer.get()))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong ReadBuffer passed to nextFile()");
+    auto read_buffer_from_libarchive = std::unique_ptr<ReadBufferFromLibArchive>(static_cast<ReadBufferFromLibArchive *>(read_buffer.release()));
+    auto handle = std::move(*read_buffer_from_libarchive).releaseHandle();
+    return std::make_unique<FileEnumeratorImpl>(std::move(handle));
+}
+
 std::vector<std::string> LibArchiveReader::getAllFiles()
 {
     return getAllFiles({});
diff --git a/src/IO/Archives/LibArchiveReader.h b/src/IO/Archives/LibArchiveReader.h
index 3dadd710089..c4b08d8ddf7 100644
--- a/src/IO/Archives/LibArchiveReader.h
+++ b/src/IO/Archives/LibArchiveReader.h
@@ -40,6 +40,7 @@ public:
     /// It's possible to convert a file enumerator to a read buffer and vice versa.
     std::unique_ptr<ReadBufferFromFileBase> readFile(std::unique_ptr<FileEnumerator> enumerator) override;
     std::unique_ptr<FileEnumerator> nextFile(std::unique_ptr<ReadBuffer> read_buffer) override;
+    std::unique_ptr<FileEnumerator> currentFile(std::unique_ptr<ReadBuffer> read_buffer) override;
 
     std::vector<std::string> getAllFiles() override;
     std::vector<std::string> getAllFiles(NameFilter filter) override;
diff --git a/src/IO/Archives/ZipArchiveReader.cpp b/src/IO/Archives/ZipArchiveReader.cpp
index 636042ec586..63fdf5fe190 100644
--- a/src/IO/Archives/ZipArchiveReader.cpp
+++ b/src/IO/Archives/ZipArchiveReader.cpp
@@ -589,6 +589,15 @@ std::unique_ptr<ZipArchiveReader::FileEnumerator> ZipArchiveReader::nextFile(std
     return std::make_unique<FileEnumeratorImpl>(std::move(handle));
 }
 
+std::unique_ptr<ZipArchiveReader::FileEnumerator> ZipArchiveReader::currentFile(std::unique_ptr<ReadBuffer> read_buffer)
+{
+    if (!dynamic_cast<ReadBufferFromZipArchive *>(read_buffer.get()))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong ReadBuffer passed to nextFile()");
+    auto read_buffer_from_zip = std::unique_ptr<ReadBufferFromZipArchive>(static_cast<ReadBufferFromZipArchive *>(read_buffer.release()));
+    auto handle = std::move(*read_buffer_from_zip).releaseHandle();
+    return std::make_unique<FileEnumeratorImpl>(std::move(handle));
+}
+
 std::vector<std::string> ZipArchiveReader::getAllFiles()
 {
     return getAllFiles({});
diff --git a/src/IO/Archives/ZipArchiveReader.h b/src/IO/Archives/ZipArchiveReader.h
index a8788064fec..4b1910839eb 100644
--- a/src/IO/Archives/ZipArchiveReader.h
+++ b/src/IO/Archives/ZipArchiveReader.h
@@ -47,6 +47,7 @@ public:
     /// It's possible to convert a file enumerator to a read buffer and vice versa.
     std::unique_ptr<ReadBufferFromFileBase> readFile(std::unique_ptr<FileEnumerator> enumerator) override;
     std::unique_ptr<FileEnumerator> nextFile(std::unique_ptr<ReadBuffer> read_buffer) override;
+    std::unique_ptr<FileEnumerator> currentFile(std::unique_ptr<ReadBuffer> read_buffer) override;
 
     std::vector<std::string> getAllFiles() override;
     std::vector<std::string> getAllFiles(NameFilter filter) override;
diff --git a/src/Processors/Formats/ISchemaReader.cpp b/src/Processors/Formats/ISchemaReader.cpp
index 26c632b83dc..c5c6ba84d9a 100644
--- a/src/Processors/Formats/ISchemaReader.cpp
+++ b/src/Processors/Formats/ISchemaReader.cpp
@@ -81,7 +81,7 @@ IIRowSchemaReader::IIRowSchemaReader(ReadBuffer & in_, const FormatSettings & fo
 {
 }
 
-void IIRowSchemaReader::setContext(ContextPtr & context)
+void IIRowSchemaReader::setContext(const ContextPtr & context)
 {
     ColumnsDescription columns;
     if (tryParseColumnsListFromString(hints_str, columns, context, hints_parsing_error))
diff --git a/src/Processors/Formats/ISchemaReader.h b/src/Processors/Formats/ISchemaReader.h
index 94df71a88b4..23c6606a6bd 100644
--- a/src/Processors/Formats/ISchemaReader.h
+++ b/src/Processors/Formats/ISchemaReader.h
@@ -34,7 +34,7 @@ public:
     virtual bool hasStrictOrderOfColumns() const { return true; }
 
     virtual bool needContext() const { return false; }
-    virtual void setContext(ContextPtr &) {}
+    virtual void setContext(const ContextPtr &) {}
 
     virtual void setMaxRowsAndBytesToRead(size_t, size_t) {}
     virtual size_t getNumRowsRead() const { return 0; }
@@ -56,7 +56,7 @@ public:
     IIRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_, DataTypePtr default_type_ = nullptr);
 
     bool needContext() const override { return !hints_str.empty(); }
-    void setContext(ContextPtr & context) override;
+    void setContext(const ContextPtr & context) override;
 
 protected:
     void setMaxRowsAndBytesToRead(size_t max_rows, size_t max_bytes) override
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
index 53cb5a77898..62d33d36206 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
@@ -215,7 +215,7 @@ JSONColumnsSchemaReaderBase::JSONColumnsSchemaReaderBase(
 {
 }
 
-void JSONColumnsSchemaReaderBase::setContext(ContextPtr & ctx)
+void JSONColumnsSchemaReaderBase::setContext(const ContextPtr & ctx)
 {
     ColumnsDescription columns;
     if (tryParseColumnsListFromString(hints_str, columns, ctx, hints_parsing_error))
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
index fe80d77cd87..ee7e79afc54 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
@@ -84,7 +84,7 @@ public:
     void transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
     bool needContext() const override { return !hints_str.empty(); }
-    void setContext(ContextPtr & ctx) override;
+    void setContext(const ContextPtr & ctx) override;
 
     void setMaxRowsAndBytesToRead(size_t max_rows, size_t max_bytes) override
     {
diff --git a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
index f78ce530ecb..7283eb1330f 100644
--- a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
@@ -70,27 +70,36 @@ void JSONRowInputFormat::resetReadBuffer()
     JSONEachRowRowInputFormat::resetReadBuffer();
 }
 
-JSONRowSchemaReader::JSONRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
-    : JSONRowSchemaReader(std::make_unique<PeekableReadBuffer>(in_), format_settings_)
+JSONRowSchemaReader::JSONRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_, bool fallback_to_json_each_row_)
+    : JSONRowSchemaReader(std::make_unique<PeekableReadBuffer>(in_), format_settings_, fallback_to_json_each_row_)
 {
 }
 
-JSONRowSchemaReader::JSONRowSchemaReader(std::unique_ptr<PeekableReadBuffer> buf, const DB::FormatSettings & format_settings_)
-    : JSONEachRowSchemaReader(*buf, format_settings_), peekable_buf(std::move(buf))
+JSONRowSchemaReader::JSONRowSchemaReader(std::unique_ptr<PeekableReadBuffer> buf, const DB::FormatSettings & format_settings_, bool fallback_to_json_each_row_)
+    : JSONEachRowSchemaReader(*buf, format_settings_), peekable_buf(std::move(buf)), fallback_to_json_each_row(fallback_to_json_each_row_)
 {
 }
 
 NamesAndTypesList JSONRowSchemaReader::readSchema()
 {
     skipBOMIfExists(*peekable_buf);
-    PeekableReadBufferCheckpoint checkpoint(*peekable_buf);
-    /// Try to parse metadata, if failed, try to parse data as JSONEachRow format
-    NamesAndTypesList names_and_types;
-    if (JSONUtils::checkAndSkipObjectStart(*peekable_buf) && JSONUtils::tryReadMetadata(*peekable_buf, names_and_types))
-        return names_and_types;
 
-    peekable_buf->rollbackToCheckpoint(true);
-    return JSONEachRowSchemaReader::readSchema();
+    if (fallback_to_json_each_row)
+    {
+        PeekableReadBufferCheckpoint checkpoint(*peekable_buf);
+        /// Try to parse metadata, if failed, try to parse data as JSONEachRow format
+        NamesAndTypesList names_and_types;
+        if (JSONUtils::checkAndSkipObjectStart(*peekable_buf) && JSONUtils::tryReadMetadata(*peekable_buf, names_and_types))
+            return names_and_types;
+
+        peekable_buf->rollbackToCheckpoint(true);
+        return JSONEachRowSchemaReader::readSchema();
+    }
+    else
+    {
+        JSONUtils::skipObjectStart(*peekable_buf);
+        return JSONUtils::readMetadata(*peekable_buf);
+    }
 }
 
 void registerInputFormatJSON(FormatFactory & factory)
@@ -109,19 +118,19 @@ void registerInputFormatJSON(FormatFactory & factory)
 
 void registerJSONSchemaReader(FormatFactory & factory)
 {
-    auto register_schema_reader = [&](const String & format)
+    auto register_schema_reader = [&](const String & format, bool fallback_to_json_each_row)
     {
         factory.registerSchemaReader(
-            format, [](ReadBuffer & buf, const FormatSettings & format_settings) { return std::make_unique<JSONRowSchemaReader>(buf, format_settings); });
+            format, [fallback_to_json_each_row](ReadBuffer & buf, const FormatSettings & format_settings) { return std::make_unique<JSONRowSchemaReader>(buf, format_settings, fallback_to_json_each_row); });
 
         factory.registerAdditionalInfoForSchemaCacheGetter(format, [](const FormatSettings & settings)
         {
             return getAdditionalFormatInfoByEscapingRule(settings, FormatSettings::EscapingRule::JSON);
         });
     };
-    register_schema_reader("JSON");
+    register_schema_reader("JSON", true);
     /// JSONCompact has the same suffix with metadata.
-    register_schema_reader("JSONCompact");
+    register_schema_reader("JSONCompact", false);
 }
 
 }
diff --git a/src/Processors/Formats/Impl/JSONRowInputFormat.h b/src/Processors/Formats/Impl/JSONRowInputFormat.h
index b2e1d8a3d6d..6db5cee380a 100644
--- a/src/Processors/Formats/Impl/JSONRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONRowInputFormat.h
@@ -45,16 +45,17 @@ private:
 class JSONRowSchemaReader : public JSONEachRowSchemaReader
 {
 public:
-    JSONRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_);
+    JSONRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_, bool fallback_to_json_each_row_);
 
     NamesAndTypesList readSchema() override;
 
     bool hasStrictOrderOfColumns() const override { return false; }
 
 private:
-    JSONRowSchemaReader(std::unique_ptr<PeekableReadBuffer> buf, const FormatSettings & format_settings_);
+    JSONRowSchemaReader(std::unique_ptr<PeekableReadBuffer> buf, const FormatSettings & format_settings_, bool fallback_to_json_each_row_);
 
     std::unique_ptr<PeekableReadBuffer> peekable_buf;
+    bool fallback_to_json_each_row;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp b/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
index a6e4600d83b..f5edfb7c9d4 100644
--- a/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
@@ -609,7 +609,9 @@ void registerTemplateSchemaReader(FormatFactory & factory)
         {
             size_t index = 0;
             auto idx_getter = [&](const String &) -> std::optional<size_t> { return index++; };
-            auto row_format = fillRowFormat(settings, idx_getter, false);
+            ParsedTemplateFormatString row_format;
+            if (!settings.template_settings.row_format.empty())
+                row_format = fillRowFormat(settings, idx_getter, false);
             std::unordered_set<FormatSettings::EscapingRule> visited_escaping_rules;
             String result = fmt::format("row_format={}, resultset_format={}, row_between_delimiter={}",
                 settings.template_settings.row_format,
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
index bf2765bfd1e..f82a8c8ab64 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
@@ -37,7 +37,7 @@ public:
     void resetReadBuffer() override;
 
     /// TODO: remove context somehow.
-    void setContext(ContextPtr & context_) { context = Context::createCopy(context_); }
+    void setContext(const ContextPtr & context_) { context = Context::createCopy(context_); }
 
     const BlockMissingValues & getMissingValues() const override { return block_missing_values; }
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index fa7206eeaac..8120667916e 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -35,7 +35,6 @@
 #include <Server/TCPServer.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/MergeTree/MergeTreeDataPartUUID.h>
-#include <Storages/StorageS3Cluster.h>
 #include <Core/ExternalTable.h>
 #include <Core/ServerSettings.h>
 #include <Access/AccessControl.h>
diff --git a/src/Storages/DataLakes/IStorageDataLake.h b/src/Storages/DataLakes/IStorageDataLake.h
index 77a22cd00fc..72b182ad1f4 100644
--- a/src/Storages/DataLakes/IStorageDataLake.h
+++ b/src/Storages/DataLakes/IStorageDataLake.h
@@ -38,25 +38,25 @@ public:
     static ColumnsDescription getTableStructureFromData(
         Configuration & base_configuration,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr local_context)
+        const ContextPtr & local_context)
     {
         auto configuration = getConfigurationForDataRead(base_configuration, local_context);
         return Storage::getTableStructureFromData(configuration, format_settings, local_context);
     }
 
-    static Configuration getConfiguration(ASTs & engine_args, ContextPtr local_context)
+    static Configuration getConfiguration(ASTs & engine_args, const ContextPtr & local_context)
     {
         return Storage::getConfiguration(engine_args, local_context, /* get_format_from_file */false);
     }
 
-    Configuration updateConfigurationAndGetCopy(ContextPtr local_context) override
+    Configuration updateConfigurationAndGetCopy(const ContextPtr & local_context) override
     {
         std::lock_guard lock(configuration_update_mutex);
         updateConfigurationImpl(local_context);
         return Storage::getConfiguration();
     }
 
-    void updateConfiguration(ContextPtr local_context) override
+    void updateConfiguration(const ContextPtr & local_context) override
     {
         std::lock_guard lock(configuration_update_mutex);
         updateConfigurationImpl(local_context);
@@ -64,7 +64,7 @@ public:
 
 private:
     static Configuration getConfigurationForDataRead(
-        const Configuration & base_configuration, ContextPtr local_context, const Strings & keys = {})
+        const Configuration & base_configuration, const ContextPtr & local_context, const Strings & keys = {})
     {
         auto configuration{base_configuration};
         configuration.update(local_context);
@@ -84,12 +84,12 @@ private:
         return configuration;
     }
 
-    static Strings getDataFiles(const Configuration & configuration, ContextPtr local_context)
+    static Strings getDataFiles(const Configuration & configuration, const ContextPtr & local_context)
     {
         return MetadataParser().getFiles(configuration, local_context);
     }
 
-    void updateConfigurationImpl(ContextPtr local_context)
+    void updateConfigurationImpl(const ContextPtr & local_context)
     {
         const bool updated = base_configuration.update(local_context);
         auto new_keys = getDataFiles(base_configuration, local_context);
diff --git a/src/Storages/DataLakes/Iceberg/StorageIceberg.cpp b/src/Storages/DataLakes/Iceberg/StorageIceberg.cpp
index 20ac77976cb..faef21d6c72 100644
--- a/src/Storages/DataLakes/Iceberg/StorageIceberg.cpp
+++ b/src/Storages/DataLakes/Iceberg/StorageIceberg.cpp
@@ -40,7 +40,7 @@ StorageIceberg::StorageIceberg(
 ColumnsDescription StorageIceberg::getTableStructureFromData(
     Configuration & base_configuration,
     const std::optional<FormatSettings> &,
-    ContextPtr local_context)
+    const ContextPtr & local_context)
 {
     auto configuration{base_configuration};
     configuration.update(local_context);
@@ -48,7 +48,7 @@ ColumnsDescription StorageIceberg::getTableStructureFromData(
     return ColumnsDescription(metadata->getTableSchema());
 }
 
-void StorageIceberg::updateConfigurationImpl(ContextPtr local_context)
+void StorageIceberg::updateConfigurationImpl(const ContextPtr & local_context)
 {
     const bool updated = base_configuration.update(local_context);
     auto new_metadata = parseIcebergMetadata(base_configuration, local_context);
diff --git a/src/Storages/DataLakes/Iceberg/StorageIceberg.h b/src/Storages/DataLakes/Iceberg/StorageIceberg.h
index a18865b5a54..0b346ef0175 100644
--- a/src/Storages/DataLakes/Iceberg/StorageIceberg.h
+++ b/src/Storages/DataLakes/Iceberg/StorageIceberg.h
@@ -51,28 +51,28 @@ public:
     static ColumnsDescription getTableStructureFromData(
         Configuration & base_configuration,
         const std::optional<FormatSettings> &,
-        ContextPtr local_context);
+        const ContextPtr & local_context);
 
     static Configuration getConfiguration(ASTs & engine_args, ContextPtr local_context)
     {
         return StorageS3::getConfiguration(engine_args, local_context, /* get_format_from_file */false);
     }
 
-    Configuration updateConfigurationAndGetCopy(ContextPtr local_context) override
+    Configuration updateConfigurationAndGetCopy(const ContextPtr & local_context) override
     {
         std::lock_guard lock(configuration_update_mutex);
         updateConfigurationImpl(local_context);
         return StorageS3::getConfiguration();
     }
 
-    void updateConfiguration(ContextPtr local_context) override
+    void updateConfiguration(const ContextPtr & local_context) override
     {
         std::lock_guard lock(configuration_update_mutex);
         updateConfigurationImpl(local_context);
     }
 
 private:
-    void updateConfigurationImpl(ContextPtr local_context);
+    void updateConfigurationImpl(const ContextPtr & local_context);
 
     std::unique_ptr<IcebergMetadata> current_metadata;
     Configuration base_configuration;
diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index 1e26f1be72c..a846e9fd9ef 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -67,6 +67,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
     extern const int CANNOT_COMPILE_REGEXP;
+    extern const int CANNOT_DETECT_FORMAT;
 }
 namespace
 {
@@ -194,7 +195,7 @@ StorageHDFS::StorageHDFS(
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
     const String & comment,
-    ContextPtr context_,
+    const ContextPtr & context_,
     const String & compression_method_,
     const bool distributed_processing_,
     ASTPtr partition_by_)
@@ -206,7 +207,8 @@ StorageHDFS::StorageHDFS(
     , distributed_processing(distributed_processing_)
     , partition_by(partition_by_)
 {
-    FormatFactory::instance().checkFormatName(format_name);
+    if (format_name != "auto")
+        FormatFactory::instance().checkFormatName(format_name);
     context_->getRemoteHostFilter().checkURL(Poco::URI(uri_));
     checkHDFSURL(uri_);
 
@@ -217,11 +219,19 @@ StorageHDFS::StorageHDFS(
 
     if (columns_.empty())
     {
-        auto columns = getTableStructureFromData(format_name, uri_, compression_method, context_);
+        ColumnsDescription columns;
+        if (format_name == "auto")
+            std::tie(columns, format_name) = getTableStructureAndFormatFromData(uri_, compression_method_, context_);
+        else
+            columns = getTableStructureFromData(format_name, uri_, compression_method, context_);
+
         storage_metadata.setColumns(columns);
     }
     else
     {
+        if (format_name == "auto")
+            format_name = getTableStructureAndFormatFromData(uri_, compression_method_, context_).second;
+
         /// We don't allow special columns in HDFS storage.
         if (!columns_.hasOnlyOrdinary())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table engine HDFS doesn't support special columns like MATERIALIZED, ALIAS or EPHEMERAL");
@@ -243,25 +253,25 @@ namespace
         ReadBufferIterator(
             const std::vector<StorageHDFS::PathWithInfo> & paths_with_info_,
             const String & uri_without_path_,
-            const String & format_,
+            std::optional<String> format_,
             const String & compression_method_,
             const ContextPtr & context_)
         : WithContext(context_)
         , paths_with_info(paths_with_info_)
         , uri_without_path(uri_without_path_)
-        , format(format_)
+        , format(std::move(format_))
         , compression_method(compression_method_)
         {
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
             bool is_first = current_index == 0;
             /// For default mode check cached columns for all paths on first iteration.
             if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
             {
                 if (auto cached_columns = tryGetColumnsFromCache(paths_with_info))
-                    return {nullptr, cached_columns};
+                    return {nullptr, cached_columns, format};
             }
 
             StorageHDFS::PathWithInfo path_with_info;
@@ -271,10 +281,17 @@ namespace
                 if (current_index == paths_with_info.size())
                 {
                     if (is_first)
-                        throw Exception(ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                                        "Cannot extract table structure from {} format file, because all files are empty. "
-                                        "You must specify table structure manually", format);
-                    return {nullptr, std::nullopt};
+                    {
+                        if (format)
+                            throw Exception(ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                            "The table structure cannot be extracted from a {} format file, because all files are empty. "
+                                            "You can specify table structure manually", *format);
+
+                        throw Exception(
+                            ErrorCodes::CANNOT_DETECT_FORMAT,
+                            "The data format cannot be detected by the contents of the files, because all files are empty. You can specify table structure manually");
+                    }
+                    return {nullptr, std::nullopt, format};
                 }
 
                 path_with_info = paths_with_info[current_index++];
@@ -285,7 +302,7 @@ namespace
                 {
                     std::vector<StorageHDFS::PathWithInfo> paths = {path_with_info};
                     if (auto cached_columns = tryGetColumnsFromCache(paths))
-                        return {nullptr, cached_columns};
+                        return {nullptr, cached_columns, format};
                 }
 
                 auto compression = chooseCompressionMethod(path_with_info.path, compression_method);
@@ -293,7 +310,7 @@ namespace
                 if (!getContext()->getSettingsRef().hdfs_skip_empty_files || !impl->eof())
                 {
                     const Int64 zstd_window_log_max = getContext()->getSettingsRef().zstd_window_log_max;
-                    return {wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max)), std::nullopt};
+                    return {wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max)), std::nullopt, format};
                 }
             }
         }
@@ -304,7 +321,7 @@ namespace
                 return;
 
             String source = uri_without_path + paths_with_info[current_index - 1].path;
-            auto key = getKeyForSchemaCache(source, format, std::nullopt, getContext());
+            auto key = getKeyForSchemaCache(source, *format, std::nullopt, getContext());
             StorageHDFS::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -315,7 +332,7 @@ namespace
                 return;
 
             String source = uri_without_path + paths_with_info[current_index - 1].path;
-            auto key = getKeyForSchemaCache(source, format, std::nullopt, getContext());
+            auto key = getKeyForSchemaCache(source, *format, std::nullopt, getContext());
             StorageHDFS::getSchemaCache(getContext()).addColumns(key, columns);
         }
 
@@ -328,10 +345,15 @@ namespace
             Strings sources;
             sources.reserve(paths_with_info.size());
             std::transform(paths_with_info.begin(), paths_with_info.end(), std::back_inserter(sources), [&](const StorageHDFS::PathWithInfo & path_with_info){ return uri_without_path + path_with_info.path; });
-            auto cache_keys = getKeysForSchemaCache(sources, format, {}, getContext());
+            auto cache_keys = getKeysForSchemaCache(sources, *format, {}, getContext());
             StorageHDFS::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+
         String getLastFileName() const override
         {
             if (current_index != 0)
@@ -340,13 +362,27 @@ namespace
             return "";
         }
 
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            chassert(current_index > 0 && current_index <= paths_with_info.size());
+            auto path_with_info = paths_with_info[current_index - 1];
+            auto compression = chooseCompressionMethod(path_with_info.path, compression_method);
+            auto impl = std::make_unique<ReadBufferFromHDFS>(uri_without_path, path_with_info.path, getContext()->getGlobalContext()->getConfigRef(), getContext()->getReadSettings());
+            const Int64 zstd_window_log_max = getContext()->getSettingsRef().zstd_window_log_max;
+            return wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+        }
+
     private:
         std::optional<ColumnsDescription> tryGetColumnsFromCache(const std::vector<StorageHDFS::PathWithInfo> & paths_with_info_)
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_hdfs)
+            auto context = getContext();
+
+            if (!context->getSettingsRef().schema_inference_use_cache_for_hdfs)
                 return std::nullopt;
 
-            auto & schema_cache = StorageHDFS::getSchemaCache(getContext());
+            auto & schema_cache = StorageHDFS::getSchemaCache(context);
             for (const auto & path_with_info : paths_with_info_)
             {
                 auto get_last_mod_time = [&]() -> std::optional<time_t>
@@ -354,7 +390,7 @@ namespace
                     if (path_with_info.info)
                         return path_with_info.info->last_mod_time;
 
-                    auto builder = createHDFSBuilder(uri_without_path + "/", getContext()->getGlobalContext()->getConfigRef());
+                    auto builder = createHDFSBuilder(uri_without_path + "/", context->getGlobalContext()->getConfigRef());
                     auto fs = createHDFSFS(builder.get());
                     HDFSFileInfoPtr hdfs_info(hdfsGetPathInfo(fs.get(), path_with_info.path.c_str()));
                     if (hdfs_info)
@@ -364,10 +400,28 @@ namespace
                 };
 
                 String url = uri_without_path + path_with_info.path;
-                auto cache_key = getKeyForSchemaCache(url, format, {}, getContext());
-                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-                if (columns)
-                    return columns;
+                if (format)
+                {
+                    auto cache_key = getKeyForSchemaCache(url, *format, {}, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        return columns;
+                }
+                else
+                {
+                    /// If format is unknown, we can iterate through all possible input formats
+                    /// and check if we have an entry with this format and this file in schema cache.
+                    /// If we have such entry for some format, we can use this format to read the file.
+                    for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                    {
+                        auto cache_key = getKeyForSchemaCache(url, format_name, {}, context);
+                        if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        {
+                            /// Now format is known. It should be the same for all files.
+                            format = format_name;
+                            return columns;
+                        }
+                    }
+                }
             }
 
             return std::nullopt;
@@ -375,29 +429,49 @@ namespace
 
         const std::vector<StorageHDFS::PathWithInfo> & paths_with_info;
         const String & uri_without_path;
-        const String & format;
+        std::optional<String> format;
         const String & compression_method;
         size_t current_index = 0;
     };
 }
 
-ColumnsDescription StorageHDFS::getTableStructureFromData(
-    const String & format,
+std::pair<ColumnsDescription, String> StorageHDFS::getTableStructureAndFormatFromDataImpl(
+    std::optional<String> format,
     const String & uri,
     const String & compression_method,
-    ContextPtr ctx)
+    const ContextPtr & ctx)
 {
     const auto [path_from_uri, uri_without_path] = getPathFromUriAndUriWithoutPath(uri);
     auto paths_with_info = getPathsList(path_from_uri, uri, ctx);
 
-    if (paths_with_info.empty() && !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format))
+    if (paths_with_info.empty() && (!format || !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(*format)))
+    {
+        if (format)
+            throw Exception(
+                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                "The table structure cannot be extracted from a {} format file, because there are no files in HDFS with provided path."
+                " You can specify table structure manually", *format);
+
         throw Exception(
             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-            "Cannot extract table structure from {} format file, because there are no files in HDFS with provided path."
-            " You must specify table structure manually", format);
+            "The data format cannot be detected by the contents of the files, because there are no files in HDFS with provided path."
+            " You can specify the format manually");
+    }
 
     ReadBufferIterator read_buffer_iterator(paths_with_info, uri_without_path, format, compression_method, ctx);
-    return readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, paths_with_info.size() > 1, ctx);
+    if (format)
+        return {readSchemaFromFormat(*format, std::nullopt, read_buffer_iterator, ctx), *format};
+    return detectFormatAndReadSchema(std::nullopt, read_buffer_iterator, ctx);
+}
+
+std::pair<ColumnsDescription, String> StorageHDFS::getTableStructureAndFormatFromData(const String & uri, const String & compression_method, const ContextPtr & ctx)
+{
+    return getTableStructureAndFormatFromDataImpl(std::nullopt, uri, compression_method, ctx);
+}
+
+ColumnsDescription StorageHDFS::getTableStructureFromData(const String & format, const String & uri, const String & compression_method, const DB::ContextPtr & ctx)
+{
+    return getTableStructureAndFormatFromDataImpl(format, uri, compression_method, ctx).first;
 }
 
 class HDFSSource::DisclosedGlobIterator::Impl
@@ -533,7 +607,7 @@ StorageHDFS::PathWithInfo HDFSSource::URISIterator::next()
 HDFSSource::HDFSSource(
     const ReadFromFormatInfo & info,
     StorageHDFSPtr storage_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     UInt64 max_block_size_,
     std::shared_ptr<IteratorWrapper> file_iterator_,
     bool need_only_count_)
@@ -712,7 +786,7 @@ public:
     HDFSSink(const String & uri,
         const String & format,
         const Block & sample_block,
-        ContextPtr context,
+        const ContextPtr & context,
         const CompressionMethod compression_method)
         : SinkToStorage(sample_block)
     {
@@ -1073,7 +1147,7 @@ void registerStorageHDFS(StorageFactory & factory)
         }
 
         if (format_name == "auto")
-            format_name = FormatFactory::instance().getFormatFromFileName(url, true);
+            format_name = FormatFactory::instance().getFormatFromFileName(url);
 
         String compression_method;
         if (engine_args.size() == 3)
diff --git a/src/Storages/HDFS/StorageHDFS.h b/src/Storages/HDFS/StorageHDFS.h
index f1f0019d3e0..1edbf2b77ce 100644
--- a/src/Storages/HDFS/StorageHDFS.h
+++ b/src/Storages/HDFS/StorageHDFS.h
@@ -44,7 +44,7 @@ public:
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
         const String & comment,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const String & compression_method_ = "",
         bool distributed_processing_ = false,
         ASTPtr partition_by = nullptr);
@@ -86,7 +86,12 @@ public:
         const String & format,
         const String & uri,
         const String & compression_method,
-        ContextPtr ctx);
+        const ContextPtr & ctx);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromData(
+        const String & uri,
+        const String & compression_method,
+        const ContextPtr & ctx);
 
     static SchemaCache & getSchemaCache(const ContextPtr & ctx);
 
@@ -97,6 +102,12 @@ protected:
     friend class ReadFromHDFS;
 
 private:
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromDataImpl(
+        std::optional<String> format,
+        const String & uri,
+        const String & compression_method,
+        const ContextPtr & ctx);
+
     std::vector<String> uris;
     String format_name;
     String compression_method;
@@ -141,7 +152,7 @@ public:
     HDFSSource(
         const ReadFromFormatInfo & info,
         StorageHDFSPtr storage_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         UInt64 max_block_size_,
         std::shared_ptr<IteratorWrapper> file_iterator_,
         bool need_only_count_);
diff --git a/src/Storages/HDFS/StorageHDFSCluster.cpp b/src/Storages/HDFS/StorageHDFSCluster.cpp
index 2e8129b9845..a1e03926520 100644
--- a/src/Storages/HDFS/StorageHDFSCluster.cpp
+++ b/src/Storages/HDFS/StorageHDFSCluster.cpp
@@ -43,12 +43,10 @@ StorageHDFSCluster::StorageHDFSCluster(
     const String & format_name_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
-    const String & compression_method_,
-    bool structure_argument_was_provided_)
-    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageHDFSCluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
+    const String & compression_method)
+    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageHDFSCluster (" + table_id_.table_name + ")"))
     , uri(uri_)
     , format_name(format_name_)
-    , compression_method(compression_method_)
 {
     checkHDFSURL(uri_);
     context_->getRemoteHostFilter().checkURL(Poco::URI(uri_));
@@ -57,11 +55,20 @@ StorageHDFSCluster::StorageHDFSCluster(
 
     if (columns_.empty())
     {
-        auto columns = StorageHDFS::getTableStructureFromData(format_name, uri_, compression_method, context_);
+        ColumnsDescription columns;
+        if (format_name == "auto")
+            std::tie(columns, format_name) = StorageHDFS::getTableStructureAndFormatFromData(uri_, compression_method, context_);
+        else
+            columns = StorageHDFS::getTableStructureFromData(format_name, uri_, compression_method, context_);
         storage_metadata.setColumns(columns);
     }
     else
+    {
+        if (format_name == "auto")
+            format_name = StorageHDFS::getTableStructureAndFormatFromData(uri_, compression_method, context_).second;
+
         storage_metadata.setColumns(columns_);
+    }
 
     storage_metadata.setConstraints(constraints_);
     setInMemoryMetadata(storage_metadata);
@@ -69,13 +76,14 @@ StorageHDFSCluster::StorageHDFSCluster(
     virtual_columns = VirtualColumnUtils::getPathFileAndSizeVirtualsForStorage(storage_metadata.getSampleBlock().getNamesAndTypesList());
 }
 
-void StorageHDFSCluster::addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context)
+void StorageHDFSCluster::updateQueryToSendIfNeeded(DB::ASTPtr & query, const DB::StorageSnapshotPtr & storage_snapshot, const DB::ContextPtr & context)
 {
     ASTExpressionList * expression_list = extractTableFunctionArgumentsFromSelectQuery(query);
     if (!expression_list)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected SELECT query from table function hdfsCluster, got '{}'", queryToString(query));
 
-    TableFunctionHDFSCluster::addColumnsStructureToArguments(expression_list->children, structure, context);
+    TableFunctionHDFSCluster::updateStructureAndFormatArgumentsIfNeeded(
+        expression_list->children, storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(), format_name, context);
 }
 
 
diff --git a/src/Storages/HDFS/StorageHDFSCluster.h b/src/Storages/HDFS/StorageHDFSCluster.h
index 7c4c41a573a..40884f98984 100644
--- a/src/Storages/HDFS/StorageHDFSCluster.h
+++ b/src/Storages/HDFS/StorageHDFSCluster.h
@@ -28,8 +28,7 @@ public:
         const String & format_name_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
-        const String & compression_method_,
-        bool structure_argument_was_provided_);
+        const String & compression_method);
 
     std::string getName() const override { return "HDFSCluster"; }
 
@@ -42,11 +41,10 @@ public:
     bool supportsTrivialCountOptimization() const override { return true; }
 
 private:
-    void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) override;
+    void updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context) override;
 
     String uri;
     String format_name;
-    String compression_method;
     NamesAndTypesList virtual_columns;
 };
 
diff --git a/src/Storages/IStorageCluster.cpp b/src/Storages/IStorageCluster.cpp
index 6f42d8f855c..348e37fc72c 100644
--- a/src/Storages/IStorageCluster.cpp
+++ b/src/Storages/IStorageCluster.cpp
@@ -32,12 +32,10 @@ namespace DB
 IStorageCluster::IStorageCluster(
     const String & cluster_name_,
     const StorageID & table_id_,
-    Poco::Logger * log_,
-    bool structure_argument_was_provided_)
+    Poco::Logger * log_)
     : IStorage(table_id_)
     , log(log_)
     , cluster_name(cluster_name_)
-    , structure_argument_was_provided(structure_argument_was_provided_)
 {
 }
 
@@ -130,8 +128,7 @@ void IStorageCluster::read(
         query_to_send = interpreter.getQueryInfo().query->clone();
     }
 
-    if (!structure_argument_was_provided)
-        addColumnsStructureToQuery(query_to_send, storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(), context);
+    updateQueryToSendIfNeeded(query_to_send, storage_snapshot, context);
 
     RestoreQualifiedNamesVisitor::Data data;
     data.distributed_table = DatabaseAndTableWithAlias(*getTableExpression(query_info.query->as<ASTSelectQuery &>(), 0));
diff --git a/src/Storages/IStorageCluster.h b/src/Storages/IStorageCluster.h
index b233f20103d..28ebda5125e 100644
--- a/src/Storages/IStorageCluster.h
+++ b/src/Storages/IStorageCluster.h
@@ -19,8 +19,7 @@ public:
     IStorageCluster(
         const String & cluster_name_,
         const StorageID & table_id_,
-        Poco::Logger * log_,
-        bool structure_argument_was_provided_);
+        Poco::Logger * log_);
 
     void read(
         QueryPlan & query_plan,
@@ -42,13 +41,11 @@ public:
 
 protected:
     virtual void updateBeforeRead(const ContextPtr &) {}
-
-    virtual void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) = 0;
+    virtual void updateQueryToSendIfNeeded(ASTPtr & /*query*/,  const StorageSnapshotPtr & /*storage_snapshot*/, const ContextPtr & /*context*/) {}
 
 private:
     Poco::Logger * log;
     String cluster_name;
-    bool structure_argument_was_provided;
 };
 
 
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index bc33e8cf2a9..098d279e482 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -143,11 +143,17 @@ StorageS3Queue::StorageS3Queue(
     StorageInMemoryMetadata storage_metadata;
     if (columns_.empty())
     {
-        auto columns = StorageS3::getTableStructureFromDataImpl(configuration, format_settings, context_);
+        ColumnsDescription columns;
+        if (configuration.format == "auto")
+            std::tie(columns, configuration.format) = StorageS3::getTableStructureAndFormatFromData(configuration, format_settings, context_);
+        else
+            columns = StorageS3::getTableStructureFromData(configuration, format_settings, context_);
         storage_metadata.setColumns(columns);
     }
     else
     {
+        if (configuration.format == "auto")
+            configuration.format = StorageS3::getTableStructureAndFormatFromData(configuration, format_settings, context_).second;
         storage_metadata.setColumns(columns_);
     }
 
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index cd841a1a673..888d360aff1 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -65,6 +65,7 @@ namespace ErrorCodes
     extern const int DATABASE_ACCESS_DENIED;
     extern const int CANNOT_COMPILE_REGEXP;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int CANNOT_DETECT_FORMAT;
     extern const int LOGICAL_ERROR;
     extern const int NOT_IMPLEMENTED;
 
@@ -127,7 +128,7 @@ void StorageAzureBlob::processNamedCollectionResult(StorageAzureBlob::Configurat
 }
 
 
-StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine_args, ContextPtr local_context)
+StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine_args, const ContextPtr & local_context)
 {
     StorageAzureBlob::Configuration configuration;
 
@@ -143,7 +144,7 @@ StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine
         configuration.blobs_paths = {configuration.blob_path};
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
 
         return configuration;
     }
@@ -236,13 +237,13 @@ StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine
     configuration.blobs_paths = {configuration.blob_path};
 
     if (configuration.format == "auto")
-        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
 
     return configuration;
 }
 
 
-AzureObjectStorage::SettingsPtr StorageAzureBlob::createSettings(ContextPtr local_context)
+AzureObjectStorage::SettingsPtr StorageAzureBlob::createSettings(const ContextPtr & local_context)
 {
     const auto & context_settings = local_context->getSettingsRef();
     auto settings_ptr = std::make_unique<AzureObjectStorageSettings>();
@@ -447,7 +448,7 @@ Poco::URI StorageAzureBlob::Configuration::getConnectionURL() const
 StorageAzureBlob::StorageAzureBlob(
     const Configuration & configuration_,
     std::unique_ptr<AzureObjectStorage> && object_storage_,
-    ContextPtr context,
+    const ContextPtr & context,
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
@@ -463,17 +464,25 @@ StorageAzureBlob::StorageAzureBlob(
     , format_settings(format_settings_)
     , partition_by(partition_by_)
 {
-    FormatFactory::instance().checkFormatName(configuration.format);
+    if (configuration.format != "auto")
+        FormatFactory::instance().checkFormatName(configuration.format);
     context->getGlobalContext()->getRemoteHostFilter().checkURL(configuration.getConnectionURL());
 
     StorageInMemoryMetadata storage_metadata;
     if (columns_.empty())
     {
-        auto columns = getTableStructureFromData(object_storage.get(), configuration, format_settings, context, distributed_processing);
+        ColumnsDescription columns;
+        if (configuration.format == "auto")
+            std::tie(columns, configuration.format) = getTableStructureAndFormatFromData(object_storage.get(), configuration, format_settings, context);
+        else
+            columns = getTableStructureFromData(object_storage.get(), configuration, format_settings, context);
         storage_metadata.setColumns(columns);
     }
     else
     {
+        if (configuration.format == "auto")
+            configuration.format = getTableStructureAndFormatFromData(object_storage.get(), configuration, format_settings, context).second;
+
         /// We don't allow special columns in File storage.
         if (!columns_.hasOnlyOrdinary())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table engine AzureBlobStorage doesn't support special columns like MATERIALIZED, ALIAS or EPHEMERAL");
@@ -517,7 +526,7 @@ public:
     StorageAzureBlobSink(
         const String & format,
         const Block & sample_block_,
-        ContextPtr context,
+        const ContextPtr & context,
         std::optional<FormatSettings> format_settings_,
         const CompressionMethod compression_method,
         AzureObjectStorage * object_storage,
@@ -607,22 +616,21 @@ private:
     std::mutex cancel_mutex;
 };
 
-class PartitionedStorageAzureBlobSink : public PartitionedSink
+class PartitionedStorageAzureBlobSink : public PartitionedSink, WithContext
 {
 public:
     PartitionedStorageAzureBlobSink(
         const ASTPtr & partition_by,
         const String & format_,
         const Block & sample_block_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         std::optional<FormatSettings> format_settings_,
         const CompressionMethod compression_method_,
         AzureObjectStorage * object_storage_,
         const String & blob_)
-        : PartitionedSink(partition_by, context_, sample_block_)
+        : PartitionedSink(partition_by, context_, sample_block_), WithContext(context_)
         , format(format_)
         , sample_block(sample_block_)
-        , context(context_)
         , compression_method(compression_method_)
         , object_storage(object_storage_)
         , blob(blob_)
@@ -638,7 +646,7 @@ public:
         return std::make_shared<StorageAzureBlobSink>(
             format,
             sample_block,
-            context,
+            getContext(),
             format_settings,
             compression_method,
             object_storage,
@@ -649,7 +657,6 @@ public:
 private:
     const String format;
     const Block sample_block;
-    const ContextPtr context;
     const CompressionMethod compression_method;
     AzureObjectStorage * object_storage;
     const String blob;
@@ -913,7 +920,7 @@ StorageAzureBlobSource::GlobIterator::GlobIterator(
     String blob_path_with_globs_,
     const ActionsDAG::Node * predicate,
     const NamesAndTypesList & virtual_columns_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     RelativePathsWithMetadata * outer_blobs_,
     std::function<void(FileProgress)> file_progress_callback_)
     : IIterator(context_)
@@ -1028,7 +1035,7 @@ StorageAzureBlobSource::KeysIterator::KeysIterator(
     const Strings & keys_,
     const ActionsDAG::Node * predicate,
     const NamesAndTypesList & virtual_columns_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     RelativePathsWithMetadata * outer_blobs,
     std::function<void(FileProgress)> file_progress_callback)
     : IIterator(context_)
@@ -1147,7 +1154,7 @@ StorageAzureBlobSource::StorageAzureBlobSource(
     const ReadFromFormatInfo & info,
     const String & format_,
     String name_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     std::optional<FormatSettings> format_settings_,
     UInt64 max_block_size_,
     String compression_hint_,
@@ -1290,6 +1297,7 @@ namespace
         ReadBufferIterator(
             const std::shared_ptr<StorageAzureBlobSource::IIterator> & file_iterator_,
             AzureObjectStorage * object_storage_,
+            std::optional<String> format_,
             const StorageAzureBlob::Configuration & configuration_,
             const std::optional<FormatSettings> & format_settings_,
             const RelativePathsWithMetadata & read_keys_,
@@ -1298,19 +1306,20 @@ namespace
             , file_iterator(file_iterator_)
             , object_storage(object_storage_)
             , configuration(configuration_)
+            , format(std::move(format_))
             , format_settings(format_settings_)
             , read_keys(read_keys_)
             , prev_read_keys_size(read_keys_.size())
         {
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
             /// For default mode check cached columns for currently read keys on first iteration.
             if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
             {
                 if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
-                    return {nullptr, cached_columns};
+                    return {nullptr, cached_columns, format};
             }
 
             current_path_with_metadata = file_iterator->next();
@@ -1318,12 +1327,20 @@ namespace
             if (current_path_with_metadata.relative_path.empty())
             {
                 if (first)
+                {
+                    if (format)
+                        throw Exception(
+                            ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                            "The table structure cannot be extracted from a {} format file, because there are no files with provided path "
+                            "in AzureBlobStorage. You can specify table structure manually", *format);
+
                     throw Exception(
                         ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                        "Cannot extract table structure from {} format file, because there are no files with provided path "
-                        "in AzureBlobStorage. You must specify table structure manually", configuration.format);
+                        "The data format cannot be detected by the contents of the files, because there are no files with provided path "
+                        "in AzureBlobStorage. You can specify table structure manually");
+                }
 
-                return {nullptr, std::nullopt};
+                return {nullptr, std::nullopt, format};
             }
 
             first = false;
@@ -1334,13 +1351,13 @@ namespace
                 auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
                 prev_read_keys_size = read_keys.size();
                 if (columns_from_cache)
-                    return {nullptr, columns_from_cache};
+                    return {nullptr, columns_from_cache, format};
             }
             else if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
             {
                 RelativePathsWithMetadata paths = {current_path_with_metadata};
                 if (auto columns_from_cache = tryGetColumnsFromCache(paths.begin(), paths.end()))
-                    return {nullptr, columns_from_cache};
+                    return {nullptr, columns_from_cache, format};
             }
 
             first = false;
@@ -1348,7 +1365,7 @@ namespace
             return {wrapReadBufferWithCompressionMethod(
                 object_storage->readObject(StoredObject(current_path_with_metadata.relative_path), getContext()->getReadSettings(), {}, current_path_with_metadata.metadata.size_bytes),
                 chooseCompressionMethod(current_path_with_metadata.relative_path, configuration.compression_method),
-                zstd_window_log_max), std::nullopt};
+                zstd_window_log_max), std::nullopt, format};
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
@@ -1357,7 +1374,7 @@ namespace
                 return;
 
             String source = fs::path(configuration.connection_url) / configuration.container / current_path_with_metadata.relative_path;
-            auto key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(source, *format, format_settings, getContext());
             StorageAzureBlob::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -1368,7 +1385,7 @@ namespace
                 return;
 
             String source = fs::path(configuration.connection_url) / configuration.container / current_path_with_metadata.relative_path;
-            auto key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(source, *format, format_settings, getContext());
             StorageAzureBlob::getSchemaCache(getContext()).addColumns(key, columns);
         }
 
@@ -1382,16 +1399,36 @@ namespace
             Strings sources;
             sources.reserve(read_keys.size());
             std::transform(read_keys.begin(), read_keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket + '/' + elem.relative_path; });
-            auto cache_keys = getKeysForSchemaCache(sources, configuration.format, format_settings, getContext());
+            auto cache_keys = getKeysForSchemaCache(sources, *format, format_settings, getContext());
             StorageAzureBlob::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+        
         String getLastFileName() const override { return current_path_with_metadata.relative_path; }
 
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            int zstd_window_log_max = static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max);
+            return wrapReadBufferWithCompressionMethod(
+                        object_storage->readObject(StoredObject(current_path_with_metadata.relative_path), getContext()->getReadSettings(), {}, current_path_with_metadata.metadata.size_bytes),
+                        chooseCompressionMethod(current_path_with_metadata.relative_path, configuration.compression_method),
+                        zstd_window_log_max);
+        }
+
     private:
         std::optional<ColumnsDescription> tryGetColumnsFromCache(const RelativePathsWithMetadata::const_iterator & begin, const RelativePathsWithMetadata::const_iterator & end)
         {
-            auto & schema_cache = StorageAzureBlob::getSchemaCache(getContext());
+            auto context = getContext();
+            if (!context->getSettingsRef().schema_inference_use_cache_for_azure)
+                return std::nullopt;
+
+            auto & schema_cache = StorageAzureBlob::getSchemaCache(context);
             for (auto it = begin; it < end; ++it)
             {
                 auto get_last_mod_time = [&] -> std::optional<time_t>
@@ -1403,10 +1440,28 @@ namespace
 
                 auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
                 String source = host_and_bucket + '/' + it->relative_path;
-                auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
-                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-                if (columns)
-                    return columns;
+                if (format)
+                {
+                    auto cache_key = getKeyForSchemaCache(source, *format, format_settings, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        return columns;
+                }
+                else
+                {
+                    /// If format is unknown, we can iterate through all possible input formats
+                    /// and check if we have an entry with this format and this file in schema cache.
+                    /// If we have such entry for some format, we can use this format to read the file.
+                    for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                    {
+                        auto cache_key = getKeyForSchemaCache(source, format_name, format_settings, context);
+                        if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        {
+                            /// Now format is known. It should be the same for all files.
+                            format = format_name;
+                            return columns;
+                        }
+                    }
+                }
             }
 
             return std::nullopt;
@@ -1415,6 +1470,7 @@ namespace
         std::shared_ptr<StorageAzureBlobSource::IIterator> file_iterator;
         AzureObjectStorage * object_storage;
         const StorageAzureBlob::Configuration & configuration;
+        std::optional<String> format;
         const std::optional<FormatSettings> & format_settings;
         const RelativePathsWithMetadata & read_keys;
         size_t prev_read_keys_size;
@@ -1423,21 +1479,16 @@ namespace
     };
 }
 
-ColumnsDescription StorageAzureBlob::getTableStructureFromData(
+std::pair<ColumnsDescription, String> StorageAzureBlob::getTableStructureAndFormatFromDataImpl(
+    std::optional<String> format,
     AzureObjectStorage * object_storage,
     const Configuration & configuration,
     const std::optional<FormatSettings> & format_settings,
-    ContextPtr ctx,
-    bool distributed_processing)
+    const ContextPtr & ctx)
 {
     RelativePathsWithMetadata read_keys;
     std::shared_ptr<StorageAzureBlobSource::IIterator> file_iterator;
-    if (distributed_processing)
-    {
-        file_iterator = std::make_shared<StorageAzureBlobSource::ReadIterator>(ctx,
-            ctx->getReadTaskCallback());
-    }
-    else if (configuration.withGlobs())
+    if (configuration.withGlobs())
     {
         file_iterator = std::make_shared<StorageAzureBlobSource::GlobIterator>(
             object_storage, configuration.container, configuration.blob_path, nullptr, NamesAndTypesList{}, ctx, &read_keys);
@@ -1448,8 +1499,28 @@ ColumnsDescription StorageAzureBlob::getTableStructureFromData(
             object_storage, configuration.container, configuration.blobs_paths, nullptr, NamesAndTypesList{}, ctx, &read_keys);
     }
 
-    ReadBufferIterator read_buffer_iterator(file_iterator, object_storage, configuration, format_settings, read_keys, ctx);
-    return readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
+    ReadBufferIterator read_buffer_iterator(file_iterator, object_storage, format, configuration, format_settings, read_keys, ctx);
+    if (format)
+        return {readSchemaFromFormat(*format, format_settings, read_buffer_iterator, ctx), *format};
+    return detectFormatAndReadSchema(format_settings, read_buffer_iterator, ctx);
+}
+
+std::pair<ColumnsDescription, String> StorageAzureBlob::getTableStructureAndFormatFromData(
+    DB::AzureObjectStorage * object_storage,
+    const DB::StorageAzureBlob::Configuration & configuration,
+    const std::optional<FormatSettings> & format_settings,
+    const DB::ContextPtr & ctx)
+{
+    return getTableStructureAndFormatFromDataImpl(std::nullopt, object_storage, configuration, format_settings, ctx);
+}
+
+ColumnsDescription StorageAzureBlob::getTableStructureFromData(
+    DB::AzureObjectStorage * object_storage,
+    const DB::StorageAzureBlob::Configuration & configuration,
+    const std::optional<FormatSettings> & format_settings,
+    const DB::ContextPtr & ctx)
+{
+    return getTableStructureAndFormatFromDataImpl(std::nullopt, object_storage, configuration, format_settings, ctx).first;
 }
 
 SchemaCache & StorageAzureBlob::getSchemaCache(const ContextPtr & ctx)
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index 16e5b9edfb6..71c93021dd4 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -31,9 +31,9 @@ public:
 
         String getPath() const { return blob_path; }
 
-        bool update(ContextPtr context);
+        bool update(const ContextPtr & context);
 
-        void connect(ContextPtr context);
+        void connect(const ContextPtr & context);
 
         bool withGlobs() const { return blob_path.find_first_of("*?{") != std::string::npos; }
 
@@ -59,7 +59,7 @@ public:
     StorageAzureBlob(
         const Configuration & configuration_,
         std::unique_ptr<AzureObjectStorage> && object_storage_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
@@ -68,10 +68,10 @@ public:
         bool distributed_processing_,
         ASTPtr partition_by_);
 
-    static StorageAzureBlob::Configuration getConfiguration(ASTs & engine_args, ContextPtr local_context);
+    static StorageAzureBlob::Configuration getConfiguration(ASTs & engine_args, const ContextPtr & local_context);
     static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration, bool is_read_only);
 
-    static AzureObjectStorage::SettingsPtr createSettings(ContextPtr local_context);
+    static AzureObjectStorage::SettingsPtr createSettings(const ContextPtr & local_context);
 
     static void processNamedCollectionResult(StorageAzureBlob::Configuration & configuration, const NamedCollection & collection);
 
@@ -115,10 +115,22 @@ public:
         AzureObjectStorage * object_storage,
         const Configuration & configuration,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr ctx,
-        bool distributed_processing = false);
+        const ContextPtr & ctx);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromData(
+        AzureObjectStorage * object_storage,
+        const Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & ctx);
 
 private:
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromDataImpl(
+        std::optional<String> format,
+        AzureObjectStorage * object_storage,
+        const Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & ctx);
+
     friend class ReadFromAzureBlob;
 
     std::string name;
@@ -137,7 +149,7 @@ public:
     class IIterator : public WithContext
     {
     public:
-        IIterator(ContextPtr context_):WithContext(context_) {}
+        IIterator(const ContextPtr & context_):WithContext(context_) {}
         virtual ~IIterator() = default;
         virtual RelativePathWithMetadata next() = 0;
 
@@ -153,7 +165,7 @@ public:
             String blob_path_with_globs_,
             const ActionsDAG::Node * predicate,
             const NamesAndTypesList & virtual_columns_,
-            ContextPtr context_,
+            const ContextPtr & context_,
             RelativePathsWithMetadata * outer_blobs_,
             std::function<void(FileProgress)> file_progress_callback_ = {});
 
@@ -186,7 +198,7 @@ public:
     class ReadIterator : public IIterator
     {
     public:
-        explicit ReadIterator(ContextPtr context_,
+        explicit ReadIterator(const ContextPtr & context_,
                               const ReadTaskCallback & callback_)
             : IIterator(context_), callback(callback_) { }
         RelativePathWithMetadata next() override
@@ -207,7 +219,7 @@ public:
             const Strings & keys_,
             const ActionsDAG::Node * predicate,
             const NamesAndTypesList & virtual_columns_,
-            ContextPtr context_,
+            const ContextPtr & context_,
             RelativePathsWithMetadata * outer_blobs,
             std::function<void(FileProgress)> file_progress_callback = {});
 
@@ -229,7 +241,7 @@ public:
         const ReadFromFormatInfo & info,
         const String & format_,
         String name_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         std::optional<FormatSettings> format_settings_,
         UInt64 max_block_size_,
         String compression_hint_,
diff --git a/src/Storages/StorageAzureBlobCluster.cpp b/src/Storages/StorageAzureBlobCluster.cpp
index a6372577fb0..0f607a9812f 100644
--- a/src/Storages/StorageAzureBlobCluster.cpp
+++ b/src/Storages/StorageAzureBlobCluster.cpp
@@ -36,23 +36,30 @@ StorageAzureBlobCluster::StorageAzureBlobCluster(
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
-    ContextPtr context_,
-    bool structure_argument_was_provided_)
-    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageAzureBlobCluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
+    const ContextPtr & context)
+    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageAzureBlobCluster (" + table_id_.table_name + ")"))
     , configuration{configuration_}
     , object_storage(std::move(object_storage_))
 {
-    context_->getGlobalContext()->getRemoteHostFilter().checkURL(configuration_.getConnectionURL());
+    context->getGlobalContext()->getRemoteHostFilter().checkURL(configuration_.getConnectionURL());
     StorageInMemoryMetadata storage_metadata;
 
     if (columns_.empty())
     {
+        ColumnsDescription columns;
         /// `format_settings` is set to std::nullopt, because StorageAzureBlobCluster is used only as table function
-        auto columns = StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, /*format_settings=*/std::nullopt, context_, false);
+        if (configuration.format == "auto")
+            std::tie(columns, configuration.format) = StorageAzureBlob::getTableStructureAndFormatFromData(object_storage.get(), configuration, /*format_settings=*/std::nullopt, context);
+        else
+            columns = StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, /*format_settings=*/std::nullopt, context);
         storage_metadata.setColumns(columns);
     }
     else
+    {
+        if (configuration.format == "auto")
+            configuration.format = StorageAzureBlob::getTableStructureAndFormatFromData(object_storage.get(), configuration, /*format_settings=*/std::nullopt, context).second;
         storage_metadata.setColumns(columns_);
+    }
 
     storage_metadata.setConstraints(constraints_);
     setInMemoryMetadata(storage_metadata);
@@ -60,13 +67,14 @@ StorageAzureBlobCluster::StorageAzureBlobCluster(
     virtual_columns = VirtualColumnUtils::getPathFileAndSizeVirtualsForStorage(storage_metadata.getSampleBlock().getNamesAndTypesList());
 }
 
-void StorageAzureBlobCluster::addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context)
+void StorageAzureBlobCluster::updateQueryToSendIfNeeded(DB::ASTPtr & query, const DB::StorageSnapshotPtr & storage_snapshot, const DB::ContextPtr & context)
 {
     ASTExpressionList * expression_list = extractTableFunctionArgumentsFromSelectQuery(query);
     if (!expression_list)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected SELECT query from table function s3Cluster, got '{}'", queryToString(query));
 
-    TableFunctionAzureBlobStorageCluster::addColumnsStructureToArguments(expression_list->children, structure, context);
+    TableFunctionAzureBlobStorageCluster::updateStructureAndFormatArgumentsIfNeeded(
+        expression_list->children, storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(), configuration.format, context);
 }
 
 RemoteQueryExecutor::Extension StorageAzureBlobCluster::getTaskIteratorExtension(const ActionsDAG::Node * predicate, const ContextPtr & context) const
diff --git a/src/Storages/StorageAzureBlobCluster.h b/src/Storages/StorageAzureBlobCluster.h
index 2831b94f825..476f21c6742 100644
--- a/src/Storages/StorageAzureBlobCluster.h
+++ b/src/Storages/StorageAzureBlobCluster.h
@@ -27,8 +27,7 @@ public:
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
-        ContextPtr context_,
-        bool structure_argument_was_provided_);
+        const ContextPtr & context);
 
     std::string getName() const override { return "AzureBlobStorageCluster"; }
 
@@ -43,7 +42,7 @@ public:
 private:
     void updateBeforeRead(const ContextPtr & /*context*/) override {}
 
-    void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) override;
+    void updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context) override;
 
     StorageAzureBlob::Configuration configuration;
     NamesAndTypesList virtual_columns;
diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index 9f864813de9..920c7069529 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -89,6 +89,7 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
     extern const int CANNOT_APPEND_TO_FILE;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int CANNOT_DETECT_FORMAT;
     extern const int CANNOT_COMPILE_REGEXP;
 }
 
@@ -327,7 +328,7 @@ std::unique_ptr<ReadBuffer> createReadBuffer(
 
 }
 
-Strings StorageFile::getPathsList(const String & table_path, const String & user_files_path, ContextPtr context, size_t & total_bytes_to_read)
+Strings StorageFile::getPathsList(const String & table_path, const String & user_files_path, const ContextPtr & context, size_t & total_bytes_to_read)
 {
     fs::path user_files_absolute_path = fs::weakly_canonical(user_files_path);
     fs::path fs_table_path(table_path);
@@ -374,27 +375,44 @@ namespace
     public:
         ReadBufferFromFileIterator(
             const std::vector<String> & paths_,
-            const String & format_,
+            std::optional<String> format_,
             const String & compression_method_,
             const std::optional<FormatSettings> & format_settings_,
-            ContextPtr context_)
+            const ContextPtr & context_)
             : WithContext(context_)
             , paths(paths_)
-            , format(format_)
+            , format(std::move(format_))
             , compression_method(compression_method_)
             , format_settings(format_settings_)
         {
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
             bool is_first = current_index == 0;
-            /// For default mode check cached columns for all paths on first iteration.
-            /// If we have cached columns, next() won't be called again.
-            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            if (is_first)
             {
-                if (auto cached_columns = tryGetColumnsFromCache(paths))
-                    return {nullptr, cached_columns};
+                /// If format is unknown we iterate through all paths on first iteration and
+                /// try to determine format by file name.
+                if (!format)
+                {
+                    for (const auto & path : paths)
+                    {
+                        if (auto format_from_path = FormatFactory::instance().tryGetFormatFromFileName(path))
+                        {
+                            format = format_from_path;
+                            break;
+                        }
+                    }
+                }
+
+                /// For default mode check cached columns for all paths on first iteration.
+                /// If we have cached columns, next() won't be called again.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                {
+                    if (auto cached_columns = tryGetColumnsFromCache(paths))
+                        return {nullptr, cached_columns, format};
+                }
             }
 
             String path;
@@ -405,11 +423,18 @@ namespace
                 if (current_index == paths.size())
                 {
                     if (is_first)
+                    {
+                        if (format)
+                            throw Exception(
+                                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                "The table structure cannot be extracted from a {} format file, because all files are empty. You can specify the format manually",
+                                *format);
+
                         throw Exception(
-                            ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                            "Cannot extract table structure from {} format file, because all files are empty. You must specify table structure manually",
-                            format);
-                    return {nullptr, std::nullopt};
+                            ErrorCodes::CANNOT_DETECT_FORMAT,
+                            "The data format cannot be detected by the contents of the files, because all files are empty. You can specify table structure manually");
+                    }
+                    return {nullptr, std::nullopt, std::nullopt};
                 }
 
                 path = paths[current_index++];
@@ -420,10 +445,10 @@ namespace
             if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
             {
                 if (auto cached_columns = tryGetColumnsFromCache({path}))
-                    return {nullptr, cached_columns};
+                    return {nullptr, cached_columns, format};
             }
 
-            return {createReadBuffer(path, file_stat, false, -1, compression_method, getContext()), std::nullopt};
+            return {createReadBuffer(path, file_stat, false, -1, compression_method, getContext()), std::nullopt, format};
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
@@ -431,7 +456,7 @@ namespace
             if (!getContext()->getSettingsRef().use_cache_for_count_from_files)
                 return;
 
-            auto key = getKeyForSchemaCache(paths[current_index - 1], format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(paths[current_index - 1], *format, format_settings, getContext());
             StorageFile::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -443,7 +468,7 @@ namespace
 
             /// For union mode, schema can be different for different files, so we need to
             /// cache last inferred schema only for last processed file.
-            auto cache_key = getKeyForSchemaCache(paths[current_index - 1], format, format_settings, getContext());
+            auto cache_key = getKeyForSchemaCache(paths[current_index - 1], *format, format_settings, getContext());
             StorageFile::getSchemaCache(getContext()).addColumns(cache_key, columns);
         }
 
@@ -454,7 +479,7 @@ namespace
                 return;
 
             /// For default mode we cache resulting schema for all paths.
-            auto cache_keys = getKeysForSchemaCache(paths, format, format_settings, getContext());
+            auto cache_keys = getKeysForSchemaCache(paths, *format, format_settings, getContext());
             StorageFile::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
         }
 
@@ -465,14 +490,30 @@ namespace
             return "";
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            chassert(current_index > 0 && current_index <= paths.size());
+            auto path = paths[current_index - 1];
+            auto file_stat = getFileStat(path, false, -1, "File");
+            return createReadBuffer(path, file_stat, false, -1, compression_method, getContext());
+        }
+
     private:
         std::optional<ColumnsDescription> tryGetColumnsFromCache(const Strings & paths_)
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file)
+            auto context = getContext();
+            if (!context->getSettingsRef().schema_inference_use_cache_for_file)
                 return std::nullopt;
 
             /// Check if the cache contains one of the paths.
-            auto & schema_cache = StorageFile::getSchemaCache(getContext());
+            auto & schema_cache = StorageFile::getSchemaCache(context);
             struct stat file_stat{};
             for (const auto & path : paths_)
             {
@@ -484,10 +525,28 @@ namespace
                     return file_stat.st_mtime;
                 };
 
-                auto cache_key = getKeyForSchemaCache(path, format, format_settings, getContext());
-                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-                if (columns)
-                    return columns;
+                if (format)
+                {
+                    auto cache_key = getKeyForSchemaCache(path, *format, format_settings, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        return columns;
+                }
+                else
+                {
+                    /// If format is unknown, we can iterate through all possible input formats
+                    /// and check if we have an entry with this format and this file in schema cache.
+                    /// If we have such entry for some format, we can use this format to read the file.
+                    for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                    {
+                        auto cache_key = getKeyForSchemaCache(path, format_name, format_settings, context);
+                        if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        {
+                            /// Now format is known. It should be the same for all files.
+                            format = format_name;
+                            return columns;
+                        }
+                    }
+                }
             }
 
             return std::nullopt;
@@ -496,7 +555,7 @@ namespace
         const std::vector<String> & paths;
 
         size_t current_index = 0;
-        String format;
+        std::optional<String> format;
         String compression_method;
         const std::optional<FormatSettings> & format_settings;
     };
@@ -506,17 +565,17 @@ namespace
     public:
         ReadBufferFromArchiveIterator(
             const StorageFile::ArchiveInfo & archive_info_,
-            const String & format_,
+            std::optional<String> format_,
             const std::optional<FormatSettings> & format_settings_,
-            ContextPtr context_)
+            const ContextPtr & context_)
             : WithContext(context_)
             , archive_info(archive_info_)
-            , format(format_)
+            , format(std::move(format_))
             , format_settings(format_settings_)
         {
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
             /// For default mode check cached columns for all initial archive paths (maybe with globs) on first iteration.
             /// If we have cached columns, next() won't be called again.
@@ -524,8 +583,8 @@ namespace
             {
                 for (const auto & archive : archive_info.paths_to_archives)
                 {
-                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, archive_info.path_in_archive))
-                        return {nullptr, cached_columns};
+                    if (auto cached_schema = tryGetSchemaFromCache(archive, fmt::format("{}::{}", archive, archive_info.path_in_archive)))
+                        return {nullptr, cached_schema, format};
                 }
             }
 
@@ -535,12 +594,19 @@ namespace
                 if (current_archive_index == archive_info.paths_to_archives.size())
                 {
                     if (is_first)
-                        throw Exception(
-                            ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                            "Cannot extract table structure from {} format file, because all files are empty. You must specify table structure manually",
-                            format);
+                    {
+                        if (format)
+                            throw Exception(
+                                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                "The table structure cannot be extracted from a {} format file, because all files are empty. You can specify table structure manually",
+                                *format);
 
-                    return {nullptr, std::nullopt};
+                        throw Exception(
+                            ErrorCodes::CANNOT_DETECT_FORMAT,
+                            "The data format cannot be detected by the contents of the files, because all files are empty. You can specify the format manually");
+                    }
+
+                    return {nullptr, std::nullopt, format};
                 }
 
                 const auto & archive = archive_info.paths_to_archives[current_archive_index];
@@ -554,11 +620,18 @@ namespace
                         continue;
                     }
 
+                    if (format)
+                        throw Exception(
+                            ErrorCodes::CANNOT_DETECT_FORMAT,
+                            "The table structure cannot be extracted from a {} format file, because the archive {} is empty. "
+                            "You can specify table structure manually",
+                            *format,
+                            archive);
+
                     throw Exception(
-                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                        "Cannot extract table structure from {} format file, because the archive {} is empty. "
-                        "You must specify table structure manually",
-                        format,
+                        ErrorCodes::CANNOT_DETECT_FORMAT,
+                        "The data format cannot be detected by the contents of the files, because the archive {} is empty. "
+                        "You can specify the format manually",
                         archive);
                 }
 
@@ -574,8 +647,8 @@ namespace
                     last_read_file_path = paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), archive_info.path_in_archive));
                     is_first = false;
 
-                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, last_read_file_path))
-                        return {nullptr, cached_columns};
+                    if (auto cached_schema = tryGetSchemaFromCache(archive, last_read_file_path))
+                        return {nullptr, cached_schema, format};
                 }
                 else
                 {
@@ -611,13 +684,20 @@ namespace
                     last_read_file_path = paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), *filename));
                     is_first = false;
 
-                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, last_read_file_path))
+                    /// If format is unknown we can try to determine it by the file name.
+                    if (!format)
+                    {
+                        if (auto format_from_file = FormatFactory::instance().tryGetFormatFromFileName(*filename))
+                            format = format_from_file;
+                    }
+
+                    if (auto cached_schema = tryGetSchemaFromCache(archive, last_read_file_path))
                     {
                         /// For union mode next() will be called again even if we found cached columns,
                         /// so we need to remember last_read_buffer to continue iterating through files in archive.
                         if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
                             last_read_buffer = archive_reader->readFile(std::move(file_enumerator));
-                        return {nullptr, cached_columns};
+                        return {nullptr, cached_schema, format};
                     }
 
                     read_buf = archive_reader->readFile(std::move(file_enumerator));
@@ -626,7 +706,7 @@ namespace
                 break;
             }
 
-            return {std::move(read_buf), std::nullopt};
+            return {std::move(read_buf), std::nullopt, format};
         }
 
         void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> buffer) override
@@ -640,7 +720,7 @@ namespace
             if (!getContext()->getSettingsRef().use_cache_for_count_from_files)
                 return;
 
-            auto key = getKeyForSchemaCache(last_read_file_path, format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(last_read_file_path, *format, format_settings, getContext());
             StorageFile::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -653,7 +733,7 @@ namespace
             /// For union mode, schema can be different for different files in archive, so we need to
             /// cache last inferred schema only for last processed file.
             auto & schema_cache = StorageFile::getSchemaCache(getContext());
-            auto cache_key = getKeyForSchemaCache(last_read_file_path, format, format_settings, getContext());
+            auto cache_key = getKeyForSchemaCache(last_read_file_path, *format, format_settings, getContext());
             schema_cache.addColumns(cache_key, columns);
         }
 
@@ -669,17 +749,42 @@ namespace
             for (const auto & archive : archive_info.paths_to_archives)
                 paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive, archive_info.path_in_archive));
             auto & schema_cache = StorageFile::getSchemaCache(getContext());
-            auto cache_keys = getKeysForSchemaCache(paths_for_schema_cache, format, format_settings, getContext());
+            auto cache_keys = getKeysForSchemaCache(paths_for_schema_cache, *format, format_settings, getContext());
             schema_cache.addManyColumns(cache_keys, columns);
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+
         String getLastFileName() const override
         {
             return last_read_file_path;
         }
 
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            if (archive_info.isSingleFileRead())
+            {
+                chassert(current_archive_index > 0 && current_archive_index <= archive_info.paths_to_archives.size());
+                const auto & archive = archive_info.paths_to_archives[current_archive_index - 1];
+                auto archive_reader = createArchiveReader(archive);
+                return archive_reader->readFile(archive_info.path_in_archive, false);
+            }
+
+            chassert(current_archive_index >= 0 && current_archive_index < archive_info.paths_to_archives.size());
+            const auto & archive = archive_info.paths_to_archives[current_archive_index];
+            auto archive_reader = createArchiveReader(archive);
+            chassert(last_read_buffer);
+            file_enumerator = archive_reader->currentFile(std::move(last_read_buffer));
+            return archive_reader->readFile(std::move(file_enumerator));
+        }
+
     private:
-        std::optional<ColumnsDescription> tryGetColumnsFromSchemaCache(const std::string & archive_path, const std::string & full_path)
+        std::optional<ColumnsDescription> tryGetSchemaFromCache(const std::string & archive_path, const std::string & full_path)
         {
             auto context = getContext();
             if (!context->getSettingsRef().schema_inference_use_cache_for_file)
@@ -695,11 +800,28 @@ namespace
                 return file_stat.st_mtime;
             };
 
-            auto cache_key = getKeyForSchemaCache(full_path, format, format_settings, context);
-            auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-
-            if (columns)
-                return columns;
+            if (format)
+            {
+                auto cache_key = getKeyForSchemaCache(full_path, *format, format_settings, context);
+                if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                    return columns;
+            }
+            else
+            {
+                /// If format is unknown, we can iterate through all possible input formats
+                /// and check if we have an entry with this format and this file in schema cache.
+                /// If we have such entry for some format, we can use this format to read the file.
+                for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                {
+                    auto cache_key = getKeyForSchemaCache(full_path, format_name, format_settings, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                    {
+                        /// Now format is known. It should be the same for all files.
+                        format = format_name;
+                        return columns;
+                    }
+                }
+            }
 
             return std::nullopt;
         }
@@ -715,13 +837,13 @@ namespace
         std::unique_ptr<IArchiveReader::FileEnumerator> file_enumerator;
         std::unique_ptr<ReadBuffer> last_read_buffer;
 
-        String format;
+        std::optional<String> format;
         const std::optional<FormatSettings> & format_settings;
         std::vector<std::string> paths_for_schema_cache;
     };
 }
 
-ColumnsDescription StorageFile::getTableStructureFromFileDescriptor(ContextPtr context)
+std::pair<ColumnsDescription, String> StorageFile::getTableStructureAndFormatFromFileDescriptor(std::optional<String> format, const ContextPtr & context)
 {
     /// If we want to read schema from file descriptor we should create
     /// a read buffer from fd, create a checkpoint, read some data required
@@ -738,22 +860,29 @@ ColumnsDescription StorageFile::getTableStructureFromFileDescriptor(ContextPtr c
     read_buf->setCheckpoint();
     auto read_buffer_iterator = SingleReadBufferIterator(std::move(read_buf));
 
-    auto columns = readSchemaFromFormat(format_name, format_settings, read_buffer_iterator, false, context, peekable_read_buffer_from_fd);
+    ColumnsDescription columns;
+    if (format)
+        columns = readSchemaFromFormat(*format, format_settings, read_buffer_iterator, context);
+    else
+        std::tie(columns, format) = detectFormatAndReadSchema(format_settings, read_buffer_iterator, context);
+
+    peekable_read_buffer_from_fd = read_buffer_iterator.releaseBuffer();
     if (peekable_read_buffer_from_fd)
     {
         /// If we have created read buffer in readSchemaFromFormat we should rollback to checkpoint.
         assert_cast<PeekableReadBuffer *>(peekable_read_buffer_from_fd.get())->rollbackToCheckpoint();
         has_peekable_read_buffer_from_fd = true;
     }
-    return columns;
+
+    return {columns, *format};
 }
 
-ColumnsDescription StorageFile::getTableStructureFromFile(
-    const String & format,
+std::pair<ColumnsDescription, String> StorageFile::getTableStructureAndFormatFromFileImpl(
+    std::optional<String> format,
     const std::vector<String> & paths,
     const String & compression_method,
     const std::optional<FormatSettings> & format_settings,
-    ContextPtr context,
+    const ContextPtr & context,
     const std::optional<ArchiveInfo> & archive_info)
 {
     if (format == "Distributed")
@@ -761,29 +890,60 @@ ColumnsDescription StorageFile::getTableStructureFromFile(
         if (paths.empty())
             throw Exception(ErrorCodes::INCORRECT_FILE_NAME, "Cannot get table structure from file, because no files match specified name");
 
-        return ColumnsDescription(DistributedAsyncInsertSource(paths[0]).getOutputs().front().getHeader().getNamesAndTypesList());
+        return {ColumnsDescription(DistributedAsyncInsertSource(paths[0]).getOutputs().front().getHeader().getNamesAndTypesList()), *format};
     }
 
     if (((archive_info && archive_info->paths_to_archives.empty()) || (!archive_info && paths.empty()))
-        && !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format))
+        && (!format || !FormatFactory::instance().checkIfFormatHasExternalSchemaReader(*format)))
+    {
+        if (format)
+            throw Exception(
+                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                "The table structure cannot be extracted from a {} format file, because there are no files with provided path. "
+                "You can specify table structure manually", *format);
+
         throw Exception(
             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-            "Cannot extract table structure from {} format file, because there are no files with provided path. "
-            "You must specify table structure manually", format);
+            "The data format cannot be detected by the contents of the files, because there are no files with provided path. "
+            "You can specify the format manually");
+
+    }
 
     if (archive_info)
     {
         ReadBufferFromArchiveIterator read_buffer_iterator(*archive_info, format, format_settings, context);
-        return readSchemaFromFormat(
-            format,
-            format_settings,
-            read_buffer_iterator,
-            /*retry=*/archive_info->paths_to_archives.size() > 1 || !archive_info->isSingleFileRead(),
-            context);
+        if (format)
+            return {readSchemaFromFormat(*format, format_settings, read_buffer_iterator, context), *format};
+
+        return detectFormatAndReadSchema(format_settings, read_buffer_iterator, context);
     }
 
     ReadBufferFromFileIterator read_buffer_iterator(paths, format, compression_method, format_settings, context);
-    return readSchemaFromFormat(format, format_settings, read_buffer_iterator, paths.size() > 1, context);
+    if (format)
+        return {readSchemaFromFormat(*format, format_settings, read_buffer_iterator, context), *format};
+
+    return detectFormatAndReadSchema(format_settings, read_buffer_iterator, context);
+}
+
+ColumnsDescription StorageFile::getTableStructureFromFile(
+    const DB::String & format,
+    const std::vector<String> & paths,
+    const DB::String & compression_method,
+    const std::optional<FormatSettings> & format_settings,
+    const ContextPtr & context,
+    const std::optional<ArchiveInfo> & archive_info)
+{
+    return getTableStructureAndFormatFromFileImpl(format, paths, compression_method, format_settings, context, archive_info).first;
+}
+
+std::pair<ColumnsDescription, String> StorageFile::getTableStructureAndFormatFromFile(
+    const std::vector<String> & paths,
+    const DB::String & compression_method,
+    const std::optional<FormatSettings> & format_settings,
+    const ContextPtr & context,
+    const std::optional<ArchiveInfo> & archive_info)
+{
+    return getTableStructureAndFormatFromFileImpl(std::nullopt, paths, compression_method, format_settings, context, archive_info);
 }
 
 bool StorageFile::supportsSubsetOfColumns(const ContextPtr & context) const
@@ -874,7 +1034,7 @@ StorageFile::StorageFile(CommonArguments args)
     , compression_method(args.compression_method)
     , base_path(args.getContext()->getPath())
 {
-    if (format_name != "Distributed")
+    if (format_name != "Distributed" && format_name != "auto")
         FormatFactory::instance().checkFormatName(format_name);
 }
 
@@ -886,16 +1046,19 @@ void StorageFile::setStorageMetadata(CommonArguments args)
     {
         ColumnsDescription columns;
         if (use_table_fd)
-            columns = getTableStructureFromFileDescriptor(args.getContext());
+        {
+            if (format_name == "auto")
+                std::tie(columns, format_name) = getTableStructureAndFormatFromFileDescriptor(std::nullopt, args.getContext());
+            else
+                columns = getTableStructureAndFormatFromFileDescriptor(format_name, args.getContext()).first;
+        }
         else
         {
-            columns = getTableStructureFromFile(
-                format_name,
-                paths,
-                compression_method,
-                format_settings,
-                args.getContext(),
-                archive_info);
+            if (format_name == "auto")
+                std::tie(columns, format_name) = getTableStructureAndFormatFromFile(paths, compression_method, format_settings, args.getContext(), archive_info);
+            else
+                columns = getTableStructureFromFile(format_name, paths, compression_method, format_settings, args.getContext(), archive_info);
+
             if (!args.columns.empty() && args.columns != columns)
                 throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS, "Table structure and file structure are different");
         }
@@ -903,6 +1066,8 @@ void StorageFile::setStorageMetadata(CommonArguments args)
     }
     else
     {
+        if (format_name == "auto")
+            format_name = getTableStructureAndFormatFromFile(paths, compression_method, format_settings, args.getContext(), archive_info).second;
         /// We don't allow special columns in File storage.
         if (!args.columns.hasOnlyOrdinary())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table engine File doesn't support special columns like MATERIALIZED, ALIAS or EPHEMERAL");
@@ -917,7 +1082,7 @@ void StorageFile::setStorageMetadata(CommonArguments args)
 }
 
 
-static std::chrono::seconds getLockTimeout(ContextPtr context)
+static std::chrono::seconds getLockTimeout(const ContextPtr & context)
 {
     const Settings & settings = context->getSettingsRef();
     Int64 lock_timeout = settings.lock_acquire_timeout.totalSeconds();
@@ -933,9 +1098,9 @@ StorageFileSource::FilesIterator::FilesIterator(
     std::optional<StorageFile::ArchiveInfo> archive_info_,
     const ActionsDAG::Node * predicate,
     const NamesAndTypesList & virtual_columns,
-    ContextPtr context_,
+    const ContextPtr & context_,
     bool distributed_processing_)
-    : files(files_), archive_info(std::move(archive_info_)), distributed_processing(distributed_processing_), context(context_)
+    : WithContext(context_), files(files_), archive_info(std::move(archive_info_)), distributed_processing(distributed_processing_)
 {
     ActionsDAGPtr filter_dag;
     if (!distributed_processing && !archive_info && !files.empty())
@@ -948,7 +1113,7 @@ StorageFileSource::FilesIterator::FilesIterator(
 String StorageFileSource::FilesIterator::next()
 {
     if (distributed_processing)
-        return context->getReadTaskCallback()();
+        return getContext()->getReadTaskCallback()();
     else
     {
         const auto & fs = isReadFromArchive() ? archive_info->paths_to_archives : files;
@@ -972,12 +1137,12 @@ const String & StorageFileSource::FilesIterator::getFileNameInArchive()
 StorageFileSource::StorageFileSource(
     const ReadFromFormatInfo & info,
     std::shared_ptr<StorageFile> storage_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     UInt64 max_block_size_,
     FilesIteratorPtr files_iterator_,
     std::unique_ptr<ReadBuffer> read_buf_,
     bool need_only_count_)
-    : SourceWithKeyCondition(info.source_header, false)
+    : SourceWithKeyCondition(info.source_header, false), WithContext(context_)
     , storage(std::move(storage_))
     , files_iterator(std::move(files_iterator_))
     , read_buf(std::move(read_buf_))
@@ -985,13 +1150,12 @@ StorageFileSource::StorageFileSource(
     , requested_columns(info.requested_columns)
     , requested_virtual_columns(info.requested_virtual_columns)
     , block_for_format(info.format_header)
-    , context(context_)
     , max_block_size(max_block_size_)
     , need_only_count(need_only_count_)
 {
     if (!storage->use_table_fd)
     {
-        shared_lock = std::shared_lock(storage->rwlock, getLockTimeout(context));
+        shared_lock = std::shared_lock(storage->rwlock, getLockTimeout(getContext()));
         if (!shared_lock)
             throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Lock timeout exceeded");
         storage->readers_counter.fetch_add(1, std::memory_order_release);
@@ -1008,7 +1172,7 @@ void StorageFileSource::beforeDestroy()
     if (std::uncaught_exceptions() == 0 && cnt == 1 && !storage->was_renamed)
     {
         shared_lock.unlock();
-        auto exclusive_lock = std::unique_lock{storage->rwlock, getLockTimeout(context)};
+        auto exclusive_lock = std::unique_lock{storage->rwlock, getLockTimeout(getContext())};
 
         if (!exclusive_lock)
             return;
@@ -1027,7 +1191,7 @@ void StorageFileSource::beforeDestroy()
                 file_path = file_path.lexically_normal();
 
                 // Checking access rights
-                checkCreationIsAllowed(context, context->getUserFilesPath(), file_path, true);
+                checkCreationIsAllowed(getContext(), getContext()->getUserFilesPath(), file_path, true);
 
                 // Checking an existing of new file
                 if (fs::exists(file_path))
@@ -1060,7 +1224,7 @@ void StorageFileSource::setKeyCondition(const ActionsDAG::NodeRawConstPtrs & nod
 
 bool StorageFileSource::tryGetCountFromCache(const struct stat & file_stat)
 {
-    if (!context->getSettingsRef().use_cache_for_count_from_files)
+    if (!getContext()->getSettingsRef().use_cache_for_count_from_files)
         return false;
 
     auto num_rows_from_cache = tryGetNumRowsFromCache(current_path, file_stat.st_mtime);
@@ -1102,7 +1266,7 @@ Chunk StorageFileSource::generate()
                             return {};
 
                         auto file_stat = getFileStat(archive, storage->use_table_fd, storage->table_fd, storage->getName());
-                        if (context->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0)
+                        if (getContext()->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0)
                             continue;
 
                         archive_reader = createArchiveReader(archive);
@@ -1116,7 +1280,7 @@ Chunk StorageFileSource::generate()
                         if (!read_buf)
                             continue;
 
-                        if (auto progress_callback = context->getFileProgressCallback())
+                        if (auto progress_callback = getContext()->getFileProgressCallback())
                             progress_callback(FileProgress(0, tryGetFileSizeFromReadBuffer(*read_buf).value_or(0)));
                     }
                     else
@@ -1130,7 +1294,7 @@ Chunk StorageFileSource::generate()
                                     return {};
 
                                 current_archive_stat = getFileStat(archive, storage->use_table_fd, storage->table_fd, storage->getName());
-                                if (context->getSettingsRef().engine_file_skip_empty_files && current_archive_stat.st_size == 0)
+                                if (getContext()->getSettingsRef().engine_file_skip_empty_files && current_archive_stat.st_size == 0)
                                     continue;
 
                                 archive_reader = createArchiveReader(archive);
@@ -1164,7 +1328,7 @@ Chunk StorageFileSource::generate()
                             continue;
 
                         read_buf = archive_reader->readFile(std::move(file_enumerator));
-                        if (auto progress_callback = context->getFileProgressCallback())
+                        if (auto progress_callback = getContext()->getFileProgressCallback())
                             progress_callback(FileProgress(0, tryGetFileSizeFromReadBuffer(*read_buf).value_or(0)));
                     }
                 }
@@ -1190,16 +1354,16 @@ Chunk StorageFileSource::generate()
                 file_stat = getFileStat(current_path, storage->use_table_fd, storage->table_fd, storage->getName());
                 current_file_size = file_stat.st_size;
 
-                if (context->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0)
+                if (getContext()->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0)
                     continue;
 
                 if (need_only_count && tryGetCountFromCache(file_stat))
                     continue;
 
-                read_buf = createReadBuffer(current_path, file_stat, storage->use_table_fd, storage->table_fd, storage->compression_method, context);
+                read_buf = createReadBuffer(current_path, file_stat, storage->use_table_fd, storage->table_fd, storage->compression_method, getContext());
             }
 
-            const Settings & settings = context->getSettingsRef();
+            const Settings & settings = getContext()->getSettingsRef();
 
             size_t file_num = 0;
             if (storage->archive_info)
@@ -1211,7 +1375,7 @@ Chunk StorageFileSource::generate()
 
             const auto max_parsing_threads = std::max<size_t>(settings.max_threads / file_num, 1UL);
             input_format = FormatFactory::instance().getInput(
-                storage->format_name, *read_buf, block_for_format, context, max_block_size, storage->format_settings,
+                storage->format_name, *read_buf, block_for_format, getContext(), max_block_size, storage->format_settings,
                 max_parsing_threads, std::nullopt, /*is_remote_fs*/ false, CompressionMethod::None, need_only_count);
 
             if (key_condition)
@@ -1227,7 +1391,7 @@ Chunk StorageFileSource::generate()
             {
                 builder.addSimpleTransform([&](const Block & header)
                 {
-                    return std::make_shared<AddingDefaultsTransform>(header, columns_description, *input_format, context);
+                    return std::make_shared<AddingDefaultsTransform>(header, columns_description, *input_format, getContext());
                 });
             }
 
@@ -1264,7 +1428,7 @@ Chunk StorageFileSource::generate()
         if (storage->use_table_fd)
             finished_generate = true;
 
-        if (input_format && storage->format_name != "Distributed" && context->getSettingsRef().use_cache_for_count_from_files)
+        if (input_format && storage->format_name != "Distributed" && getContext()->getSettingsRef().use_cache_for_count_from_files)
             addNumRowsToCache(current_path, total_rows_in_file);
 
         total_rows_in_file = 0;
@@ -1295,14 +1459,14 @@ Chunk StorageFileSource::generate()
 
 void StorageFileSource::addNumRowsToCache(const String & path, size_t num_rows) const
 {
-    auto key = getKeyForSchemaCache(path, storage->format_name, storage->format_settings, context);
-    StorageFile::getSchemaCache(context).addNumRows(key, num_rows);
+    auto key = getKeyForSchemaCache(path, storage->format_name, storage->format_settings, getContext());
+    StorageFile::getSchemaCache(getContext()).addNumRows(key, num_rows);
 }
 
 std::optional<size_t> StorageFileSource::tryGetNumRowsFromCache(const String & path, time_t last_mod_time) const
 {
-    auto & schema_cache = StorageFile::getSchemaCache(context);
-    auto key = getKeyForSchemaCache(path, storage->format_name, storage->format_settings, context);
+    auto & schema_cache = StorageFile::getSchemaCache(getContext());
+    auto key = getKeyForSchemaCache(path, storage->format_name, storage->format_settings, getContext());
     auto get_last_mod_time = [&]() -> std::optional<time_t>
     {
         return last_mod_time;
@@ -1311,7 +1475,7 @@ std::optional<size_t> StorageFileSource::tryGetNumRowsFromCache(const String & p
     return schema_cache.tryGetNumRows(key, get_last_mod_time);
 }
 
-class ReadFromFile : public SourceStepWithFilter
+class ReadFromFile : public SourceStepWithFilter, WithContext
 {
 public:
     std::string getName() const override { return "ReadFromFile"; }
@@ -1323,14 +1487,13 @@ public:
         std::shared_ptr<StorageFile> storage_,
         ReadFromFormatInfo info_,
         const bool need_only_count_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         size_t max_block_size_,
         size_t num_streams_)
-        : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
+        : SourceStepWithFilter(DataStream{.header = std::move(sample_block)}), WithContext(context_)
         , storage(std::move(storage_))
         , info(std::move(info_))
         , need_only_count(need_only_count_)
-        , context(std::move(context_))
         , max_block_size(max_block_size_)
         , max_num_streams(num_streams_)
     {
@@ -1341,7 +1504,6 @@ private:
     ReadFromFormatInfo info;
     const bool need_only_count;
 
-    ContextPtr context;
     size_t max_block_size;
     const size_t max_num_streams;
 
@@ -1352,7 +1514,7 @@ private:
 
 void ReadFromFile::applyFilters()
 {
-    auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes, {}, context);
+    auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes, {}, getContext());
     const ActionsDAG::Node * predicate = nullptr;
     if (filter_actions_dag)
         predicate = filter_actions_dag->getOutputs().at(0);
@@ -1422,7 +1584,7 @@ void ReadFromFile::createIterator(const ActionsDAG::Node * predicate)
         storage->archive_info,
         predicate,
         storage->virtual_columns,
-        context,
+        getContext(),
         storage->distributed_processing);
 }
 
@@ -1444,8 +1606,10 @@ void ReadFromFile::initializePipeline(QueryPipelineBuilder & pipeline, const Bui
     Pipes pipes;
     pipes.reserve(num_streams);
 
+    auto ctx = getContext();
+
     /// Set total number of bytes to process. For progress bar.
-    auto progress_callback = context->getFileProgressCallback();
+    auto progress_callback = ctx->getFileProgressCallback();
 
     if (progress_callback && !storage->archive_info)
         progress_callback(FileProgress(0, storage->total_bytes_to_read));
@@ -1463,20 +1627,20 @@ void ReadFromFile::initializePipeline(QueryPipelineBuilder & pipeline, const Bui
         auto source = std::make_shared<StorageFileSource>(
             info,
             storage,
-            context,
+            ctx,
             max_block_size,
             files_iterator,
             std::move(read_buffer),
             need_only_count);
 
-        source->setKeyCondition(filter_nodes.nodes, context);
+        source->setKeyCondition(filter_nodes.nodes, ctx);
         pipes.emplace_back(std::move(source));
     }
 
     auto pipe = Pipe::unitePipes(std::move(pipes));
     size_t output_ports = pipe.numOutputPorts();
-    const bool parallelize_output = context->getSettingsRef().parallelize_output_from_storages;
-    if (parallelize_output && storage->parallelizeOutputAfterReading(context) && output_ports > 0 && output_ports < max_num_streams)
+    const bool parallelize_output = ctx->getSettingsRef().parallelize_output_from_storages;
+    if (parallelize_output && storage->parallelizeOutputAfterReading(ctx) && output_ports > 0 && output_ports < max_num_streams)
         pipe.resize(max_num_streams);
 
     if (pipe.empty())
@@ -1489,7 +1653,7 @@ void ReadFromFile::initializePipeline(QueryPipelineBuilder & pipeline, const Bui
 }
 
 
-class StorageFileSink final : public SinkToStorage
+class StorageFileSink final : public SinkToStorage, WithContext
 {
 public:
     StorageFileSink(
@@ -1502,9 +1666,9 @@ public:
         const CompressionMethod compression_method_,
         const std::optional<FormatSettings> & format_settings_,
         const String format_name_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         int flags_)
-        : SinkToStorage(metadata_snapshot_->getSampleBlock())
+        : SinkToStorage(metadata_snapshot_->getSampleBlock()), WithContext(context_)
         , metadata_snapshot(metadata_snapshot_)
         , table_name_for_log(table_name_for_log_)
         , table_fd(table_fd_)
@@ -1514,7 +1678,6 @@ public:
         , compression_method(compression_method_)
         , format_name(format_name_)
         , format_settings(format_settings_)
-        , context(context_)
         , flags(flags_)
     {
         initialize();
@@ -1531,9 +1694,9 @@ public:
         const CompressionMethod compression_method_,
         const std::optional<FormatSettings> & format_settings_,
         const String format_name_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         int flags_)
-        : SinkToStorage(metadata_snapshot_->getSampleBlock())
+        : SinkToStorage(metadata_snapshot_->getSampleBlock()), WithContext(context_)
         , metadata_snapshot(metadata_snapshot_)
         , table_name_for_log(table_name_for_log_)
         , table_fd(table_fd_)
@@ -1543,7 +1706,6 @@ public:
         , compression_method(compression_method_)
         , format_name(format_name_)
         , format_settings(format_settings_)
-        , context(context_)
         , flags(flags_)
         , lock(std::move(lock_))
     {
@@ -1567,7 +1729,7 @@ public:
 
         /// In case of formats with prefixes if file is not empty we have already written prefix.
         bool do_not_write_prefix = naked_buffer->size();
-        const auto & settings = context->getSettingsRef();
+        const auto & settings = getContext()->getSettingsRef();
         write_buf = wrapWriteBufferWithCompressionMethod(
             std::move(naked_buffer),
             compression_method,
@@ -1575,7 +1737,7 @@ public:
             static_cast<int>(settings.output_format_compression_zstd_window_log));
 
         writer = FormatFactory::instance().getOutputFormatParallelIfPossible(format_name,
-                                                                             *write_buf, metadata_snapshot->getSampleBlock(), context, format_settings);
+                                                                             *write_buf, metadata_snapshot->getSampleBlock(), getContext(), format_settings);
 
         if (do_not_write_prefix)
             writer->doNotWritePrefix();
@@ -1658,7 +1820,6 @@ private:
     std::string format_name;
     std::optional<FormatSettings> format_settings;
 
-    ContextPtr context;
     int flags;
     std::unique_lock<std::shared_timed_mutex> lock;
 
@@ -2043,7 +2204,7 @@ StorageFile::ArchiveInfo StorageFile::getArchiveInfo(
     const std::string & path_to_archive,
     const std::string & file_in_archive,
     const std::string & user_files_path,
-    ContextPtr context,
+    const ContextPtr & context,
     size_t & total_bytes_to_read
 )
 {
diff --git a/src/Storages/StorageFile.h b/src/Storages/StorageFile.h
index b74868597a6..a5ccbc8f506 100644
--- a/src/Storages/StorageFile.h
+++ b/src/Storages/StorageFile.h
@@ -84,7 +84,7 @@ public:
 
     static Names getVirtualColumnNames();
 
-    static Strings getPathsList(const String & table_path, const String & user_files_path, ContextPtr context, size_t & total_bytes_to_read);
+    static Strings getPathsList(const String & table_path, const String & user_files_path, const ContextPtr & context, size_t & total_bytes_to_read);
 
     /// Check if the format supports reading only some subset of columns.
     /// Is is useful because such formats could effectively skip unknown columns
@@ -112,14 +112,19 @@ public:
         }
     };
 
-    ColumnsDescription getTableStructureFromFileDescriptor(ContextPtr context);
-
     static ColumnsDescription getTableStructureFromFile(
         const String & format,
         const std::vector<String> & paths,
         const String & compression_method,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr context,
+        const ContextPtr & context,
+        const std::optional<ArchiveInfo> & archive_info = std::nullopt);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromFile(
+        const std::vector<String> & paths,
+        const String & compression_method,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & context,
         const std::optional<ArchiveInfo> & archive_info = std::nullopt);
 
     static SchemaCache & getSchemaCache(const ContextPtr & context);
@@ -130,7 +135,7 @@ public:
         const std::string & path_to_archive,
         const std::string & file_in_archive,
         const std::string & user_files_path,
-        ContextPtr context,
+        const ContextPtr & context,
         size_t & total_bytes_to_read);
 
     bool supportsTrivialCountOptimization() const override { return true; }
@@ -141,6 +146,16 @@ protected:
     friend class ReadFromFile;
 
 private:
+    std::pair<ColumnsDescription, String> getTableStructureAndFormatFromFileDescriptor(std::optional<String> format, const ContextPtr & context);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromFileImpl(
+        std::optional<String> format,
+        const std::vector<String> & paths,
+        const String & compression_method,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & context,
+        const std::optional<ArchiveInfo> & archive_info = std::nullopt);
+
     void setStorageMetadata(CommonArguments args);
 
     std::string format_name;
@@ -187,10 +202,10 @@ private:
     bool distributed_processing = false;
 };
 
-class StorageFileSource : public SourceWithKeyCondition
+class StorageFileSource : public SourceWithKeyCondition, WithContext
 {
 public:
-    class FilesIterator
+    class FilesIterator : WithContext
     {
     public:
         explicit FilesIterator(
@@ -198,7 +213,7 @@ public:
             std::optional<StorageFile::ArchiveInfo> archive_info_,
             const ActionsDAG::Node * predicate,
             const NamesAndTypesList & virtual_columns,
-            ContextPtr context_,
+            const ContextPtr & context_,
             bool distributed_processing_ = false);
 
         String next();
@@ -227,8 +242,6 @@ private:
         std::atomic<size_t> index = 0;
 
         bool distributed_processing;
-
-        ContextPtr context;
     };
 
     using FilesIteratorPtr = std::shared_ptr<FilesIterator>;
@@ -236,7 +249,7 @@ private:
     StorageFileSource(
         const ReadFromFormatInfo & info,
         std::shared_ptr<StorageFile> storage_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         UInt64 max_block_size_,
         FilesIteratorPtr files_iterator_,
         std::unique_ptr<ReadBuffer> read_buf_,
@@ -286,7 +299,6 @@ private:
     NamesAndTypesList requested_virtual_columns;
     Block block_for_format;
 
-    ContextPtr context;    /// TODO Untangle potential issues with context lifetime.
     UInt64 max_block_size;
 
     bool finished_generate = false;
diff --git a/src/Storages/StorageFileCluster.cpp b/src/Storages/StorageFileCluster.cpp
index c12124f1e07..65eec0a7ea1 100644
--- a/src/Storages/StorageFileCluster.cpp
+++ b/src/Storages/StorageFileCluster.cpp
@@ -25,36 +25,39 @@ extern const int LOGICAL_ERROR;
 }
 
 StorageFileCluster::StorageFileCluster(
-    ContextPtr context_,
+    const ContextPtr & context,
     const String & cluster_name_,
     const String & filename_,
     const String & format_name_,
-    const String & compression_method_,
+    const String & compression_method,
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
-    const ConstraintsDescription & constraints_,
-    bool structure_argument_was_provided_)
-    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageFileCluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
+    const ConstraintsDescription & constraints_)
+    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageFileCluster (" + table_id_.table_name + ")"))
     , filename(filename_)
     , format_name(format_name_)
-    , compression_method(compression_method_)
 {
     StorageInMemoryMetadata storage_metadata;
 
     size_t total_bytes_to_read; // its value isn't used as we are not reading files (just listing them). But it is required by getPathsList
-    paths = StorageFile::getPathsList(filename_, context_->getUserFilesPath(), context_, total_bytes_to_read);
+    paths = StorageFile::getPathsList(filename_, context->getUserFilesPath(), context, total_bytes_to_read);
 
     if (columns_.empty())
     {
-        auto columns = StorageFile::getTableStructureFromFile(format_name,
-                                                             paths,
-                                                             compression_method,
-                                                             std::nullopt,
-                                                             context_);
+        ColumnsDescription columns;
+        if (format_name == "auto")
+            std::tie(columns, format_name) = StorageFile::getTableStructureAndFormatFromFile(paths, compression_method, std::nullopt, context);
+        else
+            columns = StorageFile::getTableStructureFromFile(format_name, paths, compression_method, std::nullopt, context);
+
         storage_metadata.setColumns(columns);
     }
     else
+    {
+        if (format_name == "auto")
+            format_name = StorageFile::getTableStructureAndFormatFromFile(paths, compression_method, std::nullopt, context).second;
         storage_metadata.setColumns(columns_);
+    }
 
     storage_metadata.setConstraints(constraints_);
     setInMemoryMetadata(storage_metadata);
@@ -62,13 +65,14 @@ StorageFileCluster::StorageFileCluster(
     virtual_columns = VirtualColumnUtils::getPathFileAndSizeVirtualsForStorage(storage_metadata.getSampleBlock().getNamesAndTypesList());
 }
 
-void StorageFileCluster::addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context)
+void StorageFileCluster::updateQueryToSendIfNeeded(DB::ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const DB::ContextPtr & context)
 {
     ASTExpressionList * expression_list = extractTableFunctionArgumentsFromSelectQuery(query);
     if (!expression_list)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected SELECT query from table function fileCluster, got '{}'", queryToString(query));
 
-    TableFunctionFileCluster::addColumnsStructureToArguments(expression_list->children, structure, context);
+    TableFunctionFileCluster::updateStructureAndFormatArgumentsIfNeeded(
+        expression_list->children, storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(), format_name, context);
 }
 
 RemoteQueryExecutor::Extension StorageFileCluster::getTaskIteratorExtension(const ActionsDAG::Node * predicate, const ContextPtr & context) const
diff --git a/src/Storages/StorageFileCluster.h b/src/Storages/StorageFileCluster.h
index a6e57c3bb4f..2803c8b6e5b 100644
--- a/src/Storages/StorageFileCluster.h
+++ b/src/Storages/StorageFileCluster.h
@@ -17,15 +17,14 @@ class StorageFileCluster : public IStorageCluster
 {
 public:
     StorageFileCluster(
-        ContextPtr context_,
+        const ContextPtr & context_,
         const String & cluster_name_,
         const String & filename_,
         const String & format_name_,
         const String & compression_method_,
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
-        const ConstraintsDescription & constraints_,
-        bool structure_argument_was_provided_);
+        const ConstraintsDescription & constraints_);
 
     std::string getName() const override { return "FileCluster"; }
 
@@ -38,12 +37,11 @@ public:
     bool supportsTrivialCountOptimization() const override { return true; }
 
 private:
-    void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) override;
+    void updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context) override;
 
     Strings paths;
     String filename;
     String format_name;
-    String compression_method;
     NamesAndTypesList virtual_columns;
 };
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index c376af5a3d7..8e5b6040a63 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -129,6 +129,7 @@ namespace ErrorCodes
     extern const int UNEXPECTED_EXPRESSION;
     extern const int DATABASE_ACCESS_DENIED;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int CANNOT_DETECT_FORMAT;
     extern const int NOT_IMPLEMENTED;
     extern const int CANNOT_COMPILE_REGEXP;
     extern const int FILE_DOESNT_EXIST;
@@ -428,7 +429,7 @@ StorageS3Source::DisclosedGlobIterator::DisclosedGlobIterator(
     const S3::URI & globbed_uri_,
     const ActionsDAG::Node * predicate,
     const NamesAndTypesList & virtual_columns_,
-    ContextPtr context,
+    const ContextPtr & context,
     KeysWithInfo * read_keys_,
     const S3Settings::RequestSettings & request_settings_,
     std::function<void(FileProgress)> file_progress_callback_)
@@ -563,7 +564,7 @@ StorageS3Source::StorageS3Source(
     const ReadFromFormatInfo & info,
     const String & format_,
     String name_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     std::optional<FormatSettings> format_settings_,
     UInt64 max_block_size_,
     const S3Settings::RequestSettings & request_settings_,
@@ -841,7 +842,7 @@ public:
     StorageS3Sink(
         const String & format,
         const Block & sample_block_,
-        ContextPtr context,
+        const ContextPtr & context,
         std::optional<FormatSettings> format_settings_,
         const CompressionMethod compression_method,
         const StorageS3::Configuration & configuration_,
@@ -949,23 +950,22 @@ private:
 };
 
 
-class PartitionedStorageS3Sink : public PartitionedSink
+class PartitionedStorageS3Sink : public PartitionedSink, WithContext
 {
 public:
     PartitionedStorageS3Sink(
         const ASTPtr & partition_by,
         const String & format_,
         const Block & sample_block_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         std::optional<FormatSettings> format_settings_,
         const CompressionMethod compression_method_,
         const StorageS3::Configuration & configuration_,
         const String & bucket_,
         const String & key_)
-        : PartitionedSink(partition_by, context_, sample_block_)
+        : PartitionedSink(partition_by, context_, sample_block_), WithContext(context_)
         , format(format_)
         , sample_block(sample_block_)
-        , context(context_)
         , compression_method(compression_method_)
         , configuration(configuration_)
         , bucket(bucket_)
@@ -985,7 +985,7 @@ public:
         return std::make_shared<StorageS3Sink>(
             format,
             sample_block,
-            context,
+            getContext(),
             format_settings,
             compression_method,
             configuration,
@@ -997,7 +997,6 @@ public:
 private:
     const String format;
     const Block sample_block;
-    const ContextPtr context;
     const CompressionMethod compression_method;
     const StorageS3::Configuration configuration;
     const String bucket;
@@ -1033,7 +1032,7 @@ private:
 
 StorageS3::StorageS3(
     const Configuration & configuration_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
@@ -1050,18 +1049,27 @@ StorageS3::StorageS3(
 {
     updateConfiguration(context_); // NOLINT(clang-analyzer-optin.cplusplus.VirtualCall)
 
-    FormatFactory::instance().checkFormatName(configuration.format);
+    if (configuration.format != "auto")
+        FormatFactory::instance().checkFormatName(configuration.format);
     context_->getGlobalContext()->getRemoteHostFilter().checkURL(configuration.url.uri);
     context_->getGlobalContext()->getHTTPHeaderFilter().checkHeaders(configuration.headers_from_ast);
 
     StorageInMemoryMetadata storage_metadata;
     if (columns_.empty())
     {
-        auto columns = getTableStructureFromDataImpl(configuration, format_settings, context_);
+        ColumnsDescription columns;
+        if (configuration.format == "auto")
+            std::tie(columns, configuration.format) = getTableStructureAndFormatFromData(configuration, format_settings, context_);
+        else
+            columns = getTableStructureFromData(configuration, format_settings, context_);
+
         storage_metadata.setColumns(columns);
     }
     else
     {
+        if (configuration.format == "auto")
+            configuration.format = getTableStructureAndFormatFromData(configuration, format_settings, context_).second;
+
         /// We don't allow special columns in S3 storage.
         if (!columns_.hasOnlyOrdinary())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table engine S3 doesn't support special columns like MATERIALIZED, ALIAS or EPHEMERAL");
@@ -1350,14 +1358,14 @@ void StorageS3::truncate(const ASTPtr & /* query */, const StorageMetadataPtr &,
         LOG_WARNING(&Poco::Logger::get("StorageS3"), "Failed to delete {}, error: {}", error.GetKey(), error.GetMessage());
 }
 
-StorageS3::Configuration StorageS3::updateConfigurationAndGetCopy(ContextPtr local_context)
+StorageS3::Configuration StorageS3::updateConfigurationAndGetCopy(const ContextPtr & local_context)
 {
     std::lock_guard lock(configuration_update_mutex);
     configuration.update(local_context);
     return configuration;
 }
 
-void StorageS3::updateConfiguration(ContextPtr local_context)
+void StorageS3::updateConfiguration(const ContextPtr & local_context)
 {
     std::lock_guard lock(configuration_update_mutex);
     configuration.update(local_context);
@@ -1375,7 +1383,7 @@ const StorageS3::Configuration & StorageS3::getConfiguration()
     return configuration;
 }
 
-bool StorageS3::Configuration::update(ContextPtr context)
+bool StorageS3::Configuration::update(const ContextPtr & context)
 {
     auto s3_settings = context->getStorageS3Settings().getSettings(url.uri.toString());
     request_settings = s3_settings.request_settings;
@@ -1390,7 +1398,7 @@ bool StorageS3::Configuration::update(ContextPtr context)
     return true;
 }
 
-void StorageS3::Configuration::connect(ContextPtr context)
+void StorageS3::Configuration::connect(const ContextPtr & context)
 {
     const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
     const Settings & local_settings = context->getSettingsRef();
@@ -1462,7 +1470,7 @@ void StorageS3::processNamedCollectionResult(StorageS3::Configuration & configur
     configuration.request_settings = S3Settings::RequestSettings(collection);
 }
 
-StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, ContextPtr local_context, bool get_format_from_file)
+StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, const ContextPtr & local_context, bool get_format_from_file)
 {
     StorageS3::Configuration configuration;
 
@@ -1601,7 +1609,7 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
     configuration.keys = {configuration.url.key};
 
     if (configuration.format == "auto" && get_format_from_file)
-        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.url.key, true);
+        configuration.format = FormatFactory::instance().tryGetFormatFromFileName(configuration.url.key).value_or("auto");
 
     return configuration;
 }
@@ -1609,9 +1617,17 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
 ColumnsDescription StorageS3::getTableStructureFromData(
     const StorageS3::Configuration & configuration,
     const std::optional<FormatSettings> & format_settings,
-    ContextPtr ctx)
+    const ContextPtr & ctx)
 {
-    return getTableStructureFromDataImpl(configuration, format_settings, ctx);
+    return getTableStructureAndFormatFromDataImpl(configuration.format, configuration, format_settings, ctx).first;
+}
+
+std::pair<ColumnsDescription, String> StorageS3::getTableStructureAndFormatFromData(
+    const StorageS3::Configuration & configuration,
+    const std::optional<FormatSettings> & format_settings,
+    const ContextPtr & ctx)
+{
+    return getTableStructureAndFormatFromDataImpl(std::nullopt, configuration, format_settings, ctx);
 }
 
 namespace
@@ -1623,24 +1639,43 @@ namespace
             std::shared_ptr<StorageS3Source::IIterator> file_iterator_,
             const StorageS3Source::KeysWithInfo & read_keys_,
             const StorageS3::Configuration & configuration_,
+            std::optional<String> format_,
             const std::optional<FormatSettings> & format_settings_,
             const ContextPtr & context_)
             : WithContext(context_)
             , file_iterator(file_iterator_)
             , read_keys(read_keys_)
             , configuration(configuration_)
+            , format(std::move(format_))
             , format_settings(format_settings_)
             , prev_read_keys_size(read_keys_.size())
         {
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
-            /// For default mode check cached columns for currently read keys on first iteration.
-            if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            if (first)
             {
-                if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
-                    return {nullptr, cached_columns};
+                /// If format is unknown we iterate through all currently read keys on first iteration and
+                /// try to determine format by file name.
+                if (!format)
+                {
+                    for (const auto & key_with_info : read_keys)
+                    {
+                        if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName(key_with_info->key))
+                        {
+                            format = format_from_file_name;
+                            break;
+                        }
+                    }
+                }
+
+                /// For default mode check cached columns for currently read keys on first iteration.
+                if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                {
+                    if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
+                        return {nullptr, cached_columns, format};
+                }
             }
 
             while (true)
@@ -1650,13 +1685,34 @@ namespace
                 if (!current_key_with_info || current_key_with_info->key.empty())
                 {
                     if (first)
-                        throw Exception(
-                            ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                            "Cannot extract table structure from {} format file, because there are no files with provided path "
-                            "in S3 or all files are empty. You must specify table structure manually",
-                            configuration.format);
+                    {
+                        if (format)
+                            throw Exception(
+                                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                "The table structure cannot be extracted from a {} format file, because there are no files with provided path "
+                                "in S3 or all files are empty. You can specify table structure manually",
+                                *format);
 
-                    return {nullptr, std::nullopt};
+                        throw Exception(
+                            ErrorCodes::CANNOT_DETECT_FORMAT,
+                            "The data format cannot be detected by the contents of the files, because there are no files with provided path "
+                            "in S3 or all files are empty. You can specify the format manually");
+                    }
+
+                    return {nullptr, std::nullopt, format};
+                }
+
+                /// S3 file iterator could get new keys after new iteration, if format is unknown we can try to determine it by new file names.
+                if (!format && read_keys.size() > prev_read_keys_size)
+                {
+                    for (auto it = read_keys.begin() + prev_read_keys_size; it != read_keys.end(); ++it)
+                    {
+                        if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName((*it)->key))
+                        {
+                            format = format_from_file_name;
+                            break;
+                        }
+                    }
                 }
 
                 /// S3 file iterator could get new keys after new iteration, check them in schema cache if schema inference mode is default.
@@ -1665,9 +1721,11 @@ namespace
                     auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
                     prev_read_keys_size = read_keys.size();
                     if (columns_from_cache)
-                        return {nullptr, columns_from_cache};
+                        return {nullptr, columns_from_cache, format};
                 }
 
+                prev_read_keys_size = read_keys.size();
+
                 if (getContext()->getSettingsRef().s3_skip_empty_files && current_key_with_info->info && current_key_with_info->info->size == 0)
                     continue;
 
@@ -1678,7 +1736,7 @@ namespace
                     if (auto columns_from_cache = tryGetColumnsFromCache(keys.begin(), keys.end()))
                     {
                         first = false;
-                        return {nullptr, columns_from_cache};
+                        return {nullptr, columns_from_cache, format};
                     }
                 }
 
@@ -1687,7 +1745,7 @@ namespace
                 if (!getContext()->getSettingsRef().s3_skip_empty_files || !impl->eof())
                 {
                     first = false;
-                    return {wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(current_key_with_info->key, configuration.compression_method), zstd_window_log_max), std::nullopt};
+                    return {wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(current_key_with_info->key, configuration.compression_method), zstd_window_log_max), std::nullopt, format};
                 }
             }
         }
@@ -1698,7 +1756,7 @@ namespace
                 return;
 
             String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / configuration.url.bucket / current_key_with_info->key;
-            auto key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(source, *format, format_settings, getContext());
             StorageS3::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -1709,7 +1767,7 @@ namespace
                 return;
 
             String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / configuration.url.bucket / current_key_with_info->key;
-            auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            auto cache_key = getKeyForSchemaCache(source, *format, format_settings, getContext());
             StorageS3::getSchemaCache(getContext()).addColumns(cache_key, columns);
         }
 
@@ -1723,10 +1781,15 @@ namespace
             Strings sources;
             sources.reserve(read_keys.size());
             std::transform(read_keys.begin(), read_keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket / elem->key; });
-            auto cache_keys = getKeysForSchemaCache(sources, configuration.format, format_settings, getContext());
+            auto cache_keys = getKeysForSchemaCache(sources, *format, format_settings, getContext());
             StorageS3::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+
         String getLastFileName() const override
         {
             if (current_key_with_info)
@@ -1734,15 +1797,26 @@ namespace
             return "";
         }
 
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            chassert(current_key_with_info);
+            int zstd_window_log_max = static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max);
+            auto impl = std::make_unique<ReadBufferFromS3>(configuration.client, configuration.url.bucket, current_key_with_info->key, configuration.url.version_id, configuration.request_settings, getContext()->getReadSettings());
+            return wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(current_key_with_info->key, configuration.compression_method), zstd_window_log_max);
+        }
+
     private:
         std::optional<ColumnsDescription> tryGetColumnsFromCache(
             const StorageS3::KeysWithInfo::const_iterator & begin,
             const StorageS3::KeysWithInfo::const_iterator & end)
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
+            auto context = getContext();
+            if (!context->getSettingsRef().schema_inference_use_cache_for_s3)
                 return std::nullopt;
 
-            auto & schema_cache = StorageS3::getSchemaCache(getContext());
+            auto & schema_cache = StorageS3::getSchemaCache(context);
             for (auto it = begin; it < end; ++it)
             {
                 auto get_last_mod_time = [&]
@@ -1773,10 +1847,29 @@ namespace
 
                 String path = fs::path(configuration.url.bucket) / (*it)->key;
                 String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / path;
-                auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
-                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-                if (columns)
-                    return columns;
+
+                if (format)
+                {
+                    auto cache_key = getKeyForSchemaCache(source, *format, format_settings, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        return columns;
+                }
+                else
+                {
+                    /// If format is unknown, we can iterate through all possible input formats
+                    /// and check if we have an entry with this format and this file in schema cache.
+                    /// If we have such entry for some format, we can use this format to read the file.
+                    for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                    {
+                        auto cache_key = getKeyForSchemaCache(source, format_name, format_settings, context);
+                        if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        {
+                            /// Now format is known. It should be the same for all files.
+                            format = format_name;
+                            return columns;
+                        }
+                    }
+                }
             }
 
             return std::nullopt;
@@ -1785,6 +1878,7 @@ namespace
         std::shared_ptr<StorageS3Source::IIterator> file_iterator;
         const StorageS3Source::KeysWithInfo & read_keys;
         const StorageS3::Configuration & configuration;
+        std::optional<String> format;
         const std::optional<FormatSettings> & format_settings;
         StorageS3Source::KeyWithInfoPtr current_key_with_info;
         size_t prev_read_keys_size;
@@ -1793,17 +1887,20 @@ namespace
 
 }
 
-ColumnsDescription StorageS3::getTableStructureFromDataImpl(
+std::pair<ColumnsDescription, String> StorageS3::getTableStructureAndFormatFromDataImpl(
+    std::optional<String> format,
     const Configuration & configuration,
     const std::optional<FormatSettings> & format_settings,
-    ContextPtr ctx)
+    const ContextPtr & ctx)
 {
     KeysWithInfo read_keys;
 
     auto file_iterator = createFileIterator(configuration, false, ctx, {}, {}, &read_keys);
 
-    ReadBufferIterator read_buffer_iterator(file_iterator, read_keys, configuration, format_settings, ctx);
-    return readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
+    ReadBufferIterator read_buffer_iterator(file_iterator, read_keys, configuration, format, format_settings, ctx);
+    if (format)
+        return {readSchemaFromFormat(*format, format_settings, read_buffer_iterator, ctx), *format};
+    return detectFormatAndReadSchema(format_settings, read_buffer_iterator, ctx);
 }
 
 void registerStorageS3Impl(const String & name, StorageFactory & factory)
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index b90a0d394cb..cb3c3f4b947 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -80,7 +80,7 @@ public:
             const S3::URI & globbed_uri_,
             const ActionsDAG::Node * predicate,
             const NamesAndTypesList & virtual_columns,
-            ContextPtr context,
+            const ContextPtr & context,
             KeysWithInfo * read_keys_ = nullptr,
             const S3Settings::RequestSettings & request_settings_ = {},
             std::function<void(FileProgress)> progress_callback_ = {});
@@ -134,7 +134,7 @@ public:
         const ReadFromFormatInfo & info,
         const String & format,
         String name_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         std::optional<FormatSettings> format_settings_,
         UInt64 max_block_size_,
         const S3Settings::RequestSettings & request_settings_,
@@ -280,9 +280,9 @@ public:
 
         String getPath() const { return url.key; }
 
-        bool update(ContextPtr context);
+        bool update(const ContextPtr & context);
 
-        void connect(ContextPtr context);
+        void connect(const ContextPtr & context);
 
         bool withGlobs() const { return url.key.find_first_of("*?{") != std::string::npos; }
 
@@ -308,7 +308,7 @@ public:
 
     StorageS3(
         const Configuration & configuration_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
@@ -345,21 +345,26 @@ public:
 
     static SchemaCache & getSchemaCache(const ContextPtr & ctx);
 
-    static StorageS3::Configuration getConfiguration(ASTs & engine_args, ContextPtr local_context, bool get_format_from_file = true);
+    static StorageS3::Configuration getConfiguration(ASTs & engine_args, const ContextPtr & local_context, bool get_format_from_file = true);
 
     static ColumnsDescription getTableStructureFromData(
         const StorageS3::Configuration & configuration,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr ctx);
+        const ContextPtr & ctx);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromData(
+        const StorageS3::Configuration & configuration,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & ctx);
 
     using KeysWithInfo = StorageS3Source::KeysWithInfo;
 
     bool supportsTrivialCountOptimization() const override { return true; }
 
 protected:
-    virtual Configuration updateConfigurationAndGetCopy(ContextPtr local_context);
+    virtual Configuration updateConfigurationAndGetCopy(const ContextPtr & local_context);
 
-    virtual void updateConfiguration(ContextPtr local_context);
+    virtual void updateConfiguration(const ContextPtr & local_context);
 
     void useConfiguration(const Configuration & new_configuration);
 
@@ -380,10 +385,11 @@ private:
     std::optional<FormatSettings> format_settings;
     ASTPtr partition_by;
 
-    static ColumnsDescription getTableStructureFromDataImpl(
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromDataImpl(
+        std::optional<String> format,
         const Configuration & configuration,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr ctx);
+        const ContextPtr & ctx);
 
     bool supportsSubcolumns() const override { return true; }
 
diff --git a/src/Storages/StorageS3Cluster.cpp b/src/Storages/StorageS3Cluster.cpp
index e1738056e9d..5264372889e 100644
--- a/src/Storages/StorageS3Cluster.cpp
+++ b/src/Storages/StorageS3Cluster.cpp
@@ -38,25 +38,34 @@ StorageS3Cluster::StorageS3Cluster(
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
-    ContextPtr context_,
-    bool structure_argument_was_provided_)
-    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageS3Cluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
+    const ContextPtr & context)
+    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageS3Cluster (" + table_id_.table_name + ")"))
     , s3_configuration{configuration_}
 {
-    context_->getGlobalContext()->getRemoteHostFilter().checkURL(configuration_.url.uri);
-    context_->getGlobalContext()->getHTTPHeaderFilter().checkHeaders(configuration_.headers_from_ast);
+    context->getGlobalContext()->getRemoteHostFilter().checkURL(configuration_.url.uri);
+    context->getGlobalContext()->getHTTPHeaderFilter().checkHeaders(configuration_.headers_from_ast);
 
     StorageInMemoryMetadata storage_metadata;
-    updateConfigurationIfChanged(context_);
+    updateConfigurationIfChanged(context);
 
     if (columns_.empty())
     {
+        ColumnsDescription columns;
         /// `format_settings` is set to std::nullopt, because StorageS3Cluster is used only as table function
-        auto columns = StorageS3::getTableStructureFromDataImpl(s3_configuration, /*format_settings=*/std::nullopt, context_);
+        if (s3_configuration.format == "auto")
+            std::tie(columns, s3_configuration.format) = StorageS3::getTableStructureAndFormatFromData(s3_configuration, /*format_settings=*/std::nullopt, context);
+        else
+            columns = StorageS3::getTableStructureFromData(s3_configuration, /*format_settings=*/std::nullopt, context);
+
         storage_metadata.setColumns(columns);
     }
     else
+    {
+        if (s3_configuration.format == "auto")
+            s3_configuration.format = StorageS3::getTableStructureAndFormatFromData(s3_configuration, /*format_settings=*/std::nullopt, context).second;
+
         storage_metadata.setColumns(columns_);
+    }
 
     storage_metadata.setConstraints(constraints_);
     setInMemoryMetadata(storage_metadata);
@@ -64,13 +73,17 @@ StorageS3Cluster::StorageS3Cluster(
     virtual_columns = VirtualColumnUtils::getPathFileAndSizeVirtualsForStorage(storage_metadata.getSampleBlock().getNamesAndTypesList());
 }
 
-void StorageS3Cluster::addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context)
+void StorageS3Cluster::updateQueryToSendIfNeeded(DB::ASTPtr & query, const DB::StorageSnapshotPtr & storage_snapshot, const DB::ContextPtr & context)
 {
     ASTExpressionList * expression_list = extractTableFunctionArgumentsFromSelectQuery(query);
     if (!expression_list)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected SELECT query from table function s3Cluster, got '{}'", queryToString(query));
 
-    TableFunctionS3Cluster::addColumnsStructureToArguments(expression_list->children, structure, context);
+    TableFunctionS3Cluster::updateStructureAndFormatArgumentsIfNeeded(
+        expression_list->children,
+        storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(),
+        s3_configuration.format,
+        context);
 }
 
 void StorageS3Cluster::updateConfigurationIfChanged(ContextPtr local_context)
diff --git a/src/Storages/StorageS3Cluster.h b/src/Storages/StorageS3Cluster.h
index c526f14834a..ac25c506337 100644
--- a/src/Storages/StorageS3Cluster.h
+++ b/src/Storages/StorageS3Cluster.h
@@ -27,8 +27,7 @@ public:
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
-        ContextPtr context_,
-        bool structure_argument_was_provided_);
+        const ContextPtr & context_);
 
     std::string getName() const override { return "S3Cluster"; }
 
@@ -46,7 +45,7 @@ protected:
 private:
     void updateBeforeRead(const ContextPtr & context) override { updateConfigurationIfChanged(context); }
 
-    void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) override;
+    void updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context) override;
 
     StorageS3::Configuration s3_configuration;
     NamesAndTypesList virtual_columns;
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 0ba72af6fc0..a68ed6965fc 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -101,7 +101,7 @@ static ConnectionTimeouts getHTTPTimeouts(ContextPtr context)
 
 IStorageURLBase::IStorageURLBase(
     const String & uri_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     const StorageID & table_id_,
     const String & format_name_,
     const std::optional<FormatSettings> & format_settings_,
@@ -123,16 +123,26 @@ IStorageURLBase::IStorageURLBase(
     , partition_by(partition_by_)
     , distributed_processing(distributed_processing_)
 {
-    FormatFactory::instance().checkFormatName(format_name);
+    if (format_name != "auto")
+        FormatFactory::instance().checkFormatName(format_name);
+
     StorageInMemoryMetadata storage_metadata;
 
     if (columns_.empty())
     {
-        auto columns = getTableStructureFromData(format_name, uri, compression_method, headers, format_settings, context_);
+        ColumnsDescription columns;
+        if (format_name == "auto")
+            std::tie(columns, format_name) = getTableStructureAndFormatFromData(uri, compression_method, headers, format_settings, context_);
+        else
+            columns = getTableStructureFromData(format_name, uri, compression_method, headers, format_settings, context_);
+
         storage_metadata.setColumns(columns);
     }
     else
     {
+        if (format_name == "auto")
+            format_name = getTableStructureAndFormatFromData(uri, compression_method, headers, format_settings, context_).second;
+
         /// We don't allow special columns in URL storage.
         if (!columns_.hasOnlyOrdinary())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table engine URL doesn't support special columns like MATERIALIZED, ALIAS or EPHEMERAL");
@@ -257,7 +267,7 @@ StorageURLSource::StorageURLSource(
     const String & format_,
     const std::optional<FormatSettings> & format_settings_,
     String name_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     UInt64 max_block_size,
     const ConnectionTimeouts & timeouts,
     CompressionMethod compression_method,
@@ -525,7 +535,7 @@ StorageURLSink::StorageURLSink(
     const String & format,
     const std::optional<FormatSettings> & format_settings,
     const Block & sample_block,
-    ContextPtr context,
+    const ContextPtr & context,
     const ConnectionTimeouts & timeouts,
     const CompressionMethod compression_method,
     const HTTPHeaderEntries & headers,
@@ -668,7 +678,7 @@ std::vector<std::pair<std::string, std::string>> IStorageURLBase::getReadURIPara
     const Names & /*column_names*/,
     const StorageSnapshotPtr & /*storage_snapshot*/,
     const SelectQueryInfo & /*query_info*/,
-    ContextPtr /*context*/,
+    const ContextPtr & /*context*/,
     QueryProcessingStage::Enum & /*processed_stage*/,
     size_t /*max_block_size*/) const
 {
@@ -679,7 +689,7 @@ std::function<void(std::ostream &)> IStorageURLBase::getReadPOSTDataCallback(
     const Names & /*column_names*/,
     const ColumnsDescription & /* columns_description */,
     const SelectQueryInfo & /*query_info*/,
-    ContextPtr /*context*/,
+    const ContextPtr & /*context*/,
     QueryProcessingStage::Enum & /*processed_stage*/,
     size_t /*max_block_size*/) const
 {
@@ -693,28 +703,48 @@ namespace
     public:
         ReadBufferIterator(
             const std::vector<String> & urls_to_check_,
-            const String & format_,
+            std::optional<String> format_,
             const CompressionMethod & compression_method_,
             const HTTPHeaderEntries & headers_,
             const std::optional<FormatSettings> & format_settings_,
             const ContextPtr & context_)
-            : WithContext(context_), format(format_), compression_method(compression_method_), headers(headers_), format_settings(format_settings_)
+            : WithContext(context_), format(std::move(format_)), compression_method(compression_method_), headers(headers_), format_settings(format_settings_)
         {
             url_options_to_check.reserve(urls_to_check_.size());
             for (const auto & url : urls_to_check_)
                 url_options_to_check.push_back(getFailoverOptions(url, getContext()->getSettingsRef().glob_expansion_max_elements));
         }
 
-        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
+        Data next() override
         {
             bool is_first = (current_index == 0);
-            /// For default mode check cached columns for all urls on first iteration.
-            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            if (is_first)
             {
-                for (const auto & options : url_options_to_check)
+                /// If format is unknown we iterate through all url options on first iteration and
+                /// try to determine format by file name.
+                if (!format)
                 {
-                    if (auto cached_columns = tryGetColumnsFromCache(options))
-                        return {nullptr, cached_columns};
+                    for (const auto & options : url_options_to_check)
+                    {
+                        for (const auto & url : options)
+                        {
+                            if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName(url))
+                            {
+                                format = format_from_file_name;
+                                break;
+                            }
+                        }
+                    }
+                }
+
+                /// For default mode check cached columns for all urls on first iteration.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                {
+                    for (const auto & options : url_options_to_check)
+                    {
+                        if (auto cached_columns = tryGetColumnsFromCache(options))
+                            return {nullptr, cached_columns, format};
+                    }
                 }
             }
 
@@ -724,20 +754,30 @@ namespace
                 if (current_index == url_options_to_check.size())
                 {
                     if (is_first)
+                    {
+                        if (format)
+                            throw Exception(
+                                ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                                "The table structure cannot be extracted from a {} format file, because all files are empty. "
+                                "You can specify table structure manually",
+                                *format);
+
                         throw Exception(
                             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                            "Cannot extract table structure from {} format file, because all files are empty. "
-                            "You must specify table structure manually",
-                            format);
-                    return {nullptr, std::nullopt};
+                            "The data format cannot be detected by the contents of the files, because there are no files with provided path "
+                            "You can specify the format manually");
+
+                    }
+
+                    return {nullptr, std::nullopt, format};
                 }
 
                 if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
                 {
-                    if (auto cached_columns = tryGetColumnsFromCache(url_options_to_check[current_index]))
+                    if (auto cached_schema = tryGetColumnsFromCache(url_options_to_check[current_index]))
                     {
                         ++current_index;
-                        return {nullptr, cached_columns};
+                        return {nullptr, cached_schema, format};
                     }
                 }
 
@@ -762,7 +802,7 @@ namespace
             return {wrapReadBufferWithCompressionMethod(
                 std::move(uri_and_buf.second),
                 compression_method,
-                static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max)), std::nullopt};
+                static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max)), std::nullopt, format};
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
@@ -770,7 +810,7 @@ namespace
             if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url)
                 return;
 
-            auto key = getKeyForSchemaCache(current_url_option, format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(current_url_option, *format, format_settings, getContext());
             StorageURL::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
@@ -780,7 +820,7 @@ namespace
                 || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
                 return;
 
-            auto key = getKeyForSchemaCache(current_url_option, format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(current_url_option, *format, format_settings, getContext());
             StorageURL::getSchemaCache(getContext()).addColumns(key, columns);
         }
 
@@ -792,17 +832,45 @@ namespace
 
             for (const auto & options : url_options_to_check)
             {
-                auto keys = getKeysForSchemaCache(options, format, format_settings, getContext());
+                auto keys = getKeysForSchemaCache(options, *format, format_settings, getContext());
                 StorageURL::getSchemaCache(getContext()).addManyColumns(keys, columns);
             }
         }
 
+        void setFormatName(const String & format_name) override
+        {
+            format = format_name;
+        }
+
         String getLastFileName() const override { return current_url_option; }
 
+        bool supportsLastReadBufferRecreation() const override { return true; }
+
+        std::unique_ptr<ReadBuffer> recreateLastReadBuffer() override
+        {
+            chassert(current_index > 0 && current_index <= url_options_to_check.size());
+            auto first_option = url_options_to_check[current_index - 1].cbegin();
+            auto uri_and_buf = StorageURLSource::getFirstAvailableURIAndReadBuffer(
+                first_option,
+                url_options_to_check[current_index - 1].cend(),
+                getContext(),
+                {},
+                Poco::Net::HTTPRequest::HTTP_GET,
+                {},
+                getHTTPTimeouts(getContext()),
+                credentials,
+                headers,
+                false,
+                false);
+
+            return wrapReadBufferWithCompressionMethod(std::move(uri_and_buf.second), compression_method, static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max));
+        }
+
     private:
         std::optional<ColumnsDescription> tryGetColumnsFromCache(const Strings & urls)
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url)
+            auto context = getContext();
+            if (!context->getSettingsRef().schema_inference_use_cache_for_url)
                 return std::nullopt;
 
             auto & schema_cache = StorageURL::getSchemaCache(getContext());
@@ -810,7 +878,7 @@ namespace
             {
                 auto get_last_mod_time = [&]() -> std::optional<time_t>
                 {
-                    auto last_mod_time = StorageURL::tryGetLastModificationTime(url, headers, credentials, getContext());
+                    auto last_mod_time = StorageURL::tryGetLastModificationTime(url, headers, credentials, context);
                     /// Some URLs could not have Last-Modified header, in this case we cannot be sure that
                     /// data wasn't changed after adding it's schema to cache. Use schema from cache only if
                     /// special setting for this case is enabled.
@@ -819,10 +887,27 @@ namespace
                     return last_mod_time;
                 };
 
-                auto cache_key = getKeyForSchemaCache(url, format, format_settings, getContext());
-                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-                if (columns)
-                    return columns;
+                if (format)
+                {
+                    auto cache_key = getKeyForSchemaCache(url, *format, format_settings, context);
+                    if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        return columns;
+                }
+                else
+                {
+                    /// If format is unknown, we can iterate through all possible input formats
+                    /// and check if we have an entry with this format and this file in schema cache.
+                    /// If we have such entry for some format, we can use this format to read the file.
+                    for (const auto & format_name : FormatFactory::instance().getAllInputFormats())
+                    {
+                        auto cache_key = getKeyForSchemaCache(url, format_name, format_settings, context);
+                        if (auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time))
+                        {
+                            format = format_name;
+                            return columns;
+                        }
+                    }
+                }
             }
 
             return std::nullopt;
@@ -831,7 +916,7 @@ namespace
         std::vector<std::vector<String>> url_options_to_check;
         size_t current_index = 0;
         String current_url_option;
-        const String & format;
+        std::optional<String> format;
         const CompressionMethod & compression_method;
         const HTTPHeaderEntries & headers;
         Poco::Net::HTTPBasicCredentials credentials;
@@ -839,13 +924,13 @@ namespace
     };
 }
 
-ColumnsDescription IStorageURLBase::getTableStructureFromData(
-    const String & format,
+std::pair<ColumnsDescription, String> IStorageURLBase::getTableStructureAndFormatFromDataImpl(
+    std::optional<String> format,
     const String & uri,
     CompressionMethod compression_method,
     const HTTPHeaderEntries & headers,
     const std::optional<FormatSettings> & format_settings,
-    ContextPtr context)
+    const ContextPtr & context)
 {
     context->getRemoteHostFilter().checkURL(Poco::URI(uri));
 
@@ -858,7 +943,30 @@ ColumnsDescription IStorageURLBase::getTableStructureFromData(
         urls_to_check = {uri};
 
     ReadBufferIterator read_buffer_iterator(urls_to_check, format, compression_method, headers, format_settings, context);
-    return readSchemaFromFormat(format, format_settings, read_buffer_iterator, urls_to_check.size() > 1, context);
+    if (format)
+        return {readSchemaFromFormat(*format, format_settings, read_buffer_iterator, context), *format};
+    return detectFormatAndReadSchema(format_settings, read_buffer_iterator, context);
+}
+
+ColumnsDescription IStorageURLBase::getTableStructureFromData(
+    const String & format,
+    const String & uri,
+    CompressionMethod compression_method,
+    const HTTPHeaderEntries & headers,
+    const std::optional<FormatSettings> & format_settings,
+    const ContextPtr & context)
+{
+    return getTableStructureAndFormatFromDataImpl(format, uri, compression_method, headers, format_settings, context).first;
+}
+
+std::pair<ColumnsDescription, String> IStorageURLBase::getTableStructureAndFormatFromData(
+    const String & uri,
+    CompressionMethod compression_method,
+    const HTTPHeaderEntries & headers,
+    const std::optional<FormatSettings> & format_settings,
+    const ContextPtr & context)
+{
+    return getTableStructureAndFormatFromDataImpl(std::nullopt, uri, compression_method, headers, format_settings, context);
 }
 
 bool IStorageURLBase::supportsSubsetOfColumns(const ContextPtr & context) const
@@ -1243,7 +1351,7 @@ StorageURL::StorageURL(
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
     const String & comment,
-    ContextPtr context_,
+    const ContextPtr & context_,
     const String & compression_method_,
     const HTTPHeaderEntries & headers_,
     const String & http_method_,
@@ -1276,7 +1384,7 @@ StorageURLWithFailover::StorageURLWithFailover(
     const std::optional<FormatSettings> & format_settings_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
-    ContextPtr context_,
+    const ContextPtr & context_,
     const String & compression_method_)
     : StorageURL("", table_id_, format_name_, format_settings_, columns_, constraints_, String{}, context_, compression_method_)
 {
@@ -1325,7 +1433,7 @@ FormatSettings StorageURL::getFormatSettingsFromArgs(const StorageFactory::Argum
 }
 
 size_t StorageURL::evalArgsAndCollectHeaders(
-    ASTs & url_function_args, HTTPHeaderEntries & header_entries, ContextPtr context)
+    ASTs & url_function_args, HTTPHeaderEntries & header_entries, const ContextPtr & context)
 {
     ASTs::iterator headers_it = url_function_args.end();
 
@@ -1409,7 +1517,7 @@ void StorageURL::processNamedCollectionResult(Configuration & configuration, con
     configuration.structure = collection.getOrDefault<String>("structure", "auto");
 }
 
-StorageURL::Configuration StorageURL::getConfiguration(ASTs & args, ContextPtr local_context)
+StorageURL::Configuration StorageURL::getConfiguration(ASTs & args, const ContextPtr & local_context)
 {
     StorageURL::Configuration configuration;
 
@@ -1433,7 +1541,7 @@ StorageURL::Configuration StorageURL::getConfiguration(ASTs & args, ContextPtr l
     }
 
     if (configuration.format == "auto")
-        configuration.format = FormatFactory::instance().getFormatFromFileName(Poco::URI(configuration.url).getPath(), true);
+        configuration.format = FormatFactory::instance().tryGetFormatFromFileName(Poco::URI(configuration.url).getPath()).value_or("auto");
 
     for (const auto & [header, value] : configuration.headers)
     {
diff --git a/src/Storages/StorageURL.h b/src/Storages/StorageURL.h
index c8b8d0942f4..18a90c7bb82 100644
--- a/src/Storages/StorageURL.h
+++ b/src/Storages/StorageURL.h
@@ -57,7 +57,15 @@ public:
         CompressionMethod compression_method,
         const HTTPHeaderEntries & headers,
         const std::optional<FormatSettings> & format_settings,
-        ContextPtr context);
+        const ContextPtr & context);
+
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromData(
+        const String & uri,
+        CompressionMethod compression_method,
+        const HTTPHeaderEntries & headers,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & context);
+
 
     static SchemaCache & getSchemaCache(const ContextPtr & context);
 
@@ -72,7 +80,7 @@ protected:
 
     IStorageURLBase(
         const String & uri_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const StorageID & id_,
         const String & format_name_,
         const std::optional<FormatSettings> & format_settings_,
@@ -106,7 +114,7 @@ protected:
         const Names & column_names,
         const StorageSnapshotPtr & storage_snapshot,
         const SelectQueryInfo & query_info,
-        ContextPtr context,
+        const ContextPtr & context,
         QueryProcessingStage::Enum & processed_stage,
         size_t max_block_size) const;
 
@@ -114,7 +122,7 @@ protected:
         const Names & column_names,
         const ColumnsDescription & columns_description,
         const SelectQueryInfo & query_info,
-        ContextPtr context,
+        const ContextPtr & context,
         QueryProcessingStage::Enum & processed_stage,
         size_t max_block_size) const;
 
@@ -127,6 +135,14 @@ protected:
     bool supportsTrivialCountOptimization() const override { return true; }
 
 private:
+    static std::pair<ColumnsDescription, String> getTableStructureAndFormatFromDataImpl(
+        std::optional<String> format,
+        const String & uri,
+        CompressionMethod compression_method,
+        const HTTPHeaderEntries & headers,
+        const std::optional<FormatSettings> & format_settings,
+        const ContextPtr & context);
+
     virtual Block getHeaderBlock(const Names & column_names, const StorageSnapshotPtr & storage_snapshot) const = 0;
 };
 
@@ -160,7 +176,7 @@ public:
         const String & format,
         const std::optional<FormatSettings> & format_settings,
         String name_,
-        ContextPtr context,
+        const ContextPtr & context,
         UInt64 max_block_size,
         const ConnectionTimeouts & timeouts,
         CompressionMethod compression_method,
@@ -231,7 +247,7 @@ public:
         const String & format,
         const std::optional<FormatSettings> & format_settings,
         const Block & sample_block,
-        ContextPtr context,
+        const ContextPtr & context,
         const ConnectionTimeouts & timeouts,
         CompressionMethod compression_method,
         const HTTPHeaderEntries & headers = {},
@@ -263,7 +279,7 @@ public:
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
         const String & comment,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const String & compression_method_,
         const HTTPHeaderEntries & headers_ = {},
         const String & method_ = "",
@@ -292,12 +308,12 @@ public:
         std::string addresses_expr;
     };
 
-    static Configuration getConfiguration(ASTs & args, ContextPtr context);
+    static Configuration getConfiguration(ASTs & args, const ContextPtr & context);
 
     /// Does evaluateConstantExpressionOrIdentifierAsLiteral() on all arguments.
     /// If `headers(...)` argument is present, parses it and moves it to the end of the array.
     /// Returns number of arguments excluding `headers(...)`.
-    static size_t evalArgsAndCollectHeaders(ASTs & url_function_args, HTTPHeaderEntries & header_entries, ContextPtr context);
+    static size_t evalArgsAndCollectHeaders(ASTs & url_function_args, HTTPHeaderEntries & header_entries, const ContextPtr & context);
 
     static void processNamedCollectionResult(Configuration & configuration, const NamedCollection & collection);
 };
@@ -314,7 +330,7 @@ public:
         const std::optional<FormatSettings> & format_settings_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
-        ContextPtr context_,
+        const ContextPtr & context_,
         const String & compression_method_);
 
     void read(
diff --git a/src/Storages/StorageURLCluster.cpp b/src/Storages/StorageURLCluster.cpp
index a0b5fcd6f28..d71dfea7693 100644
--- a/src/Storages/StorageURLCluster.cpp
+++ b/src/Storages/StorageURLCluster.cpp
@@ -35,36 +35,43 @@ namespace ErrorCodes
 }
 
 StorageURLCluster::StorageURLCluster(
-    ContextPtr context_,
+    const ContextPtr & context,
     const String & cluster_name_,
     const String & uri_,
     const String & format_,
-    const String & compression_method_,
+    const String & compression_method,
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
-    const StorageURL::Configuration & configuration_,
-    bool structure_argument_was_provided_)
-    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageURLCluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
-    , uri(uri_)
+    const StorageURL::Configuration & configuration_)
+    : IStorageCluster(cluster_name_, table_id_, &Poco::Logger::get("StorageURLCluster (" + table_id_.table_name + ")"))
+    , uri(uri_), format_name(format_)
 {
-    context_->getRemoteHostFilter().checkURL(Poco::URI(uri));
-    context_->getHTTPHeaderFilter().checkHeaders(configuration_.headers);
+    context->getRemoteHostFilter().checkURL(Poco::URI(uri));
+    context->getHTTPHeaderFilter().checkHeaders(configuration_.headers);
 
     StorageInMemoryMetadata storage_metadata;
 
     if (columns_.empty())
     {
-        auto columns = StorageURL::getTableStructureFromData(format_,
-            uri,
-            chooseCompressionMethod(Poco::URI(uri).getPath(), compression_method_),
-            configuration_.headers,
-            std::nullopt,
-            context_);
+        ColumnsDescription columns;
+        if (format_name == "auto")
+            std::tie(columns, format_name) = StorageURL::getTableStructureAndFormatFromData(
+                uri, chooseCompressionMethod(Poco::URI(uri).getPath(), compression_method), configuration_.headers, std::nullopt, context);
+        else
+            columns = StorageURL::getTableStructureFromData(
+                format_, uri, chooseCompressionMethod(Poco::URI(uri).getPath(), compression_method), configuration_.headers, std::nullopt, context);
+
         storage_metadata.setColumns(columns);
     }
     else
+    {
+        if (format_name == "auto")
+            format_name = StorageURL::getTableStructureAndFormatFromData(
+                uri, chooseCompressionMethod(Poco::URI(uri).getPath(), compression_method), configuration_.headers, std::nullopt, context).second;
+
         storage_metadata.setColumns(columns_);
+    }
 
     storage_metadata.setConstraints(constraints_);
     setInMemoryMetadata(storage_metadata);
@@ -72,13 +79,14 @@ StorageURLCluster::StorageURLCluster(
     virtual_columns = VirtualColumnUtils::getPathFileAndSizeVirtualsForStorage(storage_metadata.getSampleBlock().getNamesAndTypesList());
 }
 
-void StorageURLCluster::addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context)
+void StorageURLCluster::updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context)
 {
     ASTExpressionList * expression_list = extractTableFunctionArgumentsFromSelectQuery(query);
     if (!expression_list)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected SELECT query from table function urlCluster, got '{}'", queryToString(query));
 
-    TableFunctionURLCluster::addColumnsStructureToArguments(expression_list->children, structure, context);
+    TableFunctionURLCluster::updateStructureAndFormatArgumentsIfNeeded(
+        expression_list->children, storage_snapshot->metadata->getColumns().getAll().toNamesAndTypesDescription(), format_name, context);
 }
 
 RemoteQueryExecutor::Extension StorageURLCluster::getTaskIteratorExtension(const ActionsDAG::Node * predicate, const ContextPtr & context) const
diff --git a/src/Storages/StorageURLCluster.h b/src/Storages/StorageURLCluster.h
index 07978040029..f57d262f434 100644
--- a/src/Storages/StorageURLCluster.h
+++ b/src/Storages/StorageURLCluster.h
@@ -19,16 +19,15 @@ class StorageURLCluster : public IStorageCluster
 {
 public:
     StorageURLCluster(
-        ContextPtr context_,
+        const ContextPtr & context,
         const String & cluster_name_,
         const String & uri_,
         const String & format_,
-        const String & compression_method_,
+        const String & compression_method,
         const StorageID & table_id_,
         const ColumnsDescription & columns_,
         const ConstraintsDescription & constraints_,
-        const StorageURL::Configuration & configuration_,
-        bool structure_argument_was_provided_);
+        const StorageURL::Configuration & configuration_);
 
     std::string getName() const override { return "URLCluster"; }
 
@@ -41,11 +40,10 @@ public:
     bool supportsTrivialCountOptimization() const override { return true; }
 
 private:
-    void addColumnsStructureToQuery(ASTPtr & query, const String & structure, const ContextPtr & context) override;
+    void updateQueryToSendIfNeeded(ASTPtr & query, const StorageSnapshotPtr & storage_snapshot, const ContextPtr & context) override;
 
     String uri;
     String format_name;
-    String compression_method;
     NamesAndTypesList virtual_columns;
 };
 
diff --git a/src/Storages/StorageXDBC.cpp b/src/Storages/StorageXDBC.cpp
index a274b1ba4db..c01d0310952 100644
--- a/src/Storages/StorageXDBC.cpp
+++ b/src/Storages/StorageXDBC.cpp
@@ -59,7 +59,7 @@ std::vector<std::pair<std::string, std::string>> StorageXDBC::getReadURIParams(
     const Names & /* column_names */,
     const StorageSnapshotPtr & /*storage_snapshot*/,
     const SelectQueryInfo & /*query_info*/,
-    ContextPtr /*context*/,
+    const ContextPtr & /*context*/,
     QueryProcessingStage::Enum & /*processed_stage*/,
     size_t max_block_size) const
 {
@@ -70,7 +70,7 @@ std::function<void(std::ostream &)> StorageXDBC::getReadPOSTDataCallback(
     const Names & column_names,
     const ColumnsDescription & columns_description,
     const SelectQueryInfo & query_info,
-    ContextPtr local_context,
+    const ContextPtr & local_context,
     QueryProcessingStage::Enum & /*processed_stage*/,
     size_t /*max_block_size*/) const
 {
diff --git a/src/Storages/StorageXDBC.h b/src/Storages/StorageXDBC.h
index fe678785dc2..9a0a9b5afa1 100644
--- a/src/Storages/StorageXDBC.h
+++ b/src/Storages/StorageXDBC.h
@@ -55,7 +55,7 @@ private:
         const Names & column_names,
         const StorageSnapshotPtr & storage_snapshot,
         const SelectQueryInfo & query_info,
-        ContextPtr context,
+        const ContextPtr & context,
         QueryProcessingStage::Enum & processed_stage,
         size_t max_block_size) const override;
 
@@ -63,7 +63,7 @@ private:
         const Names & column_names,
         const ColumnsDescription & columns_description,
         const SelectQueryInfo & query_info,
-        ContextPtr context,
+        const ContextPtr & context,
         QueryProcessingStage::Enum & processed_stage,
         size_t max_block_size) const override;
 
diff --git a/src/TableFunctions/ITableFunctionCluster.h b/src/TableFunctions/ITableFunctionCluster.h
index 7e81d6d21b7..9f56d781bc9 100644
--- a/src/TableFunctions/ITableFunctionCluster.h
+++ b/src/TableFunctions/ITableFunctionCluster.h
@@ -4,7 +4,6 @@
 
 #include <Interpreters/Context.h>
 #include <Interpreters/evaluateConstantExpression.h>
-#include <Storages/StorageS3Cluster.h>
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <TableFunctions/ITableFunction.h>
 #include <TableFunctions/TableFunctionAzureBlobStorage.h>
@@ -29,14 +28,14 @@ public:
     String getName() const override = 0;
     String getSignature() const override = 0;
 
-    static void addColumnsStructureToArguments(ASTs & args, const String & desired_structure, const ContextPtr & context)
+    static void updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure_, const String & format_, const ContextPtr & context)
     {
         if (args.empty())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected empty list of arguments for {}Cluster table function", Base::name);
 
         ASTPtr cluster_name_arg = args.front();
         args.erase(args.begin());
-        Base::addColumnsStructureToArguments(args, desired_structure, context);
+        Base::updateStructureAndFormatArgumentsIfNeeded(args, structure_, format_, context);
         args.insert(args.begin(), cluster_name_arg);
     }
 
diff --git a/src/TableFunctions/ITableFunctionFileLike.cpp b/src/TableFunctions/ITableFunctionFileLike.cpp
index b88af855309..b697f3df925 100644
--- a/src/TableFunctions/ITableFunctionFileLike.cpp
+++ b/src/TableFunctions/ITableFunctionFileLike.cpp
@@ -27,14 +27,14 @@ void ITableFunctionFileLike::parseFirstArguments(const ASTPtr & arg, const Conte
     filename = checkAndGetLiteralArgument<String>(arg, "source");
 }
 
-String ITableFunctionFileLike::getFormatFromFirstArgument()
+std::optional<String> ITableFunctionFileLike::tryGetFormatFromFirstArgument()
 {
-    return FormatFactory::instance().getFormatFromFileName(filename, true);
+    return FormatFactory::instance().tryGetFormatFromFileName(filename);
 }
 
 bool ITableFunctionFileLike::supportsReadingSubsetOfColumns(const ContextPtr & context)
 {
-    return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(format, context);
+    return format != "auto" && FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(format, context);
 }
 
 void ITableFunctionFileLike::parseArguments(const ASTPtr & ast_function, ContextPtr context)
@@ -63,7 +63,10 @@ void ITableFunctionFileLike::parseArgumentsImpl(ASTs & args, const ContextPtr &
         format = checkAndGetLiteralArgument<String>(args[1], "format");
 
     if (format == "auto")
-        format = getFormatFromFirstArgument();
+    {
+        if (auto format_from_first_argument = tryGetFormatFromFirstArgument())
+            format = *format_from_first_argument;
+    }
 
     if (args.size() > 2)
     {
@@ -79,34 +82,37 @@ void ITableFunctionFileLike::parseArgumentsImpl(ASTs & args, const ContextPtr &
         compression_method = checkAndGetLiteralArgument<String>(args[3], "compression_method");
 }
 
-void ITableFunctionFileLike::addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr &)
+void ITableFunctionFileLike::updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr & context)
 {
     if (args.empty() || args.size() > getMaxNumberOfArguments())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected 1 to {} arguments in table function, got {}", getMaxNumberOfArguments(), args.size());
 
+    auto format_literal = std::make_shared<ASTLiteral>(format);
     auto structure_literal = std::make_shared<ASTLiteral>(structure);
 
+    for (auto & arg : args)
+        arg = evaluateConstantExpressionOrIdentifierAsLiteral(arg, context);
+
     /// f(filename)
     if (args.size() == 1)
     {
-        /// Add format=auto before structure argument.
-        args.push_back(std::make_shared<ASTLiteral>("auto"));
+        args.push_back(format_literal);
         args.push_back(structure_literal);
     }
     /// f(filename, format)
     else if (args.size() == 2)
     {
+        if (checkAndGetLiteralArgument<String>(args[1], "format") == "auto")
+            args.back() = format_literal;
         args.push_back(structure_literal);
     }
-    /// f(filename, format, 'auto')
-    else if (args.size() == 3)
+    /// f(filename, format, structure) or f(filename, format, structure, compression)
+    else if (args.size() >= 3)
     {
-        args.back() = structure_literal;
-    }
-    /// f(filename, format, 'auto', compression)
-    else if (args.size() == 4)
-    {
-        args[args.size() - 2] = structure_literal;
+        if (checkAndGetLiteralArgument<String>(args[1], "format") == "auto")
+            args[1] = format_literal;
+        if (checkAndGetLiteralArgument<String>(args[2], "structure") == "auto")
+            args[2] = structure_literal;
     }
 }
 
diff --git a/src/TableFunctions/ITableFunctionFileLike.h b/src/TableFunctions/ITableFunctionFileLike.h
index 5fe86587797..b378f2f3a6c 100644
--- a/src/TableFunctions/ITableFunctionFileLike.h
+++ b/src/TableFunctions/ITableFunctionFileLike.h
@@ -31,7 +31,7 @@ public:
 
     static size_t getMaxNumberOfArguments() { return 4; }
 
-    static void addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr &);
+    static void updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr &);
 
 protected:
 
@@ -39,7 +39,7 @@ protected:
     virtual void parseArgumentsImpl(ASTs & args, const ContextPtr & context);
 
     virtual void parseFirstArguments(const ASTPtr & arg, const ContextPtr & context);
-    virtual String getFormatFromFirstArgument();
+    virtual std::optional<String> tryGetFormatFromFirstArgument();
 
     String filename;
     String path_to_archive;
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
index d394c836369..b9e0af53b7b 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
@@ -58,7 +58,7 @@ void TableFunctionAzureBlobStorage::parseArgumentsImpl(ASTs & engine_args, const
         configuration.blobs_paths = {configuration.blob_path};
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
     }
     else
     {
@@ -155,7 +155,7 @@ void TableFunctionAzureBlobStorage::parseArgumentsImpl(ASTs & engine_args, const
         configuration.blobs_paths = {configuration.blob_path};
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
+            configuration.format = FormatFactory::instance().tryGetFormatFromFileName(configuration.blob_path).value_or("auto");
     }
 }
 
@@ -174,15 +174,24 @@ void TableFunctionAzureBlobStorage::parseArguments(const ASTPtr & ast_function,
     parseArgumentsImpl(args, context);
 }
 
-void TableFunctionAzureBlobStorage::addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr & context)
+void TableFunctionAzureBlobStorage::updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr & context)
 {
-    if (tryGetNamedCollectionWithOverrides(args, context))
+    if (auto collection = tryGetNamedCollectionWithOverrides(args, context))
     {
-        /// In case of named collection, just add key-value pair "structure='...'"
-        /// at the end of arguments to override existed structure.
-        ASTs equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure)};
-        auto equal_func = makeASTFunction("equals", std::move(equal_func_args));
-        args.push_back(equal_func);
+        /// In case of named collection, just add key-value pairs "format='...', structure='...'"
+        /// at the end of arguments to override existed format and structure with "auto" values.
+        if (collection->getOrDefault<String>("format", "auto") == "auto")
+        {
+            ASTs format_equal_func_args = {std::make_shared<ASTIdentifier>("format"), std::make_shared<ASTLiteral>(format)};
+            auto format_equal_func = makeASTFunction("equals", std::move(format_equal_func_args));
+            args.push_back(format_equal_func);
+        }
+        if (collection->getOrDefault<String>("structure", "auto") == "auto")
+        {
+            ASTs structure_equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure)};
+            auto structure_equal_func = makeASTFunction("equals", std::move(structure_equal_func_args));
+            args.push_back(structure_equal_func);
+        }
     }
     else
     {
@@ -191,65 +200,126 @@ void TableFunctionAzureBlobStorage::addColumnsStructureToArguments(ASTs & args,
                             "Storage Azure requires 3 to 7 arguments: "
                             "AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])");
 
+        auto format_literal = std::make_shared<ASTLiteral>(format);
         auto structure_literal = std::make_shared<ASTLiteral>(structure);
 
+        for (auto & arg : args)
+            arg = evaluateConstantExpressionOrIdentifierAsLiteral(arg, context);
+
         auto is_format_arg
             = [](const std::string & s) -> bool { return s == "auto" || FormatFactory::instance().getAllFormats().contains(s); };
 
-
+        /// (connection_string, container_name, blobpath)
         if (args.size() == 3)
         {
-            /// Add format=auto & compression=auto before structure argument.
-            args.push_back(std::make_shared<ASTLiteral>("auto"));
+            args.push_back(format_literal);
+            /// Add compression = "auto" before structure argument.
             args.push_back(std::make_shared<ASTLiteral>("auto"));
             args.push_back(structure_literal);
         }
+        /// (connection_string, container_name, blobpath, structure) or
+        /// (connection_string, container_name, blobpath, format)
+        /// We can distinguish them by looking at the 4-th argument: check if it's format name or not.
         else if (args.size() == 4)
         {
             auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name/structure");
+            /// (..., format) -> (..., format, compression, structure)
             if (is_format_arg(fourth_arg))
             {
+                if (fourth_arg == "auto")
+                    args[3] = format_literal;
                 /// Add compression=auto before structure argument.
                 args.push_back(std::make_shared<ASTLiteral>("auto"));
                 args.push_back(structure_literal);
             }
+            /// (..., structure) -> (..., format, compression, structure)
             else
             {
-                args.back() = structure_literal;
+                auto structure_arg = args.back();
+                args[3] = format_literal;
+                /// Add compression=auto before structure argument.
+                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                if (fourth_arg == "auto")
+                    args.push_back(structure_literal);
+                else
+                    args.push_back(structure_arg);
             }
         }
+        /// (connection_string, container_name, blobpath, format, compression) or
+        /// (storage_account_url, container_name, blobpath, account_name, account_key)
+        /// We can distinguish them by looking at the 4-th argument: check if it's format name or not.
         else if (args.size() == 5)
         {
             auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name");
-            if (!is_format_arg(fourth_arg))
+            /// (..., format, compression) -> (..., format, compression, structure)
+            if (is_format_arg(fourth_arg))
             {
-                /// Add format=auto & compression=auto before structure argument.
-                args.push_back(std::make_shared<ASTLiteral>("auto"));
-                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                if (fourth_arg == "auto")
+                    args[3] = format_literal;
+                args.push_back(structure_literal);
             }
-            args.push_back(structure_literal);
-        }
-        else if (args.size() == 6)
-        {
-            auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name");
-            if (!is_format_arg(fourth_arg))
+            /// (..., account_name, account_key) -> (..., account_name, account_key, format, compression, structure)
+            else
             {
+                args.push_back(format_literal);
                 /// Add compression=auto before structure argument.
                 args.push_back(std::make_shared<ASTLiteral>("auto"));
                 args.push_back(structure_literal);
             }
+        }
+        /// (connection_string, container_name, blobpath, format, compression, structure) or
+        /// (storage_account_url, container_name, blobpath, account_name, account_key, structure) or
+        /// (storage_account_url, container_name, blobpath, account_name, account_key, format)
+        else if (args.size() == 6)
+        {
+            auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name");
+            auto sixth_arg = checkAndGetLiteralArgument<String>(args[5], "format/structure");
+
+            /// (..., format, compression, structure)
+            if (is_format_arg(fourth_arg))
+            {
+                if (fourth_arg == "auto")
+                    args[3] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[5], "structure") == "auto")
+                    args[5] = structure_literal;
+            }
+            /// (..., account_name, account_key, format) -> (..., account_name, account_key, format, compression, structure)
+            else if (is_format_arg(sixth_arg))
+            {
+                if (sixth_arg == "auto")
+                    args[5] = format_literal;
+                /// Add compression=auto before structure argument.
+                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                args.push_back(structure_literal);
+            }
+            /// (..., account_name, account_key, structure) -> (..., account_name, account_key, format, compression, structure)
             else
             {
-                args.back() = structure_literal;
+                auto structure_arg = args.back();
+                args[5] = format_literal;
+                /// Add compression=auto before structure argument.
+                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                if (sixth_arg == "auto")
+                    args.push_back(structure_literal);
+                else
+                    args.push_back(structure_arg);
             }
         }
+        /// (storage_account_url, container_name, blobpath, account_name, account_key, format, compression)
         else if (args.size() == 7)
         {
+            /// (..., format, compression) -> (..., format, compression, structure)
+            if (checkAndGetLiteralArgument<String>(args[5], "format") == "auto")
+                args[5] = format_literal;
             args.push_back(structure_literal);
         }
+        /// (storage_account_url, container_name, blobpath, account_name, account_key, format, compression, structure)
         else if (args.size() == 8)
         {
-            args.back() = structure_literal;
+            if (checkAndGetLiteralArgument<String>(args[5], "format") == "auto")
+                args[5] = format_literal;
+            if (checkAndGetLiteralArgument<String>(args[7], "structure") == "auto")
+                args[7] = structure_literal;
         }
     }
 }
@@ -263,7 +333,9 @@ ColumnsDescription TableFunctionAzureBlobStorage::getActualTableStructure(Contex
         auto settings = StorageAzureBlob::createSettings(context);
 
         auto object_storage = std::make_unique<AzureObjectStorage>("AzureBlobStorageTableFunction", std::move(client), std::move(settings));
-        return StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, std::nullopt, context, false);
+        if (configuration.format == "auto")
+            return StorageAzureBlob::getTableStructureAndFormatFromData(object_storage.get(), configuration, std::nullopt, context).first;
+        return StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, std::nullopt, context);
     }
 
     return parseColumnsListFromString(configuration.structure, context);
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.h b/src/TableFunctions/TableFunctionAzureBlobStorage.h
index 1a221f60c55..9622881b417 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorage.h
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.h
@@ -55,7 +55,7 @@ public:
 
     virtual void parseArgumentsImpl(ASTs & args, const ContextPtr & context);
 
-    static void addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr & context);
+    static void updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr & context);
 
 protected:
 
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp b/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
index eee585967c2..a2221cf35b6 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
+++ b/src/TableFunctions/TableFunctionAzureBlobStorageCluster.cpp
@@ -21,9 +21,8 @@ StoragePtr TableFunctionAzureBlobStorageCluster::executeImpl(
 {
     StoragePtr storage;
     ColumnsDescription columns;
-    bool structure_argument_was_provided = configuration.structure != "auto";
 
-    if (structure_argument_was_provided)
+    if (configuration.structure != "auto")
     {
         columns = parseColumnsListFromString(configuration.structure, context);
     }
@@ -59,8 +58,7 @@ StoragePtr TableFunctionAzureBlobStorageCluster::executeImpl(
             StorageID(getDatabaseName(), table_name),
             columns,
             ConstraintsDescription{},
-            context,
-            structure_argument_was_provided);
+            context);
     }
 
     storage->startup();
diff --git a/src/TableFunctions/TableFunctionFile.cpp b/src/TableFunctions/TableFunctionFile.cpp
index 8a9dde374ec..b481076e9b6 100644
--- a/src/TableFunctions/TableFunctionFile.cpp
+++ b/src/TableFunctions/TableFunctionFile.cpp
@@ -54,12 +54,12 @@ void TableFunctionFile::parseFirstArguments(const ASTPtr & arg, const ContextPtr
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "The first argument of table function '{}' mush be path or file descriptor", getName());
 }
 
-String TableFunctionFile::getFormatFromFirstArgument()
+std::optional<String> TableFunctionFile::tryGetFormatFromFirstArgument()
 {
     if (fd >= 0)
-        return FormatFactory::instance().getFormatFromFileDescriptor(fd);
+        return FormatFactory::instance().tryGetFormatFromFileDescriptor(fd);
     else
-        return FormatFactory::instance().getFormatFromFileName(filename, true);
+        return FormatFactory::instance().tryGetFormatFromFileName(filename);
 }
 
 StoragePtr TableFunctionFile::getStorage(const String & source,
@@ -104,10 +104,11 @@ ColumnsDescription TableFunctionFile::getActualTableStructure(ContextPtr context
             archive_info
                 = StorageFile::getArchiveInfo(path_to_archive, filename, context->getUserFilesPath(), context, total_bytes_to_read);
 
+        if (format == "auto")
+            return StorageFile::getTableStructureAndFormatFromFile(paths, compression_method, std::nullopt, context, archive_info).first;
         return StorageFile::getTableStructureFromFile(format, paths, compression_method, std::nullopt, context, archive_info);
     }
 
-
     return parseColumnsListFromString(structure, context);
 }
 
diff --git a/src/TableFunctions/TableFunctionFile.h b/src/TableFunctions/TableFunctionFile.h
index 6eaab29db8a..1347284753e 100644
--- a/src/TableFunctions/TableFunctionFile.h
+++ b/src/TableFunctions/TableFunctionFile.h
@@ -27,7 +27,7 @@ public:
 protected:
     int fd = -1;
     void parseFirstArguments(const ASTPtr & arg, const ContextPtr & context) override;
-    String getFormatFromFirstArgument() override;
+    std::optional<String> tryGetFormatFromFirstArgument() override;
 
 private:
     StoragePtr getStorage(
diff --git a/src/TableFunctions/TableFunctionFileCluster.cpp b/src/TableFunctions/TableFunctionFileCluster.cpp
index 843909e2a58..3e53349b022 100644
--- a/src/TableFunctions/TableFunctionFileCluster.cpp
+++ b/src/TableFunctions/TableFunctionFileCluster.cpp
@@ -43,8 +43,7 @@ StoragePtr TableFunctionFileCluster::getStorage(
             compression_method,
             StorageID(getDatabaseName(), table_name),
             columns,
-            ConstraintsDescription{},
-            structure != "auto");
+            ConstraintsDescription{});
     }
 
     return storage;
diff --git a/src/TableFunctions/TableFunctionFormat.cpp b/src/TableFunctions/TableFunctionFormat.cpp
index 4b6d0f70c0a..ad2a142a140 100644
--- a/src/TableFunctions/TableFunctionFormat.cpp
+++ b/src/TableFunctions/TableFunctionFormat.cpp
@@ -33,7 +33,9 @@ namespace ErrorCodes
 namespace
 {
 
-/* format(format_name, data) - ...
+/* format(format_name, structure, data) - parses data according to the specified format and structure.
+ * format(format_name, data) - infers the schema from the data and parses it according to the specified format.
+ * format(data) - detects the format, infers the schema and parses data according to inferred format and structure.
  */
 class TableFunctionFormat : public ITableFunction
 {
@@ -49,11 +51,11 @@ private:
     ColumnsDescription getActualTableStructure(ContextPtr context, bool is_insert_query) const override;
     void parseArguments(const ASTPtr & ast_function, ContextPtr context) override;
 
-    Block parseData(ColumnsDescription columns, ContextPtr context) const;
+    Block parseData(const ColumnsDescription & columns, const String & format_name, const ContextPtr & context) const;
 
-    String format;
-    String data;
+    String format = "auto";
     String structure = "auto";
+    String data;
 };
 
 void TableFunctionFormat::parseArguments(const ASTPtr & ast_function, ContextPtr context)
@@ -65,14 +67,15 @@ void TableFunctionFormat::parseArguments(const ASTPtr & ast_function, ContextPtr
 
     ASTs & args = args_func.at(0)->children;
 
-    if (args.size() != 2 && args.size() != 3)
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 2 or 3 arguments: format, [structure], data", getName());
+    if (args.empty() || args.size() > 3)
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires from 1 to 3 arguments: [format, [structure]], data", getName());
 
     for (auto & arg : args)
         arg = evaluateConstantExpressionOrIdentifierAsLiteral(arg, context);
 
-    format = checkAndGetLiteralArgument<String>(args[0], "format");
     data = checkAndGetLiteralArgument<String>(args.back(), "data");
+    if (args.size() > 1)
+        format = checkAndGetLiteralArgument<String>(args[0], "format");
     if (args.size() == 3)
         structure = checkAndGetLiteralArgument<String>(args[1], "structure");
 }
@@ -82,19 +85,21 @@ ColumnsDescription TableFunctionFormat::getActualTableStructure(ContextPtr conte
     if (structure == "auto")
     {
         SingleReadBufferIterator read_buffer_iterator(std::make_unique<ReadBufferFromString>(data));
-        return readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, false, context);
+        if (format == "auto")
+            return detectFormatAndReadSchema(std::nullopt, read_buffer_iterator, context).first;
+        return readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, context);
     }
     return parseColumnsListFromString(structure, context);
 }
 
-Block TableFunctionFormat::parseData(ColumnsDescription columns, ContextPtr context) const
+Block TableFunctionFormat::parseData(const ColumnsDescription & columns, const String & format_name, const ContextPtr & context) const
 {
     Block block;
     for (const auto & name_and_type : columns.getAllPhysical())
         block.insert({name_and_type.type->createColumn(), name_and_type.type, name_and_type.name});
 
     auto read_buf = std::make_unique<ReadBufferFromString>(data);
-    auto input_format = context->getInputFormat(format, *read_buf, block, context->getSettingsRef().max_block_size);
+    auto input_format = context->getInputFormat(format_name, *read_buf, block, context->getSettingsRef().max_block_size);
     QueryPipelineBuilder builder;
     builder.init(Pipe(input_format));
     if (columns.hasDefaults())
@@ -120,10 +125,24 @@ Block TableFunctionFormat::parseData(ColumnsDescription columns, ContextPtr cont
     return concatenateBlocks(blocks);
 }
 
-StoragePtr TableFunctionFormat::executeImpl(const ASTPtr & /*ast_function*/, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool is_insert_query) const
+StoragePtr TableFunctionFormat::executeImpl(const ASTPtr & /*ast_function*/, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool /*is_insert_query*/) const
 {
-    auto columns = getActualTableStructure(context, is_insert_query);
-    Block res_block = parseData(columns, context);
+    ColumnsDescription columns;
+    String format_name = format;
+    if (structure == "auto")
+    {
+        SingleReadBufferIterator read_buffer_iterator(std::make_unique<ReadBufferFromString>(data));
+        if (format_name == "auto")
+            std::tie(columns, format_name) = detectFormatAndReadSchema(std::nullopt, read_buffer_iterator, context);
+        else
+            columns = readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, context);
+    }
+    else
+    {
+        columns = parseColumnsListFromString(structure, context);
+    }
+
+    Block res_block = parseData(columns, format_name, context);
     auto res = std::make_shared<StorageValues>(StorageID(getDatabaseName(), table_name), columns, res_block);
     res->startup();
     return res;
diff --git a/src/TableFunctions/TableFunctionHDFS.cpp b/src/TableFunctions/TableFunctionHDFS.cpp
index 8d48a7ba30e..2dac4398144 100644
--- a/src/TableFunctions/TableFunctionHDFS.cpp
+++ b/src/TableFunctions/TableFunctionHDFS.cpp
@@ -33,6 +33,8 @@ ColumnsDescription TableFunctionHDFS::getActualTableStructure(ContextPtr context
     if (structure == "auto")
     {
         context->checkAccess(getSourceAccessType());
+        if (format == "auto")
+            return StorageHDFS::getTableStructureAndFormatFromData(filename, compression_method, context).first;
         return StorageHDFS::getTableStructureFromData(format, filename, compression_method, context);
     }
 
diff --git a/src/TableFunctions/TableFunctionHDFSCluster.cpp b/src/TableFunctions/TableFunctionHDFSCluster.cpp
index 6fb7ed0fce5..57ce6d2b9ff 100644
--- a/src/TableFunctions/TableFunctionHDFSCluster.cpp
+++ b/src/TableFunctions/TableFunctionHDFSCluster.cpp
@@ -45,8 +45,7 @@ StoragePtr TableFunctionHDFSCluster::getStorage(
             format,
             columns,
             ConstraintsDescription{},
-            compression_method,
-            structure != "auto");
+            compression_method);
     }
     return storage;
 }
diff --git a/src/TableFunctions/TableFunctionS3.cpp b/src/TableFunctions/TableFunctionS3.cpp
index a9c5a5c99f0..3fedd38277c 100644
--- a/src/TableFunctions/TableFunctionS3.cpp
+++ b/src/TableFunctions/TableFunctionS3.cpp
@@ -61,12 +61,11 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
         if (configuration.format == "auto")
         {
             String file_path = named_collection->getOrDefault<String>("filename", Poco::URI(named_collection->get<String>("url")).getPath());
-            configuration.format = FormatFactory::instance().getFormatFromFileName(file_path, true);
+            configuration.format = FormatFactory::instance().tryGetFormatFromFileName(file_path).value_or("auto");
         }
     }
     else
     {
-
         size_t count = StorageURL::evalArgsAndCollectHeaders(args, configuration.headers_from_ast, context);
 
         if (count == 0 || count > 7)
@@ -216,7 +215,7 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
         configuration.auth_settings.no_sign_request = no_sign_request;
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(Poco::URI(url).getPath(), true);
+            configuration.format = FormatFactory::instance().tryGetFormatFromFileName(Poco::URI(url).getPath()).value_or("auto");
     }
 
     configuration.keys = {configuration.url.key};
@@ -238,15 +237,24 @@ void TableFunctionS3::parseArguments(const ASTPtr & ast_function, ContextPtr con
     parseArgumentsImpl(args, context);
 }
 
-void TableFunctionS3::addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr & context)
+void TableFunctionS3::updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr & context)
 {
-    if (tryGetNamedCollectionWithOverrides(args, context))
+    if (auto collection = tryGetNamedCollectionWithOverrides(args, context))
     {
-        /// In case of named collection, just add key-value pair "structure='...'"
-        /// at the end of arguments to override existed structure.
-        ASTs equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure)};
-        auto equal_func = makeASTFunction("equals", std::move(equal_func_args));
-        args.push_back(equal_func);
+        /// In case of named collection, just add key-value pairs "format='...', structure='...'"
+        /// at the end of arguments to override existed format and structure with "auto" values.
+        if (collection->getOrDefault<String>("format", "auto") == "auto")
+        {
+            ASTs format_equal_func_args = {std::make_shared<ASTIdentifier>("format"), std::make_shared<ASTLiteral>(format)};
+            auto format_equal_func = makeASTFunction("equals", std::move(format_equal_func_args));
+            args.push_back(format_equal_func);
+        }
+        if (collection->getOrDefault<String>("structure", "auto") == "auto")
+        {
+            ASTs structure_equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure)};
+            auto structure_equal_func = makeASTFunction("equals", std::move(structure_equal_func_args));
+            args.push_back(structure_equal_func);
+        }
     }
     else
     {
@@ -256,23 +264,25 @@ void TableFunctionS3::addColumnsStructureToArguments(ASTs & args, const String &
         if (count == 0 || count > getMaxNumberOfArguments())
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected 1 to {} arguments in table function, got {}", getMaxNumberOfArguments(), count);
 
+        auto format_literal = std::make_shared<ASTLiteral>(format);
         auto structure_literal = std::make_shared<ASTLiteral>(structure);
 
-        /// s3(s3_url)
+        /// s3(s3_url) -> s3(s3_url, format, structure)
         if (count == 1)
         {
-            /// Add format=auto before structure argument.
-            args.push_back(std::make_shared<ASTLiteral>("auto"));
+            args.push_back(format_literal);
             args.push_back(structure_literal);
         }
-        /// s3(s3_url, format) or s3(s3_url, NOSIGN)
+        /// s3(s3_url, format) -> s3(s3_url, format, structure) or
+        /// s3(s3_url, NOSIGN) -> s3(s3_url, NOSIGN, format, structure)
         /// We can distinguish them by looking at the 2-nd argument: check if it's NOSIGN or not.
         else if (count == 2)
         {
             auto second_arg = checkAndGetLiteralArgument<String>(args[1], "format/NOSIGN");
-            /// If there is NOSIGN, add format=auto before structure.
             if (boost::iequals(second_arg, "NOSIGN"))
-                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                args.push_back(format_literal);
+            else if (second_arg == "auto")
+                args.back() = format_literal;
             args.push_back(structure_literal);
         }
         /// s3(source, format, structure) or
@@ -282,18 +292,25 @@ void TableFunctionS3::addColumnsStructureToArguments(ASTs & args, const String &
         else if (count == 3)
         {
             auto second_arg = checkAndGetLiteralArgument<String>(args[1], "format/NOSIGN");
+            /// s3(source, NOSIGN, format) -> s3(source, NOSIGN, format, structure)
             if (boost::iequals(second_arg, "NOSIGN"))
             {
+                if (checkAndGetLiteralArgument<String>(args[2], "format") == "auto")
+                    args.back() = format_literal;
                 args.push_back(structure_literal);
             }
+            /// s3(source, format, structure)
             else if (second_arg == "auto" || FormatFactory::instance().getAllFormats().contains(second_arg))
             {
-                args[count - 1] = structure_literal;
+                if (second_arg == "auto")
+                    args[1] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[2], "structure") == "auto")
+                    args[2] = structure_literal;
             }
+            /// s3(source, access_key_id, access_key_id) -> s3(source, access_key_id, access_key_id, format, structure)
             else
             {
-                /// Add format=auto before structure argument.
-                args.push_back(std::make_shared<ASTLiteral>("auto"));
+                args.push_back(format_literal);
                 args.push_back(structure_literal);
             }
         }
@@ -304,16 +321,27 @@ void TableFunctionS3::addColumnsStructureToArguments(ASTs & args, const String &
         else if (count == 4)
         {
             auto second_arg = checkAndGetLiteralArgument<String>(args[1], "format/NOSIGN");
+            /// s3(source, NOSIGN, format, structure)
             if (boost::iequals(second_arg, "NOSIGN"))
             {
-                args[count - 1] = structure_literal;
+                if (checkAndGetLiteralArgument<String>(args[2], "format") == "auto")
+                    args[2] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[3], "structure") == "auto")
+                    args[3] = structure_literal;
             }
+            /// s3(source, format, structure, compression_method)
             else if (second_arg == "auto" || FormatFactory::instance().getAllFormats().contains(second_arg))
             {
-                args[count - 2] = structure_literal;
+                if (second_arg == "auto")
+                    args[1] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[2], "structure") == "auto")
+                    args[2] = structure_literal;
             }
+            /// s3(source, access_key_id, access_key_id, format) -> s3(source, access_key_id, access_key_id, format, structure)
             else
             {
+                if (checkAndGetLiteralArgument<String>(args[3], "format") == "auto")
+                    args[3] = format_literal;
                 args.push_back(structure_literal);
             }
         }
@@ -323,19 +351,30 @@ void TableFunctionS3::addColumnsStructureToArguments(ASTs & args, const String &
         else if (count == 5)
         {
             auto sedond_arg = checkAndGetLiteralArgument<String>(args[1], "format/NOSIGN");
+            /// s3(source, NOSIGN, format, structure, compression_method)
             if (boost::iequals(sedond_arg, "NOSIGN"))
             {
-                args[count - 2] = structure_literal;
+                if (checkAndGetLiteralArgument<String>(args[2], "format") == "auto")
+                    args[2] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[3], "structure") == "auto")
+                    args[3] = structure_literal;
             }
+            /// s3(source, access_key_id, access_key_id, format, structure)
             else
             {
-                args[count - 1] = structure_literal;
+                if (checkAndGetLiteralArgument<String>(args[3], "format") == "auto")
+                    args[3] = format_literal;
+                if (checkAndGetLiteralArgument<String>(args[4], "structure") == "auto")
+                    args[4] = structure_literal;
             }
         }
         /// s3(source, access_key_id, secret_access_key, format, structure, compression)
         else if (count == 6)
         {
-            args[count - 2] = structure_literal;
+            if (checkAndGetLiteralArgument<String>(args[3], "format") == "auto")
+                args[3] = format_literal;
+            if (checkAndGetLiteralArgument<String>(args[4], "structure") == "auto")
+                args[4] = structure_literal;
         }
     }
 }
@@ -346,6 +385,9 @@ ColumnsDescription TableFunctionS3::getActualTableStructure(ContextPtr context,
     {
         context->checkAccess(getSourceAccessType());
         configuration.update(context);
+        if (configuration.format == "auto")
+            return StorageS3::getTableStructureAndFormatFromData(configuration, std::nullopt, context).first;
+
         return StorageS3::getTableStructureFromData(configuration, std::nullopt, context);
     }
 
diff --git a/src/TableFunctions/TableFunctionS3.h b/src/TableFunctions/TableFunctionS3.h
index fa73c1d313e..00ca36c6653 100644
--- a/src/TableFunctions/TableFunctionS3.h
+++ b/src/TableFunctions/TableFunctionS3.h
@@ -57,7 +57,7 @@ public:
 
     virtual void parseArgumentsImpl(ASTs & args, const ContextPtr & context);
 
-    static void addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr & context);
+    static void updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure, const String & format, const ContextPtr & context);
 
 protected:
 
diff --git a/src/TableFunctions/TableFunctionS3Cluster.cpp b/src/TableFunctions/TableFunctionS3Cluster.cpp
index ce96f7f580b..e727c4e4c89 100644
--- a/src/TableFunctions/TableFunctionS3Cluster.cpp
+++ b/src/TableFunctions/TableFunctionS3Cluster.cpp
@@ -21,9 +21,8 @@ StoragePtr TableFunctionS3Cluster::executeImpl(
 {
     StoragePtr storage;
     ColumnsDescription columns;
-    bool structure_argument_was_provided = configuration.structure != "auto";
 
-    if (structure_argument_was_provided)
+    if (configuration.structure != "auto")
     {
         columns = parseColumnsListFromString(configuration.structure, context);
     }
@@ -53,8 +52,7 @@ StoragePtr TableFunctionS3Cluster::executeImpl(
             StorageID(getDatabaseName(), table_name),
             columns,
             ConstraintsDescription{},
-            context,
-            structure_argument_was_provided);
+            context);
     }
 
     storage->startup();
diff --git a/src/TableFunctions/TableFunctionURL.cpp b/src/TableFunctions/TableFunctionURL.cpp
index aa535991d65..a78b2affa9a 100644
--- a/src/TableFunctions/TableFunctionURL.cpp
+++ b/src/TableFunctions/TableFunctionURL.cpp
@@ -55,7 +55,7 @@ void TableFunctionURL::parseArgumentsImpl(ASTs & args, const ContextPtr & contex
 
         format = configuration.format;
         if (format == "auto")
-            format = FormatFactory::instance().getFormatFromFileName(Poco::URI(filename).getPath(), true);
+            format = FormatFactory::instance().tryGetFormatFromFileName(Poco::URI(filename).getPath()).value_or("auto");
 
         StorageURL::evalArgsAndCollectHeaders(args, configuration.headers, context);
     }
@@ -78,15 +78,24 @@ void TableFunctionURL::parseArgumentsImpl(ASTs & args, const ContextPtr & contex
     }
 }
 
-void TableFunctionURL::addColumnsStructureToArguments(ASTs & args, const String & desired_structure, const ContextPtr & context)
+void TableFunctionURL::updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure_, const String & format_, const ContextPtr & context)
 {
-    if (tryGetNamedCollectionWithOverrides(args, context))
+    if (auto collection = tryGetNamedCollectionWithOverrides(args, context))
     {
-        /// In case of named collection, just add key-value pair "structure='...'"
-        /// at the end of arguments to override existed structure.
-        ASTs equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(desired_structure)};
-        auto equal_func = makeASTFunction("equals", std::move(equal_func_args));
-        args.push_back(equal_func);
+        /// In case of named collection, just add key-value pairs "format='...', structure='...'"
+        /// at the end of arguments to override existed format and structure with "auto" values.
+        if (collection->getOrDefault<String>("format", "auto") == "auto")
+        {
+            ASTs format_equal_func_args = {std::make_shared<ASTIdentifier>("format"), std::make_shared<ASTLiteral>(format_)};
+            auto format_equal_func = makeASTFunction("equals", std::move(format_equal_func_args));
+            args.push_back(format_equal_func);
+        }
+        if (collection->getOrDefault<String>("structure", "auto") == "auto")
+        {
+            ASTs structure_equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure_)};
+            auto structure_equal_func = makeASTFunction("equals", std::move(structure_equal_func_args));
+            args.push_back(structure_equal_func);
+        }
     }
     else
     {
@@ -101,7 +110,7 @@ void TableFunctionURL::addColumnsStructureToArguments(ASTs & args, const String
             args.pop_back();
         }
 
-        ITableFunctionFileLike::addColumnsStructureToArguments(args, desired_structure, context);
+        ITableFunctionFileLike::updateStructureAndFormatArgumentsIfNeeded(args, structure_, format_, context);
 
         if (headers_ast)
             args.push_back(headers_ast);
@@ -131,6 +140,14 @@ ColumnsDescription TableFunctionURL::getActualTableStructure(ContextPtr context,
     if (structure == "auto")
     {
         context->checkAccess(getSourceAccessType());
+        if (format == "auto")
+            return StorageURL::getTableStructureAndFormatFromData(
+                       filename,
+                       chooseCompressionMethod(Poco::URI(filename).getPath(), compression_method),
+                       configuration.headers,
+                       std::nullopt,
+                       context).first;
+
         return StorageURL::getTableStructureFromData(format,
             filename,
             chooseCompressionMethod(Poco::URI(filename).getPath(), compression_method),
@@ -148,9 +165,9 @@ std::unordered_set<String> TableFunctionURL::getVirtualsToCheckBeforeUsingStruct
     return {virtual_column_names.begin(), virtual_column_names.end()};
 }
 
-String TableFunctionURL::getFormatFromFirstArgument()
+std::optional<String> TableFunctionURL::tryGetFormatFromFirstArgument()
 {
-    return FormatFactory::instance().getFormatFromFileName(Poco::URI(filename).getPath(), true);
+    return FormatFactory::instance().tryGetFormatFromFileName(Poco::URI(filename).getPath());
 }
 
 void registerTableFunctionURL(TableFunctionFactory & factory)
diff --git a/src/TableFunctions/TableFunctionURL.h b/src/TableFunctions/TableFunctionURL.h
index bf417f950c0..54e223283ba 100644
--- a/src/TableFunctions/TableFunctionURL.h
+++ b/src/TableFunctions/TableFunctionURL.h
@@ -34,7 +34,7 @@ public:
 
     ColumnsDescription getActualTableStructure(ContextPtr context, bool is_insert_query) const override;
 
-    static void addColumnsStructureToArguments(ASTs & args, const String & desired_structure, const ContextPtr & context);
+    static void updateStructureAndFormatArgumentsIfNeeded(ASTs & args, const String & structure_, const String & format_, const ContextPtr & context);
 
     std::unordered_set<String> getVirtualsToCheckBeforeUsingStructureHint() const override;
 
@@ -53,8 +53,7 @@ private:
 
     const char * getStorageTypeName() const override { return "URL"; }
 
-    String getFormatFromFirstArgument() override;
-
+    std::optional<String> tryGetFormatFromFirstArgument() override;
 };
 
 }
diff --git a/src/TableFunctions/TableFunctionURLCluster.cpp b/src/TableFunctions/TableFunctionURLCluster.cpp
index a2949278155..5fd3c3342a5 100644
--- a/src/TableFunctions/TableFunctionURLCluster.cpp
+++ b/src/TableFunctions/TableFunctionURLCluster.cpp
@@ -40,8 +40,7 @@ StoragePtr TableFunctionURLCluster::getStorage(
             StorageID(getDatabaseName(), table_name),
             getActualTableStructure(context, /* is_insert_query */ true),
             ConstraintsDescription{},
-            configuration,
-            structure != "auto");
+            configuration);
     }
     return storage;
 }
diff --git a/tests/integration/test_file_cluster/test.py b/tests/integration/test_file_cluster/test.py
index d75cd6c7d23..5d12407e3f2 100644
--- a/tests/integration/test_file_cluster/test.py
+++ b/tests/integration/test_file_cluster/test.py
@@ -123,3 +123,91 @@ def test_no_such_files(started_cluster):
     distributed = node.query(get_query("*", True, "3,4"))
 
     assert TSV(local) == TSV(distributed)
+
+
+def test_schema_inference(started_cluster):
+    node = started_cluster.instances["s0_0_0"]
+
+    expected_result = node.query(
+        "select * from file('file*.csv', 'CSV', 's String, i UInt32') ORDER BY (i, s)"
+    )
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv') ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', CSV) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', auto, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', CSV, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', auto, auto, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file*.csv', CSV, auto, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+
+def test_format_detection(started_cluster):
+    for node_name in ("s0_0_0", "s0_0_1", "s0_1_0"):
+        for i in range(1, 3):
+            started_cluster.instances[node_name].query(
+                f"""
+                INSERT INTO TABLE FUNCTION file(
+                    'file_for_format_detection_{i}', 'CSV', 's String, i UInt32') VALUES ('file{i}',{i})
+                    """
+            )
+
+    node = started_cluster.instances["s0_0_0"]
+    expected_result = node.query(
+        "select * from file('file_for_format_detection*', 'CSV', 's String, i UInt32') ORDER BY (i, s)"
+    )
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*') ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*', auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*', auto, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*', auto, 's String, i UInt32') ORDER BY (i, s)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*', auto, auto, auto) ORDER BY (c1, c2)"
+    )
+    assert result == expected_result
+
+    result = node.query(
+        "select * from fileCluster('my_cluster', 'file_for_format_detection*', auto, 's String, i UInt32', auto) ORDER BY (i, s)"
+    )
+    assert result == expected_result
diff --git a/tests/integration/test_s3_cluster/test.py b/tests/integration/test_s3_cluster/test.py
index 673ca318c92..03919ee6a4d 100644
--- a/tests/integration/test_s3_cluster/test.py
+++ b/tests/integration/test_s3_cluster/test.py
@@ -35,7 +35,9 @@ def create_buckets_s3(cluster):
 
             # Make all files a bit different
             for number in range(100 + file_number):
-                data.append([str(number + file_number) * 10, number + file_number])
+                data.append(
+                    ["str_" + str(number + file_number) * 10, number + file_number]
+                )
 
             writer = csv.writer(f)
             writer.writerows(data)
@@ -427,3 +429,33 @@ def test_cluster_with_named_collection(started_cluster):
     )
 
     assert TSV(pure_s3) == TSV(s3_cluster)
+
+
+def test_cluster_format_detection(started_cluster):
+    node = started_cluster.instances["s0_0_0"]
+
+    expected_desc_result = node.query(
+        "desc s3('http://minio1:9001/root/data/generated/*', 'minio', 'minio123', 'CSV')"
+    )
+
+    desc_result = node.query(
+        "desc s3('http://minio1:9001/root/data/generated/*', 'minio', 'minio123')"
+    )
+
+    assert expected_desc_result == desc_result
+
+    expected_result = node.query(
+        "SELECT * FROM s3('http://minio1:9001/root/data/generated/*', 'minio', 'minio123', 'CSV', 'a String, b UInt64') order by a, b"
+    )
+
+    result = node.query(
+        "SELECT * FROM s3Cluster(cluster_simple, 'http://minio1:9001/root/data/generated/*', 'minio', 'minio123') order by c1, c2"
+    )
+
+    assert result == expected_result
+
+    result = node.query(
+        "SELECT * FROM s3Cluster(cluster_simple, 'http://minio1:9001/root/data/generated/*', 'minio', 'minio123', auto, 'a String, b UInt64') order by a, b"
+    )
+
+    assert result == expected_result
diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index 3cccd07c134..75ef50ec12a 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -1250,3 +1250,73 @@ def test_size_virtual_column(cluster):
         result
         == "test_size_virtual_column1.tsv\t2\ntest_size_virtual_column2.tsv\t3\ntest_size_virtual_column3.tsv\t4\n"
     )
+
+
+def test_format_detection(cluster):
+    node = cluster.instances["node"]
+    storage_account_url = cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]
+    account_name = "devstoreaccount1"
+    account_key = "Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw=="
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection0', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt64, y String') select number as x, 'str_' || toString(number) from numbers(0)",
+    )
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt64, y String') select number as x, 'str_' || toString(number) from numbers(10)",
+    )
+
+    expected_desc_result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'auto')",
+    )
+
+    desc_result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}')",
+    )
+
+    assert expected_desc_result == desc_result
+
+    expected_result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt64, y String')",
+    )
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}')",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}', auto, auto, 'x UInt64, y String')",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection{{0,1}}', '{account_name}', '{account_key}')",
+    )
+
+    assert result == expected_result
+
+    node.query(f"system drop schema cache for hdfs")
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection{{0,1}}', '{account_name}', '{account_key}')",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection{{0,1}}', '{account_name}', '{account_key}')",
+    )
+
+    assert result == expected_result
diff --git a/tests/integration/test_storage_azure_blob_storage/test_cluster.py b/tests/integration/test_storage_azure_blob_storage/test_cluster.py
index 2bd3f24d25f..6c5e2d20ca5 100644
--- a/tests/integration/test_storage_azure_blob_storage/test_cluster.py
+++ b/tests/integration/test_storage_azure_blob_storage/test_cluster.py
@@ -262,3 +262,72 @@ def test_partition_parallel_reading_with_cluster(cluster):
     )
 
     assert azure_cluster == "3\n"
+
+
+def test_format_detection(cluster):
+    node = cluster.instances["node_0"]
+    storage_account_url = cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]
+    account_name = "devstoreaccount1"
+    account_key = "Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw=="
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection0', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt32, y String') select number as x, 'str_' || toString(number) from numbers(10)",
+    )
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection1', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt32, y String') select number as x, 'str_' || toString(number) from numbers(10, 10)",
+    )
+
+    expected_desc_result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'auto')",
+    )
+
+    desc_result = azure_query(
+        node,
+        f"desc azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}')",
+    )
+
+    assert expected_desc_result == desc_result
+
+    expected_result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'x UInt32, y String') order by x",
+    )
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}') order by x",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', auto) order by x",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', auto, auto) order by x",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', 'x UInt32, y String') order by x",
+    )
+
+    assert result == expected_result
+
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorageCluster('simple_cluster', '{storage_account_url}', 'cont', 'test_format_detection*', '{account_name}', '{account_key}', auto, auto, 'x UInt32, y String') order by x",
+    )
+
+    assert result == expected_result
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 8ed1e4b6c0e..8dee15f4d94 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -1047,6 +1047,74 @@ def test_union_schema_inference_mode(started_cluster):
     assert "Cannot extract table structure" in error
 
 
+def test_format_detection(started_cluster):
+    node = started_cluster.instances["node1"]
+
+    node.query(
+        "insert into function hdfs('hdfs://hdfs1:9000/test_format_detection0', JSONEachRow) select number as x, 'str_' || toString(number) as y from numbers(0)"
+    )
+
+    node.query(
+        "insert into function hdfs('hdfs://hdfs1:9000/test_format_detection1', JSONEachRow) select number as x, 'str_' || toString(number) as y from numbers(10)"
+    )
+
+    expected_desc_result = node.query(
+        "desc hdfs('hdfs://hdfs1:9000/test_format_detection1', JSONEachRow)"
+    )
+
+    desc_result = node.query("desc hdfs('hdfs://hdfs1:9000/test_format_detection1')")
+
+    assert expected_desc_result == desc_result
+
+    expected_result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_format_detection1', JSONEachRow, 'x UInt64, y String') order by x, y"
+    )
+
+    result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_format_detection1') order by x, y"
+    )
+
+    assert expected_result == result
+
+    result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_format_detection1', auto, 'x UInt64, y String') order by x, y"
+    )
+
+    assert expected_result == result
+
+    result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_format_detection{0,1}') order by x, y"
+    )
+
+    assert expected_result == result
+
+    node.query("system drop schema cache for hdfs")
+
+    result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_format_detection{0,1}') order by x, y"
+    )
+
+    assert expected_result == result
+
+    result = node.query(
+        "select * from hdfsCluster(test_cluster_two_shards, 'hdfs://hdfs1:9000/test_format_detection{0,1}') order by x, y"
+    )
+
+    assert expected_result == result
+
+    result = node.query(
+        "select * from hdfsCluster(test_cluster_two_shards, 'hdfs://hdfs1:9000/test_format_detection{0,1}', auto, auto) order by x, y"
+    )
+
+    assert expected_result == result
+
+    result = node.query(
+        "select * from hdfsCluster(test_cluster_two_shards, 'hdfs://hdfs1:9000/test_format_detection{0,1}', auto, 'x UInt64, y String') order by x, y"
+    )
+
+    assert expected_result == result
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 2549cb0d473..365ade7da65 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -2194,3 +2194,57 @@ def test_union_schema_inference_mode(started_cluster):
             f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3,4}}.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
         )
         assert "Cannot extract table structure" in error
+
+
+def test_s3_format_detection(started_cluster):
+    bucket = started_cluster.minio_bucket
+    instance = started_cluster.instances["dummy"]
+
+    instance.query(
+        f"insert into table function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection0', 'JSONEachRow', 'x UInt64, y String') select number, 'str_' || toString(number) from numbers(0) settings s3_truncate_on_insert=1"
+    )
+
+    instance.query(
+        f"insert into table function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1', 'JSONEachRow', 'x UInt64, y String') select number, 'str_' || toString(number) from numbers(5) settings s3_truncate_on_insert=1"
+    )
+
+    expected_result = instance.query(
+        f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1', 'JSONEachRow', 'x UInt64, y String')"
+    )
+
+    expected_desc_result = instance.query(
+        f"desc s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1', 'JSONEachRow')"
+    )
+
+    for engine in ["s3", "url"]:
+        desc_result = instance.query(
+            f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1')"
+        )
+
+        assert desc_result == expected_desc_result
+
+        result = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1')"
+        )
+
+        assert result == expected_result
+
+        result = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection1', auto, 'x UInt64, y String')"
+        )
+
+        assert result == expected_result
+
+        result = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection{{0,1}}', auto, 'x UInt64, y String')"
+        )
+
+        assert result == expected_result
+
+        instance.query(f"system drop schema cache for {engine}")
+
+        result = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_format_detection{{0,1}}', auto, 'x UInt64, y String')"
+        )
+
+        assert result == expected_result
diff --git a/tests/queries/0_stateless/02969_auto_format_detection.reference b/tests/queries/0_stateless/02969_auto_format_detection.reference
new file mode 100644
index 00000000000..4b86be04996
--- /dev/null
+++ b/tests/queries/0_stateless/02969_auto_format_detection.reference
@@ -0,0 +1,123 @@
+Parquet
+a	Nullable(UInt64)					
+b	Nullable(String)					
+c	Array(Nullable(UInt64))					
+d	Tuple(\n    a Nullable(UInt64),\n    b Nullable(String))					
+ORC
+a	Nullable(Int64)					
+b	Nullable(String)					
+c	Array(Nullable(Int64))					
+d	Tuple(\n    a Nullable(Int64),\n    b Nullable(String))					
+Arrow
+a	Nullable(UInt64)					
+b	Nullable(String)					
+c	Array(Nullable(UInt64))					
+d	Tuple(\n    a Nullable(UInt64),\n    b Nullable(String))					
+ArrowStream
+a	Nullable(UInt64)					
+b	Nullable(String)					
+c	Array(Nullable(UInt64))					
+d	Tuple(\n    a Nullable(UInt64),\n    b Nullable(String))					
+Avro
+a	Int64					
+b	String					
+c	Array(Int64)					
+d	Tuple(\n    a Int64,\n    b String)					
+Native
+a	UInt64					
+b	String					
+c	Array(UInt64)					
+d	Tuple(\n    a UInt64,\n    b String)					
+BSONEachRow
+a	Nullable(Int64)					
+b	Nullable(String)					
+c	Array(Nullable(Int64))					
+d	Tuple(\n    a Nullable(Int64),\n    b Nullable(String))					
+JSONCompact
+a	UInt64					
+b	String					
+c	Array(UInt64)					
+d	Tuple(\n    a UInt64,\n    b String)					
+Values
+c1	Nullable(UInt64)					
+c2	Nullable(String)					
+c3	Array(Nullable(UInt64))					
+c4	Tuple(Nullable(UInt64), Nullable(String))					
+TSKV
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(UInt64))					
+d	Nullable(String)					
+JSONObjectEachRow
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+JSONColumns
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+JSONCompactColumns
+c1	Nullable(String)					
+c2	Nullable(String)					
+c3	Array(Nullable(String))					
+c4	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+JSONCompact
+a	UInt64					
+b	String					
+c	Array(UInt64)					
+d	Tuple(\n    a UInt64,\n    b String)					
+JSON
+a	UInt64					
+b	String					
+c	Array(UInt64)					
+d	Tuple(\n    a UInt64,\n    b String)					
+TSV
+c1	Nullable(UInt64)					
+c2	Nullable(String)					
+c3	Array(Nullable(UInt64))					
+c4	Tuple(Nullable(UInt64), Nullable(String))					
+CSV
+c1	Nullable(UInt64)					
+c2	Nullable(String)					
+c3	Array(Nullable(UInt64))					
+c4	Nullable(UInt64)					
+c5	Nullable(String)					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	UInt64					
+b	String					
+c	Array(UInt64)					
+d	Tuple(\n    a UInt64,\n    b String)					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+1
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
+a	Nullable(String)					
+b	Nullable(String)					
+c	Array(Nullable(String))					
+d	Tuple(\n    a Nullable(String),\n    b Nullable(String))					
diff --git a/tests/queries/0_stateless/02969_auto_format_detection.sh b/tests/queries/0_stateless/02969_auto_format_detection.sh
new file mode 100755
index 00000000000..5b9b4e09efa
--- /dev/null
+++ b/tests/queries/0_stateless/02969_auto_format_detection.sh
@@ -0,0 +1,46 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+DATA_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME.data
+
+for format in Parquet ORC Arrow ArrowStream Avro Native BSONEachRow JSONCompact Values TSKV JSONObjectEachRow JSONColumns JSONCompactColumns JSONCompact JSON TSV CSV
+do
+    echo $format
+    $CLICKHOUSE_LOCAL -q "select * from generateRandom('a UInt64, b String, c Array(UInt64), d Tuple(a UInt64, b String)', 42) limit 10 format $format" > $DATA_FILE
+    $CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE')"
+done
+
+rm $DATA_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from generateRandom('a UInt64, b String, c Array(UInt64), d Tuple(a UInt64, b String)', 42) limit 10 format JSONEachRow" > $DATA_FILE.jsonl
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE*')"
+
+
+$CLICKHOUSE_LOCAL -q "select * from generateRandom('a UInt64, b String, c Array(UInt64), d Tuple(a UInt64, b String)', 42) limit 10 format JSONEachRow" > $DATA_FILE
+
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE', auto, 'a UInt64, b String, c Array(UInt64), d Tuple(a UInt64, b String)')"
+
+$CLICKHOUSE_LOCAL -nmq "
+desc file('$DATA_FILE');
+desc file('$DATA_FILE');
+"
+
+$CLICKHOUSE_LOCAL -nmq "
+desc file('$DATA_FILE', JSONEachRow);
+desc file('$DATA_FILE');
+"
+
+touch $DATA_FILE.1
+$CLICKHOUSE_LOCAL -q "select * from generateRandom('a UInt64, b String, c Array(UInt64), d Tuple(a UInt64, b String)', 42) limit 10 format JSONEachRow" > $DATA_FILE.2
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE.{1,2}')"
+$CLICKHOUSE_LOCAL -q "desc file('$DATA_FILE.{1,2}') settings schema_inference_mode='union'" 2>&1 | grep -c "CANNOT_DETECT_FORMAT"
+
+$CLICKHOUSE_LOCAL -nmq "
+desc file('$DATA_FILE.2');
+desc file('$DATA_FILE.{1,2}');
+"
+
+rm $DATA_FILE*

From f05174e441f8efaa732f9e717f46259a9a8e479b Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 22 Jan 2024 23:28:17 +0000
Subject: [PATCH 0221/1081] Fix style

---
 docs/en/interfaces/schema-inference.md | 2 +-
 src/Formats/ReadSchemaUtils.cpp        | 2 +-
 src/Storages/IStorageCluster.h         | 2 +-
 src/Storages/StorageAzureBlob.cpp      | 4 ++--
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index d255688da1f..3d3ee5c83d6 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -1988,7 +1988,7 @@ Note:
 - If you have a lot of files, reading schema from all of them can take a lot of time.
 
 
-## Automatic format detection {#autimatic-format-detection}
+## Automatic format detection {#automatic-format-detection}
 
 If data format is not specified and cannot be determined by the file extension, ClickHouse will try to detect the file format by its content.
 
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index b4fba7b9ce6..c882f15b4b0 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -379,7 +379,7 @@ try
 
                     /// We choose the format with larger number of columns in inferred schema.
                     size_t max_number_of_columns = 0;
-                    for (const auto & [format_to_detect, schema] : format_to_schema )
+                    for (const auto & [format_to_detect, schema] : format_to_schema)
                     {
                         if (schema.size() > max_number_of_columns)
                         {
diff --git a/src/Storages/IStorageCluster.h b/src/Storages/IStorageCluster.h
index 28ebda5125e..92d9a84b758 100644
--- a/src/Storages/IStorageCluster.h
+++ b/src/Storages/IStorageCluster.h
@@ -41,7 +41,7 @@ public:
 
 protected:
     virtual void updateBeforeRead(const ContextPtr &) {}
-    virtual void updateQueryToSendIfNeeded(ASTPtr & /*query*/,  const StorageSnapshotPtr & /*storage_snapshot*/, const ContextPtr & /*context*/) {}
+    virtual void updateQueryToSendIfNeeded(ASTPtr & /*query*/, const StorageSnapshotPtr & /*storage_snapshot*/, const ContextPtr & /*context*/) {}
 
 private:
     Poco::Logger * log;
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 888d360aff1..35072dc5cae 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -1335,7 +1335,7 @@ namespace
                             "in AzureBlobStorage. You can specify table structure manually", *format);
 
                     throw Exception(
-                        ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
+                        ErrorCodes::CANNOT_DETECT_FORMAT,
                         "The data format cannot be detected by the contents of the files, because there are no files with provided path "
                         "in AzureBlobStorage. You can specify table structure manually");
                 }
@@ -1407,7 +1407,7 @@ namespace
         {
             format = format_name;
         }
-        
+
         String getLastFileName() const override { return current_path_with_metadata.relative_path; }
 
         bool supportsLastReadBufferRecreation() const override { return true; }

From 1bff525666b96e1a433d07e933e76a845e503dcb Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 23 Jan 2024 09:35:41 +0000
Subject: [PATCH 0222/1081] Fix tests and docs

---
 docs/en/interfaces/schema-inference.md                   | 2 +-
 src/Client/ClientBase.cpp                                | 6 +++---
 tests/queries/0_stateless/02969_auto_format_detection.sh | 1 +
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index 3d3ee5c83d6..6a7b744dd43 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -55,7 +55,7 @@ DESCRIBE file('hobbies.jsonl')
 └─────────┴─────────────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 
-## Table engines [File](../engines/table-engines/special/file.md), [S3](../engines/table-engines/integrations/s3.md), [URL](../engines/table-engines/special/url.md), [HDFS](../engines/table-engines/integrations/hdfs.md), [azureBlobStorage](./engines/table-engines/integrations/azureBlobStorage.md)
+## Table engines [File](../engines/table-engines/special/file.md), [S3](../engines/table-engines/integrations/s3.md), [URL](../engines/table-engines/special/url.md), [HDFS](../engines/table-engines/integrations/hdfs.md), [azureBlobStorage](../engines/table-engines/integrations/azureBlobStorage.md)
 
 If the list of columns is not specified in `CREATE TABLE` query, the structure of the table will be inferred automatically from the data.
 
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 01eff0d3e4c..6c39c3ebc95 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -632,9 +632,9 @@ try
             }
             else if (query_with_output->out_file)
             {
-                const auto & format_name = FormatFactory::instance().getFormatFromFileName(out_file);
-                if (!format_name.empty())
-                    current_format = format_name;
+                auto format_name = FormatFactory::instance().tryGetFormatFromFileName(out_file);
+                if (format_name)
+                    current_format = *format_name;
             }
         }
 
diff --git a/tests/queries/0_stateless/02969_auto_format_detection.sh b/tests/queries/0_stateless/02969_auto_format_detection.sh
index 5b9b4e09efa..88d6575e499 100755
--- a/tests/queries/0_stateless/02969_auto_format_detection.sh
+++ b/tests/queries/0_stateless/02969_auto_format_detection.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: no-fasttest
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 48609d3c9f55b00cd787a5592c8f51a96ac9ad42 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 23 Jan 2024 09:36:01 +0000
Subject: [PATCH 0223/1081] Fix tests

---
 programs/local/LocalServer.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index dd96532aadd..2caf3a559a9 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -336,23 +336,23 @@ std::string LocalServer::getInitialCreateTableQuery()
     auto table_structure = config().getString("table-structure", "auto");
 
     String table_file;
-    String format_from_file_name;
+    std::optional<String> format_from_file_name;
     if (!config().has("table-file") || config().getString("table-file") == "-")
     {
         /// Use Unix tools stdin naming convention
         table_file = "stdin";
-        format_from_file_name = FormatFactory::instance().getFormatFromFileDescriptor(STDIN_FILENO);
+        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDIN_FILENO);
     }
     else
     {
         /// Use regular file
         auto file_name = config().getString("table-file");
         table_file = quoteString(file_name);
-        format_from_file_name = FormatFactory::instance().getFormatFromFileName(file_name);
+        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName(file_name);
     }
 
     auto data_format = backQuoteIfNeed(
-        config().getString("table-data-format", config().getString("format", format_from_file_name.empty() ? "TSV" : format_from_file_name)));
+        config().getString("table-data-format", config().getString("format", format_from_file_name ? *format_from_file_name : "TSV")));
 
 
     if (table_structure == "auto")

From eaca40c53efb4c08878165219242bc22a004371f Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 23 Jan 2024 10:28:57 +0000
Subject: [PATCH 0224/1081] Update tests

---
 src/Formats/ReadSchemaUtils.cpp                           | 8 ++++----
 tests/queries/0_stateless/01030_storage_url_syntax.sql    | 4 ++--
 tests/queries/0_stateless/02424_pod_array_overflow.sql    | 2 +-
 tests/queries/0_stateless/02426_pod_array_overflow_2.sql  | 2 +-
 tests/queries/0_stateless/02426_pod_array_overflow_3.sql  | 2 +-
 .../queries/0_stateless/02497_schema_inference_nulls.sql  | 4 ++--
 .../0_stateless/02502_bad_values_schema_inference.sql     | 2 +-
 .../02783_max_bytes_to_read_in_schema_inference.sql       | 2 +-
 8 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index c882f15b4b0..08e05872c97 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -193,13 +193,13 @@ try
                 if (format_name)
                     throw Exception(
                         ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                        "The table structure cannot be extracted from a {} format file:\n{}\nYou can specify the structure manually",
+                        "The table structure cannot be extracted from a {} format file:\n{}\n.You can specify the structure manually",
                         *format_name,
                         exception_message);
 
                 throw Exception(
                     ErrorCodes::CANNOT_DETECT_FORMAT,
-                    "The data format cannot be detected by the contents of the files:\n{}\nYou can specify the format manually",
+                    "The data format cannot be detected by the contents of the files:\n{}\n.You can specify the format manually",
                     exception_message);
             }
 
@@ -274,7 +274,7 @@ try
                         throw Exception(
                             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                             "The table structure cannot be extracted from a {} format file. "
-                            "Error: {}. You can specify the structure manually",
+                            "Error:\n{}.\nYou can specify the structure manually",
                             *format_name,
                             exception_message);
                     }
@@ -473,7 +473,7 @@ try
                 throw Exception(
                     ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                     "The table structure cannot be extracted from a {} format file. "
-                    "Error: {}. You can specify the structure manually",
+                    "Error:\n{}.\nYou can specify the structure manually",
                     *format_name,
                     exception_messages);
             }
diff --git a/tests/queries/0_stateless/01030_storage_url_syntax.sql b/tests/queries/0_stateless/01030_storage_url_syntax.sql
index 9b31558eece..eda108aca2f 100644
--- a/tests/queries/0_stateless/01030_storage_url_syntax.sql
+++ b/tests/queries/0_stateless/01030_storage_url_syntax.sql
@@ -1,7 +1,7 @@
 drop table if exists test_table_url_syntax
 ;
 create table test_table_url_syntax (id UInt32) ENGINE = URL('')
-; -- { serverError 36 }
+; -- { serverError UNSUPPORTED_URI_SCHEME }
 create table test_table_url_syntax (id UInt32) ENGINE = URL('','','','')
 ; -- { serverError 42 }
 drop table if exists test_table_url_syntax
@@ -11,7 +11,7 @@ drop table if exists test_table_url
 ;
 
 create table test_table_url(id UInt32) ENGINE = URL('http://localhost/endpoint')
-; -- { serverError 36 }
+; -- { serverError CANNOT_DETECT_FORMAT }
 
 create table test_table_url(id UInt32) ENGINE = URL('http://localhost/endpoint.json');
 drop table test_table_url;
diff --git a/tests/queries/0_stateless/02424_pod_array_overflow.sql b/tests/queries/0_stateless/02424_pod_array_overflow.sql
index 4b85d5be029..50c46cf19f1 100644
--- a/tests/queries/0_stateless/02424_pod_array_overflow.sql
+++ b/tests/queries/0_stateless/02424_pod_array_overflow.sql
@@ -1 +1 @@
-SELECT * FROM format(Native, '\x02\x02\x02\x6b\x30\x1a\x4d\x61\x70\x28\x46\x69\x78\x65\x64\x53\x74\x72\x69\x6e\x67\x28\x31\x29\x2c\x20\x49\x6e\x74\x36\x34\x29\x01\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x7f\x00\x7f\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x64\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xcf\x31\x3f\x56\x69\x11\x89\x25'); -- { serverError 128 }
+SELECT * FROM format(Native, '\x02\x02\x02\x6b\x30\x1a\x4d\x61\x70\x28\x46\x69\x78\x65\x64\x53\x74\x72\x69\x6e\x67\x28\x31\x29\x2c\x20\x49\x6e\x74\x36\x34\x29\x01\x00\x00\x00\x00\x00\x00\x00\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\xff\x7f\x00\x7f\xff\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x64\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00\xcf\x31\x3f\x56\x69\x11\x89\x25'); -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
diff --git a/tests/queries/0_stateless/02426_pod_array_overflow_2.sql b/tests/queries/0_stateless/02426_pod_array_overflow_2.sql
index 52a00730227..6a0d97acee3 100644
--- a/tests/queries/0_stateless/02426_pod_array_overflow_2.sql
+++ b/tests/queries/0_stateless/02426_pod_array_overflow_2.sql
@@ -1 +1 @@
-SELECT * FROM format(Native, 'k0\x23Array(Tuple(FixedString(1), Int64))\0\0\0\0\0\0\0�����\0����������������\0�\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0d\0\0\0\0\0\0\0\0\0\0\0\0\0�1?Vi�%'); -- { serverError 128 }
+SELECT * FROM format(Native, 'k0\x23Array(Tuple(FixedString(1), Int64))\0\0\0\0\0\0\0�����\0����������������\0�\0\0\0\0\0\0\0\0\0\0\0\0\0\0\0d\0\0\0\0\0\0\0\0\0\0\0\0\0�1?Vi�%'); -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
diff --git a/tests/queries/0_stateless/02426_pod_array_overflow_3.sql b/tests/queries/0_stateless/02426_pod_array_overflow_3.sql
index 857ba2ca28e..caabf7d1679 100644
--- a/tests/queries/0_stateless/02426_pod_array_overflow_3.sql
+++ b/tests/queries/0_stateless/02426_pod_array_overflow_3.sql
@@ -1 +1 @@
-SELECT * FROM format(Native, '\x01\x01\x01x\x0CArray(UInt8)\x01\x00\xBD\xEF\xBF\xBD\xEF\xBF\xBD\xEF'); -- { serverError 128 }
+SELECT * FROM format(Native, '\x01\x01\x01x\x0CArray(UInt8)\x01\x00\xBD\xEF\xBF\xBD\xEF\xBF\xBD\xEF'); -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
diff --git a/tests/queries/0_stateless/02497_schema_inference_nulls.sql b/tests/queries/0_stateless/02497_schema_inference_nulls.sql
index a25060e8182..b78b5709dbb 100644
--- a/tests/queries/0_stateless/02497_schema_inference_nulls.sql
+++ b/tests/queries/0_stateless/02497_schema_inference_nulls.sql
@@ -4,7 +4,7 @@ set input_format_json_try_infer_named_tuples_from_objects=0;
 set input_format_json_read_objects_as_strings=0;
 set input_format_json_infer_incomplete_types_as_strings=0;
 set input_format_json_read_numbers_as_strings=0;
-desc format(JSONEachRow, '{"x" : 1234}, {"x" : "String"}') settings input_format_json_try_infer_numbers_from_strings=1; -- { serverError TYPE_MISMATCH }
+desc format(JSONEachRow, '{"x" : 1234}, {"x" : "String"}') settings input_format_json_try_infer_numbers_from_strings=1; -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
 desc format(JSONEachRow, '{"x" : [null, 1]}');
 desc format(JSONEachRow, '{"x" : [null, 1]}, {"x" : []}');
 desc format(JSONEachRow, '{"x" : [null, 1]}, {"x" : [null]}');
@@ -26,7 +26,7 @@ desc format(JSONEachRow, '{"x" : [1, 2]}, {"x" : [null]}');
 
 select 'JSONCompactEachRow';
 set schema_inference_make_columns_nullable=1;
-desc format(JSONCompactEachRow, '[1234], ["String"]') settings input_format_json_try_infer_numbers_from_strings=1; -- { serverError TYPE_MISMATCH }
+desc format(JSONCompactEachRow, '[1234], ["String"]') settings input_format_json_try_infer_numbers_from_strings=1; -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
 desc format(JSONCompactEachRow, '[[null, 1]]');
 desc format(JSONCompactEachRow, '[[null, 1]], [[]]');
 desc format(JSONCompactEachRow, '[[null, 1]], [[null]]');
diff --git a/tests/queries/0_stateless/02502_bad_values_schema_inference.sql b/tests/queries/0_stateless/02502_bad_values_schema_inference.sql
index 4c796842c0d..67ac09832de 100644
--- a/tests/queries/0_stateless/02502_bad_values_schema_inference.sql
+++ b/tests/queries/0_stateless/02502_bad_values_schema_inference.sql
@@ -1,2 +1,2 @@
-desc format(Values, '(\'abc)'); -- { serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED }
+desc format(Values, '(\'abc)'); -- { serverError CANNOT_EXTRACT_TABLE_STRUCTURE }
 
diff --git a/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql
index b4165e8e80a..ef0381df1a6 100644
--- a/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql
+++ b/tests/queries/0_stateless/02783_max_bytes_to_read_in_schema_inference.sql
@@ -1,5 +1,5 @@
 set input_format_max_rows_to_read_for_schema_inference=2;
 set input_format_json_infer_incomplete_types_as_strings=0;
-desc format('JSONEachRow', '{"a" : null}, {"a" : 42}') settings input_format_max_bytes_to_read_for_schema_inference=10; -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
+desc format('JSONEachRow', '{"a" : null}, {"a" : 42}') settings input_format_max_bytes_to_read_for_schema_inference=10; -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 desc format('JSONEachRow', '{"a" : null}, {"a" : 42}') settings input_format_max_bytes_to_read_for_schema_inference=20;
 

From 5e4796ae161e0546845f2dca167671eadf9463c3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 23 Jan 2024 12:46:07 +0000
Subject: [PATCH 0225/1081] Fix heap-use-after-free

---
 src/Formats/ReadSchemaUtils.cpp | 24 ++++++++++++++----------
 1 file changed, 14 insertions(+), 10 deletions(-)

diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 08e05872c97..4c734130622 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -349,31 +349,35 @@ try
                 if (!format_name)
                 {
                     std::unordered_map<String, NamesAndTypesList> format_to_schema;
-                    for (const auto & format_to_detect : getSimilarFormatsSetForDetection())
+                    const auto & formats_set_to_detect = getSimilarFormatsSetForDetection();
+                    for (size_t i = 0; i != formats_set_to_detect.size(); ++i)
                     {
                         try
                         {
                             schema_reader = FormatFactory::instance().getSchemaReader(
-                                format_to_detect, support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
+                                formats_set_to_detect[i], support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
                             schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
                             auto tmp_names_and_types = schema_reader->readSchema();
                             /// If schema was inferred successfully for this format, remember it and try next format.
                             if (!tmp_names_and_types.empty())
-                                format_to_schema[format_to_detect] = tmp_names_and_types;
+                                format_to_schema[formats_set_to_detect[i]] = tmp_names_and_types;
                         }
                         catch (...) // NOLINT(bugprone-empty-catch)
                         {
                             /// Try next format.
                         }
 
-                        if (support_buf_recreation)
+                        if (i != formats_set_to_detect.size() - 1)
                         {
-                            read_buffer_iterator.setPreviousReadBuffer(std::move(iterator_data.buf));
-                            iterator_data.buf = read_buffer_iterator.recreateLastReadBuffer();
-                        }
-                        else
-                        {
-                            peekable_buf->rollbackToCheckpoint();
+                            if (support_buf_recreation)
+                            {
+                                read_buffer_iterator.setPreviousReadBuffer(std::move(iterator_data.buf));
+                                iterator_data.buf = read_buffer_iterator.recreateLastReadBuffer();
+                            }
+                            else
+                            {
+                                peekable_buf->rollbackToCheckpoint();
+                            }
                         }
                     }
 

From 93fbe1d9c8dc1af75094e81fc25e20ee1241bab3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 23 Jan 2024 16:17:16 +0000
Subject: [PATCH 0226/1081] Fixes

---
 src/Formats/FormatFactory.cpp                    |  2 +-
 src/Formats/ReadSchemaUtils.cpp                  | 16 ++++++++--------
 .../0_stateless/02185_orc_corrupted_file.sh      |  2 +-
 .../02245_parquet_skip_unknown_type.sh           |  2 +-
 ..._json_wrong_root_type_in_schema_inference.sql |  4 ++--
 .../0_stateless/02286_mysql_dump_input_format.sh |  2 +-
 .../0_stateless/02293_formats_json_columns.sh    |  2 +-
 .../02327_capnproto_protobuf_empty_messages.sh   |  8 ++++----
 .../0_stateless/02416_json_object_inference.sql  |  2 +-
 ...uplicate_column_names_in_schema_inference.sql |  8 ++++----
 .../02458_use_structure_from_insertion_table.sql | 10 +++++-----
 tests/queries/0_stateless/02724_database_s3.sh   |  2 +-
 tests/queries/0_stateless/02725_database_hdfs.sh |  2 +-
 .../02900_union_schema_inference_mode.sh         |  4 ++--
 14 files changed, 33 insertions(+), 33 deletions(-)

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index cacb5a510da..b6f8f041d8d 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -673,7 +673,7 @@ std::optional<String> FormatFactory::tryGetFormatFromFileDescriptor(int fd)
 #elif defined(OS_DARWIN)
     char file_path[PATH_MAX] = {'\0'};
     if (fcntl(fd, F_GETPATH, file_path) != -1)
-        return tryGetFormatFromFileName(file_path, false);
+        return tryGetFormatFromFileName(file_path);
     return std::nullopt;
 #else
     (void)fd;
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 4c734130622..5576da56dbf 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -127,7 +127,6 @@ try
         IReadBufferIterator::Data iterator_data;
         std::vector<std::pair<NamesAndTypesList, String>> schemas_for_union_mode;
         std::string exception_messages;
-        SchemaReaderPtr schema_reader;
         size_t max_rows_to_read = format_settings ? format_settings->max_rows_to_read_for_schema_inference
                                                   : context->getSettingsRef().input_format_max_rows_to_read_for_schema_inference;
         size_t max_bytes_to_read = format_settings ? format_settings->max_bytes_to_read_for_schema_inference
@@ -227,6 +226,8 @@ try
                 continue;
             }
 
+            SchemaReaderPtr schema_reader;
+
             if (format_name)
             {
                 try
@@ -417,12 +418,11 @@ try
         if (!format_name)
             throw Exception(ErrorCodes::CANNOT_DETECT_FORMAT, "The data format cannot be detected by the contents of the files. You can specify the format manually");
 
-        /// If we got all schemas from cache, schema_reader can be uninitialized.
-        /// But we still need some stateless methods of ISchemaReader,
-        /// let's initialize it with empty buffer.
+        /// We need some stateless methods of ISchemaReader, but during reading schema we
+        /// could not even create a schema reader (for example when we got schema from cache).
+        /// Let's create stateless schema reader from empty read buffer.
         EmptyReadBuffer empty;
-        if (!schema_reader)
-            schema_reader = FormatFactory::instance().getSchemaReader(*format_name, empty, context, format_settings);
+        SchemaReaderPtr stateless_schema_reader = FormatFactory::instance().getSchemaReader(*format_name, empty, context, format_settings);
 
         if (mode == SchemaInferenceMode::UNION)
         {
@@ -449,7 +449,7 @@ try
                             /// If types are not the same, try to transform them according
                             /// to the format to find common type.
                             auto new_type_copy = type;
-                            schema_reader->transformTypesFromDifferentFilesIfNeeded(it->second, new_type_copy);
+                            stateless_schema_reader->transformTypesFromDifferentFilesIfNeeded(it->second, new_type_copy);
 
                             /// If types are not the same after transform, we cannot do anything, throw an exception.
                             if (!it->second->equals(*new_type_copy))
@@ -495,7 +495,7 @@ try
         /// It will allow to execute simple data loading with query
         /// "INSERT INTO table SELECT * FROM ..."
         const auto & insertion_table = context->getInsertionTable();
-        if (schema_reader && !schema_reader->hasStrictOrderOfColumns() && !insertion_table.empty())
+        if (!stateless_schema_reader->hasStrictOrderOfColumns() && !insertion_table.empty())
         {
             auto storage = DatabaseCatalog::instance().getTable(insertion_table, context);
             auto metadata = storage->getInMemoryMetadataPtr();
diff --git a/tests/queries/0_stateless/02185_orc_corrupted_file.sh b/tests/queries/0_stateless/02185_orc_corrupted_file.sh
index 1987f094faa..12510ae3836 100755
--- a/tests/queries/0_stateless/02185_orc_corrupted_file.sh
+++ b/tests/queries/0_stateless/02185_orc_corrupted_file.sh
@@ -8,4 +8,4 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 cp $CUR_DIR/data_orc/corrupted.orc $USER_FILES_PATH/
 
-${CLICKHOUSE_CLIENT} --query="select * from file('corrupted.orc')" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL'
+${CLICKHOUSE_CLIENT} --query="select * from file('corrupted.orc')" 2>&1 | grep -F -q 'CANNOT_EXTRACT_TABLE_STRUCTURE' && echo 'OK' || echo 'FAIL'
diff --git a/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh b/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
index 954e2e83f27..8ff6e28b123 100755
--- a/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
+++ b/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
@@ -12,6 +12,6 @@ DATA_FILE=$USER_FILES_PATH/$FILE_NAME
 cp $CUR_DIR/data_parquet_bad_column/metadata_0.parquet $DATA_FILE
 
 
-$CLICKHOUSE_CLIENT -q "desc file(test_02245.parquet)" 2>&1 | grep -qF "Cannot extract table structure" && echo "OK" || echo "FAIL"
+$CLICKHOUSE_CLIENT -q "desc file(test_02245.parquet)" 2>&1 | grep -qF "CANNOT_EXTRACT_TABLE_STRUCTURE" && echo "OK" || echo "FAIL"
 $CLICKHOUSE_CLIENT -q "desc file(test_02245.parquet) settings input_format_parquet_skip_columns_with_unsupported_types_in_schema_inference=1"
 $CLICKHOUSE_CLIENT -q "select count(*) from file(test_02245.parquet) settings input_format_parquet_skip_columns_with_unsupported_types_in_schema_inference=1"
diff --git a/tests/queries/0_stateless/02268_json_wrong_root_type_in_schema_inference.sql b/tests/queries/0_stateless/02268_json_wrong_root_type_in_schema_inference.sql
index 5462d38f1a3..98bf29c32f5 100644
--- a/tests/queries/0_stateless/02268_json_wrong_root_type_in_schema_inference.sql
+++ b/tests/queries/0_stateless/02268_json_wrong_root_type_in_schema_inference.sql
@@ -1,7 +1,7 @@
 -- Tags: no-fasttest
 
 insert into function file('02268_data.jsonl', 'TSV') select 1;
-select * from file('02268_data.jsonl'); --{serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+select * from file('02268_data.jsonl'); --{serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 
 insert into function file('02268_data.jsonCompactEachRow', 'TSV') select 1;
-select * from file('02268_data.jsonCompactEachRow'); --{serverError CANNOT_PARSE_INPUT_ASSERTION_FAILED}
+select * from file('02268_data.jsonCompactEachRow'); --{serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
diff --git a/tests/queries/0_stateless/02286_mysql_dump_input_format.sh b/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
index a3711497ae8..2f6167c3ddf 100755
--- a/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
+++ b/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
@@ -23,7 +23,7 @@ $CLICKHOUSE_CLIENT -q "desc file(dump1.sql, MySQLDump) settings input_format_mys
 $CLICKHOUSE_CLIENT -q "select * from file(dump1.sql, MySQLDump) settings input_format_mysql_dump_table_name='test', max_threads=1"
 $CLICKHOUSE_CLIENT -q "desc file(dump1.sql, MySQLDump) settings input_format_mysql_dump_table_name='test2'"
 $CLICKHOUSE_CLIENT -q "select * from file(dump1.sql, MySQLDump) settings input_format_mysql_dump_table_name='test2', max_threads=1"
-$CLICKHOUSE_CLIENT -q "desc file(dump1.sql, MySQLDump) settings input_format_mysql_dump_table_name='test 3'"  2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL'
+$CLICKHOUSE_CLIENT -q "desc file(dump1.sql, MySQLDump) settings input_format_mysql_dump_table_name='test 3'"  2>&1 | grep -F -q 'CANNOT_EXTRACT_TABLE_STRUCTURE' && echo 'OK' || echo 'FAIL'
 $CLICKHOUSE_CLIENT -q "select * from file(dump1.sql, MySQLDump, 'x Nullable(Int32)') settings input_format_mysql_dump_table_name='test 3'" 2>&1 | grep -F -q 'EMPTY_DATA_PASSED' && echo 'OK' || echo 'FAIL'
 
 echo "dump2"
diff --git a/tests/queries/0_stateless/02293_formats_json_columns.sh b/tests/queries/0_stateless/02293_formats_json_columns.sh
index ce35c4bd878..4eae5a1abb4 100755
--- a/tests/queries/0_stateless/02293_formats_json_columns.sh
+++ b/tests/queries/0_stateless/02293_formats_json_columns.sh
@@ -88,4 +88,4 @@ echo '
 }
 ' > $DATA_FILE
 
-$CLICKHOUSE_CLIENT -q "desc file(data_02293, JSONColumns) settings input_format_max_rows_to_read_for_schema_inference=3, input_format_json_infer_incomplete_types_as_strings=0" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL'
+$CLICKHOUSE_CLIENT -q "desc file(data_02293, JSONColumns) settings input_format_max_rows_to_read_for_schema_inference=3, input_format_json_infer_incomplete_types_as_strings=0" 2>&1 | grep -F -q 'CANNOT_EXTRACT_TABLE_STRUCTURE' && echo 'OK' || echo 'FAIL'
diff --git a/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh b/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
index dfc0dedeaf1..650faf6985e 100755
--- a/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
+++ b/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
@@ -15,11 +15,11 @@ mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
 cp -r $CLIENT_SCHEMADIR/02327_* $SCHEMADIR/$SERVER_SCHEMADIR/
 
 
-$CLICKHOUSE_CLIENT --query="desc file(data.pb) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL';
-$CLICKHOUSE_CLIENT --query="desc file(data.capnp) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="desc file(data.pb) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'The table structure cannot be extracted' && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="desc file(data.capnp) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'The table structure cannot be extracted' && echo 'OK' || echo 'FAIL';
 
-$CLICKHOUSE_CLIENT --query="create table test_protobuf engine=File(Protobuf) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL';
-$CLICKHOUSE_CLIENT --query="create table test_capnp engine=File(CapnProto) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="create table test_protobuf engine=File(Protobuf) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'The table structure cannot be extracted' && echo 'OK' || echo 'FAIL';
+$CLICKHOUSE_CLIENT --query="create table test_capnp engine=File(CapnProto) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty'" 2>&1 | grep -F -q 'The table structure cannot be extracted' && echo 'OK' || echo 'FAIL';
 
 $CLICKHOUSE_CLIENT --query="desc file(data.pb) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty', input_format_protobuf_skip_fields_with_unsupported_types_in_schema_inference=1";
 $CLICKHOUSE_CLIENT --query="desc file(data.capnp) settings format_schema='$SERVER_SCHEMADIR/02327_schema:MessageWithEmpty', input_format_capn_proto_skip_fields_with_unsupported_types_in_schema_inference=1";
diff --git a/tests/queries/0_stateless/02416_json_object_inference.sql b/tests/queries/0_stateless/02416_json_object_inference.sql
index 91137c0243c..3022ee026d0 100644
--- a/tests/queries/0_stateless/02416_json_object_inference.sql
+++ b/tests/queries/0_stateless/02416_json_object_inference.sql
@@ -2,5 +2,5 @@
 set allow_experimental_object_type=1;
 desc format(JSONEachRow, '{"a" : {"b" : {"c" : 1, "d" : "str"}}}');
 set allow_experimental_object_type=0, input_format_json_read_objects_as_strings=0, input_format_json_try_infer_named_tuples_from_objects=0, input_format_json_read_numbers_as_strings=0;
-desc format(JSONEachRow, '{"a" : {"b" : {"c" : 1, "d" : "str"}}}'); -- {serverError 652}
+desc format(JSONEachRow, '{"a" : {"b" : {"c" : 1, "d" : "str"}}}'); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 
diff --git a/tests/queries/0_stateless/02455_duplicate_column_names_in_schema_inference.sql b/tests/queries/0_stateless/02455_duplicate_column_names_in_schema_inference.sql
index 626a4d7034e..f67e5496a98 100644
--- a/tests/queries/0_stateless/02455_duplicate_column_names_in_schema_inference.sql
+++ b/tests/queries/0_stateless/02455_duplicate_column_names_in_schema_inference.sql
@@ -1,7 +1,7 @@
 -- Tags: no-fasttest
 
-desc format(JSONEachRow, '{"x" : 1, "x" : 2}'); -- {serverError INCORRECT_DATA}
-desc format(JSONEachRow, '{"x" : 1, "y" : 2}\n{"x" : 2, "x" : 3}'); -- {serverError INCORRECT_DATA}
-desc format(CSVWithNames, 'a,b,a\n1,2,3'); -- {serverError INCORRECT_DATA}
-desc format(CSV, '1,2,3') settings column_names_for_schema_inference='a, b, a'; -- {serverError INCORRECT_DATA}
+desc format(JSONEachRow, '{"x" : 1, "x" : 2}'); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+desc format(JSONEachRow, '{"x" : 1, "y" : 2}\n{"x" : 2, "x" : 3}'); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+desc format(CSVWithNames, 'a,b,a\n1,2,3'); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+desc format(CSV, '1,2,3') settings column_names_for_schema_inference='a, b, a'; -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 
diff --git a/tests/queries/0_stateless/02458_use_structure_from_insertion_table.sql b/tests/queries/0_stateless/02458_use_structure_from_insertion_table.sql
index ac549a7faf1..71a2381d7b6 100644
--- a/tests/queries/0_stateless/02458_use_structure_from_insertion_table.sql
+++ b/tests/queries/0_stateless/02458_use_structure_from_insertion_table.sql
@@ -10,14 +10,14 @@ set input_format_json_infer_incomplete_types_as_strings=0;
 insert into test select * from file(02458_data.jsonl);
 insert into test select x, 1 from file(02458_data.jsonl);
 insert into test select x, y from file(02458_data.jsonl);
-insert into test select x + 1, y from file(02458_data.jsonl); -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
+insert into test select x + 1, y from file(02458_data.jsonl); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 insert into test select x, z from file(02458_data.jsonl);
 
 insert into test select * from file(02458_data.jsoncompacteachrow);
-insert into test select x, 1 from file(02458_data.jsoncompacteachrow); -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
-insert into test select x, y from file(02458_data.jsoncompacteachrow); -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
-insert into test select x + 1, y from file(02458_data.jsoncompacteachrow); -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
-insert into test select x, z from file(02458_data.jsoncompacteachrow); -- {serverError ONLY_NULLS_WHILE_READING_SCHEMA}
+insert into test select x, 1 from file(02458_data.jsoncompacteachrow); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+insert into test select x, y from file(02458_data.jsoncompacteachrow); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+insert into test select x + 1, y from file(02458_data.jsoncompacteachrow); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
+insert into test select x, z from file(02458_data.jsoncompacteachrow); -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
 
 insert into test select * from input() format CSV 1,2
 insert into test select x, y from input() format CSV 1,2 -- {serverError CANNOT_EXTRACT_TABLE_STRUCTURE}
diff --git a/tests/queries/0_stateless/02724_database_s3.sh b/tests/queries/0_stateless/02724_database_s3.sh
index 13b627c0342..80b47282146 100755
--- a/tests/queries/0_stateless/02724_database_s3.sh
+++ b/tests/queries/0_stateless/02724_database_s3.sh
@@ -46,7 +46,7 @@ DROP DATABASE IF EXISTS test3;
 CREATE DATABASE test3 ENGINE = S3;
 USE test3;
 SELECT * FROM \"http://localhost:11111/test/a.myext\"
-""" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:
+""" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "S3_ERROR" > /dev/null && echo "OK" || echo 'FAIL' ||:
 
 ${CLICKHOUSE_CLIENT} --multiline --multiquery -q """
 USE test3;
diff --git a/tests/queries/0_stateless/02725_database_hdfs.sh b/tests/queries/0_stateless/02725_database_hdfs.sh
index b4e081f6de0..71ccee6f5f4 100755
--- a/tests/queries/0_stateless/02725_database_hdfs.sh
+++ b/tests/queries/0_stateless/02725_database_hdfs.sh
@@ -58,7 +58,7 @@ SELECT * FROM \"abacaba/file.tsv\"
 """ 2>&1 | tr '\n' ' ' | grep -oF "CANNOT_EXTRACT_TABLE_STRUCTURE"
 
 ${CLICKHOUSE_CLIENT} -q "SELECT * FROM test_hdfs_4.\`http://localhost:11111/test/a.tsv\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:
-${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/file.myext\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:
+${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/file.myext\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "HDFS_ERROR" > /dev/null && echo "OK" || echo 'FAIL' ||:
 ${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/test_02725_3.tsv\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "CANNOT_EXTRACT_TABLE_STRUCTURE" > /dev/null && echo "OK" || echo 'FAIL' ||:
 
 ${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:
diff --git a/tests/queries/0_stateless/02900_union_schema_inference_mode.sh b/tests/queries/0_stateless/02900_union_schema_inference_mode.sh
index dc0dd8ae1f4..a0fdb5276e0 100755
--- a/tests/queries/0_stateless/02900_union_schema_inference_mode.sh
+++ b/tests/queries/0_stateless/02900_union_schema_inference_mode.sh
@@ -39,13 +39,13 @@ desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/archive.tar :: data{1,2,3}.jsonl');
 "
 
 echo 'Error' > $CLICKHOUSE_TEST_UNIQUE_NAME/data4.jsonl
-$CLICKHOUSE_LOCAL -q "desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3,4}.jsonl') settings schema_inference_mode='union'" 2>&1 | grep -c -F "Cannot extract table structure"
+$CLICKHOUSE_LOCAL -q "desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3,4}.jsonl') settings schema_inference_mode='union'" 2>&1 | grep -c -F "CANNOT_EXTRACT_TABLE_STRUCTURE"
 
 $CLICKHOUSE_LOCAL -nm -q "
 set schema_inference_mode = 'union';
 desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{2,3}.jsonl');
 desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3,4}.jsonl');
-" 2>&1 | grep -c -F "Cannot extract table structure"
+" 2>&1 | grep -c -F "CANNOT_EXTRACT_TABLE_STRUCTURE"
 
 echo 42 > $CLICKHOUSE_TEST_UNIQUE_NAME/data1.csv
 echo 42, 43 > $CLICKHOUSE_TEST_UNIQUE_NAME/data2.csv

From aed8ffe3d8ff123ef83435d1e03322f9a2665371 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 16:30:37 +0800
Subject: [PATCH 0227/1081] optimize for decimal

---
 src/Functions/if.cpp | 34 ++++++++++++++++++++++++++--------
 1 file changed, 26 insertions(+), 8 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index cae3b720d8b..09feda0d816 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -57,7 +57,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0, b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType>)
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 a_index += !!cond[i];
@@ -71,33 +71,39 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
                 a_index += !!cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
+        }
     }
     else if (b_is_short)
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 b_index += !cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
+        }
     }
 }
 
@@ -110,21 +116,25 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
                 a_index += !!cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
+        }
     }
 }
 
@@ -137,21 +147,25 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
             {
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
                 b_index += !cond[i];
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
+        }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            if constexpr (std::is_integral_v<ResultType>)
+        {
+            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
+        }
     }
 }
 
@@ -197,6 +211,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
+        /// TODO 这里是否可避免分支跳转
         for (size_t i = 0; i < size; ++i)
             res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
         return col_res;
@@ -1120,6 +1135,7 @@ public:
             }
             else
             {
+                /// TODO 这里不物化行不行？
                 materialized_cond_col = cond_const_col->convertToFullColumn();
                 cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
             }
@@ -1159,6 +1175,8 @@ public:
         TypeIndex left_id = left_type->getTypeId();
         TypeIndex right_id = right_type->getTypeId();
 
+        /// TODO map类型是否有优化空间
+        /// TODO 对nullable类型是否有优化空间
         if (!(callOnBasicTypes<true, true, true, false>(left_id, right_id, call)
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
             || (res = executeString(cond_col, arguments, result_type))

From 849858017237d9752f3efb801bcc2267288cb8c8 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 24 Jan 2024 10:01:06 +0100
Subject: [PATCH 0228/1081] Fixing build

---
 src/Backups/BackupIO_AzureBlobStorage.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index fca324869ae..34be110cd42 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -11,6 +11,7 @@
 #include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
 #include <IO/AzureBlobStorage/copyAzureBlobStorageFile.h>
 #include <Disks/IDisk.h>
+#include <Disks/DiskType.h>
 
 #include <Poco/Util/AbstractConfiguration.h>
 
@@ -143,7 +144,7 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
     : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterAzureBlobStorage"))
-    , data_source_description{DataSourceType::AzureBlobStorage,configuration_.container, false, false}
+    , data_source_description{DataSourceType::AzureBlobStorage, configuration_.container, false, false}
     , configuration(configuration_)
 {
     auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);

From 622a0f65b38a58557f552668844050245d4fcedd Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 18:46:06 +0800
Subject: [PATCH 0229/1081] optimize for float

---
 src/Functions/if.cpp | 106 +++++++++++++++++++++++++++++++------------
 1 file changed, 78 insertions(+), 28 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 09feda0d816..bb71f3ff1d9 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -25,6 +25,8 @@
 #include <Functions/FunctionFactory.h>
 #include <type_traits>
 
+#pragma clang diagnostic ignored "-Wundefined-reinterpret-cast"
+
 namespace DB
 {
 namespace ErrorCodes
@@ -45,9 +47,28 @@ using namespace GatherUtils;
   * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b), except floating point types because of Inf or NaN.
 */
 
-template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
-inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+template <typename ResultType>
+struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
 {
+    static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
+};
+
+#define BRANCHLESS_IF_FLOAT(TYPE, vc, va, vb, vr) \
+    using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
+    using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
+    auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
+    auto new_a = static_cast<ResultType>(va); \
+    auto new_b = static_cast<ResultType>(vb); \
+    auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
+    (vr) = *(reinterpret_cast<ResultType *>(&tmp));
+
+template <typename ResultType>
+inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
+
+template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
+NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+{
+
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
     bool b_is_short = b.size() < size;
@@ -57,14 +78,17 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0, b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                a_index += !!cond[i];
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[b_index]);
+
+            a_index += !!cond[i];
+            b_index += !cond[i];
         }
     }
     else if (a_is_short)
@@ -72,13 +96,16 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
-                a_index += !!cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[i]);
+
+            a_index += !!cond[i];
         }
     }
     else if (b_is_short)
@@ -86,29 +113,38 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index]);
+
+            b_index += !cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
+            }
             else
+            {
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
+            }
         }
     }
 }
 
 template <typename ArrayCond, typename ArrayA, typename B, typename ArrayResult, typename ResultType>
-inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
+NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
@@ -117,21 +153,28 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
-                a_index += !!cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b);
+
+            a_index += !!cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
+            }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
         }
@@ -139,7 +182,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
 }
 
 template <typename ArrayCond, typename A, typename ArrayB, typename ArrayResult, typename ResultType>
-inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
+NO_INLINE void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool b_is_short = b.size() < size;
@@ -148,21 +191,28 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
-            {
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
-                b_index += !cond[i];
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
             }
             else
-                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
+                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index]);
+
+            b_index += !cond[i];
         }
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
         {
-            if constexpr (std::is_integral_v<ResultType> || ((is_decimal<ResultType> && sizeof(ResultType) <= 8)))
+            if constexpr (is_native_int_or_decimal_v<ResultType>)
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else if constexpr (std::is_floating_point_v<ResultType>)
+            {
+                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
+            }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
         }

From 393cab820e479a76710d691d1da825079307847a Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 18:48:29 +0800
Subject: [PATCH 0230/1081] add some comment

---
 src/Functions/if.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index bb71f3ff1d9..f10b9989f13 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -261,7 +261,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
-        /// TODO 这里是否可避免分支跳转
+        /// TODO cast a and b only once
         for (size_t i = 0; i < size; ++i)
             res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
         return col_res;
@@ -1185,7 +1185,7 @@ public:
             }
             else
             {
-                /// TODO 这里不物化行不行？
+                /// TODO why materialize condition
                 materialized_cond_col = cond_const_col->convertToFullColumn();
                 cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
             }

From 788eb487075fe770097759edfd46544134e11116 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 24 Jan 2024 11:51:02 +0100
Subject: [PATCH 0231/1081] Fix build after merging master

---
 src/Backups/BackupIO_AzureBlobStorage.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 34be110cd42..2c2396e9c0a 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -34,7 +34,7 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
     : BackupReaderDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupReaderAzureBlobStorage"))
-    , data_source_description{DataSourceType::AzureBlobStorage, configuration_.container, false, false}
+    , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
     , configuration(configuration_)
 {
     auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
@@ -99,7 +99,8 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
     LOG_INFO(&Poco::Logger::get("BackupReaderAzureBlobStorage"), "Enter copyFileToDisk");
 
     auto destination_data_source_description = destination_disk->getDataSourceDescription();
-    if ((destination_data_source_description.type == DataSourceType::AzureBlobStorage)
+    if ((destination_data_source_description.type == DataSourceType::ObjectStorage)
+        && (destination_data_source_description.object_storage_type == ObjectStorageType::Azure)
         && (destination_data_source_description.is_encrypted == encrypted_in_backup))
     {
         LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
@@ -144,7 +145,7 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
     : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterAzureBlobStorage"))
-    , data_source_description{DataSourceType::AzureBlobStorage, configuration_.container, false, false}
+    , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
     , configuration(configuration_)
 {
     auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);

From eae787860944dc26bf70081369b0268f5b5ce7e4 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 19:53:50 +0800
Subject: [PATCH 0232/1081] fix style

---
 src/Functions/if.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index f10b9989f13..79646b4b86c 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -66,7 +66,7 @@ template <typename ResultType>
 inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
 
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
-NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
+inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
 {
 
     size_t size = cond.size();
@@ -144,7 +144,7 @@ NO_INLINE void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const
 }
 
 template <typename ArrayCond, typename ArrayA, typename B, typename ArrayResult, typename ResultType>
-NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
+inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool a_is_short = a.size() < size;
@@ -182,7 +182,7 @@ NO_INLINE void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b,
 }
 
 template <typename ArrayCond, typename A, typename ArrayB, typename ArrayResult, typename ResultType>
-NO_INLINE void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
+inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, ArrayResult & res)
 {
     size_t size = cond.size();
     bool b_is_short = b.size() < size;

From a657a2631f2cbca1328a0b6fde09dd9deba2a6d2 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 19:58:07 +0800
Subject: [PATCH 0233/1081] add perf tests

---
 tests/performance/if.xml | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/tests/performance/if.xml b/tests/performance/if.xml
index f4d0e8f9773..b25218f553e 100644
--- a/tests/performance/if.xml
+++ b/tests/performance/if.xml
@@ -1,12 +1,12 @@
 <test>
-
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
-
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
-
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
+    
+    <query>with rand32() % 2 as x select if(x, materialize(1.234), materialize(2.456)) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1.234::Decimal64(3) as a, 2.456::Decimal64(3) as b select if(x, materialize(a), materialize(b)) from numbers(100000000) format Null</query>
 </test>

From 4e337f83170084ba5fa83488b7e9c6ae6c21976d Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 20:00:26 +0800
Subject: [PATCH 0234/1081] add perf tests

---
 src/Functions/if.cpp | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 79646b4b86c..4b1be7f4709 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -44,7 +44,7 @@ using namespace GatherUtils;
 /** Selection function by condition: if(cond, then, else).
   * cond - UInt8
   * then, else - numeric types for which there is a general type, or dates, datetimes, or strings, or arrays of these types.
-  * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b), except floating point types because of Inf or NaN.
+  * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b)
 */
 
 template <typename ResultType>
@@ -53,7 +53,7 @@ struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
     static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
 };
 
-#define BRANCHLESS_IF_FLOAT(TYPE, vc, va, vb, vr) \
+#define BRANCHFREE_IF_FLOAT(TYPE, vc, va, vb, vr) \
     using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
     using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
     auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
@@ -82,7 +82,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[b_index]);
@@ -100,7 +100,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b[i], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b[i]);
@@ -117,7 +117,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index]);
@@ -133,7 +133,7 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b[i], res[i])
             }
             else
             {
@@ -157,7 +157,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[a_index], b, res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[a_index]) : static_cast<ResultType>(b);
@@ -173,7 +173,7 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a[i], b, res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
@@ -195,7 +195,7 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a, b[b_index], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index]);
@@ -211,7 +211,7 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
                 res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
             else if constexpr (std::is_floating_point_v<ResultType>)
             {
-                BRANCHLESS_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
+                BRANCHFREE_IF_FLOAT(ResultType, cond[i], a, b[i], res[i])
             }
             else
                 res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);

From 2418798e3c244d32b2048781b8aced3440c65135 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 24 Jan 2024 20:02:07 +0800
Subject: [PATCH 0235/1081] fix code style

---
 src/Functions/if.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 4b1be7f4709..7f1423cd434 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1225,8 +1225,8 @@ public:
         TypeIndex left_id = left_type->getTypeId();
         TypeIndex right_id = right_type->getTypeId();
 
-        /// TODO map类型是否有优化空间
-        /// TODO 对nullable类型是否有优化空间
+        /// TODO optimize for map type
+        /// TODO optimize for nullable type
         if (!(callOnBasicTypes<true, true, true, false>(left_id, right_id, call)
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
             || (res = executeString(cond_col, arguments, result_type))

From 10aaf2cbe46c7a00f744ad2e6183c441db847587 Mon Sep 17 00:00:00 2001
From: Alex Cheng <alex.cheng@sunallies.com>
Date: Wed, 24 Jan 2024 21:10:48 +0800
Subject: [PATCH 0236/1081] fix the default number of
 async_insert_max_data_size

---
 docs/en/operations/settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index f085fe1abcd..4bef6f4a02d 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1922,7 +1922,7 @@ Possible values:
 - Positive integer.
 - 0 — Asynchronous insertions are disabled.
 
-Default value: `100000`.
+Default value: `1000000`.
 
 ### async_insert_max_query_number {#async-insert-max-query-number}
 

From 383ae86ebb0da8a962521f55b08186331eb0f676 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 24 Jan 2024 15:06:16 +0000
Subject: [PATCH 0237/1081] Upgrade simdjson to v3.6.3

See https://github.com/ClickHouse/ClickHouse/issues/38621#issuecomment-1908219067
---
 contrib/simdjson | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/simdjson b/contrib/simdjson
index 1075e8609c4..6060be2fdf6 160000
--- a/contrib/simdjson
+++ b/contrib/simdjson
@@ -1 +1 @@
-Subproject commit 1075e8609c4afa253162d441437af929c29e31bb
+Subproject commit 6060be2fdf62edf4a8f51a8b0883d57d09397b30

From 7f8f379d7fe6b3368221ff97572df83eacd14e1f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 24 Jan 2024 16:04:00 +0100
Subject: [PATCH 0238/1081] Parallel & disrtibuted processing for ordered mode

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp |  51 +++-
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  14 +-
 src/Storages/S3Queue/S3QueueSettings.h        |   2 +
 src/Storages/S3Queue/S3QueueSource.cpp        |  73 +++++-
 src/Storages/S3Queue/S3QueueSource.h          |  14 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |  35 +--
 src/Storages/S3Queue/StorageS3Queue.h         |   1 +
 src/Storages/StorageS3.cpp                    |  28 +-
 src/Storages/StorageS3.h                      |  14 +-
 .../integration/test_storage_s3_queue/test.py | 240 ++++++++++++++++++
 10 files changed, 414 insertions(+), 58 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index f49e1d6f25c..02974be4c4a 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -129,6 +129,8 @@ S3QueueFilesMetadata::S3QueueFilesMetadata(const fs::path & zookeeper_path_, con
     , max_loading_retries(settings_.s3queue_loading_retries.value)
     , min_cleanup_interval_ms(settings_.s3queue_cleanup_interval_min_ms.value)
     , max_cleanup_interval_ms(settings_.s3queue_cleanup_interval_max_ms.value)
+    , shards_num(settings_.s3queue_total_shards_num)
+    , threads_per_shard(settings_.s3queue_processing_threads_num)
     , zookeeper_processing_path(zookeeper_path_ / "processing")
     , zookeeper_processed_path(zookeeper_path_ / "processed")
     , zookeeper_failed_path(zookeeper_path_ / "failed")
@@ -197,6 +199,11 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
+size_t S3QueueFilesMetadata::getProcessingThreadForPath(const std::string & path) const
+{
+    return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
+}
+
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
 {
     auto timer = DB::CurrentThread::getProfileEvents().timer(ProfileEvents::S3QueueSetFileProcessingMicroseconds);
@@ -312,7 +319,8 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
-          S3QueueFilesMetadata::ProcessingNodeHolderPtr> S3QueueFilesMetadata::trySetFileAsProcessingForUnorderedMode(const std::string & path, const FileStatusPtr & file_status)
+          S3QueueFilesMetadata::ProcessingNodeHolderPtr>
+S3QueueFilesMetadata::trySetFileAsProcessingForUnorderedMode(const std::string & path, const FileStatusPtr & file_status)
 {
     /// In one zookeeper transaction do the following:
     /// 1. check that corresponding persistent nodes do not exist in processed/ and failed/;
@@ -339,7 +347,8 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
 
     if (code == Coordination::Error::ZOK)
     {
-        auto holder = std::make_unique<ProcessingNodeHolder>(node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+        auto holder = std::make_unique<ProcessingNodeHolder>(
+            node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
         return std::pair{SetFileProcessingResult::Success, std::move(holder)};
     }
 
@@ -362,7 +371,8 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
-          S3QueueFilesMetadata::ProcessingNodeHolderPtr> S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & path, const FileStatusPtr & file_status)
+          S3QueueFilesMetadata::ProcessingNodeHolderPtr>
+S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & path, const FileStatusPtr & file_status)
 {
     /// Same as for Unordered mode.
     /// The only difference is the check if the file is already processed.
@@ -385,10 +395,15 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
         /// If the version did change - retry (since we cannot do Get and Create requests
         /// in the same zookeeper transaction, so we use a while loop with tries).
 
-        Coordination::Stat processed_node_stat;
-        auto data = zk_client->get(zookeeper_processed_path, &processed_node_stat);
+        auto processed_node = isShardedProcessing()
+            ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+            : zookeeper_processed_path;
+
         NodeMetadata processed_node_metadata;
-        if (!data.empty())
+        Coordination::Stat processed_node_stat;
+        std::string data;
+        auto processed_node_exists = zk_client->tryGet(processed_node, data, &processed_node_stat);
+        if (processed_node_exists && !data.empty())
             processed_node_metadata = NodeMetadata::fromString(data);
 
         auto max_processed_file_path = processed_node_metadata.file_path;
@@ -403,13 +418,23 @@ std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
         requests.push_back(zkutil::makeRemoveRequest(zookeeper_failed_path / node_name, -1));
 
         requests.push_back(zkutil::makeCreateRequest(zookeeper_processing_path / node_name, node_metadata.toString(), zkutil::CreateMode::Ephemeral));
-        requests.push_back(zkutil::makeCheckRequest(zookeeper_processed_path, processed_node_stat.version));
+
+        if (processed_node_exists)
+        {
+            requests.push_back(zkutil::makeCheckRequest(processed_node, processed_node_stat.version));
+        }
+        else
+        {
+            requests.push_back(zkutil::makeCreateRequest(processed_node, "", zkutil::CreateMode::Persistent));
+            requests.push_back(zkutil::makeRemoveRequest(processed_node, -1));
+        }
 
         Coordination::Responses responses;
         auto code = zk_client->tryMulti(requests, responses);
         if (code == Coordination::Error::ZOK)
         {
-            auto holder = std::make_unique<ProcessingNodeHolder>(node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+            auto holder = std::make_unique<ProcessingNodeHolder>(
+                node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
             return std::pair{SetFileProcessingResult::Success, std::move(holder)};
         }
 
@@ -500,11 +525,15 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
     const auto node_metadata = createNodeMetadata(path).toString();
     const auto zk_client = getZooKeeper();
 
+    auto processed_node = isShardedProcessing()
+        ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+        : zookeeper_processed_path;
+
     while (true)
     {
         std::string res;
         Coordination::Stat stat;
-        bool exists = zk_client->tryGet(zookeeper_processed_path, res, &stat);
+        bool exists = zk_client->tryGet(processed_node, res, &stat);
         Coordination::Requests requests;
         if (exists)
         {
@@ -527,11 +556,11 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
                     return;
                 }
             }
-            requests.push_back(zkutil::makeSetRequest(zookeeper_processed_path, node_metadata, stat.version));
+            requests.push_back(zkutil::makeSetRequest(processed_node, node_metadata, stat.version));
         }
         else
         {
-            requests.push_back(zkutil::makeCreateRequest(zookeeper_processed_path, node_metadata, zkutil::CreateMode::Persistent));
+            requests.push_back(zkutil::makeCreateRequest(processed_node, node_metadata, zkutil::CreateMode::Persistent));
         }
 
         Coordination::Responses responses;
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index f3be7c5c3a0..708355e4ac3 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -80,6 +80,15 @@ public:
 
     void deactivateCleanupTask();
 
+    bool isShardedProcessing() const { return getProcessingThreadsNum() > 1 && mode == S3QueueMode::ORDERED; }
+
+    size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
+
+    size_t getProcessingThreadForPath(const std::string & path) const;
+
+    /// shard_id must be in range [0, shards_num - 1]
+    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
@@ -87,6 +96,8 @@ private:
     const UInt64 max_loading_retries;
     const size_t min_cleanup_interval_ms;
     const size_t max_cleanup_interval_ms;
+    const size_t shards_num;
+    const size_t threads_per_shard;
 
     const fs::path zookeeper_processing_path;
     const fs::path zookeeper_processed_path;
@@ -117,8 +128,7 @@ private:
 
     struct NodeMetadata
     {
-        std::string file_path;
-        UInt64 last_processed_timestamp = 0;
+        std::string file_path; UInt64 last_processed_timestamp = 0;
         std::string last_exception;
         UInt64 retries = 0;
         std::string processing_id; /// For ephemeral processing node.
diff --git a/src/Storages/S3Queue/S3QueueSettings.h b/src/Storages/S3Queue/S3QueueSettings.h
index 66fe9b4ce31..d65b38f77f2 100644
--- a/src/Storages/S3Queue/S3QueueSettings.h
+++ b/src/Storages/S3Queue/S3QueueSettings.h
@@ -29,6 +29,8 @@ class ASTStorage;
     M(UInt32, s3queue_tracked_files_limit, 1000, "For unordered mode. Max set size for tracking processed files in ZooKeeper", 0) \
     M(UInt32, s3queue_cleanup_interval_min_ms, 60000, "For unordered mode. Polling backoff min for cleanup", 0) \
     M(UInt32, s3queue_cleanup_interval_max_ms, 60000, "For unordered mode. Polling backoff max for cleanup", 0) \
+    M(UInt32, s3queue_total_shards_num, 1, "Value 0 means disabled", 0) \
+    M(UInt32, s3queue_current_shard_num, 0, "", 0) \
 
 #define LIST_OF_S3QUEUE_SETTINGS(M, ALIAS) \
     S3QUEUE_RELATED_SETTINGS(M, ALIAS) \
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 27bec039f96..7d4ad64d554 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -46,29 +46,86 @@ StorageS3QueueSource::FileIterator::FileIterator(
     : metadata(metadata_)
     , glob_iterator(std::move(glob_iterator_))
     , shutdown_called(shutdown_called_)
+    , log(&Poco::Logger::get("StorageS3QueueSource"))
+    , sharded_processing(metadata->isShardedProcessing())
 {
+    if (sharded_processing)
+    {
+        for (size_t i = 0; i < metadata->getProcessingThreadsNum(); ++i)
+            sharded_keys.emplace(i, std::deque<KeyWithInfoPtr>{});
+    }
 }
 
-StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next()
+StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(size_t idx)
 {
     while (!shutdown_called)
     {
-        KeyWithInfoPtr val = glob_iterator->next();
+        KeyWithInfoPtr val{nullptr};
+
+        if (sharded_processing)
+        {
+            LOG_TEST(log, "CHECK: {}", idx);
+            auto & keys = sharded_keys.at(idx);
+            if (!keys.empty())
+            {
+                std::lock_guard lk(sharded_keys_mutex);
+                val = keys.front();
+                keys.pop_front();
+            }
+        }
+
+        if (!val)
+        {
+            std::unique_lock lk(sharded_keys_mutex, std::defer_lock);
+            if (sharded_processing)
+            {
+                /// To make sure order on keys in each shard in sharded_keys.
+                lk.lock();
+            }
+
+            val = glob_iterator->next();
+
+            if (val && sharded_processing)
+            {
+                auto shard = metadata->getProcessingThreadForPath(val->key);
+                if (shard != idx)
+                {
+                    LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                    auto & keys = sharded_keys.at(shard);
+                    keys.push_back(val);
+                    continue;
+                }
+                LOG_TEST(log, "Processing shard {} with key {}", shard, val->key);
+            }
+        }
 
         if (!val)
             return {};
 
         if (shutdown_called)
         {
-            LOG_TEST(&Poco::Logger::get("StorageS3QueueSource"), "Shutdown was called, stopping file iterator");
+            LOG_TEST(log, "Shutdown was called, stopping file iterator");
             return {};
         }
 
-        if (auto processing_holder = metadata->trySetFileAsProcessing(val->key);
-            processing_holder && !shutdown_called)
+        auto processing_holder = metadata->trySetFileAsProcessing(val->key);
+        if (shutdown_called)
+        {
+            LOG_TEST(log, "Shutdown was called, stopping file iterator");
+            return {};
+        }
+
+        if (processing_holder)
         {
             return std::make_shared<S3QueueKeyWithInfo>(val->key, val->info, processing_holder);
         }
+        else if (sharded_processing
+                 && metadata->getFileStatus(val->key)->state == S3QueueFilesMetadata::FileStatus::State::Processing)
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "File {} is processing by someone else in sharded processing. "
+                            "It is a bug", val->key);
+        }
     }
     return {};
 }
@@ -83,6 +140,7 @@ StorageS3QueueSource::StorageS3QueueSource(
     const Block & header_,
     std::unique_ptr<StorageS3Source> internal_source_,
     std::shared_ptr<S3QueueFilesMetadata> files_metadata_,
+    size_t processing_id_,
     const S3QueueAction & action_,
     RemoveFileFunc remove_file_func_,
     const NamesAndTypesList & requested_virtual_columns_,
@@ -96,6 +154,7 @@ StorageS3QueueSource::StorageS3QueueSource(
     , WithContext(context_)
     , name(std::move(name_))
     , action(action_)
+    , processing_id(processing_id_)
     , files_metadata(files_metadata_)
     , internal_source(std::move(internal_source_))
     , requested_virtual_columns(requested_virtual_columns_)
@@ -123,7 +182,7 @@ void StorageS3QueueSource::lazyInitialize()
     if (initialized)
         return;
 
-    internal_source->lazyInitialize();
+    internal_source->lazyInitialize(processing_id);
     reader = std::move(internal_source->reader);
     if (reader)
         reader_future = std::move(internal_source->reader_future);
@@ -249,7 +308,7 @@ Chunk StorageS3QueueSource::generate()
         /// Even if task is finished the thread may be not freed in pool.
         /// So wait until it will be freed before scheduling a new task.
         internal_source->create_reader_pool.wait();
-        reader_future = internal_source->createReaderAsync();
+        reader_future = internal_source->createReaderAsync(processing_id);
     }
 
     return {};
diff --git a/src/Storages/S3Queue/S3QueueSource.h b/src/Storages/S3Queue/S3QueueSource.h
index 542f8e8fd8c..338f355974b 100644
--- a/src/Storages/S3Queue/S3QueueSource.h
+++ b/src/Storages/S3Queue/S3QueueSource.h
@@ -38,12 +38,15 @@ public:
     class FileIterator : public IIterator
     {
     public:
-        FileIterator(std::shared_ptr<S3QueueFilesMetadata> metadata_, std::unique_ptr<GlobIterator> glob_iterator_, std::atomic<bool> & shutdown_called_);
+        FileIterator(
+            std::shared_ptr<S3QueueFilesMetadata> metadata_,
+            std::unique_ptr<GlobIterator> glob_iterator_,
+            std::atomic<bool> & shutdown_called_);
 
         /// Note:
         /// List results in s3 are always returned in UTF-8 binary order.
         /// (https://docs.aws.amazon.com/AmazonS3/latest/userguide/ListingKeysUsingAPIs.html)
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx) override;
 
         size_t estimatedKeysCount() override;
 
@@ -52,6 +55,11 @@ public:
         const std::unique_ptr<GlobIterator> glob_iterator;
         std::atomic<bool> & shutdown_called;
         std::mutex mutex;
+        Poco::Logger * log;
+
+        const bool sharded_processing;
+        std::unordered_map<size_t, std::deque<KeyWithInfoPtr>> sharded_keys;
+        std::mutex sharded_keys_mutex;
     };
 
     StorageS3QueueSource(
@@ -59,6 +67,7 @@ public:
         const Block & header_,
         std::unique_ptr<StorageS3Source> internal_source_,
         std::shared_ptr<S3QueueFilesMetadata> files_metadata_,
+        size_t processing_id_,
         const S3QueueAction & action_,
         RemoveFileFunc remove_file_func_,
         const NamesAndTypesList & requested_virtual_columns_,
@@ -80,6 +89,7 @@ public:
 private:
     const String name;
     const S3QueueAction action;
+    const size_t processing_id;
     const std::shared_ptr<S3QueueFilesMetadata> files_metadata;
     const std::shared_ptr<StorageS3Source> internal_source;
     const NamesAndTypesList requested_virtual_columns;
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index bc33e8cf2a9..511add4912f 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -75,14 +75,8 @@ namespace
         return zkutil::extractZooKeeperPath(result_zk_path, true);
     }
 
-    void checkAndAdjustSettings(S3QueueSettings & s3queue_settings, const Settings & settings, Poco::Logger * log)
+    void checkAndAdjustSettings(S3QueueSettings & s3queue_settings, const Settings & settings)
     {
-        if (s3queue_settings.mode == S3QueueMode::ORDERED && s3queue_settings.s3queue_processing_threads_num > 1)
-        {
-            LOG_WARNING(log, "Parallel processing is not yet supported for Ordered mode");
-            s3queue_settings.s3queue_processing_threads_num = 1;
-        }
-
         if (!s3queue_settings.s3queue_processing_threads_num)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Setting `s3queue_processing_threads_num` cannot be set to zero");
@@ -99,6 +93,13 @@ namespace
                             "Setting `s3queue_cleanup_interval_min_ms` ({}) must be less or equal to `s3queue_cleanup_interval_max_ms` ({})",
                             s3queue_settings.s3queue_cleanup_interval_min_ms, s3queue_settings.s3queue_cleanup_interval_max_ms);
         }
+
+        if (s3queue_settings.s3queue_current_shard_num >= s3queue_settings.s3queue_total_shards_num)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                            "Setting `s3queue_current_shard_num` ({}) cannot exceed `{}` (`s3queue_total_shards_num` - 1)",
+                            s3queue_settings.s3queue_current_shard_num, s3queue_settings.s3queue_total_shards_num);
+
+        ///TODO: Add a test with different total_shards_settings for same keeper path - exception must be thrown.
     }
 }
 
@@ -134,7 +135,7 @@ StorageS3Queue::StorageS3Queue(
         throw Exception(ErrorCodes::QUERY_NOT_ALLOWED, "S3Queue url must either end with '/' or contain globs");
     }
 
-    checkAndAdjustSettings(*s3queue_settings, context_->getSettingsRef(), log);
+    checkAndAdjustSettings(*s3queue_settings, context_->getSettingsRef());
 
     configuration.update(context_);
     FormatFactory::instance().checkFormatName(configuration.format);
@@ -221,13 +222,12 @@ public:
         std::shared_ptr<StorageS3Queue> storage_,
         ContextPtr context_,
         size_t max_block_size_,
-        size_t num_streams_)
+        size_t )
         : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
         , info(std::move(info_))
         , storage(std::move(storage_))
         , context(std::move(context_))
         , max_block_size(max_block_size_)
-        , num_streams(num_streams_)
     {
     }
 
@@ -236,7 +236,6 @@ private:
     std::shared_ptr<StorageS3Queue> storage;
     ContextPtr context;
     size_t max_block_size;
-    size_t num_streams;
 
     std::shared_ptr<StorageS3Queue::FileIterator> iterator;
 
@@ -301,11 +300,15 @@ void StorageS3Queue::read(
 void ReadFromS3Queue::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
     Pipes pipes;
-    const size_t adjusted_num_streams = std::min<size_t>(num_streams, storage->s3queue_settings->s3queue_processing_threads_num);
+    const size_t adjusted_num_streams = storage->s3queue_settings->s3queue_processing_threads_num;
 
     createIterator(nullptr);
     for (size_t i = 0; i < adjusted_num_streams; ++i)
-        pipes.emplace_back(storage->createSource(info, iterator, max_block_size, context));
+        pipes.emplace_back(storage->createSource(
+                               info,
+                               iterator,
+                               storage->files_metadata->getIdForProcessingThread(i, storage->s3queue_settings->s3queue_current_shard_num),
+                               max_block_size, context));
 
     auto pipe = Pipe::unitePipes(std::move(pipes));
     if (pipe.empty())
@@ -320,6 +323,7 @@ void ReadFromS3Queue::initializePipeline(QueryPipelineBuilder & pipeline, const
 std::shared_ptr<StorageS3QueueSource> StorageS3Queue::createSource(
     const ReadFromFormatInfo & info,
     std::shared_ptr<StorageS3Queue::FileIterator> file_iterator,
+    size_t processing_id,
     size_t max_block_size,
     ContextPtr local_context)
 {
@@ -359,7 +363,7 @@ std::shared_ptr<StorageS3QueueSource> StorageS3Queue::createSource(
     auto s3_queue_log = s3queue_settings->s3queue_enable_logging_to_s3queue_log ? local_context->getS3QueueLog() : nullptr;
     return std::make_shared<StorageS3QueueSource>(
         getName(), info.source_header, std::move(internal_source),
-        files_metadata, after_processing, file_deleter, info.requested_virtual_columns,
+        files_metadata, processing_id, after_processing, file_deleter, info.requested_virtual_columns,
         local_context, shutdown_called, table_is_being_dropped, s3_queue_log, getStorageID(), log);
 }
 
@@ -463,7 +467,8 @@ bool StorageS3Queue::streamToViews()
     for (size_t i = 0; i < s3queue_settings->s3queue_processing_threads_num; ++i)
     {
         auto source = createSource(
-            read_from_format_info, file_iterator, DBMS_DEFAULT_BUFFER_SIZE, s3queue_context);
+            read_from_format_info, file_iterator, files_metadata->getIdForProcessingThread(i, s3queue_settings->s3queue_current_shard_num),
+            DBMS_DEFAULT_BUFFER_SIZE, s3queue_context);
 
         pipes.emplace_back(std::move(source));
     }
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index 3d3594dc2ab..f65fdf38b3c 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -91,6 +91,7 @@ private:
     std::shared_ptr<StorageS3QueueSource> createSource(
         const ReadFromFormatInfo & info,
         std::shared_ptr<StorageS3Queue::FileIterator> file_iterator,
+        size_t processing_id,
         size_t max_block_size,
         ContextPtr local_context);
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index c376af5a3d7..dcd7e13b865 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -244,7 +244,7 @@ public:
         fillInternalBufferAssumeLocked();
     }
 
-    KeyWithInfoPtr next()
+    KeyWithInfoPtr next(size_t)
     {
         std::lock_guard lock(mutex);
         return nextAssumeLocked();
@@ -436,9 +436,9 @@ StorageS3Source::DisclosedGlobIterator::DisclosedGlobIterator(
 {
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::DisclosedGlobIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::DisclosedGlobIterator::next(size_t idx) /// NOLINT
 {
-    return pimpl->next();
+    return pimpl->next(idx);
 }
 
 size_t StorageS3Source::DisclosedGlobIterator::estimatedKeysCount()
@@ -471,7 +471,7 @@ public:
         }
     }
 
-    KeyWithInfoPtr next()
+    KeyWithInfoPtr next(size_t)
     {
         size_t current_index = index.fetch_add(1, std::memory_order_relaxed);
         if (current_index >= keys.size())
@@ -516,9 +516,9 @@ StorageS3Source::KeysIterator::KeysIterator(
 {
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::KeysIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::KeysIterator::next(size_t idx) /// NOLINT
 {
-    return pimpl->next();
+    return pimpl->next(idx);
 }
 
 size_t StorageS3Source::KeysIterator::estimatedKeysCount()
@@ -545,7 +545,7 @@ StorageS3Source::ReadTaskIterator::ReadTaskIterator(
         buffer.emplace_back(std::make_shared<KeyWithInfo>(key_future.get(), std::nullopt));
 }
 
-StorageS3Source::KeyWithInfoPtr StorageS3Source::ReadTaskIterator::next()
+StorageS3Source::KeyWithInfoPtr StorageS3Source::ReadTaskIterator::next(size_t) /// NOLINT
 {
     size_t current_index = index.fetch_add(1, std::memory_order_relaxed);
     if (current_index >= buffer.size())
@@ -599,23 +599,23 @@ StorageS3Source::StorageS3Source(
 {
 }
 
-void StorageS3Source::lazyInitialize()
+void StorageS3Source::lazyInitialize(size_t idx)
 {
     if (initialized)
         return;
 
-    reader = createReader();
+    reader = createReader(idx);
     if (reader)
-        reader_future = createReaderAsync();
+        reader_future = createReaderAsync(idx);
     initialized = true;
 }
 
-StorageS3Source::ReaderHolder StorageS3Source::createReader()
+StorageS3Source::ReaderHolder StorageS3Source::createReader(size_t idx)
 {
     KeyWithInfoPtr key_with_info;
     do
     {
-        key_with_info = (*file_iterator)();
+        key_with_info = file_iterator->next(idx);
         if (!key_with_info || key_with_info->key.empty())
             return {};
 
@@ -689,9 +689,9 @@ StorageS3Source::ReaderHolder StorageS3Source::createReader()
     return ReaderHolder{key_with_info, bucket, std::move(read_buf), std::move(source), std::move(pipeline), std::move(current_reader)};
 }
 
-std::future<StorageS3Source::ReaderHolder> StorageS3Source::createReaderAsync()
+std::future<StorageS3Source::ReaderHolder> StorageS3Source::createReaderAsync(size_t idx)
 {
-    return create_reader_scheduler([this] { return createReader(); }, Priority{});
+    return create_reader_scheduler([=, this] { return createReader(idx); }, Priority{});
 }
 
 std::unique_ptr<ReadBuffer> StorageS3Source::createS3ReadBuffer(const String & key, size_t object_size)
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index b90a0d394cb..5c4e4d358c0 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -61,7 +61,7 @@ public:
     {
     public:
         virtual ~IIterator() = default;
-        virtual KeyWithInfoPtr next() = 0;
+        virtual KeyWithInfoPtr next(size_t idx = 0) = 0; /// NOLINT
 
         /// Estimates how many streams we need to process all files.
         /// If keys count >= max_threads_count, the returned number may not represent the actual number of the keys.
@@ -85,7 +85,7 @@ public:
             const S3Settings::RequestSettings & request_settings_ = {},
             std::function<void(FileProgress)> progress_callback_ = {});
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -106,7 +106,7 @@ public:
             KeysWithInfo * read_keys = nullptr,
             std::function<void(FileProgress)> progress_callback_ = {});
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -120,7 +120,7 @@ public:
     public:
         explicit ReadTaskIterator(const ReadTaskCallback & callback_, size_t max_threads_count);
 
-        KeyWithInfoPtr next() override;
+        KeyWithInfoPtr next(size_t idx = 0) override; /// NOLINT
         size_t estimatedKeysCount() override;
 
     private:
@@ -253,11 +253,11 @@ private:
 
     /// Notice: we should initialize reader and future_reader lazily in generate to make sure key_condition
     /// is set before createReader is invoked for key_condition is read in createReader.
-    void lazyInitialize();
+    void lazyInitialize(size_t idx = 0);
 
     /// Recreate ReadBuffer and Pipeline for each file.
-    ReaderHolder createReader();
-    std::future<ReaderHolder> createReaderAsync();
+    ReaderHolder createReader(size_t idx = 0);
+    std::future<ReaderHolder> createReaderAsync(size_t idx = 0);
 
     std::unique_ptr<ReadBuffer> createS3ReadBuffer(const String & key, size_t object_size);
     std::unique_ptr<ReadBuffer> createAsyncS3ReadBuffer(const String & key, const ReadSettings & read_settings, size_t object_size);
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 7d40060fec6..5209c6f9642 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -960,3 +960,243 @@ def test_s3_client_reused(started_cluster):
         s3_clients_after = get_created_s3_clients_count()
 
         assert s3_clients_before == s3_clients_after
+
+
+@pytest.mark.parametrize("mode", ["unordered", "ordered"])
+def test_processing_threads(started_cluster, mode):
+    node = started_cluster.instances["instance"]
+    table_name = f"processing_threads_{mode}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    processing_threads = 32
+
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        mode,
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+            "s3queue_processing_threads_num": processing_threads,
+        },
+    )
+    create_mv(node, table_name, dst_table_name)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=1
+    )
+
+    def get_count(table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(100):
+        if (get_count(f"{dst_table_name}")) == files_to_generate:
+            break
+        time.sleep(1)
+
+    assert get_count(dst_table_name) == files_to_generate
+
+    res = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}"
+        ).splitlines()
+    ]
+    assert {tuple(v) for v in res} == set([tuple(i) for i in total_values])
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == processing_threads
+
+
+@pytest.mark.parametrize(
+    "mode, processing_threads",
+    [
+        pytest.param("unordered", 1),
+        pytest.param("unordered", 8),
+        pytest.param("ordered", 1),
+        pytest.param("ordered", 8),
+    ],
+)
+def test_shards(started_cluster, mode, processing_threads):
+    node = started_cluster.instances["instance"]
+    table_name = f"test_shards_{mode}_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    shards_num = 3
+
+    for i in range(shards_num):
+        table = f"{table_name}_{i + 1}"
+        dst_table = f"{dst_table_name}_{i + 1}"
+        create_table(
+            started_cluster,
+            node,
+            table,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": processing_threads,
+                "s3queue_total_shards_num": shards_num,
+                "s3queue_current_shard_num": i,
+            },
+        )
+        create_mv(node, table, dst_table)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=1
+    )
+
+    def get_count(table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(100):
+        if (
+            get_count(f"{dst_table_name}_1")
+            + get_count(f"{dst_table_name}_2")
+            + get_count(f"{dst_table_name}_3")
+        ) == files_to_generate:
+            break
+        time.sleep(1)
+
+    if (
+        get_count(f"{dst_table_name}_1")
+        + get_count(f"{dst_table_name}_2")
+        + get_count(f"{dst_table_name}_3")
+    ) != files_to_generate:
+        info = node.query(
+            f"SELECT * FROM system.s3queue WHERE zookeeper_path like '%{table_name}' ORDER BY file_name FORMAT Vertical"
+        )
+        logging.debug(info)
+        assert False
+
+    res1 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_1"
+        ).splitlines()
+    ]
+    res2 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_2"
+        ).splitlines()
+    ]
+    res3 = [
+        list(map(int, l.split()))
+        for l in node.query(
+            f"SELECT column1, column2, column3 FROM {dst_table_name}_3"
+        ).splitlines()
+    ]
+    assert {tuple(v) for v in res1 + res2 + res3} == set(
+        [tuple(i) for i in total_values]
+    )
+
+    # Checking that all files were processed only once
+    time.sleep(10)
+    assert (
+        get_count(f"{dst_table_name}_1")
+        + get_count(f"{dst_table_name}_2")
+        + get_count(f"{dst_table_name}_3")
+    ) == files_to_generate
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == shards_num * processing_threads
+
+
+@pytest.mark.parametrize(
+    "mode, processing_threads",
+    [
+        pytest.param("unordered", 1),
+        pytest.param("unordered", 8),
+        pytest.param("ordered", 1),
+        pytest.param("ordered", 8),
+    ],
+)
+def test_shards_distributed(started_cluster, mode, processing_threads):
+    node = started_cluster.instances["instance"]
+    node_2 = started_cluster.instances["instance2"]
+    table_name = f"test_shards_distributed_{mode}_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 300
+    row_num = 50
+    total_rows = row_num * files_to_generate
+    shards_num = 2
+
+    i = 0
+    for instance in [node, node_2]:
+        create_table(
+            started_cluster,
+            instance,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": processing_threads,
+                "s3queue_total_shards_num": shards_num,
+                "s3queue_current_shard_num": i,
+            },
+        )
+        i += 1
+
+    for instance in [node, node_2]:
+        create_mv(instance, table_name, dst_table_name)
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, row_num=row_num
+    )
+
+    def get_count(node, table_name):
+        return int(run_query(node, f"SELECT count() FROM {table_name}"))
+
+    for _ in range(150):
+        if (
+            get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+        ) == total_rows:
+            break
+        time.sleep(1)
+
+    if (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) != total_rows:
+        info = node.query(
+            f"SELECT * FROM system.s3queue WHERE zookeeper_path like '%{table_name}' ORDER BY file_name FORMAT Vertical"
+        )
+        logging.debug(info)
+        assert False
+
+    get_query = f"SELECT column1, column2, column3 FROM {dst_table_name}"
+    res1 = [list(map(int, l.split())) for l in run_query(node, get_query).splitlines()]
+    res2 = [
+        list(map(int, l.split())) for l in run_query(node_2, get_query).splitlines()
+    ]
+
+    assert len(res1) + len(res2) == total_rows
+
+    # Checking that all engines have made progress
+    assert len(res1) > 0
+    assert len(res2) > 0
+
+    assert {tuple(v) for v in res1 + res2} == set([tuple(i) for i in total_values])
+
+    # Checking that all files were processed only once
+    time.sleep(10)
+    assert (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) == total_rows
+
+    if mode == "ordered":
+        zk = started_cluster.get_kazoo_client("zoo1")
+        processed_nodes = zk.get_children(f"{keeper_path}/processed/")
+        assert len(processed_nodes) == shards_num * processing_threads

From 5ecf36f275fe7b64b29a2abc1ea7686c7369f463 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 24 Jan 2024 17:19:52 +0100
Subject: [PATCH 0239/1081] Fix style check

---
 src/Storages/S3Queue/S3QueueSource.cpp  | 1 +
 src/Storages/S3Queue/StorageS3Queue.cpp | 8 +++-----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 7d4ad64d554..1073270742f 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -28,6 +28,7 @@ namespace ErrorCodes
 {
     extern const int S3_ERROR;
     extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
 }
 
 StorageS3QueueSource::S3QueueKeyWithInfo::S3QueueKeyWithInfo(
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 511add4912f..66c4dacf5bd 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -221,8 +221,7 @@ public:
         ReadFromFormatInfo info_,
         std::shared_ptr<StorageS3Queue> storage_,
         ContextPtr context_,
-        size_t max_block_size_,
-        size_t )
+        size_t max_block_size_)
         : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
         , info(std::move(info_))
         , storage(std::move(storage_))
@@ -269,7 +268,7 @@ void StorageS3Queue::read(
     ContextPtr local_context,
     QueryProcessingStage::Enum /*processed_stage*/,
     size_t max_block_size,
-    size_t num_streams)
+    size_t)
 {
     if (!local_context->getSettingsRef().stream_like_engine_allow_direct_select)
     {
@@ -291,8 +290,7 @@ void StorageS3Queue::read(
         read_from_format_info,
         std::move(this_ptr),
         local_context,
-        max_block_size,
-        num_streams);
+        max_block_size);
 
     query_plan.addStep(std::move(reading));
 }

From e988f8a47142ab07228fbaee9acb4ba64f2644e1 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 24 Jan 2024 17:30:04 +0100
Subject: [PATCH 0240/1081] fix typo in formats.md

---
 docs/en/interfaces/formats.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index fd44fbf4462..a3f54c1c383 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -279,7 +279,7 @@ the values of `SearchPhrase`, `c` and `price` columns, which are escaped as `Quo
 
 `Search phrase: 'bathroom interior design', count: 2166, ad price: $3;`
 
-In cases where it is challenging or not possible to deploy format output configuration for the template format to a directory on all nodes in a cluste, or if the format is trivial then `format_schema_rows_template` can be used to pass the template string directly in the query, rather than a path to the file which contains it.
+In cases where it is challenging or not possible to deploy format output configuration for the template format to a directory on all nodes in a cluster, or if the format is trivial then `format_schema_rows_template` can be used to pass the template string directly in the query, rather than a path to the file which contains it.
 
 The `format_template_rows_between_delimiter` setting specifies the delimiter between rows, which is printed (or expected) after every row except the last one (`\n` by default)
 

From 6a9e7abf05760ef0eb7f531970f9eb110e7b4ea8 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 24 Jan 2024 17:57:46 +0100
Subject: [PATCH 0241/1081] Update 00937_format_schema_rows_template.sh

---
 .../queries/0_stateless/00937_format_schema_rows_template.sh | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index 651e3618f83..3124cc3b52b 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -26,7 +26,8 @@ echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Like
 $CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
 format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
-format_template_rows_between_delimiter = ';\n'"; -- { serverError 474 }
+format_template_rows_between_delimiter = ';\n'"; 
+-- { serverError 474 }
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE template";
-rm "$CURDIR"/00937_template_output_format_row.tmp
\ No newline at end of file
+rm "$CURDIR"/00937_template_output_format_row.tmp

From 11f1ea50d7182e3f9493e026b85cd91f6461aab4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 24 Jan 2024 17:55:31 +0000
Subject: [PATCH 0242/1081] Fix tests

---
 src/Formats/ReadSchemaUtils.cpp               |  9 +--
 src/Storages/HDFS/StorageHDFS.cpp             |  2 +-
 src/Storages/StorageAzureBlob.cpp             | 60 +++++++++++++++----
 src/Storages/StorageS3.cpp                    | 33 +++++-----
 .../TableFunctionAzureBlobStorage.cpp         |  2 +-
 tests/integration/test_storage_hdfs/test.py   |  4 +-
 tests/integration/test_storage_s3/test.py     |  6 +-
 .../0_stateless/02725_database_hdfs.sh        |  2 +-
 8 files changed, 79 insertions(+), 39 deletions(-)

diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 5576da56dbf..f97df25aba7 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -226,10 +226,12 @@ try
                 continue;
             }
 
-            SchemaReaderPtr schema_reader;
+            std::unique_ptr<PeekableReadBuffer> peekable_buf; /// Can be used in format detection. Should be destroyed after schema reader.
 
             if (format_name)
             {
+                SchemaReaderPtr schema_reader;
+
                 try
                 {
                     schema_reader = FormatFactory::instance().getSchemaReader(*format_name, *iterator_data.buf, context, format_settings);
@@ -296,7 +298,6 @@ try
                 /// to high memory usage as it will save all the read data from the beginning of the file,
                 /// especially it will be noticeable for formats like Parquet/ORC/Arrow that do seeks to the
                 /// end of file.
-                std::unique_ptr<PeekableReadBuffer> peekable_buf;
                 bool support_buf_recreation = read_buffer_iterator.supportsLastReadBufferRecreation();
                 if (!support_buf_recreation)
                 {
@@ -310,7 +311,7 @@ try
                 {
                     try
                     {
-                        schema_reader = FormatFactory::instance().getSchemaReader(format_to_detect, support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
+                        SchemaReaderPtr schema_reader = FormatFactory::instance().getSchemaReader(format_to_detect, support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
                         schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
                         names_and_types = schema_reader->readSchema();
                         if (names_and_types.empty())
@@ -355,7 +356,7 @@ try
                     {
                         try
                         {
-                            schema_reader = FormatFactory::instance().getSchemaReader(
+                            SchemaReaderPtr schema_reader = FormatFactory::instance().getSchemaReader(
                                 formats_set_to_detect[i], support_buf_recreation ? *iterator_data.buf : *peekable_buf, context, format_settings);
                             schema_reader->setMaxRowsAndBytesToRead(max_rows_to_read, max_bytes_to_read);
                             auto tmp_names_and_types = schema_reader->readSchema();
diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index a846e9fd9ef..59eba6505f3 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -1147,7 +1147,7 @@ void registerStorageHDFS(StorageFactory & factory)
         }
 
         if (format_name == "auto")
-            format_name = FormatFactory::instance().getFormatFromFileName(url);
+            format_name = FormatFactory::instance().tryGetFormatFromFileName(url).value_or("auto");
 
         String compression_method;
         if (engine_args.size() == 3)
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 35072dc5cae..c55725ce940 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -144,7 +144,7 @@ StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine
         configuration.blobs_paths = {configuration.blob_path};
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
+            configuration.format = FormatFactory::instance().tryGetFormatFromFileName(configuration.blob_path).value_or("auto");
 
         return configuration;
     }
@@ -237,7 +237,7 @@ StorageAzureBlob::Configuration StorageAzureBlob::getConfiguration(ASTs & engine
     configuration.blobs_paths = {configuration.blob_path};
 
     if (configuration.format == "auto")
-        configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
+        configuration.format = FormatFactory::instance().tryGetFormatFromFileName(configuration.blob_path).value_or("auto");
 
     return configuration;
 }
@@ -1316,10 +1316,28 @@ namespace
         Data next() override
         {
             /// For default mode check cached columns for currently read keys on first iteration.
-            if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            if (first)
             {
-                if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
-                    return {nullptr, cached_columns, format};
+                /// If format is unknown we iterate through all currently read keys on first iteration and
+                /// try to determine format by file name.
+                if (!format)
+                {
+                    for (const auto & key : read_keys)
+                    {
+                        if (auto format_from_path = FormatFactory::instance().tryGetFormatFromFileName(key.relative_path))
+                        {
+                            format = format_from_path;
+                            break;
+                        }
+                    }
+                }
+
+                /// For default mode check cached columns for currently read keys on first iteration.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                {
+                    if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
+                        return {nullptr, cached_columns, format};
+                }
             }
 
             current_path_with_metadata = file_iterator->next();
@@ -1345,15 +1363,33 @@ namespace
 
             first = false;
 
-            /// AzureBlobStorage file iterator could get new keys after new iteration, check them in schema cache if schema inference mode is default.
-            if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT && read_keys.size() > prev_read_keys_size)
+            /// AzureBlobStorage file iterator could get new keys after new iteration.
+            if (read_keys.size() > prev_read_keys_size)
             {
-                auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
+                /// If format is unknown we can try to determine it by new file names.
+                if (!format)
+                {
+                    for (auto it = read_keys.begin() + prev_read_keys_size; it != read_keys.end(); ++it)
+                    {
+                        if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName((*it).relative_path))
+                        {
+                            format = format_from_file_name;
+                            break;
+                        }
+                    }
+                }
+                /// Check new files in schema cache if schema inference mode is default.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                {
+                    auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
+                    if (columns_from_cache)
+                        return {nullptr, columns_from_cache, format};
+                }
+
                 prev_read_keys_size = read_keys.size();
-                if (columns_from_cache)
-                    return {nullptr, columns_from_cache, format};
             }
-            else if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+
+            if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
             {
                 RelativePathsWithMetadata paths = {current_path_with_metadata};
                 if (auto columns_from_cache = tryGetColumnsFromCache(paths.begin(), paths.end()))
@@ -1520,7 +1556,7 @@ ColumnsDescription StorageAzureBlob::getTableStructureFromData(
     const std::optional<FormatSettings> & format_settings,
     const DB::ContextPtr & ctx)
 {
-    return getTableStructureAndFormatFromDataImpl(std::nullopt, object_storage, configuration, format_settings, ctx).first;
+    return getTableStructureAndFormatFromDataImpl(configuration.format, object_storage, configuration, format_settings, ctx).first;
 }
 
 SchemaCache & StorageAzureBlob::getSchemaCache(const ContextPtr & ctx)
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 8e5b6040a63..f9c7400edfb 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1702,30 +1702,33 @@ namespace
                     return {nullptr, std::nullopt, format};
                 }
 
-                /// S3 file iterator could get new keys after new iteration, if format is unknown we can try to determine it by new file names.
-                if (!format && read_keys.size() > prev_read_keys_size)
+                /// S3 file iterator could get new keys after new iteration
+                if (read_keys.size() > prev_read_keys_size)
                 {
-                    for (auto it = read_keys.begin() + prev_read_keys_size; it != read_keys.end(); ++it)
+                    /// If format is unknown we can try to determine it by new file names.
+                    if (!format)
                     {
-                        if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName((*it)->key))
+                        for (auto it = read_keys.begin() + prev_read_keys_size; it != read_keys.end(); ++it)
                         {
-                            format = format_from_file_name;
-                            break;
+                            if (auto format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName((*it)->key))
+                            {
+                                format = format_from_file_name;
+                                break;
+                            }
                         }
                     }
-                }
 
-                /// S3 file iterator could get new keys after new iteration, check them in schema cache if schema inference mode is default.
-                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT && read_keys.size() > prev_read_keys_size)
-                {
-                    auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
+                    /// Check new files in schema cache if schema inference mode is default.
+                    if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+                    {
+                        auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
+                        if (columns_from_cache)
+                            return {nullptr, columns_from_cache, format};
+                    }
+
                     prev_read_keys_size = read_keys.size();
-                    if (columns_from_cache)
-                        return {nullptr, columns_from_cache, format};
                 }
 
-                prev_read_keys_size = read_keys.size();
-
                 if (getContext()->getSettingsRef().s3_skip_empty_files && current_key_with_info->info && current_key_with_info->info->size == 0)
                     continue;
 
diff --git a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
index b9e0af53b7b..8a537e154db 100644
--- a/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
+++ b/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
@@ -58,7 +58,7 @@ void TableFunctionAzureBlobStorage::parseArgumentsImpl(ASTs & engine_args, const
         configuration.blobs_paths = {configuration.blob_path};
 
         if (configuration.format == "auto")
-            configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path);
+            configuration.format = FormatFactory::instance().tryGetFormatFromFileName(configuration.blob_path).value_or("auto");
     }
     else
     {
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 8dee15f4d94..165dfb212b7 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -600,7 +600,7 @@ def test_schema_inference_with_globs(started_cluster):
     )
 
     assert (
-        "Cannot extract table structure from JSONCompactEachRow format file" in result
+        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
     )
 
 
@@ -1044,7 +1044,7 @@ def test_union_schema_inference_mode(started_cluster):
     error = node.query_and_get_error(
         "desc hdfs('hdfs://hdfs1:9000/test_union_schema_inference*.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
     )
-    assert "Cannot extract table structure" in error
+    assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in error
 
 
 def test_format_detection(started_cluster):
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 365ade7da65..0b5e9462860 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1380,7 +1380,7 @@ def test_schema_inference_from_globs(started_cluster):
     )
 
     assert (
-        "Cannot extract table structure from JSONCompactEachRow format file" in result
+        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
     )
 
     url_filename = "test{0,1,2,3}.jsoncompacteachrow"
@@ -1390,7 +1390,7 @@ def test_schema_inference_from_globs(started_cluster):
     )
 
     assert (
-        "Cannot extract table structure from JSONCompactEachRow format file" in result
+        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
     )
 
 
@@ -2193,7 +2193,7 @@ def test_union_schema_inference_mode(started_cluster):
         error = instance.query_and_get_error(
             f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3,4}}.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
         )
-        assert "Cannot extract table structure" in error
+        assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in error
 
 
 def test_s3_format_detection(started_cluster):
diff --git a/tests/queries/0_stateless/02725_database_hdfs.sh b/tests/queries/0_stateless/02725_database_hdfs.sh
index 71ccee6f5f4..d62f928e947 100755
--- a/tests/queries/0_stateless/02725_database_hdfs.sh
+++ b/tests/queries/0_stateless/02725_database_hdfs.sh
@@ -58,7 +58,7 @@ SELECT * FROM \"abacaba/file.tsv\"
 """ 2>&1 | tr '\n' ' ' | grep -oF "CANNOT_EXTRACT_TABLE_STRUCTURE"
 
 ${CLICKHOUSE_CLIENT} -q "SELECT * FROM test_hdfs_4.\`http://localhost:11111/test/a.tsv\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:
-${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/file.myext\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "HDFS_ERROR" > /dev/null && echo "OK" || echo 'FAIL' ||:
+${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/file.myext\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "CANNOT_EXTRACT_TABLE_STRUCTURE" > /dev/null && echo "OK" || echo 'FAIL' ||:
 ${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222/test_02725_3.tsv\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "CANNOT_EXTRACT_TABLE_STRUCTURE" > /dev/null && echo "OK" || echo 'FAIL' ||:
 
 ${CLICKHOUSE_CLIENT} --query "SELECT * FROM test_hdfs_4.\`hdfs://localhost:12222\`" 2>&1 | tr '\n' ' ' | grep -oF -e "UNKNOWN_TABLE" -e "BAD_ARGUMENTS" > /dev/null && echo "OK" || echo 'FAIL' ||:

From f551081dd4c38ac014f554c7ee4efc4e18777f9a Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 24 Jan 2024 21:10:50 +0100
Subject: [PATCH 0243/1081] Addressed review comments

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  7 ++---
 .../copyAzureBlobStorageFile.cpp              | 27 ++++++++-----------
 .../copyAzureBlobStorageFile.h                |  8 +++---
 3 files changed, 16 insertions(+), 26 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 2c2396e9c0a..1b4c10ad0cb 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -104,7 +104,7 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
         && (destination_data_source_description.is_encrypted == encrypted_in_backup))
     {
         LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
-        auto write_blob_function = [&](const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> & object_attributes) -> size_t
+        auto write_blob_function = [&](const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> &) -> size_t
         {
             /// Object storage always uses mode `Rewrite` because it simulates append using metadata and different files.
             if (blob_path.size() != 2 || mode != WriteMode::Rewrite)
@@ -123,7 +123,6 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
                 /* dest_path */ blob_path[0],
                 settings,
                 read_settings,
-                object_attributes,
                 threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupRDAzure"),
                 /* for_disk_azure_blob_storage= */ true);
 
@@ -180,7 +179,6 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
                 fs::path(configuration.blob_path) / path_in_backup,
                 settings,
                 read_settings,
-                {},
                 threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"));
             return; /// copied!
         }
@@ -204,14 +202,13 @@ void BackupWriterAzureBlobStorage::copyFile(const String & destination, const St
        /* dest_path */ destination,
        settings,
        read_settings,
-       {},
        threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"),
        /* for_disk_azure_blob_storage= */ true);
 }
 
 void BackupWriterAzureBlobStorage::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
 {
-    copyDataToAzureBlobStorageFile(create_read_buffer, start_pos, length, client, configuration.container, path_in_backup, settings, {},
+    copyDataToAzureBlobStorageFile(create_read_buffer, start_pos, length, client, configuration.container, path_in_backup, settings,
                      threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWRAzure"));
 }
 
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index bb8702e9b41..350d2d1d34e 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -47,10 +47,9 @@ namespace
             MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client_,
             size_t offset_,
             size_t total_size_,
-            const String & dest_container_,
+            const String & dest_container_for_logging_,
             const String & dest_blob_,
             MultiVersion<AzureObjectStorageSettings> settings_,
-            const std::optional<std::map<String, String>> & object_metadata_,
             ThreadPoolCallbackRunner<void> schedule_,
             bool for_disk_azure_blob_storage_,
             const Poco::Logger * log_)
@@ -58,10 +57,9 @@ namespace
             , client(client_)
             , offset (offset_)
             , total_size (total_size_)
-            , dest_container(dest_container_)
+            , dest_container_for_logging(dest_container_for_logging_)
             , dest_blob(dest_blob_)
             , settings(settings_)
-            , object_metadata(object_metadata_)
             , schedule(schedule_)
             , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
             , log(log_)
@@ -76,10 +74,9 @@ namespace
         MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client;
         size_t offset;
         size_t total_size;
-        const String & dest_container;
+        const String & dest_container_for_logging;
         const String & dest_blob;
         MultiVersion<AzureObjectStorageSettings> settings;
-        const std::optional<std::map<String, String>> & object_metadata;
         ThreadPoolCallbackRunner<void> schedule;
         bool for_disk_azure_blob_storage;
         const Poco::Logger * log;
@@ -208,7 +205,7 @@ namespace
 
         void uploadPart(size_t part_offset, size_t part_size)
         {
-            LOG_TRACE(log, "Writing part. Container: {}, Blob: {}, Size: {}", dest_container, dest_blob, part_size);
+            LOG_TRACE(log, "Writing part. Container: {}, Blob: {}, Size: {}", dest_container_for_logging, dest_blob, part_size);
 
             if (!part_size)
             {
@@ -287,7 +284,7 @@ namespace
 
             std::lock_guard lock(bg_tasks_mutex); /// Protect bg_tasks from race
             task.block_id = block_id;
-            LOG_TRACE(log, "Writing part finished. Container: {}, Blob: {}, block_id: {}, Parts: {}", dest_container, dest_blob, block_id, bg_tasks.size());
+            LOG_TRACE(log, "Writing part finished. Container: {}, Blob: {}, block_id: {}, Parts: {}", dest_container_for_logging, dest_blob, block_id, bg_tasks.size());
         }
 
         String processUploadPartRequest(UploadPartTask & task)
@@ -331,14 +328,13 @@ void copyDataToAzureBlobStorageFile(
     size_t offset,
     size_t size,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
-    const String & dest_container,
+    const String & dest_container_for_logging,
     const String & dest_blob,
     MultiVersion<AzureObjectStorageSettings> settings,
-    const std::optional<std::map<String, String>> & object_metadata,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
-    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container, dest_blob, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyDataToAzureBlobStorageFile")};
+    UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container_for_logging, dest_blob, settings, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyDataToAzureBlobStorageFile")};
     helper.performCopy();
 }
 
@@ -346,15 +342,14 @@ void copyDataToAzureBlobStorageFile(
 void copyAzureBlobStorageFile(
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
-    const String & src_container,
+    const String & src_container_for_logging,
     const String & src_blob,
     size_t offset,
     size_t size,
-    const String & dest_container,
+    const String & dest_container_for_logging,
     const String & dest_blob,
     MultiVersion<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
-    const std::optional<std::map<String, String>> & object_metadata,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
@@ -390,14 +385,14 @@ void copyAzureBlobStorageFile(
     }
     else
     {
-        LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container, src_blob);
+        LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container_for_logging, src_blob);
         auto create_read_buffer = [&]
         {
             return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client.get(), src_blob, read_settings, settings.get()->max_single_read_retries,
             settings.get()->max_single_download_retries);
         };
 
-        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container, dest_blob, settings, object_metadata, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
+        UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container_for_logging, dest_blob, settings, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};
         helper.performCopy();
     }
 }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index 491f7cd7176..15a31031f63 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -23,15 +23,14 @@ using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
 void copyAzureBlobStorageFile(
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
-    const String & src_container,
+    const String & src_container_for_logging,
     const String & src_blob,
     size_t src_offset,
     size_t src_size,
-    const String & dest_container,
+    const String & dest_container_for_logging,
     const String & dest_blob,
     MultiVersion<AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
-    const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},
     bool for_disk_azure_blob_storage = false);
 
@@ -46,10 +45,9 @@ void copyDataToAzureBlobStorageFile(
     size_t offset,
     size_t size,
     MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client,
-    const String & dest_container,
+    const String & dest_container_for_logging,
     const String & dest_blob,
     MultiVersion<AzureObjectStorageSettings> settings,
-    const std::optional<std::map<String, String>> & object_metadata = std::nullopt,
     ThreadPoolCallbackRunner<void> schedule_ = {},
     bool for_disk_azure_blob_storage = false);
 

From ad196dd047e443158b18b8dfc52d1cf2d14d6593 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Thu, 25 Jan 2024 01:18:27 +0200
Subject: [PATCH 0244/1081] Update 00937_format_schema_rows_template.sh

fix failing shellcheck
---
 tests/queries/0_stateless/00937_format_schema_rows_template.sh | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index 3124cc3b52b..8b512513d94 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -26,8 +26,7 @@ echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Like
 $CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
 format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
-format_template_rows_between_delimiter = ';\n'"; 
--- { serverError 474 }
+format_template_rows_between_delimiter = ';\n'; --{ serverError 474 }"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE template";
 rm "$CURDIR"/00937_template_output_format_row.tmp

From 3e3ae52acaedc57b9470f5b59c45307a7e048068 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 24 Jan 2024 14:35:35 +0000
Subject: [PATCH 0245/1081] Reduce even more memory

---
 programs/keeper-converter/KeeperConverter.cpp |  42 ++--
 programs/keeper/CMakeLists.txt                |   2 +-
 src/Coordination/KeeperSnapshotManager.cpp    |  82 ++++---
 src/Coordination/KeeperStorage.cpp            | 223 +++++++++++-------
 src/Coordination/KeeperStorage.h              | 153 ++++++++++--
 src/Coordination/SnapshotableHashTable.h      |  34 +--
 src/Coordination/ZooKeeperDataReader.cpp      |   2 +-
 7 files changed, 353 insertions(+), 185 deletions(-)

diff --git a/programs/keeper-converter/KeeperConverter.cpp b/programs/keeper-converter/KeeperConverter.cpp
index 20448aafa2f..99f8bab3403 100644
--- a/programs/keeper-converter/KeeperConverter.cpp
+++ b/programs/keeper-converter/KeeperConverter.cpp
@@ -38,31 +38,31 @@ int mainEntryClickHouseKeeperConverter(int argc, char ** argv)
         return 0;
     }
 
-    try
-    {
-        auto keeper_context = std::make_shared<KeeperContext>(true);
-        keeper_context->setDigestEnabled(true);
-        keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("Keeper-snapshots", options["output-dir"].as<std::string>()));
+    //try
+    //{
+    //    auto keeper_context = std::make_shared<KeeperContext>(true);
+    //    keeper_context->setDigestEnabled(true);
+    //    keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("Keeper-snapshots", options["output-dir"].as<std::string>()));
 
-        DB::KeeperStorage storage(/* tick_time_ms */ 500, /* superdigest */ "", keeper_context, /* initialize_system_nodes */ false);
+    //    DB::KeeperStorage storage(/* tick_time_ms */ 500, /* superdigest */ "", keeper_context, /* initialize_system_nodes */ false);
 
-        DB::deserializeKeeperStorageFromSnapshotsDir(storage, options["zookeeper-snapshots-dir"].as<std::string>(), logger);
-        storage.initializeSystemNodes();
+    //    DB::deserializeKeeperStorageFromSnapshotsDir(storage, options["zookeeper-snapshots-dir"].as<std::string>(), logger);
+    //    storage.initializeSystemNodes();
 
-        DB::deserializeLogsAndApplyToStorage(storage, options["zookeeper-logs-dir"].as<std::string>(), logger);
-        DB::SnapshotMetadataPtr snapshot_meta = std::make_shared<DB::SnapshotMetadata>(storage.getZXID(), 1, std::make_shared<nuraft::cluster_config>());
-        DB::KeeperStorageSnapshot snapshot(&storage, snapshot_meta);
+    //    DB::deserializeLogsAndApplyToStorage(storage, options["zookeeper-logs-dir"].as<std::string>(), logger);
+    //    DB::SnapshotMetadataPtr snapshot_meta = std::make_shared<DB::SnapshotMetadata>(storage.getZXID(), 1, std::make_shared<nuraft::cluster_config>());
+    //    DB::KeeperStorageSnapshot snapshot(&storage, snapshot_meta);
 
-        DB::KeeperSnapshotManager manager(1, keeper_context);
-        auto snp = manager.serializeSnapshotToBuffer(snapshot);
-        auto file_info = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
-        std::cout << "Snapshot serialized to path:" << fs::path(file_info.disk->getPath()) / file_info.path << std::endl;
-    }
-    catch (...)
-    {
-        std::cerr << getCurrentExceptionMessage(true) << '\n';
-        return getCurrentExceptionCode();
-    }
+    //    DB::KeeperSnapshotManager manager(1, keeper_context);
+    //    auto snp = manager.serializeSnapshotToBuffer(snapshot);
+    //    auto file_info = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
+    //    std::cout << "Snapshot serialized to path:" << fs::path(file_info.disk->getPath()) / file_info.path << std::endl;
+    //}
+    //catch (...)
+    //{
+    //    std::cerr << getCurrentExceptionMessage(true) << '\n';
+    //    return getCurrentExceptionCode();
+    //}
 
     return 0;
 }
diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index 143ded0ee85..fba9b3e4d86 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -44,7 +44,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SessionExpiryQueue.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SummingStateMachine.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/WriteBufferFromNuraftBuffer.cpp
-        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/ZooKeeperDataReader.cpp
+        #${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/ZooKeeperDataReader.cpp
 
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/SettingsFields.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/BaseSettings.cpp
diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index ee5935015e4..2f51e855763 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -79,20 +79,21 @@ namespace
             writeBinary(false, out);
 
         /// Serialize stat
-        writeBinary(node.stat.czxid, out);
-        writeBinary(node.stat.mzxid, out);
-        writeBinary(node.stat.ctime, out);
-        writeBinary(node.stat.mtime, out);
-        writeBinary(node.stat.version, out);
-        writeBinary(node.stat.cversion, out);
-        writeBinary(node.stat.aversion, out);
-        writeBinary(node.stat.ephemeralOwner, out);
+        writeBinary(node.czxid, out);
+        writeBinary(node.mzxid, out);
+        writeBinary(node.ctime(), out);
+        writeBinary(node.mtime(), out);
+        writeBinary(node.version, out);
+        writeBinary(node.cversion, out);
+        writeBinary(node.aversion, out);
+        const bool is_ephemeral = node.isEphemeral(); 
+        writeBinary(is_ephemeral ? node.ephemeralOwner() : 0, out);
         if (version < SnapshotVersion::V6)
-            writeBinary(static_cast<int32_t>(node.getData().size()), out);
-        writeBinary(node.stat.numChildren, out);
-        writeBinary(node.stat.pzxid, out);
+            writeBinary(static_cast<int32_t>(node.data_size), out);
+        writeBinary(is_ephemeral ? 0 : node.numChildren(), out);
+        writeBinary(node.pzxid, out);
 
-        writeBinary(node.seq_num, out);
+        writeBinary(node.seqNum(), out);
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
             writeBinary(node.sizeInBytes(), out);
@@ -102,7 +103,7 @@ namespace
     {
         String new_data;
         readBinary(new_data, in);
-        node.setData(std::move(new_data));
+        node.setData(new_data);
 
         if (version >= SnapshotVersion::V1)
         {
@@ -138,22 +139,41 @@ namespace
         }
 
         /// Deserialize stat
-        readBinary(node.stat.czxid, in);
-        readBinary(node.stat.mzxid, in);
-        readBinary(node.stat.ctime, in);
-        readBinary(node.stat.mtime, in);
-        readBinary(node.stat.version, in);
-        readBinary(node.stat.cversion, in);
-        readBinary(node.stat.aversion, in);
-        readBinary(node.stat.ephemeralOwner, in);
+        readBinary(node.czxid, in);
+        readBinary(node.mzxid, in);
+        int64_t ctime;
+        readBinary(ctime, in);
+        node.setCtime(ctime);
+        int64_t mtime;
+        readBinary(mtime, in);
+        node.setMtime(mtime);
+        readBinary(node.version, in);
+        readBinary(node.cversion, in);
+        readBinary(node.aversion, in);
+        int64_t ephemeral_owner = 0;
+        readBinary(ephemeral_owner, in);
+        if (ephemeral_owner != 0)
+        {
+            node.is_ephemeral_and_mtime.is_ephemeral = true;
+            node.ephemeral_or_children_data.ephemeral_owner = ephemeral_owner;
+        }
+
         if (version < SnapshotVersion::V6)
         {
             int32_t data_length = 0;
             readBinary(data_length, in);
         }
-        readBinary(node.stat.numChildren, in);
-        readBinary(node.stat.pzxid, in);
-        readBinary(node.seq_num, in);
+        int32_t num_children;
+        readBinary(num_children, in);
+        if (num_children)
+            node.ephemeral_or_children_data.children_info.num_children = num_children;
+
+        readBinary(node.pzxid, in);
+
+        int32_t seq_num;
+        readBinary(seq_num, in);
+        if (seq_num)
+            node.ephemeral_or_children_data.children_info.seq_num = seq_num;
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
         {
@@ -238,7 +258,7 @@ void KeeperStorageSnapshot::serialize(const KeeperStorageSnapshot & snapshot, Wr
         /// Benign race condition possible while taking snapshot: NuRaft decide to create snapshot at some log id
         /// and only after some time we lock storage and enable snapshot mode. So snapshot_container_size can be
         /// slightly bigger than required.
-        if (node.stat.mzxid > snapshot.zxid)
+        if (node.mzxid > snapshot.zxid)
             break;
 
         writeBinary(path, out);
@@ -363,9 +383,9 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
     if (recalculate_digest)
         storage.nodes_digest = 0;
 
-    const auto is_node_empty = [](const auto & node)
+    const auto is_node_empty = [](const auto & /*node*/)
     {
-        return node.getData().empty() && node.stat == KeeperStorage::Node::Stat{};
+        return false; //node.getData().empty() && node == KeeperStorage::Node{};
     };
 
     for (size_t nodes_read = 0; nodes_read < snapshot_container_size; ++nodes_read)
@@ -412,8 +432,8 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
         }
 
         storage.container.insertOrReplace(path, node);
-        if (node.stat.ephemeralOwner != 0)
-            storage.ephemerals[node.stat.ephemeralOwner].insert(path);
+        if (node.isEphemeral())
+            storage.ephemerals[node.ephemeralOwner()].insert(path);
 
         if (recalculate_digest)
             storage.nodes_digest += node.getDigest(path);
@@ -433,12 +453,12 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
     {
         if (itr.key != "/")
         {
-            if (itr.value.stat.numChildren != static_cast<int32_t>(itr.value.getChildren().size()))
+            if (itr.value.numChildren() != static_cast<int32_t>(itr.value.getChildren().size()))
             {
 #ifdef NDEBUG
                 /// TODO (alesapin) remove this, it should be always CORRUPTED_DATA.
                 LOG_ERROR(&Poco::Logger::get("KeeperSnapshotManager"), "Children counter in stat.numChildren {}"
-                            " is different from actual children size {} for node {}", itr.value.stat.numChildren, itr.value.getChildren().size(), itr.key);
+                            " is different from actual children size {} for node {}", itr.value.numChildren(), itr.value.getChildren().size(), itr.key);
 #else
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Children counter in stat.numChildren {}"
                                 " is different from actual children size {} for node {}",
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index c128d7c2f98..6cdbedc2dc6 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -166,56 +166,88 @@ KeeperStorage::ResponsesForSessions processWatchesImpl(
 }
 
 // When this function is updated, update CURRENT_DIGEST_VERSION!!
-uint64_t calculateDigest(std::string_view path, std::string_view data, const KeeperStorage::Node::Stat & stat)
+uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node)
 {
     SipHash hash;
 
     hash.update(path);
 
-    hash.update(data);
+    hash.update(node.data, node.data_size);
 
-    hash.update(stat.czxid);
-    hash.update(stat.czxid);
-    hash.update(stat.mzxid);
-    hash.update(stat.ctime);
-    hash.update(stat.mtime);
-    hash.update(stat.version);
-    hash.update(stat.cversion);
-    hash.update(stat.aversion);
-    hash.update(stat.ephemeralOwner);
-    hash.update(data.length());
-    hash.update(stat.numChildren);
-    hash.update(stat.pzxid);
+    hash.update(node.czxid);
+    hash.update(node.czxid);
+    hash.update(node.mzxid);
+    hash.update(node.ctime());
+    hash.update(node.mtime());
+    hash.update(node.version);
+    hash.update(node.cversion);
+    hash.update(node.aversion);
+    bool is_ephemeral = node.isEphemeral();
+    hash.update(is_ephemeral ? node.ephemeral_or_children_data.ephemeral_owner : 0);
+    hash.update(node.data_size);
+    hash.update(is_ephemeral ? 0 : node.ephemeral_or_children_data.children_info.num_children);
+    hash.update(node.pzxid);
 
     return hash.get64();
 }
 
 }
 
+void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
+{
+    czxid = stat.czxid;
+    mzxid = stat.mzxid;
+    pzxid = stat.pzxid;
+
+    setCtime(stat.ctime);
+    setMtime(stat.mtime);
+
+    version = stat.version;
+    cversion = stat.cversion;
+    aversion = stat.aversion;
+
+    if (stat.ephemeralOwner == 0)
+    {
+        is_ephemeral_and_mtime.is_ephemeral = false;
+        ephemeral_or_children_data.children_info.num_children = stat.numChildren;
+    }
+    else
+    {
+        is_ephemeral_and_mtime.is_ephemeral = true;
+        ephemeral_or_children_data.ephemeral_owner = stat.ephemeralOwner;
+    }
+}
+
 void KeeperStorage::Node::setResponseStat(Coordination::Stat & response_stat) const
 {
-    response_stat.czxid = stat.czxid;
-    response_stat.mzxid = stat.mzxid;
-    response_stat.ctime = stat.ctime;
-    response_stat.mtime = stat.mtime;
-    response_stat.version = stat.version;
-    response_stat.cversion = stat.cversion;
-    response_stat.aversion = stat.aversion;
-    response_stat.ephemeralOwner = stat.ephemeralOwner;
-    response_stat.dataLength = static_cast<int32_t>(data.size());
-    response_stat.numChildren = stat.numChildren;
-    response_stat.pzxid = stat.pzxid;
+    response_stat.czxid = czxid;
+    response_stat.mzxid = mzxid;
+    response_stat.ctime = ctime();
+    response_stat.mtime = mtime();
+    response_stat.version = version;
+    response_stat.cversion = cversion;
+    response_stat.aversion = aversion;
+    bool is_ephemeral = isEphemeral();
+    response_stat.ephemeralOwner = is_ephemeral ? ephemeral_or_children_data.ephemeral_owner : 0;
+    response_stat.dataLength = static_cast<int32_t>(data_size);
+    response_stat.numChildren = is_ephemeral ? 0 : numChildren();
+    response_stat.pzxid = pzxid;
 
 }
 
 uint64_t KeeperStorage::Node::sizeInBytes() const
 {
-    return sizeof(Node) + children.size() * sizeof(StringRef) + data.size();
+    return sizeof(Node) + children.size() * sizeof(StringRef) + data_size;
 }
 
-void KeeperStorage::Node::setData(String new_data)
+void KeeperStorage::Node::setData(const String & new_data)
 {
-    data = std::move(new_data);
+    data_size = static_cast<uint32_t>(new_data.size());
+    if (data_size != 0)
+    {
+        data = new char[new_data.size()];
+        memcpy(data, new_data.data(), data_size);
+    }
 }
 
 void KeeperStorage::Node::addChild(StringRef child_path)
@@ -230,15 +262,15 @@ void KeeperStorage::Node::removeChild(StringRef child_path)
 
 void KeeperStorage::Node::invalidateDigestCache() const
 {
-    has_cached_digest = false;
+    has_cached_digest_and_ctime.has_cached_digest = false;
 }
 
 UInt64 KeeperStorage::Node::getDigest(const std::string_view path) const
 {
-    if (!has_cached_digest)
+    if (!has_cached_digest_and_ctime.has_cached_digest)
     {
-        cached_digest = calculateDigest(path, data, stat);
-        has_cached_digest = true;
+        cached_digest = calculateDigest(path, *this);
+        has_cached_digest_and_ctime.has_cached_digest = true;
     }
 
     return cached_digest;
@@ -246,9 +278,28 @@ UInt64 KeeperStorage::Node::getDigest(const std::string_view path) const
 
 void KeeperStorage::Node::shallowCopy(const KeeperStorage::Node & other)
 {
-    stat = other.stat;
-    seq_num = other.seq_num;
-    setData(other.getData());
+    czxid = other.czxid;
+    mzxid = other.mzxid;
+    pzxid = other.pzxid;
+    acl_id = other.acl_id; /// 0 -- no ACL by default
+
+    has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
+
+    is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
+
+    ephemeral_or_children_data = other.ephemeral_or_children_data;
+
+    data_size = other.data_size;
+    if (data_size != 0)
+    {
+        data = new char[data_size];
+        memcpy(data, other.data, data_size);
+    }
+
+    version = other.version;
+    cversion = other.cversion;
+    aversion = other.aversion;
+
     cached_digest = other.cached_digest;
 }
 
@@ -284,9 +335,9 @@ void KeeperStorage::initializeSystemNodes()
         removeDigest(current_root_it->value, "/");
         auto updated_root_it = container.updateValue(
             "/",
-            [](auto & node)
+            [](KeeperStorage::Node & node)
             {
-                ++node.stat.numChildren;
+                node.increaseNumChildren();
                 node.addChild(getBaseNodeName(keeper_system_path));
             }
         );
@@ -359,7 +410,7 @@ void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
             {
                 assert(!node);
                 node = std::make_shared<Node>();
-                node->stat = operation.stat;
+                node->copyStats(operation.stat);
                 node->setData(operation.data);
                 acls = operation.acls;
                 last_applied_zxid = delta.zxid;
@@ -673,7 +724,7 @@ Coordination::Error KeeperStorage::commit(int64_t commit_zxid)
                     if (node_it == container.end())
                         onStorageInconsistency();
 
-                    if (operation.version != -1 && operation.version != node_it->value.stat.version)
+                    if (operation.version != -1 && operation.version != node_it->value.version)
                         onStorageInconsistency();
 
                     removeDigest(node_it->value, path);
@@ -695,7 +746,7 @@ Coordination::Error KeeperStorage::commit(int64_t commit_zxid)
                     if (node_it == container.end())
                         onStorageInconsistency();
 
-                    if (operation.version != -1 && operation.version != node_it->value.stat.aversion)
+                    if (operation.version != -1 && operation.version != node_it->value.aversion)
                         onStorageInconsistency();
 
                     acl_map.removeUsage(node_it->value.acl_id);
@@ -740,7 +791,7 @@ Coordination::Error KeeperStorage::commit(int64_t commit_zxid)
 bool KeeperStorage::createNode(
     const std::string & path,
     String data,
-    const KeeperStorage::Node::Stat & stat,
+    const Coordination::Stat & stat,
     Coordination::ACLs node_acls)
 {
     auto parent_path = parentNodePath(path);
@@ -749,7 +800,7 @@ bool KeeperStorage::createNode(
     if (node_it == container.end())
         return false;
 
-    if (node_it->value.stat.ephemeralOwner != 0)
+    if (node_it->value.isEphemeral())
         return false;
 
     if (container.contains(path))
@@ -761,8 +812,8 @@ bool KeeperStorage::createNode(
     acl_map.addUsage(acl_id);
 
     created_node.acl_id = acl_id;
-    created_node.stat = stat;
-    created_node.setData(std::move(data));
+    created_node.copyStats(stat);
+    created_node.setData(data);
     auto [map_key, _] = container.insert(path, created_node);
     /// Take child path from key owned by map.
     auto child_path = getBaseNodeName(map_key->getKey());
@@ -771,7 +822,7 @@ bool KeeperStorage::createNode(
             [child_path](KeeperStorage::Node & parent)
             {
                 parent.addChild(child_path);
-                chassert(parent.stat.numChildren == static_cast<int32_t>(parent.getChildren().size()));
+                chassert(parent.numChildren() == static_cast<int32_t>(parent.getChildren().size()));
             }
     );
 
@@ -785,21 +836,22 @@ bool KeeperStorage::removeNode(const std::string & path, int32_t version)
     if (node_it == container.end())
         return false;
 
-    if (version != -1 && version != node_it->value.stat.version)
+    if (version != -1 && version != node_it->value.version)
         return false;
 
-    if (node_it->value.stat.numChildren)
+    if (node_it->value.numChildren())
         return false;
 
-    auto prev_node = node_it->value;
-    acl_map.removeUsage(prev_node.acl_id);
+    KeeperStorage::Node prev_node;
+    prev_node.shallowCopy(node_it->value);
+    acl_map.removeUsage(node_it->value.acl_id);
 
     container.updateValue(
         parentNodePath(path),
         [child_basename = getBaseNodeName(node_it->key)](KeeperStorage::Node & parent)
         {
             parent.removeChild(child_basename);
-            chassert(parent.stat.numChildren == static_cast<int32_t>(parent.getChildren().size()));
+            chassert(parent.numChildren() == static_cast<int32_t>(parent.getChildren().size()));
         }
     );
 
@@ -959,7 +1011,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         if (parent_node == nullptr)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNONODE}};
 
-        else if (parent_node->stat.ephemeralOwner != 0)
+        else if (parent_node->isEphemeral())
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNOCHILDRENFOREPHEMERALS}};
 
         std::string path_created = request.path;
@@ -968,7 +1020,7 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
             if (request.not_exists)
                 return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADARGUMENTS}};
 
-            auto seq_num = parent_node->seq_num;
+            auto seq_num = parent_node->seqNum();
 
             std::stringstream seq_num_str; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
             seq_num_str.exceptions(std::ios::failbit);
@@ -1008,20 +1060,20 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         auto parent_update = [parent_cversion, zxid](KeeperStorage::Node & node)
         {
             /// Increment sequential number even if node is not sequential
-            ++node.seq_num;
+            node.increaseSeqNum();
             if (parent_cversion == -1)
-                ++node.stat.cversion;
-            else if (parent_cversion > node.stat.cversion)
-                node.stat.cversion = parent_cversion;
+                ++node.cversion;
+            else if (parent_cversion > node.cversion)
+                node.cversion = parent_cversion;
 
-            if (zxid > node.stat.pzxid)
-                node.stat.pzxid = zxid;
-            ++node.stat.numChildren;
+            if (zxid > node.pzxid)
+                node.pzxid = zxid;
+            node.increaseNumChildren();
         };
 
         new_deltas.emplace_back(std::string{parent_path}, zxid, KeeperStorage::UpdateNodeDelta{std::move(parent_update)});
 
-        KeeperStorage::Node::Stat stat;
+        Coordination::Stat stat;
         stat.czxid = zxid;
         stat.mzxid = zxid;
         stat.pzxid = zxid;
@@ -1135,7 +1187,8 @@ struct KeeperStorageGetRequestProcessor final : public KeeperStorageRequestProce
         else
         {
             node_it->value.setResponseStat(response.stat);
-            response.data = node_it->value.getData();
+            auto data = node_it->value.getData();
+            response.data = std::string(data.data, data.size);
             response.error = Coordination::Error::ZOK;
         }
 
@@ -1192,8 +1245,8 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
                 {
                     [zxid](KeeperStorage::Node & parent)
                     {
-                        if (parent.stat.pzxid < zxid)
-                            parent.stat.pzxid = zxid;
+                        if (parent.pzxid < zxid)
+                            parent.pzxid = zxid;
                    }
                 }
             );
@@ -1207,9 +1260,9 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
                 update_parent_pzxid();
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNONODE}};
         }
-        else if (request.version != -1 && request.version != node->stat.version)
+        else if (request.version != -1 && request.version != node->version)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADVERSION}};
-        else if (node->stat.numChildren != 0)
+        else if (node->numChildren() != 0)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNOTEMPTY}};
 
         if (request.restored_from_zookeeper_log)
@@ -1220,14 +1273,14 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
             zxid,
             KeeperStorage::UpdateNodeDelta{[](KeeperStorage::Node & parent)
                                            {
-                                               ++parent.stat.cversion;
-                                               --parent.stat.numChildren;
+                                               ++parent.cversion;
+                                               --parent.ephemeral_or_children_data.children_info.num_children;
                                            }});
 
-        new_deltas.emplace_back(request.path, zxid, KeeperStorage::RemoveNodeDelta{request.version, node->stat.ephemeralOwner});
+        new_deltas.emplace_back(request.path, zxid, KeeperStorage::RemoveNodeDelta{request.version, node->ephemeralOwner()});
 
-        if (node->stat.ephemeralOwner != 0)
-            storage.unregisterEphemeralPath(node->stat.ephemeralOwner, request.path);
+        if (node->isEphemeral())
+            storage.unregisterEphemeralPath(node->ephemeralOwner(), request.path);
 
         digest = storage.calculateNodesDigest(digest, new_deltas);
 
@@ -1341,7 +1394,7 @@ struct KeeperStorageSetRequestProcessor final : public KeeperStorageRequestProce
 
         auto node = storage.uncommitted_state.getNode(request.path);
 
-        if (request.version != -1 && request.version != node->stat.version)
+        if (request.version != -1 && request.version != node->version)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADVERSION}};
 
         new_deltas.emplace_back(
@@ -1350,9 +1403,9 @@ struct KeeperStorageSetRequestProcessor final : public KeeperStorageRequestProce
             KeeperStorage::UpdateNodeDelta{
                 [zxid, data = request.data, time](KeeperStorage::Node & value)
                 {
-                    value.stat.version++;
-                    value.stat.mzxid = zxid;
-                    value.stat.mtime = time;
+                    value.version++;
+                    value.mzxid = zxid;
+                    value.setMtime(time);
                     value.setData(data);
                 },
                 request.version});
@@ -1364,7 +1417,7 @@ struct KeeperStorageSetRequestProcessor final : public KeeperStorageRequestProce
                 {
                     [](KeeperStorage::Node & parent)
                     {
-                        parent.stat.cversion++;
+                        parent.cversion++;
                     }
                 }
         );
@@ -1478,7 +1531,7 @@ struct KeeperStorageListRequestProcessor final : public KeeperStorageRequestProc
                 if (child_it == container.end())
                     onStorageInconsistency();
 
-                const auto is_ephemeral = child_it->value.stat.ephemeralOwner != 0;
+                const auto is_ephemeral = child_it->value.isEphemeral();
                 return (is_ephemeral && list_request_type == EPHEMERAL_ONLY) || (!is_ephemeral && list_request_type == PERSISTENT_ONLY);
             };
 
@@ -1531,7 +1584,7 @@ struct KeeperStorageCheckRequestProcessor final : public KeeperStorageRequestPro
         auto node = storage.uncommitted_state.getNode(request.path);
         if (check_not_exists)
         {
-            if (node && (request.version == -1 || request.version == node->stat.version))
+            if (node && (request.version == -1 || request.version == node->version))
                 return {KeeperStorage::Delta{zxid, Coordination::Error::ZNODEEXISTS}};
         }
         else
@@ -1539,7 +1592,7 @@ struct KeeperStorageCheckRequestProcessor final : public KeeperStorageRequestPro
             if (!node)
                 return {KeeperStorage::Delta{zxid, Coordination::Error::ZNONODE}};
 
-            if (request.version != -1 && request.version != node->stat.version)
+            if (request.version != -1 && request.version != node->version)
                 return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADVERSION}};
         }
 
@@ -1575,7 +1628,7 @@ struct KeeperStorageCheckRequestProcessor final : public KeeperStorageRequestPro
 
         if (check_not_exists)
         {
-            if (node_it != container.end() && (request.version == -1 || request.version == node_it->value.stat.version))
+            if (node_it != container.end() && (request.version == -1 || request.version == node_it->value.version))
                 on_error(Coordination::Error::ZNODEEXISTS);
             else
                 response.error = Coordination::Error::ZOK;
@@ -1584,7 +1637,7 @@ struct KeeperStorageCheckRequestProcessor final : public KeeperStorageRequestPro
         {
             if (node_it == container.end())
                 on_error(Coordination::Error::ZNONODE);
-            else if (request.version != -1 && request.version != node_it->value.stat.version)
+            else if (request.version != -1 && request.version != node_it->value.version)
                 on_error(Coordination::Error::ZBADVERSION);
             else
                 response.error = Coordination::Error::ZOK;
@@ -1637,7 +1690,7 @@ struct KeeperStorageSetACLRequestProcessor final : public KeeperStorageRequestPr
 
         auto node = uncommitted_state.getNode(request.path);
 
-        if (request.version != -1 && request.version != node->stat.aversion)
+        if (request.version != -1 && request.version != node->aversion)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADVERSION}};
 
 
@@ -1657,7 +1710,7 @@ struct KeeperStorageSetACLRequestProcessor final : public KeeperStorageRequestPr
                 zxid,
                 KeeperStorage::UpdateNodeDelta
                 {
-                    [](KeeperStorage::Node & n) { ++n.stat.aversion; }
+                    [](KeeperStorage::Node & n) { ++n.aversion; }
                 }
             }
         };
@@ -2075,7 +2128,7 @@ UInt64 KeeperStorage::calculateNodesDigest(UInt64 current_digest, const std::vec
                 [&](const CreateNodeDelta & create_delta)
                 {
                     auto node = std::make_shared<Node>();
-                    node->stat = create_delta.stat;
+                    node->copyStats(create_delta.stat);
                     node->setData(create_delta.data);
                     updated_nodes.emplace(delta.path, node);
                 },
@@ -2198,8 +2251,8 @@ void KeeperStorage::preprocessRequest(
                     {
                         [ephemeral_path](Node & parent)
                         {
-                            ++parent.stat.cversion;
-                            --parent.stat.numChildren;
+                            ++parent.cversion;
+                            --parent.ephemeral_or_children_data.children_info.num_children;
                         }
                     }
                 );
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 01c1413a884..f14a6ed772c 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -35,40 +35,144 @@ public:
     /// New fields should be added to the struct only if it's really necessary
     struct Node
     {
-        /// to reduce size of the Node struct we use a custom Stat without dataLength
-        struct Stat
-        {
-            int64_t czxid{0};
-            int64_t mzxid{0};
-            int64_t ctime{0};
-            int64_t mtime{0};
-            int32_t version{0};
-            int32_t cversion{0};
-            int32_t aversion{0};
-            int32_t numChildren{0}; /// NOLINT
-            int64_t ephemeralOwner{0}; /// NOLINT
-            int64_t pzxid{0};
-
-            bool operator==(const Stat &) const = default;
-        };
-
+        int64_t czxid{0};
+        int64_t mzxid{0};
+        int64_t pzxid{0};
         uint64_t acl_id = 0; /// 0 -- no ACL by default
-        Stat stat{};
-        int32_t seq_num = 0;
+
+        mutable struct
+        {
+            bool has_cached_digest : 1;
+            int64_t ctime : 7;
+        } has_cached_digest_and_ctime{false, 0};
+
+        struct
+        {
+            bool is_ephemeral : 1;
+            int64_t mtime : 7;
+        } is_ephemeral_and_mtime{false, 0};
+
+
+        union
+        {
+            int64_t ephemeral_owner;
+            struct
+            {
+                int32_t seq_num;
+                int32_t num_children;
+            } children_info;
+        } ephemeral_or_children_data{0};
+
+        char * data{nullptr};
+        uint32_t data_size{0};
+
+        int32_t version{0};
+        int32_t cversion{0};
+        int32_t aversion{0};
 
         /// we cannot use `std::optional<uint64_t> because we want to
         /// pack the boolean with seq_num above
-        mutable bool has_cached_digest = false;
         mutable uint64_t cached_digest = 0;
 
+        ~Node()
+        {
+            if (data_size)
+                delete [] data;
+        }
+
+        Node() = default;
+
+        Node & operator=(const Node & other)
+        {
+            if (this == &other)
+                return *this;
+
+            czxid = other.czxid;
+            mzxid = other.mzxid;
+            pzxid = other.pzxid;
+            acl_id = other.acl_id;
+            has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
+            is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
+            ephemeral_or_children_data = other.ephemeral_or_children_data;
+            data_size = other.data_size;
+            version = other.version;
+            cversion = other.cversion;
+            aversion = other.aversion;
+
+            if (data_size != 0)
+            {
+                data = new char[data_size];
+                memcpy(data, other.data, data_size);
+            }
+            return *this;
+        }
+
+        Node(const Node & other)
+        {
+            *this = other;
+        }
+
+        bool isEphemeral() const
+        {
+
+            return is_ephemeral_and_mtime.is_ephemeral;
+        }
+
+        int64_t ephemeralOwner() const
+        {
+            return isEphemeral() ? ephemeral_or_children_data.ephemeral_owner : 0;
+        }
+
+        int32_t numChildren() const
+        {
+            return ephemeral_or_children_data.children_info.num_children;
+        }
+
+        void increaseNumChildren()
+        {
+            ++ephemeral_or_children_data.children_info.num_children;
+        }
+
+        int32_t seqNum() const
+        {
+            return ephemeral_or_children_data.children_info.seq_num;
+        }
+
+        void increaseSeqNum()
+        {
+            ++ephemeral_or_children_data.children_info.seq_num;
+        }
+
+        int64_t ctime() const
+        {
+            return has_cached_digest_and_ctime.ctime;
+        }
+
+        void setCtime(uint64_t ctime)
+        {
+            has_cached_digest_and_ctime.ctime = ctime;
+        }
+
+        int64_t mtime() const
+        {
+            return is_ephemeral_and_mtime.mtime;
+        }
+
+        void setMtime(uint64_t mtime)
+        {
+            is_ephemeral_and_mtime.mtime = mtime;
+        }
+
+        void copyStats(const Coordination::Stat & stat);
+
         void setResponseStat(Coordination::Stat & response_stat) const;
 
         /// Object memory size
         uint64_t sizeInBytes() const;
 
-        void setData(String new_data);
+        void setData(const String & new_data);
 
-        const auto & getData() const noexcept { return data; }
+        StringRef getData() const noexcept { return {data, data_size}; }
 
         void addChild(StringRef child_path);
 
@@ -87,7 +191,6 @@ public:
         // (e.g. we don't need to copy list of children)
         void shallowCopy(const Node & other);
     private:
-        String data;
         ChildrenSet children{};
     };
 
@@ -177,7 +280,7 @@ public:
     //  - quickly commit the changes to the storage
     struct CreateNodeDelta
     {
-        KeeperStorage::Node::Stat stat;
+        Coordination::Stat stat;
         Coordination::ACLs acls;
         String data;
     };
@@ -342,7 +445,7 @@ public:
     bool createNode(
         const std::string & path,
         String data,
-        const KeeperStorage::Node::Stat & stat,
+        const Coordination::Stat & stat,
         Coordination::ACLs node_acls);
 
     // Remove node in the storage
diff --git a/src/Coordination/SnapshotableHashTable.h b/src/Coordination/SnapshotableHashTable.h
index ac8d36745c2..716f08faf64 100644
--- a/src/Coordination/SnapshotableHashTable.h
+++ b/src/Coordination/SnapshotableHashTable.h
@@ -19,55 +19,47 @@ struct ListNode
     StringRef key;
     V value;
 
-    /// |*                *            ****** |
-    ///  ^                ^            ^
-    ///  active_in_map    free_key     version
-    ///  (1 byte)         (1 byte)     (6 bytes)
-    uint64_t node_metadata = 0;
+    struct 
+    {
+        bool active_in_map : 1;
+        bool free_key : 1;
+        uint64_t version : 6;
+    } node_metadata{false, false, 0};
 
     void setInactiveInMap()
     {
-        node_metadata &= ~active_in_map_mask;
+        node_metadata.active_in_map = false;
     }
 
     void setActiveInMap()
     {
-        node_metadata |= active_in_map_mask;
+        node_metadata.active_in_map = true;
     }
 
     bool isActiveInMap()
     {
-        return node_metadata & active_in_map_mask;
+        return node_metadata.active_in_map;
     }
 
     void setFreeKey()
     {
-        node_metadata |= free_key_mask;
+        node_metadata.free_key = true;
     }
 
     bool getFreeKey()
     {
-        return node_metadata & free_key_mask;
+        return node_metadata.free_key;
     }
 
     uint64_t getVersion()
     {
-        return node_metadata & version_mask;
+        return node_metadata.version;
     }
 
     void setVersion(uint64_t version)
     {
-        if (version > version_mask)
-            throw Exception(
-                ErrorCodes::LOGICAL_ERROR, "Snapshot version {} is larger than maximum allowed value {}", version, version_mask);
-
-        node_metadata &= ~version_mask;
-        node_metadata |= version;
+        node_metadata.version = version;
     }
-
-    static constexpr uint64_t active_in_map_mask = static_cast<uint64_t>(1) << 63;
-    static constexpr uint64_t free_key_mask      = static_cast<uint64_t>(1) << 62;
-    static constexpr uint64_t version_mask       = ~(static_cast<uint64_t>(3) << 62);
 };
 
 template <class V>
diff --git a/src/Coordination/ZooKeeperDataReader.cpp b/src/Coordination/ZooKeeperDataReader.cpp
index b55ebef327f..b4334893849 100644
--- a/src/Coordination/ZooKeeperDataReader.cpp
+++ b/src/Coordination/ZooKeeperDataReader.cpp
@@ -105,7 +105,7 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, Poco::L
         Coordination::read(node.acl_id, in);
 
         /// Deserialize stat
-        Coordination::read(node.stat.czxid, in);
+        Coordination::read(node.src/Coordination/ZooKeeperDataReader.cppstat.czxid, in);
         Coordination::read(node.stat.mzxid, in);
         /// For some reason ZXID specified in filename can be smaller
         /// then actual zxid from nodes. In this case we will use zxid from nodes.

From 09f1e2840c2859a517c9f76183a7abd51c488b6f Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 25 Jan 2024 10:06:05 +0100
Subject: [PATCH 0246/1081] Simplified calculatePartSize and upload task

---
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp |   2 -
 .../AzureBlobStorage/AzureObjectStorage.h     |   4 -
 .../copyAzureBlobStorageFile.cpp              | 114 +++++-------------
 3 files changed, 27 insertions(+), 93 deletions(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index cbc2996f5c1..02b0d5bb599 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -165,9 +165,7 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getInt(config_prefix + ".max_single_read_retries", 3),
         config.getInt(config_prefix + ".max_single_download_retries", 3),
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
-        config.getUInt64(config_prefix + ".min_upload_part_size", 16 * 1024 * 1024),
         config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
-        config.getUInt64(config_prefix + ".max_part_number", 10000),
         config.getBool(config_prefix + ".use_native_copy", false)
     );
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 3be4989d4f2..30fedb601dc 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -24,18 +24,14 @@ struct AzureObjectStorageSettings
         int max_single_read_retries_,
         int max_single_download_retries_,
         int list_object_keys_size_,
-        size_t min_upload_part_size_,
         size_t max_upload_part_size_,
-        size_t max_part_number_,
         bool use_native_copy_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
-        , min_upload_part_size(min_upload_part_size_)
         , max_upload_part_size(max_upload_part_size_)
-        , max_part_number(max_part_number_)
         , use_native_copy(use_native_copy_)
     {
     }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 350d2d1d34e..e5517a1a021 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -84,17 +84,10 @@ namespace
 
         struct UploadPartTask
         {
-            char *data = nullptr;
-            size_t size = 0;
-            std::string block_id;
+            std::unique_ptr<ReadBuffer> read_buffer = nullptr;
+            std::vector<std::string> block_ids;
             bool is_finished = false;
             std::exception_ptr exception;
-
-            ~UploadPartTask()
-            {
-                if (data != nullptr)
-                    free(data);
-            }
         };
 
         size_t normal_part_size;
@@ -108,56 +101,11 @@ namespace
 
         void calculatePartSize()
         {
-            if (!total_size)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Chosen multipart upload for an empty file. This must not happen");
-
-            auto max_part_number = settings.get()->max_part_number;
-            auto min_upload_part_size = settings.get()->min_upload_part_size;
             auto max_upload_part_size = settings.get()->max_upload_part_size;
-
-            if (!max_part_number)
-                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_part_number must not be 0");
-            else if (!min_upload_part_size)
-                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "min_upload_part_size must not be 0");
-            else if (max_upload_part_size < min_upload_part_size)
-                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_upload_part_size must not be less than min_upload_part_size");
-
-            size_t part_size = min_upload_part_size;
-            size_t num_parts = (total_size + part_size - 1) / part_size;
-
-            if (num_parts > max_part_number)
-            {
-                part_size = (total_size + max_part_number - 1) / max_part_number;
-                num_parts = (total_size + part_size - 1) / part_size;
-            }
-
-            if (part_size > max_upload_part_size)
-            {
-                part_size = max_upload_part_size;
-                num_parts = (total_size + part_size - 1) / part_size;
-            }
-
-            if (num_parts < 1 || num_parts > max_part_number || part_size < min_upload_part_size || part_size > max_upload_part_size)
-            {
-                String msg;
-                if (num_parts < 1)
-                    msg = "Number of parts is zero";
-                else if (num_parts > max_part_number)
-                    msg = fmt::format("Number of parts exceeds {}", num_parts, max_part_number);
-                else if (part_size < min_upload_part_size)
-                    msg = fmt::format("Size of a part is less than {}", part_size, min_upload_part_size);
-                else
-                    msg = fmt::format("Size of a part exceeds {}", part_size, max_upload_part_size);
-
-                throw Exception(
-                    ErrorCodes::INVALID_CONFIG_PARAMETER,
-                    "{} while writing {} bytes to AzureBlobStorage. Check max_part_number = {}, "
-                    "min_upload_part_size = {}, max_upload_part_size = {}",
-                    msg, total_size, max_part_number, min_upload_part_size, max_upload_part_size);
-            }
-
+            if (!max_upload_part_size)
+                throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_upload_part_size must not be 0");
             /// We've calculated the size of a normal part (the final part can be smaller).
-            normal_part_size = part_size;
+            normal_part_size = max_upload_part_size;
         }
 
     public:
@@ -238,18 +186,13 @@ namespace
 
                 try
                 {
-                    auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
-                    task->data = new char[part_size];
-                    task->size = part_size;
-                    size_t n = read_buffer->read(task->data,part_size);
-                    if (n != part_size)
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected size");
+                    task->read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
 
                     schedule([this, task, task_finish_notify]()
                     {
                         try
                         {
-                            processUploadTask(*task);
+                            processUploadPartRequest(*task);
                         }
                         catch (...)
                         {
@@ -267,38 +210,35 @@ namespace
             else
             {
                 UploadPartTask task;
-                auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
-                task.data = new char[part_size];
-                size_t n = read_buffer->read(task.data,part_size);
-                if (n != part_size)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected size");
-                task.size = part_size;
-                processUploadTask(task);
-                block_ids.emplace_back(task.block_id);
+                task.read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
+                processUploadPartRequest(task);
+                block_ids.insert(block_ids.end(),task.block_ids.begin(), task.block_ids.end());
             }
         }
 
-        void processUploadTask(UploadPartTask & task)
-        {
-            auto block_id = processUploadPartRequest(task);
-
-            std::lock_guard lock(bg_tasks_mutex); /// Protect bg_tasks from race
-            task.block_id = block_id;
-            LOG_TRACE(log, "Writing part finished. Container: {}, Blob: {}, block_id: {}, Parts: {}", dest_container_for_logging, dest_blob, block_id, bg_tasks.size());
-        }
-
-        String processUploadPartRequest(UploadPartTask & task)
+        void processUploadPartRequest(UploadPartTask & task)
         {
             ProfileEvents::increment(ProfileEvents::AzureUploadPart);
             if (for_disk_azure_blob_storage)
                 ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
 
             auto block_blob_client = client.get()->GetBlockBlobClient(dest_blob);
-            task.block_id = getRandomASCIIString(64);
-            Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.data), task.size);
-            block_blob_client.StageBlock(task.block_id, memory);
 
-            return task.block_id;
+            while (!task.read_buffer->eof())
+            {
+                  auto size = task.read_buffer->available();
+                  if (size > 0)
+                  {
+                      auto block_id = getRandomASCIIString(64);
+                      Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.read_buffer->position()), size);
+                      block_blob_client.StageBlock(block_id, memory);
+                      task.block_ids.emplace_back(block_id);
+                      task.read_buffer->ignore(size);
+                      LOG_TRACE(log, "Writing part. Container: {}, Blob: {}, block_id: {}", dest_container_for_logging, dest_blob, block_id);
+                  }
+            }
+            std::lock_guard lock(bg_tasks_mutex); /// Protect bg_tasks from race
+            LOG_TRACE(log, "Writing part finished. Container: {}, Blob: {}, Parts: {}", dest_container_for_logging, dest_blob, bg_tasks.size());
         }
 
 
@@ -316,7 +256,7 @@ namespace
             {
                 if (task.exception)
                     std::rethrow_exception(task.exception);
-                block_ids.emplace_back(task.block_id);
+                block_ids.insert(block_ids.end(),task.block_ids.begin(), task.block_ids.end());
             }
         }
     };

From e8629cf4f56c2fa5f1cd229a8986c628391a1420 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 25 Jan 2024 18:02:55 +0800
Subject: [PATCH 0247/1081] add another perf and tests

---
 src/Functions/if.cpp     | 37 ++++++++++++++++++++++++++++++++-----
 tests/performance/if.xml | 12 ++++++++++++
 2 files changed, 44 insertions(+), 5 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 7f1423cd434..7789fc51ed1 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -219,6 +219,36 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
     }
 }
 
+template <typename ArrayCond, typename A, typename B, typename ArrayResult, typename ResultType>
+inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
+{
+    size_t size = cond.size();
+    if constexpr (std::is_same_v<ResultType, Int8> || std::is_same_v<ResultType, UInt8> || is_over_big_int<ResultType>)
+    {
+        alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
+        for (size_t i = 0; i < size; ++i)
+        {
+            /// Introduce memory access to avoid branch miss
+            res[i] = ab[!cond[i]];
+        }
+    }
+    else if constexpr (std::is_same_v<ResultType, Decimal32> || std::is_same_v<ResultType, Decimal64>)
+    {
+        ResultType new_a = static_cast<ResultType>(a);
+        ResultType new_b = static_cast<ResultType>(b);
+        for (size_t i = 0; i < size; ++i)
+        {
+            /// Reuse new_a and new_b to achieve auto-vectorization
+            res[i] = cond[i] ? new_a : new_b;
+        }
+    }
+    else
+    {
+        for (size_t i = 0; i < size; ++i)
+            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+    }
+}
+
 template <typename A, typename B, typename ResultType>
 struct NumIfImpl
 {
@@ -261,9 +291,7 @@ struct NumIfImpl
         auto col_res = ColVecResult::create(size);
         ArrayResult & res = col_res->getData();
 
-        /// TODO cast a and b only once
-        for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+        fillConstantConstant<ArrayCond, A, B, ArrayResult, ResultType>(cond, a, b, res);
         return col_res;
     }
 };
@@ -312,8 +340,7 @@ struct NumIfImpl<Decimal<A>, Decimal<B>, Decimal<R>>
         auto col_res = ColVecResult::create(size, scale);
         ArrayResult & res = col_res->getData();
 
-        for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b);
+        fillConstantConstant<ArrayCond, A, B, ArrayResult, ResultType>(cond, a, b, res);
         return col_res;
     }
 };
diff --git a/tests/performance/if.xml b/tests/performance/if.xml
index b25218f553e..0f1dca91ac2 100644
--- a/tests/performance/if.xml
+++ b/tests/performance/if.xml
@@ -7,6 +7,18 @@
     <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
     <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
     
+    <!-- Tests when branches are both not constant -->
     <query>with rand32() % 2 as x select if(x, materialize(1.234), materialize(2.456)) from numbers(100000000) format Null</query>
     <query>with rand32() % 2 as x, 1.234::Decimal64(3) as a, 2.456::Decimal64(3) as b select if(x, materialize(a), materialize(b)) from numbers(100000000) format Null</query>
+
+    <!-- Tests when branches are both constant -->
+    <query>with rand32() % 2 as x, 1::Int8 as a, -1::Int8 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int64 as a, -1::Int64 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int32 as a, -1::Int32 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal32(3) as a, -1::Decimal32(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal64(3) as a, -1::Decimal64(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal128(3) as a, -1::Decimal128(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Decimal256(3) as a, -1::Decimal256(3) as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int128 as a, -1::Int128 as b select if(x, a, b) from numbers(100000000) format Null</query>
+    <query>with rand32() % 2 as x, 1::Int256 as a, -1::Int256 as b select if(x, a, b) from numbers(100000000) format Null</query>
 </test>

From aca8e90ec9372447624575f0802c3351cca2150c Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 25 Jan 2024 20:09:26 +0800
Subject: [PATCH 0248/1081] optimize when if condition is constant

---
 src/Functions/if.cpp | 16 +++++-----------
 1 file changed, 5 insertions(+), 11 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 7789fc51ed1..6c5d84c6098 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1204,18 +1204,12 @@ public:
 
         if (cond_const_col)
         {
-            if (arg_then.type->equals(*arg_else.type))
-            {
-                return cond_const_col->getValue<UInt8>()
-                    ? arg_then.column
-                    : arg_else.column;
-            }
+            UInt8 value = cond_const_col->getValue<UInt8>();
+            const ColumnWithTypeAndName & arg = value ? arg_then : arg_else;
+            if (arg.type->equals(*result_type))
+                return arg.column;
             else
-            {
-                /// TODO why materialize condition
-                materialized_cond_col = cond_const_col->convertToFullColumn();
-                cond_col = typeid_cast<const ColumnUInt8 *>(&*materialized_cond_col);
-            }
+                return castColumn(arg, result_type);
         }
 
         if (!cond_col)

From 4b26de9660a317f827bcba4e84cde4176db195d2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 13:26:13 +0000
Subject: [PATCH 0249/1081] Rename setting to use it not only in if/multiIf in
 future

---
 docs/en/operations/settings/settings.md                     | 6 +++---
 docs/en/sql-reference/data-types/variant.md                 | 6 +++---
 src/Core/Settings.h                                         | 4 ++--
 src/Core/SettingsChangesHistory.h                           | 2 +-
 src/Functions/if.cpp                                        | 2 +-
 src/Functions/multiIf.cpp                                   | 2 +-
 tests/queries/0_stateless/02941_variant_type_alters.sh      | 2 +-
 tests/queries/0_stateless/02943_variant_element.sql         | 2 +-
 tests/queries/0_stateless/02943_variant_read_subcolumns.sh  | 2 +-
 ...43_variant_type_with_different_local_and_global_order.sh | 2 +-
 .../0_stateless/02944_variant_as_if_multi_if_result.sql     | 2 +-
 11 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index dcc46a8b4ba..fb2e04f1e35 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5182,14 +5182,14 @@ Allows creation of experimental [Variant](../../sql-reference/data-types/variant
 
 Default value: `false`.
 
-## use_variant_when_no_common_type_in_if {#use_variant_when_no_common_type_in_if}
+## use_variant_as_common_type {#use_variant_as_common_type}
 
 Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
 
 Example:
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT toTypeName(if(number % 2, number, range(number))) as variant_type FROM numbers(1);
 SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
@@ -5208,7 +5208,7 @@ SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT toTypeName(multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL)) AS variant_type FROM numbers(1);
 SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
 ```
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index 34966d79079..afbd1b798b2 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -47,10 +47,10 @@ SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String
 └────────────────────────────────────────┴───────────────┘
 ```
 
-Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_when_no_common_type_in_if` should be enabled for it):
+Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_as_common_type` should be enabled for it):
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
@@ -65,7 +65,7 @@ SELECT if(number % 2, number, range(number)) as variant FROM numbers(5);
 ```
 
 ```sql
-SET use_variant_when_no_common_type_in_if = 1;
+SET use_variant_as_common_type = 1;
 SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) = 2, 'Hello, World!', NULL) AS variant FROM numbers(4);
 ```
 
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 11d33594257..da26a621c0e 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -229,7 +229,7 @@ class IColumn;
     \
     M(Bool, force_index_by_date, false, "Throw an exception if there is a partition key in a table, and it is not used.", 0) \
     M(Bool, force_primary_key, false, "Throw an exception if there is primary key in a table, and it is not used.", 0) \
-    M(Bool, use_skip_indexes, true, "Use data skipping indexes during query execution.", 0) \
+    M(Bool, use_skip_indexes, true, "Use data skinipping indexes during query execution.", 0) \
     M(Bool, use_skip_indexes_if_final, false, "If query has FINAL, then skipping data based on indexes may produce incorrect result, hence disabled by default.", 0) \
     M(String, ignore_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be excluded during query execution.", 0) \
     \
@@ -824,7 +824,7 @@ class IColumn;
     M(Bool, function_json_value_return_type_allow_complex, false, "Allow function JSON_VALUE to return complex type, such as: struct, array, map.", 0) \
     M(Bool, use_with_fill_by_sorting_prefix, true, "Columns preceding WITH FILL columns in ORDER BY clause form sorting prefix. Rows with different values in sorting prefix are filled independently", 0) \
     M(Bool, optimize_uniq_to_count, true, "Rewrite uniq and its variants(except uniqUpTo) to count if subquery has distinct or group by clause.", 0) \
-    M(Bool, use_variant_when_no_common_type_in_if, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
+    M(Bool, use_variant_as_common_type, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
     \
     /** Experimental functions */ \
     M(Bool, allow_experimental_materialized_postgresql_table, false, "Allows to use the MaterializedPostgreSQL table engine. Disabled by default, because this feature is experimental", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index b0306bd951b..d00ccf5aa66 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -88,7 +88,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
               {"allow_experimental_variant_type", false, false, "Add new experimental Variant type"},
-              {"use_variant_when_no_common_type_in_if", false, false, "Allow to use Variant in if/multiIf if there is no common type"},
+              {"use_variant_as_common_type", false, false, "Allow to use Variant in if/multiIf if there is no common type"},
               {"output_format_arrow_use_64_bit_indexes_for_dictionary", false, false, "Allow to use 64 bit indexes type in Arrow dictionaries"},
               {"parallel_replicas_mark_segment_size", 128, 128, "Add new setting to control segment size in new parallel replicas coordinator implementation"},
               {"ignore_materialized_views_with_dropped_target_table", false, false, "Add new setting to allow to ignore materialized views with dropped target table"},
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index c247938f885..c784b2fca59 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -264,7 +264,7 @@ public:
     static constexpr auto name = "if";
     static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if);
+        return std::make_shared<FunctionIf>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     explicit FunctionIf(bool use_variant_when_no_common_type_ = false) : FunctionIfBase(), use_variant_when_no_common_type(use_variant_when_no_common_type_) {}
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 31662bb353e..cb946b55c73 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -118,7 +118,7 @@ public:
             types_of_branches.emplace_back(arg);
         });
 
-        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_when_no_common_type_in_if)
+        if (context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type)
             return getLeastSupertypeOrVariant(types_of_branches);
 
         return getLeastSupertype(types_of_branches);
diff --git a/tests/queries/0_stateless/02941_variant_type_alters.sh b/tests/queries/0_stateless/02941_variant_type_alters.sh
index 9b0d4febd65..7c151d1fe9e 100755
--- a/tests/queries/0_stateless/02941_variant_type_alters.sh
+++ b/tests/queries/0_stateless/02941_variant_type_alters.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 function run()
 {
diff --git a/tests/queries/0_stateless/02943_variant_element.sql b/tests/queries/0_stateless/02943_variant_element.sql
index c8eff9775ad..556c0147e56 100644
--- a/tests/queries/0_stateless/02943_variant_element.sql
+++ b/tests/queries/0_stateless/02943_variant_element.sql
@@ -1,5 +1,5 @@
 set allow_experimental_variant_type=1;
-set use_variant_when_no_common_type_in_if=1;
+set use_variant_as_common_type=1;
 
 select variantElement(NULL::Variant(String, UInt64), 'UInt64') from numbers(4);
 select variantElement(number::Variant(String, UInt64), 'UInt64') from numbers(4);
diff --git a/tests/queries/0_stateless/02943_variant_read_subcolumns.sh b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
index 9ccad55191f..88be09c2036 100755
--- a/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
+++ b/tests/queries/0_stateless/02943_variant_read_subcolumns.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 
 function test()
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index 9f4df8d7466..d089ed3cb2f 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -7,7 +7,7 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_when_no_common_type_in_if=1 "
+CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --use_variant_as_common_type=1 "
 
 
 function test1_insert()
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
index 1121b21e383..d88c0e8b7ae 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
@@ -1,6 +1,6 @@
 set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
 set allow_experimental_variant_type=1;
-set use_variant_when_no_common_type_in_if=1;
+set use_variant_as_common_type=1;
 
 select toTypeName(res), if(1, [1,2,3], 'str_1') as res;
 select toTypeName(res), if(1, [1,2,3], 'str_1'::Nullable(String)) as res;

From 16a9e95605791b1ea73b4973e115a74ddd019e02 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 25 Jan 2024 15:40:11 +0000
Subject: [PATCH 0250/1081] Minor cleanup of msan usage

---
 src/Common/SymbolIndex.cpp                     | 16 +---------------
 src/Compression/CompressionCodecDeflateQpl.cpp | 13 +++++--------
 src/Functions/FunctionsStringSimilarity.cpp    |  3 +--
 3 files changed, 7 insertions(+), 25 deletions(-)

diff --git a/src/Common/SymbolIndex.cpp b/src/Common/SymbolIndex.cpp
index 8e8ffa4d8b7..8dde617fc74 100644
--- a/src/Common/SymbolIndex.cpp
+++ b/src/Common/SymbolIndex.cpp
@@ -1,6 +1,7 @@
 #if defined(__ELF__) && !defined(OS_FREEBSD)
 
 #include <Common/SymbolIndex.h>
+#include <Common/MemorySanitizer.h>
 
 #include <algorithm>
 #include <optional>
@@ -55,21 +56,6 @@ Otherwise you will get only exported symbols from program headers.
 
 */
 
-#if defined(__clang__)
-#   pragma clang diagnostic ignored "-Wreserved-id-macro"
-#   pragma clang diagnostic ignored "-Wunused-macros"
-#endif
-
-#define __msan_unpoison_string(X) // NOLINT
-#define __msan_unpoison(X, Y) // NOLINT
-#if defined(ch_has_feature)
-#    if ch_has_feature(memory_sanitizer)
-#        undef __msan_unpoison_string
-#        undef __msan_unpoison
-#        include <sanitizer/msan_interface.h>
-#    endif
-#endif
-
 
 namespace DB
 {
diff --git a/src/Compression/CompressionCodecDeflateQpl.cpp b/src/Compression/CompressionCodecDeflateQpl.cpp
index ee0356adde5..292f729a38d 100644
--- a/src/Compression/CompressionCodecDeflateQpl.cpp
+++ b/src/Compression/CompressionCodecDeflateQpl.cpp
@@ -6,14 +6,15 @@
 #include <Compression/CompressionFactory.h>
 #include <Compression/CompressionInfo.h>
 #include <Poco/Logger.h>
-#include <Common/randomSeed.h>
-#include <Common/logger_useful.h>
-#include "libaccel_config.h"
 #include <Common/MemorySanitizer.h>
+#include <Common/logger_useful.h>
+#include <Common/randomSeed.h>
 #include <base/scope_guard.h>
 #include <base/getPageSize.h>
-#include <immintrin.h>
 
+#include "libaccel_config.h"
+
+#include <immintrin.h>
 
 namespace DB
 {
@@ -416,9 +417,7 @@ UInt32 CompressionCodecDeflateQpl::doCompressData(const char * source, UInt32 so
 {
 /// QPL library is using AVX-512 with some shuffle operations.
 /// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
-#if defined(MEMORY_SANITIZER)
     __msan_unpoison(dest, getMaxCompressedDataSize(source_size));
-#endif
     Int32 res = HardwareCodecDeflateQpl::RET_ERROR;
     if (DeflateQplJobHWPool::instance().isJobPoolReady())
         res = hw_codec->doCompressData(source, source_size, dest, getMaxCompressedDataSize(source_size));
@@ -439,9 +438,7 @@ void CompressionCodecDeflateQpl::doDecompressData(const char * source, UInt32 so
 {
 /// QPL library is using AVX-512 with some shuffle operations.
 /// Memory sanitizer don't understand if there was uninitialized memory in SIMD register but it was not used in the result of shuffle.
-#if defined(MEMORY_SANITIZER)
     __msan_unpoison(dest, uncompressed_size);
-#endif
 /// Device IOTLB miss has big perf. impact for IAA accelerators.
 /// To avoid page fault, we need touch buffers related to accelerator in advance.
     touchBufferWithZeroFilling(dest, uncompressed_size);
diff --git a/src/Functions/FunctionsStringSimilarity.cpp b/src/Functions/FunctionsStringSimilarity.cpp
index df068531655..aadf5c246fc 100644
--- a/src/Functions/FunctionsStringSimilarity.cpp
+++ b/src/Functions/FunctionsStringSimilarity.cpp
@@ -3,6 +3,7 @@
 #include <Functions/FunctionsHashing.h>
 #include <Common/HashTable/ClearableHashMap.h>
 #include <Common/HashTable/Hash.h>
+#include <Common/MemorySanitizer.h>
 #include <Common/UTF8Helpers.h>
 
 #include <Core/Defines.h>
@@ -108,10 +109,8 @@ struct NgramDistanceImpl
 
         if constexpr (case_insensitive)
         {
-#if defined(MEMORY_SANITIZER)
             /// Due to PODArray padding accessing more elements should be OK
             __msan_unpoison(code_points + (N - 1), padding_offset * sizeof(CodePoint));
-#endif
             /// We really need template lambdas with C++20 to do it inline
             unrollLowering<N - 1>(code_points, std::make_index_sequence<padding_offset>());
         }

From e431f89339aeefef1fd4cdd5a0781d7a3d254e82 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 25 Jan 2024 18:19:46 +0100
Subject: [PATCH 0251/1081] Restart CI

---
 src/Columns/tests/gtest_column_variant.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Columns/tests/gtest_column_variant.cpp b/src/Columns/tests/gtest_column_variant.cpp
index 0a6512c46b7..25f276b9600 100644
--- a/src/Columns/tests/gtest_column_variant.cpp
+++ b/src/Columns/tests/gtest_column_variant.cpp
@@ -677,6 +677,7 @@ TEST(ColumnVariant, ScatterGeneral)
     selector.push_back(1);
     selector.push_back(2);
     selector.push_back(1);
+
     auto columns = column->scatter(3, selector);
     ASSERT_EQ(columns[0]->size(), 3);
     ASSERT_EQ((*columns[0])[0].get<UInt64>(), 42);

From 288d288b8766f75670c82f9f4f190591f2ba7332 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 25 Jan 2024 19:57:51 +0200
Subject: [PATCH 0252/1081] fix failing 00937_template_output_format

---
 src/Core/Settings.h                                       | 2 +-
 src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp | 8 ++++----
 .../0_stateless/00937_format_schema_rows_template.sh      | 3 +--
 3 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d0a327e2d44..f9e3f401d98 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1080,7 +1080,7 @@ class IColumn;
     M(String, format_schema, "", "Schema identifier (used by schema-based formats)", 0) \
     M(String, format_template_resultset, "", "Path to file which contains format string for result set (for Template format)", 0) \
     M(String, format_template_row, "", "Path to file which contains format string for rows (for Template format)", 0) \
-    M(String, format_schema_rows_template, "\n", "Format string for rows (for Template format)", 0) \
+    M(String, format_schema_rows_template, "", "Format string for rows (for Template format)", 0) \
     M(String, format_template_rows_between_delimiter, "\n", "Delimiter between rows (for Template format)", 0) \
     \
     M(EscapingRule, format_custom_escaping_rule, "Escaped", "Field escaping rule (for CustomSeparated format)", 0) \
diff --git a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
index 99a7f59c09e..efda754917b 100644
--- a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
@@ -226,14 +226,14 @@ void registerOutputFormatTemplate(FormatFactory & factory)
         }
         else
         {
-            if (!settings.template_settings.row_format_schema.empty())
-            {
-                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template, but not both");
-            }
             row_format = ParsedTemplateFormatString(
                 FormatSchemaInfo(settings.template_settings.row_format, "Template", false,
                         settings.schema.is_server, settings.schema.format_schema_path),
                 idx_by_name);
+            if (!settings.template_settings.row_format_schema.empty())
+            {
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template, but not both");
+            }
         }
         return std::make_shared<TemplateBlockOutputFormat>(sample, buf, settings, resultset_format, row_format, settings.template_settings.row_between_delimiter);
     });
diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index 8b512513d94..6161f71e78e 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -12,7 +12,7 @@ $CLICKHOUSE_CLIENT --query="CREATE TABLE template (question String, answer Strin
 $CLICKHOUSE_CLIENT --query="INSERT INTO template VALUES
 ('How awesome is clickhouse?', 'unbelievably awesome!', 456, '2016-01-02'),\
 ('How fast is clickhouse?', 'Lightning fast!', 9876543210, '2016-01-03'),\
-('Is it opensource', 'of course it is!', 789, '2016-01-04')";
+('Is it opensource?', 'of course it is!', 789, '2016-01-04')";
 
 $CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
@@ -21,7 +21,6 @@ format_template_rows_between_delimiter = ';\n'";
 echo -e "\n"
 
 # Test that if both format_schema_rows_template setting and format_template_row are provided, error is thrown 
-
 echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > "$CURDIR"/00937_template_output_format_row.tmp
 $CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \

From 08b6ec439e69bd78b166f7f268af0fbed93e5f81 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 25 Jan 2024 18:04:41 +0100
Subject: [PATCH 0253/1081] Try fxi

---
 .../test_broken_projections/test.py           | 177 +++++++++---------
 1 file changed, 85 insertions(+), 92 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 87d910b9c77..5fa3a9ee146 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -27,7 +27,6 @@ def cluster():
     finally:
         cluster.shutdown()
 
-
 def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
@@ -35,9 +34,11 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if aggressive_merge:
         vertical_merge_algorithm_min_rows_to_activate = 1
         vertical_merge_algorithm_min_columns_to_activate = 1
+        max_parts_to_merge_at_once=3
     else:
         vertical_merge_algorithm_min_rows_to_activate = 100000
         vertical_merge_algorithm_min_columns_to_activate = 100
+        max_parts_to_merge_at_once=3
 
     node.query(
         f"""
@@ -49,20 +50,19 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
         c Int64,
         d Int64,
         e Int64,
-
-        PROJECTION proj
+        PROJECTION proj1
         (
             SELECT c ORDER BY d
         ),
-        PROJECTION proj_2
+        PROJECTION proj2
         (
             SELECT d ORDER BY c
         )
     )
     ENGINE = ReplicatedMergeTree('/test_broken_projection_{data_prefix}/data/', '{replica}') ORDER BY a
     SETTINGS min_bytes_for_wide_part = 0,
-        max_parts_to_merge_at_once=3,
-        enable_vertical_merge_algorithm=1,
+        max_parts_to_merge_at_once={max_parts_to_merge_at_once},
+        enable_vertical_merge_algorithm=0,
         vertical_merge_algorithm_min_rows_to_activate = {vertical_merge_algorithm_min_rows_to_activate},
         vertical_merge_algorithm_min_columns_to_activate = {vertical_merge_algorithm_min_columns_to_activate},
         compress_primary_key=0;
@@ -216,16 +216,16 @@ def random_str(length=6):
 def check(node, table, check_result, expect_broken_part="", expected_error=""):
     query_id = random_str()
 
-    if expect_broken_part == "proj":
+    if expect_broken_part == "proj1":
         assert expected_error in node.query_and_get_error(
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
         node.query(
-            f"SELECT c FROM '{table}' WHERE d == 12 OR d == 16 ORDER BY c",
+            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
             query_id=query_id,
         )
-        assert "proj" in node.query(
+        assert "proj1" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
@@ -236,7 +236,7 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
 
     query_id = random_str()
 
-    if expect_broken_part == "proj_2":
+    if expect_broken_part == "proj2":
         assert expected_error in node.query_and_get_error(
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
@@ -245,7 +245,7 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
             query_id=query_id,
         )
-        assert "proj" in node.query(
+        assert "proj2" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
@@ -272,42 +272,42 @@ def test_broken_ignored(cluster):
         node, table_name
     )
 
-    # Break metadata (columns.txt) file of projection 'proj'
-    break_projection(node, table_name, "proj", "all_2_2_0", "metadata")
+    # Break metadata (columns.txt) file of projection 'proj1'
+    break_projection(node, table_name, "proj1", "all_2_2_0", "metadata")
 
     # Do select and after "check table" query.
     # Select works because it does not read columns.txt.
     # But expect check table result as 0.
     check(node, table_name, 0)
 
-    # Projection 'proj' from part all_2_2_0 will now appear in broken parts info
+    # Projection 'proj1' from part all_2_2_0 will now appear in broken parts info
     # because it was marked broken during "check table" query.
-    assert "all_2_2_0\tproj\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+    assert "all_2_2_0\tproj1\tFILE_DOESNT_EXIST" in get_broken_projections_info(
         node, table_name
     )
 
     # Check table query will also show a list of parts which have broken projections.
     assert "all_2_2_0" in check_table_full(node, table_name)
 
-    # Break data file of projection 'proj_2' for part all_2_2_0
-    break_projection(node, table_name, "proj_2", "all_2_2_0", "data")
+    # Break data file of projection 'proj2' for part all_2_2_0
+    break_projection(node, table_name, "proj2", "all_2_2_0", "data")
 
     # It will not yet appear in broken projections info.
-    assert "proj_2" not in get_broken_projections_info(node, table_name)
+    assert "proj2" not in get_broken_projections_info(node, table_name)
 
     # Select now fails with error "File doesn't exist"
-    check(node, table_name, 0, "proj_2", "FILE_DOESNT_EXIST")
+    check(node, table_name, 0, "proj2", "FILE_DOESNT_EXIST")
 
-    # Projection 'proj_2' from part all_2_2_0 will now appear in broken parts info.
-    assert "all_2_2_0\tproj_2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    # Projection 'proj2' from part all_2_2_0 will now appear in broken parts info.
+    assert "all_2_2_0\tproj2\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
 
     # Second select works, because projection is now marked as broken.
     check(node, table_name, 0)
 
-    # Break data file of projection 'proj_2' for part all_3_3_0
-    break_projection(node, table_name, "proj_2", "all_3_3_0", "data")
+    # Break data file of projection 'proj2' for part all_3_3_0
+    break_projection(node, table_name, "proj2", "all_3_3_0", "data")
 
     # It will not yet appear in broken projections info.
     assert "all_3_3_0" not in get_broken_projections_info(node, table_name)
@@ -315,13 +315,13 @@ def test_broken_ignored(cluster):
     insert(node, table_name, 20, 5)
     insert(node, table_name, 25, 5)
 
-    # Part all_3_3_0 has 'proj' and 'proj_2' projections, but 'proj_2' is broken and server does NOT know it yet.
+    # Part all_3_3_0 has 'proj' and 'proj2' projections, but 'proj2' is broken and server does NOT know it yet.
     # Parts all_4_4_0 and all_5_5_0 have both non-broken projections.
     # So a merge will be create for future part all_3_5_1.
-    # During merge it will fail to read from 'proj_2' of part all_3_3_0 and proj_2 will be marked broken.
+    # During merge it will fail to read from 'proj2' of part all_3_3_0 and proj2 will be marked broken.
     # Merge will be retried and on second attempt it will succeed.
     # The result part all_3_5_1 will have only 1 projection - 'proj', because
-    # it will skip 'proj_2' as it will see that one part does not have it anymore in the set of valid projections.
+    # it will skip 'proj2' as it will see that one part does not have it anymore in the set of valid projections.
     optimize(node, table_name, 0, 1)
     time.sleep(5)
 
@@ -333,7 +333,7 @@ def test_broken_ignored(cluster):
     # SELECT count() FROM system.text_log
     # WHERE level='Error'
     # AND logger_name='MergeTreeBackgroundExecutor'
-    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj_2.proj/c.bin%'
+    # AND message like 'Exception while executing background task %{table_uuid}:all_3_5_1%%Cannot open file%proj2.proj/c.bin%'
     # """)
     # )
 
@@ -356,27 +356,27 @@ def test_materialize_broken_projection(cluster):
         node, table_name
     )
 
-    break_projection(node, table_name, "proj", "all_1_1_0", "metadata")
+    break_projection(node, table_name, "proj1", "all_1_1_0", "metadata")
     reattach(node, table_name)
 
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    assert "all_1_1_0\tproj1\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
-    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+    assert "Part all_1_1_0 has a broken projection proj1" in check_table_full(
         node, table_name
     )
 
-    break_projection(node, table_name, "proj_2", "all_1_1_0", "data")
+    break_projection(node, table_name, "proj2", "all_1_1_0", "data")
     reattach(node, table_name)
 
-    assert "all_1_1_0\tproj_2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
+    assert "all_1_1_0\tproj2\tFILE_DOESNT_EXIST" in get_broken_projections_info(
         node, table_name
     )
-    assert "Part all_1_1_0 has a broken projection proj_2" in check_table_full(
+    assert "Part all_1_1_0 has a broken projection proj2" in check_table_full(
         node, table_name
     )
 
-    materialize_projection(node, table_name, "proj")
+    materialize_projection(node, table_name, "proj1")
 
     assert "has a broken projection" not in check_table_full(node, table_name)
 
@@ -398,8 +398,8 @@ def test_broken_ignored_replicated(cluster):
     create_table(node, table_name2, 2, table_name)
     check(node, table_name2, 1)
 
-    break_projection(node, table_name, "proj", "all_0_0_0", "data")
-    assert "Part all_0_0_0 has a broken projection proj" in check_table_full(
+    break_projection(node, table_name, "proj1", "all_0_0_0", "data")
+    assert "Part all_0_0_0 has a broken projection proj1" in check_table_full(
         node, table_name
     )
 
@@ -413,11 +413,11 @@ def get_random_string(string_length=8):
     return "".join((random.choice(alphabet) for _ in range(string_length)))
 
 
-def test_broken_projections_in_backups(cluster):
+def test_broken_projections_in_backups_1(cluster):
     node = cluster.instances["node"]
 
     table_name = "test4"
-    create_table(node, table_name, 1, aggressive_merge=False)
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
 
     node.query("SYSTEM STOP MERGES")
 
@@ -432,24 +432,13 @@ def test_broken_projections_in_backups(cluster):
 
     check(node, table_name, 1)
 
-    break_projection(node, table_name, "proj", "all_2_2_0", "data")
-    check(node, table_name, 0, "proj", "FILE_DOESNT_EXIST")
+    break_projection(node, table_name, "proj1", "all_2_2_0", "data")
+    check(node, table_name, 0, "proj1", "FILE_DOESNT_EXIST")
 
-    assert "all_2_2_0\tproj\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
+    assert "all_2_2_0\tproj1\tNO_FILE_IN_DATA_PART" in get_broken_projections_info(
         node, table_name
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t1\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
-
     backup_name = f"b1-{get_random_string()}"
     assert "BACKUP_CREATED" in node.query(
         f"""
@@ -466,25 +455,32 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
+    node.query("SYSTEM STOP MERGES")
 
     check(node, table_name, 1)
     assert "" == get_broken_projections_info(node, table_name)
 
-    break_projection(node, table_name, "proj_2", "all_2_2_0", "part")
 
-    check(node, table_name, 0, "proj_2", "ErrnoException")
+def test_broken_projections_in_backups_2(cluster):
+    node = cluster.instances["node"]
 
-    assert "all_2_2_0\tproj_2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+    table_name = "test5"
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
+        node, table_name
+    )
+
+    check(node, table_name, 1)
+    break_projection(node, table_name, "proj2", "all_2_2_0", "part")
+    check(node, table_name, 0, "proj2", "ErrnoException")
+
+    assert "all_2_2_0\tproj2\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -495,7 +491,7 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    materialize_projection(node, table_name, "proj_2")
+    materialize_projection(node, table_name, "proj2")
     check(node, table_name, 1)
 
     backup_name = f"b3-{get_random_string()}"
@@ -515,22 +511,31 @@ def test_broken_projections_in_backups(cluster):
     )
     check(node, table_name, 1)
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t0\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
 
-    break_projection(node, table_name, "proj", "all_1_1_0", "part")
-    assert "Part all_1_1_0 has a broken projection proj" in check_table_full(
+def test_broken_projections_in_backups_3(cluster):
+    node = cluster.instances["node"]
+
+    table_name = "test6"
+    create_table(node, table_name, 1, aggressive_merge=False, data_prefix=table_name)
+
+    node.query("SYSTEM STOP MERGES")
+
+    insert(node, table_name, 0, 5)
+    insert(node, table_name, 5, 5)
+    insert(node, table_name, 10, 5)
+    insert(node, table_name, 15, 5)
+
+    assert ["all_0_0_0", "all_1_1_0", "all_2_2_0", "all_3_3_0"] == get_parts(
         node, table_name
     )
-    assert "all_1_1_0\tproj\tFILE_DOESNT_EXIST" == get_broken_projections_info(
+
+    check(node, table_name, 1)
+
+    break_projection(node, table_name, "proj1", "all_1_1_0", "part")
+    assert "Part all_1_1_0 has a broken projection proj1" in check_table_full(
+        node, table_name
+    )
+    assert "all_1_1_0\tproj1\tFILE_DOESNT_EXIST" == get_broken_projections_info(
         node, table_name
     )
 
@@ -550,19 +555,7 @@ def test_broken_projections_in_backups(cluster):
     """
     )
 
-    assert (
-        "all_0_0_0\tproj\t0\n"
-        "all_0_0_0\tproj_2\t0\n"
-        "all_1_1_0\tproj\t1\n"
-        "all_1_1_0\tproj_2\t0\n"
-        "all_2_2_0\tproj\t0\n"
-        "all_2_2_0\tproj_2\t0\n"
-        "all_3_3_0\tproj\t0\n"
-        "all_3_3_0\tproj_2\t0" == get_projections_info(node, table_name)
-    )
-
     check(node, table_name, 0)
-    assert "all_1_1_0\tproj\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
+    assert "all_1_1_0\tproj1\tNO_FILE_IN_DATA_PART" == get_broken_projections_info(
         node, table_name
     )
-    node.query("SYSTEM START MERGES")

From 0c82926b951fc475f4b8bdc4f1000785c0d4664e Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 25 Jan 2024 18:21:38 +0000
Subject: [PATCH 0254/1081] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 5fa3a9ee146..f5e2ecba2b7 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -27,6 +27,7 @@ def cluster():
     finally:
         cluster.shutdown()
 
+
 def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if data_prefix == "":
         data_prefix = table
@@ -34,11 +35,11 @@ def create_table(node, table, replica, data_prefix="", aggressive_merge=True):
     if aggressive_merge:
         vertical_merge_algorithm_min_rows_to_activate = 1
         vertical_merge_algorithm_min_columns_to_activate = 1
-        max_parts_to_merge_at_once=3
+        max_parts_to_merge_at_once = 3
     else:
         vertical_merge_algorithm_min_rows_to_activate = 100000
         vertical_merge_algorithm_min_columns_to_activate = 100
-        max_parts_to_merge_at_once=3
+        max_parts_to_merge_at_once = 3
 
     node.query(
         f"""

From a74c78c4f0cb0ff30014afe2edd78efca3450f49 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 25 Jan 2024 20:56:23 +0200
Subject: [PATCH 0255/1081] fix failing test
 00937_format_schema_rows_template.sh

---
 .../queries/0_stateless/00937_format_schema_rows_template.sh  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index 6161f71e78e..aff5de3b555 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -22,10 +22,10 @@ echo -e "\n"
 
 # Test that if both format_schema_rows_template setting and format_template_row are provided, error is thrown 
 echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > "$CURDIR"/00937_template_output_format_row.tmp
-$CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
+$CLICKHOUSE_CLIENT --multiline --multiquery --query "SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
 format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
-format_template_rows_between_delimiter = ';\n'; --{ serverError 474 }"
+format_template_rows_between_delimiter = ';\n'; --{clientError 474}"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE template";
 rm "$CURDIR"/00937_template_output_format_row.tmp

From 64d18ad8e706e859e1ddd9398ec0a96ae088e07c Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Thu, 25 Jan 2024 22:04:21 +0200
Subject: [PATCH 0256/1081] CI trigger

---
 .../0_stateless/00937_format_schema_rows_template.reference     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.reference b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
index 167f16ec55f..5f59cca2629 100644
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.reference
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
@@ -1,4 +1,4 @@
 Question: 'How awesome is clickhouse?', Answer: 'unbelievably awesome!', Number of Likes: 456, Date: 2016-01-02;
 Question: 'How fast is clickhouse?', Answer: 'Lightning fast!', Number of Likes: 9876543210, Date: 2016-01-03;
-Question: 'Is it opensource', Answer: 'of course it is!', Number of Likes: 789, Date: 2016-01-04
+Question: 'Is it opensource?', Answer: 'of course it is!', Number of Likes: 789, Date: 2016-01-04
 

From ff15ab12b8b48db5871dde0106176dc4c7193df2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 21:06:50 +0000
Subject: [PATCH 0257/1081] Remove bad implementation of
 DataTypeVariant::createColumnConst, support use_variant_as_common_type
 setting in functions array/map

---
 docs/en/operations/settings/settings.md       | 39 ++++++++++-
 docs/en/sql-reference/data-types/variant.md   | 30 ++++++++-
 src/Columns/ColumnMap.cpp                     |  5 ++
 src/Columns/ColumnMap.h                       |  1 +
 src/DataTypes/DataTypeVariant.cpp             | 41 ------------
 src/DataTypes/DataTypeVariant.h               |  1 -
 src/DataTypes/getLeastSupertype.cpp           | 66 +++++++------------
 src/DataTypes/getLeastSupertype.h             |  5 +-
 src/Functions/array/array.cpp                 | 13 +++-
 src/Functions/map.cpp                         | 22 +++++--
 ...=> 02944_variant_as_common_type.reference} |  7 ++
 ...t.sql => 02944_variant_as_common_type.sql} | 13 +++-
 12 files changed, 147 insertions(+), 96 deletions(-)
 rename tests/queries/0_stateless/{02944_variant_as_if_multi_if_result.reference => 02944_variant_as_common_type.reference} (83%)
 rename tests/queries/0_stateless/{02944_variant_as_if_multi_if_result.sql => 02944_variant_as_common_type.sql} (87%)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index fb2e04f1e35..e8fc095438b 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -5184,7 +5184,7 @@ Default value: `false`.
 
 ## use_variant_as_common_type {#use_variant_as_common_type}
 
-Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif) functions when there is no common type for argument types.
+Allows to use `Variant` type as a result type for [if](../../sql-reference/functions/conditional-functions.md/#if)/[multiIf](../../sql-reference/functions/conditional-functions.md/#multiif)/[array](../../sql-reference/functions/array-functions.md)/[map](../../sql-reference/functions/tuple-map-functions.md) functions when there is no common type for argument types.
 
 Example:
 
@@ -5226,6 +5226,43 @@ SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) =
 └───────────────┘
 ```
 
+```sql
+SET use_variant_as_common_type = 1;
+SELECT toTypeName(array(range(number), number, 'str_' || toString(number))) as array_of_variants_type from numbers(1);
+SELECT array(range(number), number, 'str_' || toString(number)) as array_of_variants FROM numbers(3);
+```
+
+```text
+┌─array_of_variants_type────────────────────────┐
+│ Array(Variant(Array(UInt64), String, UInt64)) │
+└───────────────────────────────────────────────┘
+
+┌─array_of_variants─┐
+│ [[],0,'str_0']    │
+│ [[0],1,'str_1']   │
+│ [[0,1],2,'str_2'] │
+└───────────────────┘
+```
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT toTypeName(map('a', range(number), 'b', number, 'c', 'str_' || toString(number))) as map_of_variants_type from numbers(1);
+SELECT map('a', range(number), 'b', number, 'c', 'str_' || toString(number)) as map_of_variants FROM numbers(3);
+```
+
+```text
+┌─map_of_variants_type────────────────────────────────┐
+│ Map(String, Variant(Array(UInt64), String, UInt64)) │
+└─────────────────────────────────────────────────────┘
+
+┌─map_of_variants───────────────┐
+│ {'a':[],'b':0,'c':'str_0'}    │
+│ {'a':[0],'b':1,'c':'str_1'}   │
+│ {'a':[0,1],'b':2,'c':'str_2'} │
+└───────────────────────────────┘
+```
+
+
 Default value: `false`.
 
 ## max_partition_size_to_drop
diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index afbd1b798b2..0058e13b4ca 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -47,7 +47,7 @@ SELECT toTypeName(variant) as type_name, 'Hello, World!'::Variant(UInt64, String
 └────────────────────────────────────────┴───────────────┘
 ```
 
-Using functions `if/multiIf` when arguments doesn't have common type (setting `use_variant_as_common_type` should be enabled for it):
+Using functions `if/multiIf` when arguments don't have common type (setting `use_variant_as_common_type` should be enabled for it):
 
 ```sql
 SET use_variant_as_common_type = 1;
@@ -78,6 +78,34 @@ SELECT multiIf((number % 4) = 0, 42, (number % 4) = 1, [1, 2, 3], (number % 4) =
 └───────────────┘
 ```
 
+Using functions 'array/map' if array elements/map values don't have common type (setting `use_variant_as_common_type` should be enabled for it):
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT array(range(number), number, 'str_' || toString(number)) as array_of_variants FROM numbers(3);
+```
+
+```text
+┌─array_of_variants─┐
+│ [[],0,'str_0']    │
+│ [[0],1,'str_1']   │
+│ [[0,1],2,'str_2'] │
+└───────────────────┘
+```
+
+```sql
+SET use_variant_as_common_type = 1;
+SELECT map('a', range(number), 'b', number, 'c', 'str_' || toString(number)) as map_of_variants FROM numbers(3);
+```
+
+```text
+┌─map_of_variants───────────────┐
+│ {'a':[],'b':0,'c':'str_0'}    │
+│ {'a':[0],'b':1,'c':'str_1'}   │
+│ {'a':[0,1],'b':2,'c':'str_2'} │
+└───────────────────────────────┘
+```
+
 ## Reading Variant nested types as subcolumns
 
 Variant type supports reading a single nested type from a Variant column using the type name as a subcolumn.
diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index ddcde43ca23..307a1ef0f62 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -141,6 +141,11 @@ void ColumnMap::updateHashFast(SipHash & hash) const
     nested->updateHashFast(hash);
 }
 
+void ColumnMap::insertFrom(const IColumn & src, size_t start)
+{
+    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), start);
+}
+
 void ColumnMap::insertRangeFrom(const IColumn & src, size_t start, size_t length)
 {
     nested->insertRangeFrom(
diff --git a/src/Columns/ColumnMap.h b/src/Columns/ColumnMap.h
index fde8a7e0e67..0bae86231f9 100644
--- a/src/Columns/ColumnMap.h
+++ b/src/Columns/ColumnMap.h
@@ -64,6 +64,7 @@ public:
     void updateHashWithValue(size_t n, SipHash & hash) const override;
     void updateWeakHash32(WeakHash32 & hash) const override;
     void updateHashFast(SipHash & hash) const override;
+    void insertFrom(const IColumn & src_, size_t n) override;
     void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
     ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
     void expand(const Filter & mask, bool inverted) override;
diff --git a/src/DataTypes/DataTypeVariant.cpp b/src/DataTypes/DataTypeVariant.cpp
index 3a39fdf9ea8..456b4ea03b6 100644
--- a/src/DataTypes/DataTypeVariant.cpp
+++ b/src/DataTypes/DataTypeVariant.cpp
@@ -96,47 +96,6 @@ MutableColumnPtr DataTypeVariant::createColumn() const
     return ColumnVariant::create(std::move(nested_columns));
 }
 
-ColumnPtr DataTypeVariant::createColumnConst(size_t size, const DB::Field & field) const
-{
-    auto column = createColumn();
-    if (field.isNull())
-    {
-        column->insertDefault();
-    }
-    else
-    {
-        /// We don't have exact mapping Field type -> Data type, so we cannot
-        /// always know in which variant we need to insert the field by it's type.
-        /// Examples:
-        /// Field(42) and Variant(UInt16, String). Type of the Field - UInt64, but we can insert it in UInt16
-        /// Field(42) and Variant(Date, String). Type of the Field - UInt64, but we can insert it in Date
-
-        /// Let's first apply FieldToDataType visitor to find best Data type for this field.
-        /// If we have variant with such type, we will insert this field into it.
-        /// Otherwise we will try to find the first variant that has default Field value with the same type.
-        auto field_type = applyVisitor(FieldToDataType(), field);
-        auto discr = tryGetVariantDiscriminator(field_type);
-        if (!discr)
-        {
-            for (size_t i = 0; i != variants.size(); ++i)
-            {
-                if (field.getType() == variants[i]->getDefault().getType())
-                {
-                    discr = i;
-                    break;
-                }
-            }
-        }
-
-        if (!discr)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot insert field \"{}\" with type {} into column with type {}", toString(field), field.getTypeName(), getName());
-
-        assert_cast<ColumnVariant &>(*column).insertIntoVariant(field, *discr);
-    }
-
-    return ColumnConst::create(std::move(column), size);
-}
-
 Field DataTypeVariant::getDefault() const
 {
     return Null();
diff --git a/src/DataTypes/DataTypeVariant.h b/src/DataTypes/DataTypeVariant.h
index 1a1cb6c12f2..d26ce4ea90f 100644
--- a/src/DataTypes/DataTypeVariant.h
+++ b/src/DataTypes/DataTypeVariant.h
@@ -37,7 +37,6 @@ public:
 
     MutableColumnPtr createColumn() const override;
 
-    ColumnPtr createColumnConst(size_t size, const Field & field) const override;
     Field getDefault() const override;
 
     bool equals(const IDataType & rhs) const override;
diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index 5d67f888c4b..3c64cb755a7 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -59,25 +59,6 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     if constexpr (on_error == LeastSupertypeOnError::String)
         return std::make_shared<DataTypeString>();
 
-    if constexpr (on_error == LeastSupertypeOnError::Variant && std::is_same_v<DataTypes, std::vector<DataTypePtr>>)
-    {
-        DataTypes variants;
-        for (const auto & type : types)
-        {
-            if (isVariant(type))
-            {
-                const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
-                variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
-            }
-            else
-            {
-                variants.push_back(removeNullableOrLowCardinalityNullable(type));
-            }
-        }
-
-        return std::make_shared<DataTypeVariant>(variants);
-    }
-
     if constexpr (on_error == LeastSupertypeOnError::Null)
         return nullptr;
 
@@ -402,17 +383,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            DataTypePtr keys_common_type;
-            if constexpr (on_error == LeastSupertypeOnError::Variant)
-            {
-                keys_common_type = getLeastSupertype<LeastSupertypeOnError::Null>(key_types);
-                if (!keys_common_type)
-                    return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
-            }
-            else
-            {
-                keys_common_type = getLeastSupertype<on_error>(key_types);
-            }
+            DataTypePtr keys_common_type = getLeastSupertype<on_error>(key_types);
 
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
@@ -454,17 +425,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                DataTypePtr nested_type;
-                if constexpr (on_error == LeastSupertypeOnError::Variant)
-                {
-                    nested_type = getLeastSupertype<LeastSupertypeOnError::Null>(nested_types);
-                    if (!nested_type)
-                        return throwOrReturn<on_error>(types, "", ErrorCodes::NO_COMMON_TYPE);
-                }
-                else
-                {
-                    nested_type = getLeastSupertype<on_error>(nested_types);
-                }
+                DataTypePtr nested_type = getLeastSupertype<on_error>(nested_types);
 
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
@@ -684,7 +645,28 @@ DataTypePtr getLeastSupertypeOrString(const DataTypes & types)
 
 DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types)
 {
-    return getLeastSupertype<LeastSupertypeOnError::Variant>(types);
+    auto common_type = getLeastSupertype<LeastSupertypeOnError::Null>(types);
+    if (common_type)
+        return common_type;
+
+    /// Create Variant with provided arguments as variants.
+    DataTypes variants;
+    for (const auto & type : types)
+    {
+        /// Nested Variant types are not supported. If we have Variant type
+        /// we use all its variants in the result Variant.
+        if (isVariant(type))
+        {
+            const DataTypes & nested_variants = assert_cast<const DataTypeVariant &>(*type).getVariants();
+            variants.insert(variants.end(), nested_variants.begin(), nested_variants.end());
+        }
+        else
+        {
+            variants.push_back(removeNullableOrLowCardinalityNullable(type));
+        }
+    }
+
+    return std::make_shared<DataTypeVariant>(variants);
 }
 
 DataTypePtr tryGetLeastSupertype(const DataTypes & types)
diff --git a/src/DataTypes/getLeastSupertype.h b/src/DataTypes/getLeastSupertype.h
index d949fad69c5..ceaffbdab7a 100644
--- a/src/DataTypes/getLeastSupertype.h
+++ b/src/DataTypes/getLeastSupertype.h
@@ -8,7 +8,6 @@ enum class LeastSupertypeOnError
 {
     Throw,
     String,
-    Variant,
     Null,
 };
 
@@ -25,14 +24,14 @@ DataTypePtr getLeastSupertype(const DataTypes & types);
 /// All types can be casted to String, because they can be serialized to String.
 DataTypePtr getLeastSupertypeOrString(const DataTypes & types);
 
-/// Same as getLeastSupertype but in case when there is no supertype for some types
+/// Same as getLeastSupertype but in case when there is no supertype for provided types
 /// it uses Variant of these types as a supertype. Any type can be casted to a Variant
 /// that contains this type.
 /// As nested Variants are not allowed, if one of the types is Variant, it's variants
 /// are used in the resulting Variant.
 /// Examples:
 /// (UInt64, String) -> Variant(UInt64, String)
-/// (Array(UInt64), Array(String)) -> Array(Variant(UInt64, String))
+/// (Array(UInt64), Array(String)) -> Variant(Array(UInt64), Array(String))
 /// (Variant(UInt64, String), Array(UInt32)) -> Variant(UInt64, String, Array(UInt32))
 DataTypePtr getLeastSupertypeOrVariant(const DataTypes & types);
 
diff --git a/src/Functions/array/array.cpp b/src/Functions/array/array.cpp
index 551f0a6625b..4379283ec86 100644
--- a/src/Functions/array/array.cpp
+++ b/src/Functions/array/array.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnArray.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
 
 
 namespace DB
@@ -14,9 +15,12 @@ class FunctionArray : public IFunction
 {
 public:
     static constexpr auto name = "array";
-    static FunctionPtr create(ContextPtr)
+
+    FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
+
+    static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionArray>();
+        return std::make_shared<FunctionArray>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     bool useDefaultImplementationForNulls() const override { return false; }
@@ -31,6 +35,9 @@ public:
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
+        if (use_variant_as_common_type)
+            return std::make_shared<DataTypeArray>(getLeastSupertypeOrVariant(arguments));
+
         return std::make_shared<DataTypeArray>(getLeastSupertype(arguments));
     }
 
@@ -97,6 +104,8 @@ private:
     }
 
     bool addField(DataTypePtr type_res, const Field & f, Array & arr) const;
+
+    bool use_variant_as_common_type = false;
 };
 
 
diff --git a/src/Functions/map.cpp b/src/Functions/map.cpp
index c950a0491a5..79a18dce99b 100644
--- a/src/Functions/map.cpp
+++ b/src/Functions/map.cpp
@@ -8,6 +8,7 @@
 #include <DataTypes/getLeastSupertype.h>
 #include <Columns/ColumnMap.h>
 #include <Interpreters/castColumn.h>
+#include <Interpreters/Context.h>
 #include <Common/HashTable/HashSet.h>
 
 
@@ -30,9 +31,11 @@ class FunctionMap : public IFunction
 public:
     static constexpr auto name = "map";
 
-    static FunctionPtr create(ContextPtr)
+    FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
+
+    static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionMap>();
+        return std::make_shared<FunctionMap>(context->getSettingsRef().allow_experimental_variant_type && context->getSettingsRef().use_variant_as_common_type);
     }
 
     String getName() const override
@@ -77,8 +80,16 @@ public:
         }
 
         DataTypes tmp;
-        tmp.emplace_back(getLeastSupertype(keys));
-        tmp.emplace_back(getLeastSupertype(values));
+        if (use_variant_as_common_type)
+        {
+            tmp.emplace_back(getLeastSupertypeOrVariant(keys));
+            tmp.emplace_back(getLeastSupertypeOrVariant(values));
+        }
+        else
+        {
+            tmp.emplace_back(getLeastSupertype(keys));
+            tmp.emplace_back(getLeastSupertype(values));
+        }
         return std::make_shared<DataTypeMap>(tmp);
     }
 
@@ -138,6 +149,9 @@ public:
 
         return ColumnMap::create(nested_column);
     }
+
+private:
+    bool use_variant_as_common_type = false;
 };
 
 /// mapFromArrays(keys, values) is a function that allows you to make key-value pair from a pair of arrays
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference b/tests/queries/0_stateless/02944_variant_as_common_type.reference
similarity index 83%
rename from tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
rename to tests/queries/0_stateless/02944_variant_as_common_type.reference
index 3803f39253c..0425a8cfa30 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.reference
+++ b/tests/queries/0_stateless/02944_variant_as_common_type.reference
@@ -94,3 +94,10 @@ Variant(Array(UInt64), String, UInt64)	str_2
 Variant(Array(UInt64), String, UInt64)	[0,1,2,3]
 Variant(Array(UInt64), String, UInt64)	4
 Variant(Array(UInt64), String, UInt64)	str_5
+Array(Variant(String, UInt8))	[1,'str_1',2,'str_2']
+Array(Variant(Array(String), Array(UInt8)))	[[1,2,3],['str_1','str_2','str_3']]
+Array(Variant(Array(UInt8), Array(Variant(Array(String), Array(UInt8)))))	[[[1,2,3],['str_1','str_2','str_3']],[1,2,3]]
+Array(Variant(Array(Array(UInt8)), Array(UInt8)))	[[1,2,3],[[1,2,3]]]
+Map(String, Variant(String, UInt8))	{'a':1,'b':'str_1'}
+Map(String, Variant(Map(String, Variant(String, UInt8)), UInt8))	{'a':1,'b':{'c':2,'d':'str_1'}}
+Map(String, Variant(Array(Array(UInt8)), Array(UInt8), UInt8))	{'a':1,'b':[1,2,3],'c':[[4,5,6]]}
diff --git a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql b/tests/queries/0_stateless/02944_variant_as_common_type.sql
similarity index 87%
rename from tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
rename to tests/queries/0_stateless/02944_variant_as_common_type.sql
index d88c0e8b7ae..e985cf365dd 100644
--- a/tests/queries/0_stateless/02944_variant_as_if_multi_if_result.sql
+++ b/tests/queries/0_stateless/02944_variant_as_common_type.sql
@@ -1,4 +1,5 @@
-set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer.
+set allow_experimental_analyzer=0; -- The result type for if function with constant is different with analyzer. It wil be fixed after refactoring around constants in analyzer.
+
 set allow_experimental_variant_type=1;
 set use_variant_as_common_type=1;
 
@@ -63,3 +64,13 @@ select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 =
 select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(String)) as res from numbers(6);
 select toTypeName(res), multiIf(number % 3 == 0, range(number + 1), number % 3 == 1, number, ('str_' || toString(number))::LowCardinality(Nullable(String))) as res from numbers(6);
 
+
+select toTypeName(res), array(1, 'str_1', 2, 'str_2') as res;
+select toTypeName(res), array([1, 2, 3], ['str_1', 'str_2', 'str_3']) as res;
+select toTypeName(res), array(array([1, 2, 3], ['str_1', 'str_2', 'str_3']), [1, 2, 3]) as res;
+select toTypeName(res), array([1, 2, 3], [[1, 2, 3]]) as res;
+
+select toTypeName(res), map('a', 1, 'b', 'str_1') as res;
+select toTypeName(res), map('a', 1, 'b', map('c', 2, 'd', 'str_1')) as res;
+select toTypeName(res), map('a', 1, 'b', [1, 2, 3], 'c', [[4, 5, 6]]) as res;
+

From caeb31940ce9fce6d98ab9629881a099a349703c Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 25 Jan 2024 20:20:58 +0000
Subject: [PATCH 0258/1081] Allow to build without libssl

---
 contrib/libssh-cmake/CMakeLists.txt     | 2 +-
 src/Access/Authentication.cpp           | 4 ++--
 src/Access/AuthenticationData.cpp       | 4 ++--
 src/Access/UsersConfigAccessStorage.cpp | 2 +-
 src/Client/Connection.cpp               | 4 ++--
 src/Client/ConnectionParameters.cpp     | 2 +-
 src/Common/SSH/Wrappers.cpp             | 2 +-
 src/Common/SSH/Wrappers.h               | 2 +-
 src/Common/config.h.in                  | 1 +
 src/configure_config.cmake              | 3 +++
 10 files changed, 15 insertions(+), 11 deletions(-)

diff --git a/contrib/libssh-cmake/CMakeLists.txt b/contrib/libssh-cmake/CMakeLists.txt
index 7a3816d4dce..eee3df832fa 100644
--- a/contrib/libssh-cmake/CMakeLists.txt
+++ b/contrib/libssh-cmake/CMakeLists.txt
@@ -1,4 +1,4 @@
-option (ENABLE_SSH "Enable support for SSH keys and protocol" ON)
+option (ENABLE_SSH "Enable support for SSH keys and protocol" ${ENABLE_LIBRARIES})
 
 if (NOT ENABLE_SSH)
     message(STATUS "Not using SSH")
diff --git a/src/Access/Authentication.cpp b/src/Access/Authentication.cpp
index 372334bb152..47187d83154 100644
--- a/src/Access/Authentication.cpp
+++ b/src/Access/Authentication.cpp
@@ -73,7 +73,7 @@ namespace
         return checkPasswordDoubleSHA1MySQL(scramble, scrambled_password, Util::encodeDoubleSHA1(password_plaintext));
     }
 
-#if USE_SSL
+#if USE_SSH
     bool checkSshSignature(const std::vector<ssh::SSHKey> & keys, std::string_view signature, std::string_view original)
     {
         for (const auto & key: keys)
@@ -243,7 +243,7 @@ bool Authentication::areCredentialsValid(
                 throw Authentication::Require<SSLCertificateCredentials>("ClickHouse X.509 Authentication");
 
             case AuthenticationType::SSH_KEY:
-#if USE_SSL
+#if USE_SSH
                 return checkSshSignature(auth_data.getSSHKeys(), ssh_credentials->getSignature(), ssh_credentials->getOriginal());
 #else
                 throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
diff --git a/src/Access/AuthenticationData.cpp b/src/Access/AuthenticationData.cpp
index 1036e1e027e..da90a0f5842 100644
--- a/src/Access/AuthenticationData.cpp
+++ b/src/Access/AuthenticationData.cpp
@@ -320,7 +320,7 @@ std::shared_ptr<ASTAuthenticationData> AuthenticationData::toAST() const
         }
         case AuthenticationType::SSH_KEY:
         {
-#if USE_SSL
+#if USE_SSH
             for (const auto & key : getSSHKeys())
                 node->children.push_back(std::make_shared<ASTPublicSSHKey>(key.getBase64(), key.getKeyType()));
 
@@ -353,7 +353,7 @@ AuthenticationData AuthenticationData::fromAST(const ASTAuthenticationData & que
     /// For this type of authentication we have ASTPublicSSHKey as children for ASTAuthenticationData
     if (query.type && query.type == AuthenticationType::SSH_KEY)
     {
-#if USE_SSL
+#if USE_SSH
         AuthenticationData auth_data(*query.type);
         std::vector<ssh::SSHKey> keys;
 
diff --git a/src/Access/UsersConfigAccessStorage.cpp b/src/Access/UsersConfigAccessStorage.cpp
index 2b0fb3f9b2e..e9b2e1397ab 100644
--- a/src/Access/UsersConfigAccessStorage.cpp
+++ b/src/Access/UsersConfigAccessStorage.cpp
@@ -209,7 +209,7 @@ namespace
         }
         else if (has_ssh_keys)
         {
-#if USE_SSL
+#if USE_SSH
             user->auth_data = AuthenticationData{AuthenticationType::SSH_KEY};
 
             Poco::Util::AbstractConfiguration::Keys entries;
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index 352d2a53892..4848f4c7ee5 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -316,7 +316,7 @@ void Connection::sendHello()
                         "Inter-server secret support is disabled, because ClickHouse was built without SSL library");
 #endif
     }
-#if USE_SSL
+#if USE_SSH
     /// Just inform server that we will authenticate using SSH keys.
     else if (!ssh_private_key.isEmpty())
     {
@@ -346,7 +346,7 @@ void Connection::sendAddendum()
 
 void Connection::performHandshakeForSSHAuth()
 {
-#if USE_SSL
+#if USE_SSH
     String challenge;
     {
         writeVarUInt(Protocol::Client::SSHChallengeRequest, *out);
diff --git a/src/Client/ConnectionParameters.cpp b/src/Client/ConnectionParameters.cpp
index cadabc98447..a0ae47f0620 100644
--- a/src/Client/ConnectionParameters.cpp
+++ b/src/Client/ConnectionParameters.cpp
@@ -79,7 +79,7 @@ ConnectionParameters::ConnectionParameters(const Poco::Util::AbstractConfigurati
     }
     else
     {
-#if USE_SSL
+#if USE_SSH
         std::string filename = config.getString("ssh-key-file");
         std::string passphrase;
         if (config.has("ssh-key-passphrase"))
diff --git a/src/Common/SSH/Wrappers.cpp b/src/Common/SSH/Wrappers.cpp
index b38dd1f4036..463338dbe3f 100644
--- a/src/Common/SSH/Wrappers.cpp
+++ b/src/Common/SSH/Wrappers.cpp
@@ -1,5 +1,5 @@
 #include <Common/SSH/Wrappers.h>
-# if USE_SSL
+# if USE_SSH
 #    include <stdexcept>
 
 #    pragma GCC diagnostic push
diff --git a/src/Common/SSH/Wrappers.h b/src/Common/SSH/Wrappers.h
index 9036fac3163..699bba2b042 100644
--- a/src/Common/SSH/Wrappers.h
+++ b/src/Common/SSH/Wrappers.h
@@ -1,7 +1,7 @@
 #pragma once
 #include <Common/Exception.h>
 #include "config.h"
-#if USE_SSL
+#if USE_SSH
 #    include <string_view>
 #    include <base/types.h>
 
diff --git a/src/Common/config.h.in b/src/Common/config.h.in
index 5b3388a3b7d..8e513dca145 100644
--- a/src/Common/config.h.in
+++ b/src/Common/config.h.in
@@ -5,6 +5,7 @@
 #cmakedefine01 USE_CPUID
 #cmakedefine01 USE_BASE64
 #cmakedefine01 USE_SSL
+#cmakedefine01 USE_SSH
 #cmakedefine01 USE_HDFS
 #cmakedefine01 USE_AWS_S3
 #cmakedefine01 USE_AZURE_BLOB_STORAGE
diff --git a/src/configure_config.cmake b/src/configure_config.cmake
index 7de2d5a9fdd..141e51badbb 100644
--- a/src/configure_config.cmake
+++ b/src/configure_config.cmake
@@ -164,6 +164,9 @@ endif ()
 if (ENABLE_OPENSSL)
     set(USE_OPENSSL_INTREE 1)
 endif ()
+if (TARGET ch_contrib::ssh)
+    set(USE_SSH 1)
+endif()
 if (TARGET ch_contrib::fiu)
     set(FIU_ENABLE 1)
 endif()

From 36055bd0089f52473f893d71c475a2782a45e8b4 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Thu, 25 Jan 2024 21:44:46 +0000
Subject: [PATCH 0259/1081] init

---
 src/Functions/FunctionBinaryArithmetic.h      | 106 ++++++++++++++----
 src/Functions/IsOperation.h                   |   4 +-
 .../02975_intdiv_with_decimal.reference       |  52 +++++++++
 .../0_stateless/02975_intdiv_with_decimal.sql |  54 +++++++++
 4 files changed, 196 insertions(+), 20 deletions(-)
 create mode 100644 tests/queries/0_stateless/02975_intdiv_with_decimal.reference
 create mode 100644 tests/queries/0_stateless/02975_intdiv_with_decimal.sql

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 1b2519d1ec5..e34514d15fd 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -146,10 +146,24 @@ private: /// it's not correct for Decimal
 
 public:
     static constexpr bool allow_decimal = IsOperation<Operation>::allow_decimal;
+    static constexpr bool only_integer = IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero;
 
     /// Appropriate result type for binary operator on numeric types. "Date" can also mean
     /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
     using ResultDataType = Switch<
+        /// Result must be Integer
+        Case<
+            only_integer && IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>,
+            Switch<
+                Case<std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>, DataTypeInt256>,
+                Case<std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>, DataTypeInt128>,
+                Case<std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>, DataTypeInt64>,
+                Case<std::is_same_v<LeftDataType, DataTypeDecimal32> || std::is_same_v<RightDataType, DataTypeDecimal32>, DataTypeInt32>>>,
+        Case<
+            only_integer,
+            Switch<
+                Case<IsIntegral<LeftDataType>, LeftDataType>,
+                Case<IsIntegral<RightDataType>, RightDataType>>>,
         /// Decimal cases
         Case<!allow_decimal && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>), InvalidType>,
         Case<
@@ -1667,31 +1681,77 @@ public:
                 {
                     if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr (is_division)
+                        if constexpr (is_div_int || is_div_int_or_zero)
                         {
-                            if (context->getSettingsRef().decimal_check_overflow)
-                            {
-                                /// Check overflow by using operands scale (based on big decimal division implementation details):
-                                /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
-                                /// i.e. int_operand = decimal_operand*10^scale
-                                /// For division, left operand will be scaled by right operand scale also to do big integer division,
-                                /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
-                                /// So, we can check upfront possible overflow just by checking max scale used for left operand
-                                /// Note: it doesn't detect all possible overflow during big decimal division
-                                if (left.getScale() + right.getScale() > ResultDataType::maxPrecision())
-                                    throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
-                            }
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>)
+                                type_res = std::make_shared<DataTypeInt256>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>)
+                                type_res = std::make_shared<DataTypeInt128>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>)
+                                type_res = std::make_shared<DataTypeInt64>();
+                            else
+                                type_res = std::make_shared<DataTypeInt32>();
+                        }
+                        else
+                        {
+                            if constexpr (is_division)
+                            {
+                                if (context->getSettingsRef().decimal_check_overflow)
+                                {
+                                    /// Check overflow by using operands scale (based on big decimal division implementation details):
+                                    /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
+                                    /// i.e. int_operand = decimal_operand*10^scale
+                                    /// For division, left operand will be scaled by right operand scale also to do big integer division,
+                                    /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
+                                    /// So, we can check upfront possible overflow just by checking max scale used for left operand
+                                    /// Note: it doesn't detect all possible overflow during big decimal division
+                                    if (left.getScale() + right.getScale() > ResultDataType::maxPrecision())
+                                        throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
+                                }
+                            }
+                            ResultDataType result_type = decimalResultType<is_multiply, is_division>(left, right);
+                            type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
                         }
-                        ResultDataType result_type = decimalResultType<is_multiply, is_division>(left, right);
-                        type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
                     }
                     else if constexpr ((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
                         (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>))
                         type_res = std::make_shared<DataTypeFloat64>();
                     else if constexpr (IsDataTypeDecimal<LeftDataType>)
-                        type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
+                    {
+                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegral<RightDataType>)
+                            type_res = std::make_shared<RightDataType>();
+                        else if constexpr (is_div_int || is_div_int_or_zero)
+                        {
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
+                                type_res = std::make_shared<DataTypeInt256>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
+                                type_res = std::make_shared<DataTypeInt128>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
+                                type_res = std::make_shared<DataTypeInt64>();
+                            else
+                                type_res = std::make_shared<DataTypeInt32>();
+                        }
+                        else
+                            type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
+                    }
                     else if constexpr (IsDataTypeDecimal<RightDataType>)
-                        type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
+                    {
+                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegral<LeftDataType>)
+                            type_res = std::make_shared<LeftDataType>();
+                        else if constexpr (is_div_int || is_div_int_or_zero)
+                        {
+                            if constexpr (std::is_same_v<RightDataType, DataTypeDecimal256>)
+                                type_res = std::make_shared<DataTypeInt256>();
+                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal128>)
+                                type_res = std::make_shared<DataTypeInt128>();
+                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal64>)
+                                type_res = std::make_shared<DataTypeInt64>();
+                            else
+                                type_res = std::make_shared<DataTypeInt32>();
+                        }
+                        else
+                            type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
+                    }
                     else if constexpr (std::is_same_v<ResultDataType, DataTypeDateTime>)
                     {
                         // Special case for DateTime: binary OPS should reuse timezone
@@ -2009,8 +2069,10 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
             constexpr bool decimal_with_float = (IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>)
                 || (IsFloatingPoint<LeftDataType> && IsDataTypeDecimal<RightDataType>);
 
-            using T0 = std::conditional_t<decimal_with_float, Float64, typename LeftDataType::FieldType>;
-            using T1 = std::conditional_t<decimal_with_float, Float64, typename RightDataType::FieldType>;
+            constexpr bool is_div_int_with_decimal = (is_div_int || is_div_int_or_zero) && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>);
+
+            using T0 = std::conditional_t<decimal_with_float, Float64, std::conditional_t<is_div_int_with_decimal, Int64, typename LeftDataType::FieldType>>;
+            using T1 = std::conditional_t<decimal_with_float, Float64, std::conditional_t<is_div_int_with_decimal, Int64, typename RightDataType::FieldType>>;
             using ResultType = typename ResultDataType::FieldType;
             using ColVecT0 = ColumnVectorOrDecimal<T0>;
             using ColVecT1 = ColumnVectorOrDecimal<T1>;
@@ -2026,6 +2088,12 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                 left_col = castColumn(arguments[0], converted_type);
                 right_col = castColumn(arguments[1], converted_type);
             }
+            else if constexpr (is_div_int_with_decimal)
+            {
+                const auto converted_type = std::make_shared<DataTypeInt64>();
+                left_col = castColumn(arguments[0], converted_type);
+                right_col = castColumn(arguments[1], converted_type);
+            }
             else
             {
                 left_col = arguments[0].column;
diff --git a/src/Functions/IsOperation.h b/src/Functions/IsOperation.h
index 8ea53c865ce..b36530591ef 100644
--- a/src/Functions/IsOperation.h
+++ b/src/Functions/IsOperation.h
@@ -62,7 +62,9 @@ struct IsOperation
 
     static constexpr bool division = div_floating || div_int || div_int_or_zero || modulo;
 
-    static constexpr bool allow_decimal = plus || minus || multiply || division || least || greatest;
+    static constexpr bool division_allow_decimal = div_floating || modulo;
+
+    static constexpr bool allow_decimal = plus || minus || multiply || division_allow_decimal || least || greatest;
 };
 
 }
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.reference b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
new file mode 100644
index 00000000000..9c1faab21d7
--- /dev/null
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
@@ -0,0 +1,52 @@
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.sql b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
new file mode 100644
index 00000000000..8fc4b5a9a7d
--- /dev/null
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
@@ -0,0 +1,54 @@
+--intDiv--
+SELECT intDiv(4,2);
+SELECT intDiv(toDecimal32(4.4, 2), 2);
+SELECT intDiv(4, toDecimal32(2.2, 2));
+SELECT intDiv(toDecimal32(4.4, 2), 2);
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal32(2.2, 2));
+SELECT intDiv(toDecimal64(4.4, 3), 2);
+SELECT intDiv(toDecimal64(4.4, 3), toDecimal32(2.2, 2));
+SELECT intDiv(toDecimal128(4.4, 4), 2);
+SELECT intDiv(toDecimal128(4.4, 4), toDecimal32(2.2, 2));
+SELECT intDiv(toDecimal256(4.4, 5), 2);
+SELECT intDiv(toDecimal256(4.4, 5), toDecimal32(2.2, 2));
+SELECT intDiv(4, toDecimal64(2.2, 2));
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDiv(4, toDecimal128(2.2, 3));
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal128(2.2, 3));
+SELECT intDiv(4, toDecimal256(2.2, 4));
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal256(2.2, 4));
+SELECT intDiv(toDecimal64(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDiv(toDecimal128(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDiv(toDecimal256(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDiv(toDecimal64(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDiv(toDecimal128(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDiv(toDecimal256(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDiv(toDecimal64(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDiv(toDecimal128(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDiv(toDecimal256(4.4, 2), toDecimal256(2.2, 2));
+--intDivOrZero--
+SELECT intDivOrZero(4,2);
+SELECT intDivOrZero(toDecimal32(4.4, 2), 2);
+SELECT intDivOrZero(4, toDecimal32(2.2, 2));
+SELECT intDivOrZero(toDecimal32(4.4, 2), 2);
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal32(2.2, 2));
+SELECT intDivOrZero(toDecimal64(4.4, 3), 2);
+SELECT intDivOrZero(toDecimal64(4.4, 3), toDecimal32(2.2, 2));
+SELECT intDivOrZero(toDecimal128(4.4, 4), 2);
+SELECT intDivOrZero(toDecimal128(4.4, 4), toDecimal32(2.2, 2));
+SELECT intDivOrZero(toDecimal256(4.4, 5), 2);
+SELECT intDivOrZero(toDecimal256(4.4, 5), toDecimal32(2.2, 2));
+SELECT intDivOrZero(4, toDecimal64(2.2, 2));
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDivOrZero(4, toDecimal128(2.2, 3));
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal128(2.2, 3));
+SELECT intDivOrZero(4, toDecimal256(2.2, 4));
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal256(2.2, 4));
+SELECT intDivOrZero(toDecimal64(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDivOrZero(toDecimal128(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal64(2.2, 2));
+SELECT intDivOrZero(toDecimal64(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDivOrZero(toDecimal128(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal128(2.2, 2));
+SELECT intDivOrZero(toDecimal64(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDivOrZero(toDecimal128(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal256(2.2, 2));

From 7f6784937d91c628286a8d630d451460df897b64 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 25 Jan 2024 23:59:24 +0000
Subject: [PATCH 0260/1081] Fix

---
 src/DataTypes/getLeastSupertype.cpp | 26 +++++++++++---------------
 1 file changed, 11 insertions(+), 15 deletions(-)

diff --git a/src/DataTypes/getLeastSupertype.cpp b/src/DataTypes/getLeastSupertype.cpp
index 3c64cb755a7..09d44eeb160 100644
--- a/src/DataTypes/getLeastSupertype.cpp
+++ b/src/DataTypes/getLeastSupertype.cpp
@@ -68,8 +68,8 @@ DataTypePtr throwOrReturn(const DataTypes & types, std::string_view message_suff
     throw Exception(error_code, "There is no supertype for types {} {}", getExceptionMessagePrefix(types), message_suffix);
 }
 
-template <typename ThrowOrReturnFunc>
-DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOrReturnFunc)
+template <LeastSupertypeOnError on_error>
+DataTypePtr getNumericType(const TypeIndexSet & types)
 {
     bool all_numbers = true;
 
@@ -120,7 +120,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
     if (max_bits_of_signed_integer || max_bits_of_unsigned_integer || max_mantissa_bits_of_floating)
     {
         if (!all_numbers)
-            return throwOrReturnFunc(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
+            return throwOrReturn<on_error>(types, "because some of them are numbers and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
         /// If there are signed and unsigned types of same bit-width, the result must be signed number with at least one more bit.
         /// Example, common of Int32, UInt32 = Int64.
@@ -135,7 +135,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             if (min_bit_width_of_integer != 64)
                 ++min_bit_width_of_integer;
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     "because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values",
                     ErrorCodes::NO_COMMON_TYPE);
@@ -150,7 +150,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_mantissa_bits <= 53)
                 return std::make_shared<DataTypeFloat64>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " because some of them are integers and some are floating point,"
                     " but there is no floating point type, that can exactly represent all required integers", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -171,7 +171,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeInt256>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " because some of them are signed integers and some are unsigned integers,"
                     " but there is no signed integer type, that can exactly represent all required unsigned integer values", ErrorCodes::NO_COMMON_TYPE);
         }
@@ -191,7 +191,7 @@ DataTypePtr getNumericType(const TypeIndexSet & types, ThrowOrReturnFunc throwOr
             else if (min_bit_width_of_integer <= 256)
                 return std::make_shared<DataTypeUInt256>();
             else
-                return throwOrReturnFunc(types,
+                return throwOrReturn<on_error>(types,
                     " but as all data types are unsigned integers, we must have found maximum unsigned integer type", ErrorCodes::NO_COMMON_TYPE);
         }
     }
@@ -383,7 +383,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
             if (!all_maps)
                 return throwOrReturn<on_error>(types, "because some of them are Maps and some of them are not", ErrorCodes::NO_COMMON_TYPE);
 
-            DataTypePtr keys_common_type = getLeastSupertype<on_error>(key_types);
+            auto keys_common_type = getLeastSupertype<on_error>(key_types);
 
             auto values_common_type = getLeastSupertype<on_error>(value_types);
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype for keys or values,
@@ -425,7 +425,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
                 return getLeastSupertype<on_error>(nested_types);
             else
             {
-                DataTypePtr nested_type = getLeastSupertype<on_error>(nested_types);
+                auto nested_type = getLeastSupertype<on_error>(nested_types);
 
                 /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
                 /// nested_type will be nullptr, we should return nullptr in this case.
@@ -459,8 +459,6 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
         if (have_nullable)
         {
             auto nested_type = getLeastSupertype<on_error>(nested_types);
-            if (isVariant(nested_type))
-                return nested_type;
             /// When on_error == LeastSupertypeOnError::Null and we cannot get least supertype,
             /// nested_type will be nullptr, we should return nullptr in this case.
             if (!nested_type)
@@ -628,8 +626,7 @@ DataTypePtr getLeastSupertype(const DataTypes & types)
     {
         /// First, if we have signed integers, try to convert all UInt64 to Int64 if possible.
         convertUInt64toInt64IfPossible(types, type_ids);
-        auto throw_or_return = [&](const TypeIndexSet &, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(types, message_suffix, error_code); };
-        auto numeric_type = getNumericType(type_ids, throw_or_return);
+        auto numeric_type = getNumericType<on_error>(type_ids);
         if (numeric_type)
             return numeric_type;
     }
@@ -708,8 +705,7 @@ DataTypePtr getLeastSupertype(const TypeIndexSet & types)
         return std::make_shared<DataTypeString>();
     }
 
-    auto throw_or_return = [](const TypeIndexSet & type_ids, std::string_view message_suffix, int error_code){ return throwOrReturn<on_error>(type_ids, message_suffix, error_code); };
-    auto numeric_type = getNumericType(types, throw_or_return);
+    auto numeric_type = getNumericType<on_error>(types);
     if (numeric_type)
         return numeric_type;
 

From 918614970b8bbf0938e2ee5769d9891ec6cfecbf Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 26 Jan 2024 02:02:03 +0100
Subject: [PATCH 0261/1081] Fix style

---
 tests/integration/test_storage_hdfs/test.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 165dfb212b7..121263fb622 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -599,9 +599,7 @@ def test_schema_inference_with_globs(started_cluster):
         f"desc hdfs('hdfs://hdfs1:9000/data*.jsoncompacteachrow') settings schema_inference_use_cache_for_hdfs=0, input_format_json_infer_incomplete_types_as_strings=0"
     )
 
-    assert (
-        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
-    )
+    assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
 
 
 def test_insert_select_schema_inference(started_cluster):

From 13c86248719eabd22856e5af7161f2f7547fdd8e Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 26 Jan 2024 02:03:12 +0100
Subject: [PATCH 0262/1081] Fix style

---
 tests/integration/test_storage_s3/test.py | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index 0b5e9462860..dbbe670e8ca 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1379,9 +1379,7 @@ def test_schema_inference_from_globs(started_cluster):
         f"desc s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test*.jsoncompacteachrow') settings schema_inference_use_cache_for_s3=0, input_format_json_infer_incomplete_types_as_strings=0"
     )
 
-    assert (
-        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
-    )
+    assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
 
     url_filename = "test{0,1,2,3}.jsoncompacteachrow"
 
@@ -1389,9 +1387,7 @@ def test_schema_inference_from_globs(started_cluster):
         f"desc url('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/{url_filename}') settings schema_inference_use_cache_for_url=0, input_format_json_infer_incomplete_types_as_strings=0"
     )
 
-    assert (
-        "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
-    )
+    assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in result
 
 
 def test_signatures(started_cluster):

From 626e30609a08290f22b328f7282644bed766e649 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 26 Jan 2024 10:43:27 +0800
Subject: [PATCH 0263/1081] change as request

---
 src/Functions/if.cpp | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 6c5d84c6098..49e0f7320ff 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -48,11 +48,11 @@ using namespace GatherUtils;
 */
 
 template <typename ResultType>
-struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
-{
-    static constexpr bool value = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
-};
+concept is_native_int_or_decimal_v
+    = std::is_integral_v<ResultType> || (is_decimal<ResultType> && sizeof(ResultType) <= 8);
 
+// This macro performs a branch-free conditional assignment for floating point types.
+// It uses bitwise operations to avoid branching, which can be beneficial for performance.
 #define BRANCHFREE_IF_FLOAT(TYPE, vc, va, vb, vr) \
     using UIntType = typename NumberTraits::Construct<false, false, sizeof(TYPE)>::Type; \
     using IntType = typename NumberTraits::Construct<true, false, sizeof(TYPE)>::Type; \
@@ -62,9 +62,6 @@ struct is_native_int_or_decimal // NOLINT(readability-identifier-naming)
     auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
     (vr) = *(reinterpret_cast<ResultType *>(&tmp));
 
-template <typename ResultType>
-inline constexpr bool is_native_int_or_decimal_v = is_native_int_or_decimal<ResultType>::value;
-
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
 inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
 {

From 29b3cf60a698299572b173e8b936526877611c03 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 26 Jan 2024 16:45:09 +0800
Subject: [PATCH 0264/1081] fix perf regression

---
 src/Functions/if.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 49e0f7320ff..fba50385923 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -220,7 +220,7 @@ template <typename ArrayCond, typename A, typename B, typename ArrayResult, type
 inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
-    if constexpr (std::is_same_v<ResultType, Int8> || std::is_same_v<ResultType, UInt8> || is_over_big_int<ResultType>)
+    if constexpr (std::is_same_v<ResultType, Int8> || is_over_big_int<ResultType>)
     {
         alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
         for (size_t i = 0; i < size; ++i)

From 7515fa99f48121c5f0680581c8a217c89d97b896 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 13:15:15 +0100
Subject: [PATCH 0265/1081] I hope now

---
 tests/integration/test_broken_projections/test.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index f5e2ecba2b7..f8cbe8e6d9a 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -226,12 +226,14 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
             query_id=query_id,
         )
+        time.sleep(2)
+        node.query("SYSTEM FLUSH LOGS")
         assert "proj1" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
-        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
 
@@ -246,12 +248,14 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
             query_id=query_id,
         )
+        time.sleep(2)
+        node.query("SYSTEM FLUSH LOGS")
         assert "proj2" in node.query(
             f"""
         SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
-        WHERE current_database=currentDatabase() AND query_id='{query_id}' AND type='QueryFinish'
+        WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
 

From 176d8beac972eb6df4954b3974ba40a0b4b48b45 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 26 Jan 2024 14:34:26 +0100
Subject: [PATCH 0266/1081] Disable parallel replicas JOIN with CTE (not
 analyzer)

---
 src/Interpreters/ActionsVisitor.cpp           |  5 +-
 src/Interpreters/GlobalSubqueriesVisitor.h    | 63 +++++++++++++++----
 src/Interpreters/InterpreterSelectQuery.cpp   | 33 +---------
 src/Interpreters/PreparedSets.cpp             | 27 ++------
 src/Interpreters/PreparedSets.h               | 14 +----
 .../02972_parallel_replicas_cte.reference     |  2 +
 .../02972_parallel_replicas_cte.sql           | 23 +++++++
 7 files changed, 85 insertions(+), 82 deletions(-)
 create mode 100644 tests/queries/0_stateless/02972_parallel_replicas_cte.reference
 create mode 100644 tests/queries/0_stateless/02972_parallel_replicas_cte.sql

diff --git a/src/Interpreters/ActionsVisitor.cpp b/src/Interpreters/ActionsVisitor.cpp
index 1789cc6c4b1..78e125146d4 100644
--- a/src/Interpreters/ActionsVisitor.cpp
+++ b/src/Interpreters/ActionsVisitor.cpp
@@ -1414,10 +1414,7 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
             set_key = right_in_operand->getTreeHash(/*ignore_aliases=*/ true);
 
         if (auto set = data.prepared_sets->findSubquery(set_key))
-        {
-            set->markAsINSubquery();
             return set;
-        }
 
         FutureSetFromSubqueryPtr external_table_set;
 
@@ -1464,7 +1461,7 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
         }
 
         return data.prepared_sets->addFromSubquery(
-            set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef(), /*in_subquery=*/true);
+            set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef());
     }
     else
     {
diff --git a/src/Interpreters/GlobalSubqueriesVisitor.h b/src/Interpreters/GlobalSubqueriesVisitor.h
index 384b562c80c..08fbd748e48 100644
--- a/src/Interpreters/GlobalSubqueriesVisitor.h
+++ b/src/Interpreters/GlobalSubqueriesVisitor.h
@@ -32,6 +32,7 @@ namespace ErrorCodes
 {
     extern const int WRONG_GLOBAL_SUBQUERY;
     extern const int LOGICAL_ERROR;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 class GlobalSubqueriesMatcher
@@ -200,23 +201,33 @@ public:
     }
 
 private:
-    static bool shouldBeExecutedGlobally(const Data & data)
-    {
-        const Settings & settings = data.getContext()->getSettingsRef();
-        /// For parallel replicas we reinterpret JOIN as GLOBAL JOIN as a way to broadcast data
-        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
-        return settings.prefer_global_in_and_join || enable_parallel_processing_of_joins;
-    }
-
-
     /// GLOBAL IN
     static void visit(ASTFunction & func, ASTPtr &, Data & data)
     {
-        if ((shouldBeExecutedGlobally(data)
+        const Settings & settings = data.getContext()->getSettingsRef();
+        const bool prefer_global = settings.prefer_global_in_and_join;
+        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
+
+        if (((prefer_global || enable_parallel_processing_of_joins)
              && (func.name == "in" || func.name == "notIn" || func.name == "nullIn" || func.name == "notNullIn"))
             || func.name == "globalIn" || func.name == "globalNotIn" || func.name == "globalNullIn" || func.name == "globalNotNullIn")
         {
             ASTPtr & ast = func.arguments->children[1];
+            if (enable_parallel_processing_of_joins)
+            {
+                /// We don't enable parallel replicas for IN (subquery)
+                if (ast->as<ASTSubquery>())
+                {
+                    if (settings.allow_experimental_parallel_reading_from_replicas == 1)
+                    {
+                        LOG_DEBUG(getLogger("GlobalSubqueriesMatcher"), "IN with subquery is not supported with parallel replicas");
+                        data.getContext()->getQueryContext()->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                        return;
+                    }
+                    else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
+                }
+            }
 
             /// Literal or function can use regular IN.
             /// NOTE: We don't support passing table functions to IN.
@@ -241,9 +252,39 @@ private:
     /// GLOBAL JOIN
     static void visit(ASTTablesInSelectQueryElement & table_elem, ASTPtr &, Data & data)
     {
+        const Settings & settings = data.getContext()->getSettingsRef();
+        const bool prefer_global = settings.prefer_global_in_and_join;
+        const bool enable_parallel_processing_of_joins = data.getContext()->canUseParallelReplicasOnInitiator();
+
         if (table_elem.table_join
-            && (table_elem.table_join->as<ASTTableJoin &>().locality == JoinLocality::Global || shouldBeExecutedGlobally(data)))
+            && (table_elem.table_join->as<ASTTableJoin &>().locality == JoinLocality::Global || prefer_global
+                || enable_parallel_processing_of_joins))
         {
+            if (enable_parallel_processing_of_joins)
+            {
+                /// For parallel replicas we currently only support JOIN with subqueries
+                /// Note that tableA join tableB is previously converted into tableA JOIN (Select * FROM tableB) so that's ok
+                /// We don't support WITH cte as (subquery) Select table JOIN cte because we don't do conversion in AST
+                bool is_subquery = false;
+                if (const auto * ast_table_expr = table_elem.table_expression->as<ASTTableExpression>())
+                    is_subquery = ast_table_expr->subquery->as<ASTSubquery>() != nullptr
+                        && ast_table_expr->subquery->as<ASTSubquery>()->cte_name.empty();
+                else if (table_elem.table_expression->as<ASTSubquery>())
+                    is_subquery = true;
+
+                if (!is_subquery)
+                {
+                    if (settings.allow_experimental_parallel_reading_from_replicas == 1)
+                    {
+                        LOG_DEBUG(getLogger("GlobalSubqueriesMatcher"), "JOIN with parallel replicas is only supported with subqueries");
+                        data.getContext()->getQueryContext()->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                        return;
+                    }
+                    else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "JOIN with parallel replicas is only supported with subqueries");
+                }
+            }
+
             Names required_columns;
 
             /// Fill required columns for GLOBAL JOIN.
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 946a62c39c1..d0cf9f1160c 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -864,38 +864,7 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     ASTSelectQuery & query = getSelectQuery();
 
     /// While only_analyze we don't know anything about parts, so any decision about how many parallel replicas to use would be wrong
-    if (!storage || !context->canUseParallelReplicasOnInitiator())
-        return false;
-
-    /// check if IN operator with subquery is present in the query
-    /// if so, disable parallel replicas
-    if (query_analyzer->getPreparedSets()->hasSubqueries())
-    {
-        bool in_subqueries = false;
-        const auto & sets = query_analyzer->getPreparedSets();
-        const auto subqueries = sets->getSubqueries();
-        for (const auto & subquery : subqueries)
-        {
-            if (subquery->isINSubquery())
-            {
-                in_subqueries = true;
-                break;
-            }
-        }
-
-        if (in_subqueries)
-        {
-            if (settings.allow_experimental_parallel_reading_from_replicas == 2)
-                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
-
-            context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-            context->setSetting("max_parallel_replicas", UInt64{0});
-            LOG_DEBUG(log, "Disabling parallel replicas to execute a query with IN with subquery");
-            return true;
-        }
-    }
-
-    if (options.only_analyze)
+    if (!storage || options.only_analyze || !context->canUseParallelReplicasOnInitiator())
         return false;
 
     if (getTrivialCount(0).has_value())
diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index cc3db726f01..76f75cde1dc 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -98,12 +98,8 @@ FutureSetFromSubquery::FutureSetFromSubquery(
     std::unique_ptr<QueryPlan> source_,
     StoragePtr external_table_,
     std::shared_ptr<FutureSetFromSubquery> external_table_set_,
-    const Settings & settings,
-    bool in_subquery_)
-    : external_table(std::move(external_table_))
-    , external_table_set(std::move(external_table_set_))
-    , source(std::move(source_))
-    , in_subquery(in_subquery_)
+    const Settings & settings)
+    : external_table(std::move(external_table_)), external_table_set(std::move(external_table_set_)), source(std::move(source_))
 {
     set_and_key = std::make_shared<SetAndKey>();
     set_and_key->key = std::move(key);
@@ -281,16 +277,10 @@ FutureSetFromSubqueryPtr PreparedSets::addFromSubquery(
     std::unique_ptr<QueryPlan> source,
     StoragePtr external_table,
     FutureSetFromSubqueryPtr external_table_set,
-    const Settings & settings,
-    bool in_subquery)
+    const Settings & settings)
 {
     auto from_subquery = std::make_shared<FutureSetFromSubquery>(
-        toString(key, {}),
-        std::move(source),
-        std::move(external_table),
-        std::move(external_table_set),
-        settings,
-        in_subquery);
+        toString(key, {}), std::move(source), std::move(external_table), std::move(external_table_set), settings);
 
     auto [it, inserted] = sets_from_subqueries.emplace(key, from_subquery);
 
@@ -340,15 +330,6 @@ std::shared_ptr<FutureSetFromSubquery> PreparedSets::findSubquery(const Hash & k
     return it->second;
 }
 
-void PreparedSets::markAsINSubquery(const Hash & key)
-{
-    auto it = sets_from_subqueries.find(key);
-    if (it == sets_from_subqueries.end())
-        return;
-
-    it->second->markAsINSubquery();
-}
-
 std::shared_ptr<FutureSetFromStorage> PreparedSets::findStorage(const Hash & key) const
 {
     auto it = sets_from_storage.find(key);
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 7178cff73b9..3419d3b6839 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -101,8 +101,7 @@ public:
         std::unique_ptr<QueryPlan> source_,
         StoragePtr external_table_,
         std::shared_ptr<FutureSetFromSubquery> external_table_set_,
-        const Settings & settings,
-        bool in_subquery_);
+        const Settings & settings);
 
     FutureSetFromSubquery(
         String key,
@@ -118,8 +117,6 @@ public:
 
     QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
     void setQueryPlan(std::unique_ptr<QueryPlan> source_);
-    void markAsINSubquery() { in_subquery = true; }
-    bool isINSubquery() const { return in_subquery; }
 
 private:
     SetAndKeyPtr set_and_key;
@@ -128,11 +125,6 @@ private:
 
     std::unique_ptr<QueryPlan> source;
     QueryTreeNodePtr query_tree;
-    bool in_subquery = false; // subquery used in IN operator
-                              // the flag can be removed after enabling new analyzer and removing interpreter
-                              // or after enabling support IN operator with subqueries in parallel replicas
-                              // Note: it's necessary with interpreter since prepared sets used also for GLOBAL JOINs,
-                              //       with new analyzer it's not a case
 };
 
 using FutureSetFromSubqueryPtr = std::shared_ptr<FutureSetFromSubquery>;
@@ -160,8 +152,7 @@ public:
         std::unique_ptr<QueryPlan> source,
         StoragePtr external_table,
         FutureSetFromSubqueryPtr external_table_set,
-        const Settings & settings,
-        bool in_subquery = false);
+        const Settings & settings);
 
     FutureSetFromSubqueryPtr addFromSubquery(
         const Hash & key,
@@ -171,7 +162,6 @@ public:
     FutureSetFromTuplePtr findTuple(const Hash & key, const DataTypes & types) const;
     FutureSetFromStoragePtr findStorage(const Hash & key) const;
     FutureSetFromSubqueryPtr findSubquery(const Hash & key) const;
-    void markAsINSubquery(const Hash & key);
 
     using Subqueries = std::vector<FutureSetFromSubqueryPtr>;
     Subqueries getSubqueries() const;
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.reference b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
new file mode 100644
index 00000000000..fe21e3cec22
--- /dev/null
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
@@ -0,0 +1,2 @@
+990000
+990000
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
new file mode 100644
index 00000000000..d65374a3e02
--- /dev/null
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
@@ -0,0 +1,23 @@
+DROP TABLE IF EXISTS pr_1;
+DROP TABLE IF EXISTS pr_2;
+
+CREATE TABLE pr_1 (`a` UInt32) ENGINE = MergeTree ORDER BY a PARTITION BY a % 10 AS
+SELECT 10 * intDiv(number, 10) + 1 FROM numbers(1_000_000);
+
+CREATE TABLE pr_2 (`a` UInt32) ENGINE = MergeTree ORDER BY a AS
+SELECT * FROM numbers(1_000_000);
+
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a;
+
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3;
+
+-- Testing that it is disabled for allow_experimental_analyzer=0. With analyzer it will be supported (with correct result)
+WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
+SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
+SETTINGS allow_experimental_analyzer = 0, allow_experimental_parallel_reading_from_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3; -- { serverError SUPPORT_IS_DISABLED }
+
+DROP TABLE IF EXISTS pr_1;
+DROP TABLE IF EXISTS pr_2;

From 7908f69d84dc5a12156dee6ec7c137e1bf60c568 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 26 Jan 2024 14:01:06 +0000
Subject: [PATCH 0267/1081] Fix special builds and tests

---
 src/Functions/array/array.cpp                    | 2 +-
 src/Functions/map.cpp                            | 2 +-
 tests/queries/0_stateless/02942_variant_cast.sql | 1 +
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/array/array.cpp b/src/Functions/array/array.cpp
index 4379283ec86..03b51808799 100644
--- a/src/Functions/array/array.cpp
+++ b/src/Functions/array/array.cpp
@@ -16,7 +16,7 @@ class FunctionArray : public IFunction
 public:
     static constexpr auto name = "array";
 
-    FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
+    explicit FunctionArray(bool use_variant_as_common_type_ = false) : use_variant_as_common_type(use_variant_as_common_type_) {}
 
     static FunctionPtr create(ContextPtr context)
     {
diff --git a/src/Functions/map.cpp b/src/Functions/map.cpp
index 79a18dce99b..66cd10a3f0b 100644
--- a/src/Functions/map.cpp
+++ b/src/Functions/map.cpp
@@ -31,7 +31,7 @@ class FunctionMap : public IFunction
 public:
     static constexpr auto name = "map";
 
-    FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
+    explicit FunctionMap(bool use_variant_as_common_type_) : use_variant_as_common_type(use_variant_as_common_type_) {}
 
     static FunctionPtr create(ContextPtr context)
     {
diff --git a/tests/queries/0_stateless/02942_variant_cast.sql b/tests/queries/0_stateless/02942_variant_cast.sql
index 33587e3e438..fc2d1d63657 100644
--- a/tests/queries/0_stateless/02942_variant_cast.sql
+++ b/tests/queries/0_stateless/02942_variant_cast.sql
@@ -1,4 +1,5 @@
 set allow_experimental_variant_type=1;
+set allow_experimental_analyzer=0; -- It's currently doesn't work with analyzer because of the way it works with constants, but it will be refactored and fixed in future
 
 select NULL::Variant(String, UInt64);
 select 42::UInt64::Variant(String, UInt64);

From 692d37306eda131578a3c9df77c9c2c7e46fb231 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 26 Jan 2024 15:50:16 +0100
Subject: [PATCH 0268/1081] Fix build

---
 src/Storages/StorageURLCluster.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageURLCluster.cpp b/src/Storages/StorageURLCluster.cpp
index 7b38048b384..d0df74d7521 100644
--- a/src/Storages/StorageURLCluster.cpp
+++ b/src/Storages/StorageURLCluster.cpp
@@ -44,7 +44,7 @@ StorageURLCluster::StorageURLCluster(
     const ColumnsDescription & columns_,
     const ConstraintsDescription & constraints_,
     const StorageURL::Configuration & configuration_)
-    : IStorageCluster(cluster_name_, table_id_, getLogger("StorageURLCluster (" + table_id_.table_name + ")"), structure_argument_was_provided_)
+    : IStorageCluster(cluster_name_, table_id_, getLogger("StorageURLCluster (" + table_id_.table_name + ")"))
     , uri(uri_), format_name(format_)
 {
     context->getRemoteHostFilter().checkURL(Poco::URI(uri));

From 394e37894ff5ad87960ed8efffa655d88050e517 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 26 Jan 2024 15:03:35 +0000
Subject: [PATCH 0269/1081] Small improvement in QueryAnalysisPass

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 11 +++++++----
 src/Analyzer/QueryNode.cpp                |  1 +
 2 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e33c6565321..5582e369f33 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1214,7 +1214,7 @@ private:
 
     static void expandGroupByAll(QueryNode & query_tree_node_typed);
 
-    static void expandOrderByAll(QueryNode & query_tree_node_typed);
+    static void expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings);
 
     static std::string
     rewriteAggregateFunctionNameIfNeeded(const std::string & aggregate_function_name, NullsAction action, const ContextPtr & context);
@@ -2328,8 +2328,11 @@ void QueryAnalyzer::expandGroupByAll(QueryNode & query_tree_node_typed)
         recursivelyCollectMaxOrdinaryExpressions(node, group_by_nodes);
 }
 
-void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed)
+void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings)
 {
+    if (!settings.enable_order_by_all || !query_tree_node_typed.isOrderByAll())
+        return;
+
     auto * all_node = query_tree_node_typed.getOrderBy().getNodes()[0]->as<SortNode>();
     if (!all_node)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Select analyze for not sort node.");
@@ -2355,6 +2358,7 @@ void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed)
     }
 
     query_tree_node_typed.getOrderByNode() = list_node;
+    query_tree_node_typed.setIsOrderByAll(false);
 }
 
 std::string QueryAnalyzer::rewriteAggregateFunctionNameIfNeeded(
@@ -7133,8 +7137,7 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
     if (query_node_typed.hasHaving() && query_node_typed.isGroupByWithTotals() && is_rollup_or_cube)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "WITH TOTALS and WITH ROLLUP or CUBE are not supported together in presence of HAVING");
 
-    if (settings.enable_order_by_all && query_node_typed.isOrderByAll())
-        expandOrderByAll(query_node_typed);
+    expandOrderByAll(query_node_typed, settings);
 
     /// Initialize aliases in query node scope
     QueryExpressionsAliasVisitor visitor(scope);
diff --git a/src/Analyzer/QueryNode.cpp b/src/Analyzer/QueryNode.cpp
index a82fb4489b5..d0bff759dea 100644
--- a/src/Analyzer/QueryNode.cpp
+++ b/src/Analyzer/QueryNode.cpp
@@ -338,6 +338,7 @@ ASTPtr QueryNode::toASTImpl(const ConvertToASTOptions & options) const
     select_query->group_by_with_cube = is_group_by_with_cube;
     select_query->group_by_with_grouping_sets = is_group_by_with_grouping_sets;
     select_query->group_by_all = is_group_by_all;
+    select_query->order_by_all = is_order_by_all;
 
     if (hasWith())
         select_query->setExpression(ASTSelectQuery::Expression::WITH, getWith().toAST(options));

From 94eb33ef27a9ab7c4a99af40772ea287e67efcbf Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 14:29:50 +0100
Subject: [PATCH 0270/1081] Improve pytest --pdb experience by preserving
 dockerd on SIGINT (v2)

Previous fix (#43392) was not correct, since terminal sends SIGINT to
all processes in a group, so simply ignoring it in parent won't work. So
instead dockerd will be run in a new session.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 docker/test/integration/runner/dockerd-entrypoint.sh | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/docker/test/integration/runner/dockerd-entrypoint.sh b/docker/test/integration/runner/dockerd-entrypoint.sh
index b05aef76faf..8882daa38ea 100755
--- a/docker/test/integration/runner/dockerd-entrypoint.sh
+++ b/docker/test/integration/runner/dockerd-entrypoint.sh
@@ -23,13 +23,15 @@ if [ -f /sys/fs/cgroup/cgroup.controllers ]; then
         > /sys/fs/cgroup/cgroup.subtree_control
 fi
 
-# In case of test hung it is convenient to use pytest --pdb to debug it,
-# and on hung you can simply press Ctrl-C and it will spawn a python pdb,
-# but on SIGINT dockerd will exit, so ignore it to preserve the daemon.
-trap '' INT
 # Binding to an IP address without --tlsverify is deprecated. Startup is intentionally being slowed
 # unless --tls=false or --tlsverify=false is set
-dockerd --host=unix:///var/run/docker.sock --tls=false --host=tcp://0.0.0.0:2375 --default-address-pool base=172.17.0.0/12,size=24 &>/ClickHouse/tests/integration/dockerd.log &
+#
+# In case of test hung it is convenient to use pytest --pdb to debug it,
+# and on hung you can simply press Ctrl-C and it will spawn a python pdb,
+# but on SIGINT dockerd will exit, so we spawn new session to ignore SIGINT by
+# docker.
+# Note, that if you will run it via runner, it will send SIGINT to docker anyway.
+setsid dockerd --host=unix:///var/run/docker.sock --tls=false --host=tcp://0.0.0.0:2375 --default-address-pool base=172.17.0.0/12,size=24 &>/ClickHouse/tests/integration/dockerd.log &
 
 set +e
 reties=0

From e3c07d456295ccc2524a2fafc6ea8a74a2e8bc39 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 24 Jan 2024 17:50:39 +0000
Subject: [PATCH 0271/1081] Analyzer: Fix CTE name clash resolution

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 23 ++++++++++++++++++++---
 1 file changed, 20 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e33c6565321..ceb54fc6056 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1396,6 +1396,8 @@ private:
     /// Lambdas that are currently in resolve process
     std::unordered_set<IQueryTreeNode *> lambdas_in_resolve_process;
 
+    std::unordered_set<String> cte_in_resolve_process;
+
     /// Function name to user defined lambda map
     std::unordered_map<std::string, QueryTreeNodePtr> function_name_to_user_defined_lambda;
 
@@ -3712,7 +3714,12 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
         if (it->second.resolve_result.isResolved() &&
             scope.use_identifier_lookup_to_result_cache &&
             !scope.non_cached_identifier_lookups_during_expression_resolve.contains(identifier_lookup))
-            return it->second.resolve_result;
+        {
+            if (!it->second.resolve_result.isResolvedFromCTEs() || !cte_in_resolve_process.contains(identifier_lookup.identifier.getFullName()))
+            {
+                return it->second.resolve_result;
+            }
+        }
     }
     else
     {
@@ -3769,8 +3776,10 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
 
     if (!resolve_result.resolved_identifier && identifier_lookup.isTableExpressionLookup())
     {
-        auto cte_query_node_it = scope.cte_name_to_query_node.find(identifier_lookup.identifier.getFullName());
-        if (cte_query_node_it != scope.cte_name_to_query_node.end())
+        auto full_name = identifier_lookup.identifier.getFullName();
+        auto cte_query_node_it = scope.cte_name_to_query_node.find(full_name);
+        if (cte_query_node_it != scope.cte_name_to_query_node.end()
+            && !cte_in_resolve_process.contains(full_name))
         {
             resolve_result.resolved_identifier = cte_query_node_it->second;
             resolve_result.resolve_place = IdentifierResolvePlace::CTE;
@@ -5704,6 +5713,7 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
                     if (resolved_as_cte)
                     {
+                        auto cte_node = resolved_identifier_node;
                         resolved_identifier_node = resolved_identifier_node->clone();
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
@@ -7112,6 +7122,10 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
             max_subquery_depth);
 
     auto & query_node_typed = query_node->as<QueryNode &>();
+
+    if (query_node_typed.isCTE())
+        cte_in_resolve_process.insert(query_node_typed.getCTEName());
+
     const auto & settings = scope.context->getSettingsRef();
 
     bool is_rollup_or_cube = query_node_typed.isGroupByWithRollup() || query_node_typed.isGroupByWithCube();
@@ -7452,6 +7466,9 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
         node->removeAlias();
 
     query_node_typed.resolveProjectionColumns(std::move(projection_columns));
+
+    if (query_node_typed.isCTE())
+        cte_in_resolve_process.erase(query_node_typed.getCTEName());
 }
 
 void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, IdentifierResolveScope & scope)

From 778f4371c2b73dddf122e5948b67e01466cbed32 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 25 Jan 2024 09:43:27 +0000
Subject: [PATCH 0272/1081] Cleanup the code

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 23 +++++++++++++++++++++--
 tests/analyzer_tech_debt.txt              |  1 -
 2 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index ceb54fc6056..a43f4cba5e9 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1396,7 +1396,7 @@ private:
     /// Lambdas that are currently in resolve process
     std::unordered_set<IQueryTreeNode *> lambdas_in_resolve_process;
 
-    std::unordered_set<String> cte_in_resolve_process;
+    std::unordered_set<std::string_view> cte_in_resolve_process;
 
     /// Function name to user defined lambda map
     std::unordered_map<std::string, QueryTreeNodePtr> function_name_to_user_defined_lambda;
@@ -3778,6 +3778,19 @@ IdentifierResolveResult QueryAnalyzer::tryResolveIdentifier(const IdentifierLook
     {
         auto full_name = identifier_lookup.identifier.getFullName();
         auto cte_query_node_it = scope.cte_name_to_query_node.find(full_name);
+
+        /// CTE may reference table expressions with the same name, e.g.:
+        ///
+        /// WITH test1 AS (SELECT * FROM test1) SELECT * FROM test1;
+        ///
+        /// Since we don't support recursive CTEs, `test1` identifier inside of CTE
+        /// references to table <default database name>.test1.
+        /// This means that the example above is equivalent to the following query:
+        ///
+        /// SELECT * FROM test1;
+        ///
+        /// To accomplish this behaviour it's not allowed to resolve identifiers to
+        /// CTE that is being resolved.
         if (cte_query_node_it != scope.cte_name_to_query_node.end()
             && !cte_in_resolve_process.contains(full_name))
         {
@@ -5713,7 +5726,6 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
 
                     if (resolved_as_cte)
                     {
-                        auto cte_node = resolved_identifier_node;
                         resolved_identifier_node = resolved_identifier_node->clone();
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
@@ -7474,6 +7486,10 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
 void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, IdentifierResolveScope & scope)
 {
     auto & union_node_typed = union_node->as<UnionNode &>();
+
+    if(union_node_typed.isCTE())
+        cte_in_resolve_process.insert(union_node_typed.getCTEName());
+
     auto & queries_nodes = union_node_typed.getQueries().getNodes();
 
     for (auto & query_node : queries_nodes)
@@ -7497,6 +7513,9 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
                 scope.scope_node->formatASTForErrorMessage());
         }
     }
+
+    if(union_node_typed.isCTE())
+        cte_in_resolve_process.erase(union_node_typed.getCTEName());
 }
 
 }
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index a84f912f371..d944dd96e25 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -7,7 +7,6 @@
 01214_test_storage_merge_aliases_with_where
 01244_optimize_distributed_group_by_sharding_key
 01268_shard_avgweighted
-01495_subqueries_in_with_statement
 01560_merge_distributed_join
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints

From e38face46b7c78b04551ec4a9590e10f7b872935 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 25 Jan 2024 10:55:45 +0100
Subject: [PATCH 0273/1081] Fix style

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index a43f4cba5e9..9c42c6621da 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -7487,7 +7487,7 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
 {
     auto & union_node_typed = union_node->as<UnionNode &>();
 
-    if(union_node_typed.isCTE())
+    if (union_node_typed.isCTE())
         cte_in_resolve_process.insert(union_node_typed.getCTEName());
 
     auto & queries_nodes = union_node_typed.getQueries().getNodes();
@@ -7514,7 +7514,7 @@ void QueryAnalyzer::resolveUnion(const QueryTreeNodePtr & union_node, Identifier
         }
     }
 
-    if(union_node_typed.isCTE())
+    if (union_node_typed.isCTE())
         cte_in_resolve_process.erase(union_node_typed.getCTEName());
 }
 

From a9d2e136978116311e2f9559cfabe040f35e80a2 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 26 Jan 2024 14:23:19 +0000
Subject: [PATCH 0274/1081] Handle CTEs more careafully

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 9c42c6621da..feca2980638 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5730,6 +5730,8 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
                         subquery_node = resolved_identifier_node->as<QueryNode>();
                         union_node = resolved_identifier_node->as<UnionNode>();
 
+                        std::string_view cte_name = subquery_node ? subquery_node->getCTEName() : union_node->getCTEName();
+
                         if (subquery_node)
                             subquery_node->setIsCTE(false);
                         else
@@ -5738,10 +5740,21 @@ ProjectionNames QueryAnalyzer::resolveExpressionNode(QueryTreeNodePtr & node, Id
                         IdentifierResolveScope subquery_scope(resolved_identifier_node, &scope /*parent_scope*/);
                         subquery_scope.subquery_depth = scope.subquery_depth + 1;
 
+                        /// CTE is being resolved, it's required to forbid to resolve to it again
+                        /// because recursive CTEs are not supported, e.g.:
+                        ///
+                        /// WITH test1 AS (SELECT i + 1, j + 1 FROM test1) SELECT toInt64(4) i, toInt64(5) j FROM numbers(3) WHERE (i, j) IN test1;
+                        ///
+                        /// In this example argument of function `in` is being resolve here. If CTE `test1` is not forbidden,
+                        /// `test1` is resolved to CTE (not to the table) in `initializeQueryJoinTreeNode` function.
+                        cte_in_resolve_process.insert(cte_name);
+
                         if (subquery_node)
                             resolveQuery(resolved_identifier_node, subquery_scope);
                         else
                             resolveUnion(resolved_identifier_node, subquery_scope);
+
+                        cte_in_resolve_process.erase(cte_name);
                     }
                 }
             }

From ee15b6e64608ddb519c4997533aca14d21153834 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 16:26:59 +0100
Subject: [PATCH 0275/1081] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 35 +++++++++-----
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  4 +-
 src/Storages/S3Queue/S3QueueSource.cpp        | 48 +++++++++----------
 src/Storages/S3Queue/S3QueueSource.h          |  2 +
 src/Storages/S3Queue/StorageS3Queue.cpp       |  2 +-
 5 files changed, 52 insertions(+), 39 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 02974be4c4a..9fb127baef9 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -199,7 +199,7 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
-size_t S3QueueFilesMetadata::getProcessingThreadForPath(const std::string & path) const
+size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
     return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
 }
@@ -219,16 +219,24 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
         std::lock_guard lock(file_status->metadata_lock);
         switch (file_status->state)
         {
-            case FileStatus::State::Processing: [[fallthrough]];
+            case FileStatus::State::Processing:
+            {
+                LOG_TEST(log, "File {} is already processing", path);
+                return {};
+            }
             case FileStatus::State::Processed:
             {
+                LOG_TEST(log, "File {} is already processed", path);
                 return {};
             }
             case FileStatus::State::Failed:
             {
                 /// If max_loading_retries == 0, file is not retriable.
                 if (max_loading_retries == 0)
+                {
+                    LOG_TEST(log, "File {} is failed and processing retries are disabled", path);
                     return {};
+                }
 
                 /// Otherwise file_status->retries is also cached.
                 /// In case file_status->retries >= max_loading_retries we can fully rely that it is true
@@ -237,7 +245,10 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
                 /// (another server could have done a try after we cached retries value),
                 /// so check with zookeeper here.
                 if (file_status->retries >= max_loading_retries)
+                {
+                    LOG_TEST(log, "File {} is failed and processing retries are exceeeded", path);
                     return {};
+                }
 
                 break;
             }
@@ -291,31 +302,26 @@ S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAs
             if (!file_status->processing_start_time)
                 file_status->processing_start_time = std::chrono::system_clock::to_time_t(std::chrono::system_clock::now());
 
-            break;
+            return processing_node_holder;
         }
         case SetFileProcessingResult::AlreadyProcessed:
         {
             std::lock_guard lock(file_status->metadata_lock);
             file_status->state = FileStatus::State::Processed;
-            break;
+            return {};
         }
         case SetFileProcessingResult::AlreadyFailed:
         {
             std::lock_guard lock(file_status->metadata_lock);
             file_status->state = FileStatus::State::Failed;
-            break;
+            return {};
         }
         case SetFileProcessingResult::ProcessingByOtherNode:
         {
             /// We cannot save any local state here, see comment above.
-            break;
+            return {};
         }
     }
-
-    if (result == SetFileProcessingResult::Success)
-        return processing_node_holder;
-
-    return {};
 }
 
 std::pair<S3QueueFilesMetadata::SetFileProcessingResult,
@@ -396,7 +402,7 @@ S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & p
         /// in the same zookeeper transaction, so we use a while loop with tries).
 
         auto processed_node = isShardedProcessing()
-            ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+            ? zookeeper_processed_path / toString(getProcessingIdForPath(path))
             : zookeeper_processed_path;
 
         NodeMetadata processed_node_metadata;
@@ -435,6 +441,8 @@ S3QueueFilesMetadata::trySetFileAsProcessingForOrderedMode(const std::string & p
         {
             auto holder = std::make_unique<ProcessingNodeHolder>(
                 node_metadata.processing_id, path, zookeeper_processing_path / node_name, file_status, zk_client);
+
+            LOG_TEST(log, "File {} is ready to be processed", path);
             return std::pair{SetFileProcessingResult::Success, std::move(holder)};
         }
 
@@ -526,9 +534,10 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
     const auto zk_client = getZooKeeper();
 
     auto processed_node = isShardedProcessing()
-        ? zookeeper_processed_path / toString(getProcessingThreadForPath(path))
+        ? zookeeper_processed_path / toString(getProcessingIdForPath(path))
         : zookeeper_processed_path;
 
+    LOG_TEST(log, "Setting file `{}` as processed", path);
     while (true)
     {
         std::string res;
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 708355e4ac3..1436f8eae7b 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -84,11 +84,13 @@ public:
 
     size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
 
-    size_t getProcessingThreadForPath(const std::string & path) const;
+    size_t getProcessingIdForPath(const std::string & path) const;
 
     /// shard_id must be in range [0, shards_num - 1]
     size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
 
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < shard_id * (threads_per_shard + 1); }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 1073270742f..eed644aff7c 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -43,12 +43,14 @@ StorageS3QueueSource::S3QueueKeyWithInfo::S3QueueKeyWithInfo(
 StorageS3QueueSource::FileIterator::FileIterator(
     std::shared_ptr<S3QueueFilesMetadata> metadata_,
     std::unique_ptr<GlobIterator> glob_iterator_,
+    size_t current_shard_,
     std::atomic<bool> & shutdown_called_)
     : metadata(metadata_)
     , glob_iterator(std::move(glob_iterator_))
     , shutdown_called(shutdown_called_)
     , log(&Poco::Logger::get("StorageS3QueueSource"))
     , sharded_processing(metadata->isShardedProcessing())
+    , current_shard(current_shard_)
 {
     if (sharded_processing)
     {
@@ -63,40 +65,36 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
     {
         KeyWithInfoPtr val{nullptr};
 
-        if (sharded_processing)
-        {
-            LOG_TEST(log, "CHECK: {}", idx);
-            auto & keys = sharded_keys.at(idx);
-            if (!keys.empty())
-            {
-                std::lock_guard lk(sharded_keys_mutex);
-                val = keys.front();
-                keys.pop_front();
-            }
-        }
-
-        if (!val)
         {
             std::unique_lock lk(sharded_keys_mutex, std::defer_lock);
             if (sharded_processing)
             {
-                /// To make sure order on keys in each shard in sharded_keys.
+                /// To make sure order on keys in each shard in sharded_keys
+                /// we need to check sharded_keys and to next() under lock.
                 lk.lock();
+
+                auto & keys = sharded_keys.at(idx);
+                if (!keys.empty())
+                {
+                    val = keys.front();
+                    keys.pop_front();
+                }
             }
 
-            val = glob_iterator->next();
-
-            if (val && sharded_processing)
+            if (!val)
             {
-                auto shard = metadata->getProcessingThreadForPath(val->key);
-                if (shard != idx)
+                val = glob_iterator->next();
+                if (val && sharded_processing)
                 {
-                    LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                    auto & keys = sharded_keys.at(shard);
-                    keys.push_back(val);
-                    continue;
+                    auto shard = metadata->getProcessingIdForPath(val->key);
+                    if (idx != shard && metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                    {
+                        LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                        auto & keys = sharded_keys.at(shard);
+                        keys.push_back(val);
+                        continue;
+                    }
                 }
-                LOG_TEST(log, "Processing shard {} with key {}", shard, val->key);
             }
         }
 
@@ -116,6 +114,8 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
             return {};
         }
 
+        LOG_TEST(log, "Checking if can process key {} for processing_id {}", val->key, idx);
+
         if (processing_holder)
         {
             return std::make_shared<S3QueueKeyWithInfo>(val->key, val->info, processing_holder);
diff --git a/src/Storages/S3Queue/S3QueueSource.h b/src/Storages/S3Queue/S3QueueSource.h
index 338f355974b..47fc3ee960e 100644
--- a/src/Storages/S3Queue/S3QueueSource.h
+++ b/src/Storages/S3Queue/S3QueueSource.h
@@ -41,6 +41,7 @@ public:
         FileIterator(
             std::shared_ptr<S3QueueFilesMetadata> metadata_,
             std::unique_ptr<GlobIterator> glob_iterator_,
+            size_t current_shard_,
             std::atomic<bool> & shutdown_called_);
 
         /// Note:
@@ -58,6 +59,7 @@ public:
         Poco::Logger * log;
 
         const bool sharded_processing;
+        const size_t current_shard;
         std::unordered_map<size_t, std::deque<KeyWithInfoPtr>> sharded_keys;
         std::mutex sharded_keys_mutex;
     };
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 66c4dacf5bd..39c7e974740 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -569,7 +569,7 @@ std::shared_ptr<StorageS3Queue::FileIterator> StorageS3Queue::createFileIterator
     auto glob_iterator = std::make_unique<StorageS3QueueSource::GlobIterator>(
         *configuration.client, configuration.url, predicate, virtual_columns, local_context,
         /* read_keys */nullptr, configuration.request_settings);
-    return std::make_shared<FileIterator>(files_metadata, std::move(glob_iterator), shutdown_called);
+    return std::make_shared<FileIterator>(files_metadata, std::move(glob_iterator), s3queue_settings->s3queue_current_shard_num, shutdown_called);
 }
 
 void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)

From e56728ae6c00c6abc92a2d186eb24cb2b2fe57b7 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:32:09 +0100
Subject: [PATCH 0276/1081] tests: add s3_plain disk

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/config/config.d/storage_conf.xml | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/tests/config/config.d/storage_conf.xml b/tests/config/config.d/storage_conf.xml
index 18652826d83..1429dfff724 100644
--- a/tests/config/config.d/storage_conf.xml
+++ b/tests/config/config.d/storage_conf.xml
@@ -4,11 +4,17 @@
             <s3_disk>
                 <type>s3</type>
                 <path>s3_disk/</path>
-                <endpoint>http://localhost:11111/test/common/</endpoint>
+                <endpoint>http://localhost:11111/test/s3/</endpoint>
                 <access_key_id>clickhouse</access_key_id>
                 <secret_access_key>clickhouse</secret_access_key>
                 <request_timeout_ms>20000</request_timeout_ms>
             </s3_disk>
+            <s3_plain_disk>
+                <type>s3_plain</type>
+                <endpoint>http://localhost:11111/test/s3_plain/</endpoint>
+                <access_key_id>clickhouse</access_key_id>
+                <secret_access_key>clickhouse</secret_access_key>
+            </s3_plain_disk>
             <s3_cache>
                 <type>cache</type>
                 <disk>s3_disk</disk>

From 6751e01cc3d848132cafb10f0e2195281b6c2575 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:59:16 +0100
Subject: [PATCH 0277/1081] Do not drop parts for static (ro/write-once)
 storages for Replicated engine

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp | 9 +++++++++
 src/Storages/StorageMergeTree.cpp        | 3 ---
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 39c113c240e..b70e1471b3c 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2740,6 +2740,15 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
+    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
+    ///
+    /// Note, that one may think that drop on write-once disk should be
+    /// supported, since it is pretty trivial to implement
+    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
+    /// however removing part requires moveDirectory() as well.
+    if (isStaticStorage())
+        return;
+
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 7e6c5ca3924..b0473a4bbb0 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -319,9 +319,6 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 void StorageMergeTree::drop()
 {
     shutdown(true);
-    /// In case there is read-only disk we cannot allow to call dropAllData(), but dropping tables is allowed.
-    if (isStaticStorage())
-        return;
     dropAllData();
 }
 

From 41ebaefeda10c8177dbb92e0651fd833238880b9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:27:17 +0100
Subject: [PATCH 0278/1081] Add a note for
 MetadataStorageFromPlainObjectStorage to support transactions

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.h      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
index 1bb008c0c19..58089079a44 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
@@ -106,7 +106,7 @@ public:
 
     void commit() override
     {
-        /// Nothing to commit.
+        /// TODO: rewrite with transactions
     }
 
     bool supportsChmod() const override { return false; }

From f3b4f28f0d6f3064416653877b1b081f004f0d8f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:51:44 +0100
Subject: [PATCH 0279/1081] Disable mutable operations into
 {Replicated,}MergeTree with static storage

Mutable operations includes:
- INSERT
- OPTIMIZE
- parts manipulation
- ...

But does not include DROP, since you need an ability to DROP it.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp    |  3 +++
 src/Storages/StorageMergeTree.cpp           | 21 +++++++++++++++++++++
 src/Storages/StorageMergeTree.h             |  2 ++
 src/Storages/StorageReplicatedMergeTree.cpp |  7 +++++++
 4 files changed, 33 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index b70e1471b3c..61bfc2bf9cb 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -90,6 +90,7 @@
 
 #include <base/insertAtEnd.h>
 #include <base/interpolate.h>
+#include <base/defines.h>
 
 #include <algorithm>
 #include <atomic>
@@ -7080,6 +7081,8 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
+    chassert(!isStaticStorage());
+
     /// Check that the storage policy contains the disk where the src_part is located.
     bool does_storage_policy_allow_same_disk = false;
     for (const DiskPtr & disk : getStoragePolicy()->getDisks())
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index b0473a4bbb0..f9d360f02e7 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -65,6 +65,7 @@ namespace ErrorCodes
     extern const int NO_SUCH_DATA_PART;
     extern const int ABORTED;
     extern const int SUPPORT_IS_DISABLED;
+    extern const int TABLE_IS_READ_ONLY;
 }
 
 namespace ActionLocks
@@ -294,6 +295,8 @@ std::optional<UInt64> StorageMergeTree::totalBytesUncompressed(const Settings &)
 SinkToStoragePtr
 StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
+    assertNotReadonly();
+
     const auto & settings = local_context->getSettingsRef();
     return std::make_shared<MergeTreeSink>(
         *this, metadata_snapshot, settings.max_partitions_per_insert_block, local_context);
@@ -327,6 +330,8 @@ void StorageMergeTree::alter(
     ContextPtr local_context,
     AlterLockHolder & table_lock_holder)
 {
+    assertNotReadonly();
+
     if (local_context->getCurrentTransaction() && local_context->getSettingsRef().throw_on_unsupported_query_inside_transaction)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "ALTER METADATA is not supported inside transactions");
 
@@ -617,6 +622,8 @@ void StorageMergeTree::setMutationCSN(const String & mutation_id, CSN csn)
 
 void StorageMergeTree::mutate(const MutationCommands & commands, ContextPtr query_context)
 {
+    assertNotReadonly();
+
     delayMutationOrThrowIfNeeded(nullptr, query_context);
 
     /// Validate partition IDs (if any) before starting mutation
@@ -807,6 +814,8 @@ std::vector<MergeTreeMutationStatus> StorageMergeTree::getMutationsStatus() cons
 
 CancellationCode StorageMergeTree::killMutation(const String & mutation_id)
 {
+    assertNotReadonly();
+
     LOG_TRACE(log, "Killing mutation {}", mutation_id);
     UInt64 mutation_version = MergeTreeMutationEntry::tryParseFileName(mutation_id);
     if (!mutation_version)
@@ -1517,6 +1526,8 @@ bool StorageMergeTree::optimize(
     bool cleanup,
     ContextPtr local_context)
 {
+    assertNotReadonly();
+
     if (deduplicate)
     {
         if (deduplicate_by_columns.empty())
@@ -1762,6 +1773,8 @@ void StorageMergeTree::renameAndCommitEmptyParts(MutableDataPartsVector & new_pa
 
 void StorageMergeTree::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr query_context, TableExclusiveLockHolder &)
 {
+    assertNotReadonly();
+
     {
         /// Asks to complete merges and does not allow them to start.
         /// This protects against "revival" of data for a removed partition after completion of merge.
@@ -2036,6 +2049,8 @@ PartitionCommandsResultInfo StorageMergeTree::attachPartition(
 
 void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, const ASTPtr & partition, bool replace, ContextPtr local_context)
 {
+    assertNotReadonly();
+
     auto lock1 = lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
     auto lock2 = source_table->lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
     auto merges_blocker = stopMergesAndWait();
@@ -2434,6 +2449,12 @@ PreparedSetsCachePtr StorageMergeTree::getPreparedSetsCache(Int64 mutation_id)
     return cache;
 }
 
+void StorageMergeTree::assertNotReadonly() const
+{
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+}
+
 void StorageMergeTree::fillNewPartName(MutableDataPartPtr & part, DataPartsLock &)
 {
     part->info.min_block = part->info.max_block = increment.get();
diff --git a/src/Storages/StorageMergeTree.h b/src/Storages/StorageMergeTree.h
index 51bf6aa42e7..359fa1d262d 100644
--- a/src/Storages/StorageMergeTree.h
+++ b/src/Storages/StorageMergeTree.h
@@ -273,6 +273,8 @@ private:
 
     PreparedSetsCachePtr getPreparedSetsCache(Int64 mutation_id);
 
+    void assertNotReadonly() const;
+
     friend class MergeTreeSink;
     friend class MergeTreeData;
     friend class MergePlainMergeTreeTask;
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index c82721d2a18..579cc5f4c30 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -4659,6 +4659,9 @@ bool StorageReplicatedMergeTree::fetchPart(
     zkutil::ZooKeeper::Ptr zookeeper_,
     bool try_fetch_shared)
 {
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     auto zookeeper = zookeeper_ ? zookeeper_ : getZooKeeper();
     const auto part_info = MergeTreePartInfo::fromPartName(part_name, format_version);
 
@@ -5496,6 +5499,8 @@ void StorageReplicatedMergeTree::assertNotReadonly() const
 {
     if (is_readonly)
         throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode (replica path: {})", replica_path);
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
 }
 
 
@@ -5504,6 +5509,8 @@ SinkToStoragePtr StorageReplicatedMergeTree::write(const ASTPtr & /*query*/, con
     if (!initialization_done)
         throw Exception(ErrorCodes::NOT_INITIALIZED, "Table is not initialized yet");
 
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
     /// If table is read-only because it doesn't have metadata in zk yet, then it's not possible to insert into it
     /// Without this check, we'll write data parts on disk, and afterwards will remove them since we'll fail to commit them into zk
     /// In case of remote storage like s3, it'll generate unnecessary PUT requests

From 9ce18bbf4332a53c7838694365c31ee3861e0a98 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 16:06:53 +0100
Subject: [PATCH 0280/1081] Implement
 MetadataStorageFromPlainObjectStorageTransaction::removeDirectory (for DROP
 TABLE)

This is required to remove format_version.txt for MergeTree after DROP

    (lldb) bt
    * thread 192, name = 'BgSchPool', stop reason = breakpoint 1.1
        frame 0: 0x0000000016c7f452 clickhouse`__cxa_throw(thrown_object=0x00007ffd7a53c480, tinfo=0x00000000011602a0, dest=(clickhouse`DB::Exception::~Exception() at Exception.h:40)) + 18 at cxa_exception.cpp:258
        frame 1: 0x00000000109bf709 clickhouse`DB::IMetadataTransaction::throwNotImplemented() + 137 at IMetadataStorage.h:151
        frame 2: 0x00000000109bf126 clickhouse`DB::IMetadataTransaction::removeDirectory(this=<unavailable>, (null)=<unavailable>) + 6 at IMetadataStorage.h:96
        frame 3: 0x0000000010968978 clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::removeMetadataRecursive(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1, path_to_remove="tmp_insert_all_2_2_0") + 376 at DiskObjectStorageTransaction.cpp:364
        frame 4: 0x000000001096893d clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::removeMetadataRecursive(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1, path_to_remove="store/27f/27f6f9d2-ab2e-4817-b771-0e706e485b15/") + 317 at DiskObjectStorageTransaction.cpp:362
        frame 5: 0x0000000010965a7f clickhouse`DB::(anonymous namespace)::RemoveRecursiveObjectStorageOperation::execute(this=0x00007ffd7a7327a0, tx=std::__1::shared_ptr<DB::IMetadataTransaction>::element_type @ 0x00007ffd7a6f6018 strong=4 weak=1) + 95 at DiskObjectStorageTransaction.cpp:372
        frame 6: 0x0000000010963a2f clickhouse`DB::DiskObjectStorageTransaction::commit(this=0x00007ffea22b6168) + 79 at DiskObjectStorageTransaction.cpp:903
        frame 7: 0x00000000109577e5 clickhouse`DB::DiskObjectStorage::removeSharedRecursive(this=<unavailable>, path="store/27f/27f6f9d2-ab2e-4817-b771-0e706e485b15/", keep_all_batch_data=false, file_names_remove_metadata_only=size=0) + 133 at DiskObjectStorage.cpp:426
        frame 8: 0x000000001095af79 clickhouse`DB::DiskObjectStorage::removeRecursive(this=<unavailable>, path=<unavailable>) + 57 at DiskObjectStorage.h:79
      * frame 9: 0x0000000010b5c3d5 clickhouse`DB::DatabaseCatalog::dropTableFinally(this=0x00007ffff7096800, table=0x00007ffe853e1bd0) + 1365 at DatabaseCatalog.cpp:1317
        frame 10: 0x0000000010b5b7e7 clickhouse`DB::DatabaseCatalog::dropTableDataTask(this=0x00007ffff7096800) + 2375 at DatabaseCatalog.cpp:1270

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../MetadataStorageFromPlainObjectStorage.cpp               | 6 ++++++
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.h  | 1 +
 2 files changed, 7 insertions(+)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index f20cd67a39f..72d512c6f6b 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -121,6 +121,12 @@ void MetadataStorageFromPlainObjectStorageTransaction::unlinkFile(const std::str
     metadata_storage.object_storage->removeObject(object);
 }
 
+void MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(const std::string & path)
+{
+    for (auto it = metadata_storage.iterateDirectory(path); it->isValid(); it->next())
+        metadata_storage.object_storage->removeObject(StoredObject(it->path()));
+}
+
 void MetadataStorageFromPlainObjectStorageTransaction::createDirectory(const std::string &)
 {
     /// Noop. It is an Object Storage not a filesystem.
diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
index 58089079a44..8a8466c3fbe 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.h
@@ -101,6 +101,7 @@ public:
     void createDirectoryRecursive(const std::string & path) override;
 
     void unlinkFile(const std::string & path) override;
+    void removeDirectory(const std::string & path) override;
 
     UnlinkMetadataFileOperationOutcomePtr unlinkMetadata(const std::string & path) override;
 

From d79c1f7e1c4a98a333c89aa77306ad2c22b2d183 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 15:38:36 +0100
Subject: [PATCH 0281/1081] Fix
 MetadataStorageFromPlainObjectStorage::iterateDirectory() (add prefix)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp    | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index 72d512c6f6b..b03809f5b39 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -98,6 +98,8 @@ DirectoryIteratorPtr MetadataStorageFromPlainObjectStorage::iterateDirectory(con
 {
     /// Required for MergeTree
     auto paths = listDirectory(path);
+    // Prepend path, since iterateDirectory() includes path, unlike listDirectory()
+    std::for_each(paths.begin(), paths.end(), [&](auto & child) { child = fs::path(path) / child; });
     std::vector<std::filesystem::path> fs_paths(paths.begin(), paths.end());
     return std::make_unique<StaticDirectoryIterator>(std::move(fs_paths));
 }

From 046a7a5df53451e224da8214d783ebbd7e7db0dc Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 24 Jan 2024 11:56:09 +0100
Subject: [PATCH 0282/1081] tests: cover DROP TABLE on s3_plain disk

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference |  7 +++
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    | 35 +++++++++++++++
 .../02980_s3_plain_DROP_TABLE_MergeTree.yml   |  7 +++
 ...n_DROP_TABLE_ReplicatedMergeTree.reference |  7 +++
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh | 45 +++++++++++++++++++
 ...3_plain_DROP_TABLE_ReplicatedMergeTree.yml |  7 +++
 6 files changed, 108 insertions(+)
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
 create mode 100755 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
 create mode 100755 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
 create mode 100644 tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
new file mode 100644
index 00000000000..2bec7a1d508
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -0,0 +1,7 @@
+Files before DROP TABLE
+format_version.txt
+
+Files after DETACH TABLE
+format_version.txt
+
+Files after DROP TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
new file mode 100755
index 00000000000..406e53a2175
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -0,0 +1,35 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires S3
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+config="${BASH_SOURCE[0]/.sh/.yml}"
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table if exists data;
+    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk';
+    insert into data values (1); -- { serverError TABLE_IS_READ_ONLY }
+    optimize table data final; -- { serverError TABLE_IS_READ_ONLY }
+"
+
+path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM system.tables WHERE database = '$CLICKHOUSE_DATABASE' AND table = 'data'")
+# trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
+path=${path%/}
+
+echo "Files before DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+
+$CLICKHOUSE_CLIENT -q "detach table data"
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    attach table data;
+    drop table data;
+"
+# Check that there is no leftovers:
+echo "Files after DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
new file mode 100644
index 00000000000..ca5036736d8
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.yml
@@ -0,0 +1,7 @@
+storage_configuration:
+  disks:
+    s3_plain_disk:
+      type: s3_plain
+      endpoint: http://localhost:11111/test/s3_plain/
+      access_key_id: clickhouse
+      secret_access_key: clickhouse
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
new file mode 100644
index 00000000000..166512b4b85
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -0,0 +1,7 @@
+Files before DROP TABLE
+format_version.txt
+
+Files after DETACH TABLE
+format_version.txt
+
+Files after DETACH TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
new file mode 100755
index 00000000000..6b8f191edc0
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -0,0 +1,45 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires S3
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+config="${BASH_SOURCE[0]/.sh/.yml}"
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table if exists data_read;
+    drop table if exists data_write;
+
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk';
+    create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
+
+    insert into data_write values (1);
+    system sync replica data_read; -- { serverError TABLE_IS_READ_ONLY }
+"
+
+path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM system.tables WHERE database = '$CLICKHOUSE_DATABASE' AND table = 'data_read'")
+# trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
+path=${path%/}
+
+echo "Files before DROP TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    detach table data_read;
+    detach table data_write;
+"
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+
+$CLICKHOUSE_CLIENT -nm -q "
+    attach table data_read;
+    attach table data_write;
+
+    drop table data_read;
+    drop table data_write;
+"
+# Check that there is no leftovers:
+echo "Files after DETACH TABLE"
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml
new file mode 100644
index 00000000000..ca5036736d8
--- /dev/null
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.yml
@@ -0,0 +1,7 @@
+storage_configuration:
+  disks:
+    s3_plain_disk:
+      type: s3_plain
+      endpoint: http://localhost:11111/test/s3_plain/
+      access_key_id: clickhouse
+      secret_access_key: clickhouse

From 1ee723d50d1226eff86b0fd6c0297322a5bda682 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 17:56:25 +0100
Subject: [PATCH 0283/1081] Prohibit DROP from static storages

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp                 | 9 ---------
 src/Storages/StorageMergeTree.cpp                        | 4 ++++
 src/Storages/StorageReplicatedMergeTree.cpp              | 4 ++++
 .../integration/test_attach_backup_from_s3_plain/test.py | 3 +--
 4 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61bfc2bf9cb..62ec058b124 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2741,15 +2741,6 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
-    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
-    ///
-    /// Note, that one may think that drop on write-once disk should be
-    /// supported, since it is pretty trivial to implement
-    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
-    /// however removing part requires moveDirectory() as well.
-    if (isStaticStorage())
-        return;
-
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index f9d360f02e7..9e1420d811b 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -321,6 +321,10 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 
 void StorageMergeTree::drop()
 {
+    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     shutdown(true);
     dropAllData();
 }
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 579cc5f4c30..39c6641a885 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1085,6 +1085,10 @@ zkutil::ZooKeeperPtr StorageReplicatedMergeTree::getZooKeeperIfTableShutDown() c
 
 void StorageReplicatedMergeTree::drop()
 {
+    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
+    if (isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
+
     /// There is also the case when user has configured ClickHouse to wrong ZooKeeper cluster
     /// or metadata of staled replica were removed manually,
     /// in this case, has_metadata_in_zookeeper = false, and we also permit to drop the table.
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index e575c487b7a..4d48a4438ea 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -64,8 +64,7 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
 
     node.query(
         f"""
-    -- NOTE: DROP DATABASE cannot be done w/o this due to metadata leftovers
-    set force_remove_data_recursively_on_drop=1;
+    detach table ordinary_db.{table_name};
     drop database ordinary_db sync;
     """
     )

From aafc149c1eff50c0df95459240065f2eafd73a1b Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 19:24:53 +0100
Subject: [PATCH 0284/1081] Prohibit CREATE on static storages (ATTACH should
 be used instead)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp           | 6 ++++--
 src/Storages/StorageReplicatedMergeTree.cpp | 3 +++
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 9e1420d811b..9896e04c57f 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -115,12 +115,14 @@ StorageMergeTree::StorageMergeTree(
     , writer(*this)
     , merger_mutator(*this)
 {
-    initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
+    if (!attach && isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
 
+    initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
 
     loadDataParts(has_force_restore_data_flag, std::nullopt);
 
-    if (!attach && !getDataPartsForInternalUsage().empty() && !isStaticStorage())
+    if (!attach && !getDataPartsForInternalUsage().empty())
         throw Exception(ErrorCodes::INCORRECT_DATA,
                         "Data directory for table already containing data parts - probably "
                         "it was unclean DROP table or manual intervention. "
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 39c6641a885..2f5daaff36c 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -338,6 +338,9 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     , replicated_fetches_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_fetches_network_bandwidth, getContext()->getReplicatedFetchesThrottler()))
     , replicated_sends_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_sends_network_bandwidth, getContext()->getReplicatedSendsThrottler()))
 {
+    if (!attach && isStaticStorage())
+        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
+
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
     /// We create and deactivate all tasks for consistency.
     /// They all will be scheduled and activated by the restarting thread.

From d99fb4ce5be1086c0b90d20c85bd7f98414b34a9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 25 Jan 2024 19:24:55 +0100
Subject: [PATCH 0285/1081] tests: rewrite test for MergeTree engines in
 s3_plain using ATTACH

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference |  9 ++--
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    | 40 +++++++++++++----
 ...n_DROP_TABLE_ReplicatedMergeTree.reference |  9 ++--
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh | 43 +++++++++++++------
 4 files changed, 68 insertions(+), 33 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
index 2bec7a1d508..d510f225161 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -1,7 +1,4 @@
-Files before DROP TABLE
-format_version.txt
-
+data after INSERT	1
+data after ATTACH	1
+Files before DETACH TABLE
 Files after DETACH TABLE
-format_version.txt
-
-Files after DROP TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
index 406e53a2175..2059d33ccfd 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -6,11 +6,38 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
+# config for clickhouse-disks (to check leftovers)
 config="${BASH_SOURCE[0]/.sh/.yml}"
 
+# only in Atomic ATTACH from s3_plain works
+new_database="ordinary_$CLICKHOUSE_DATABASE"
+$CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -q "create database $new_database engine=Ordinary"
+CLICKHOUSE_CLIENT=${CLICKHOUSE_CLIENT/--database=$CLICKHOUSE_DATABASE/--database=$new_database}
+CLICKHOUSE_DATABASE="$new_database"
+
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data;
-    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk';
+    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
+
+    create table data (key Int) engine=MergeTree() order by key;
+    insert into data values (1);
+    select 'data after INSERT', count() from data;
+"
+
+# suppress output
+$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table data;
+    attach table data (key Int) engine=MergeTree() order by key
+    settings
+        max_suspicious_broken_parts=0,
+        disk=disk(type=s3_plain,
+            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            access_key_id='test',
+            secret_access_key='testtest');
+    select 'data after ATTACH', count() from data;
+
     insert into data values (1); -- { serverError TABLE_IS_READ_ONLY }
     optimize table data final; -- { serverError TABLE_IS_READ_ONLY }
 "
@@ -19,17 +46,12 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 # trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
 path=${path%/}
 
-echo "Files before DROP TABLE"
+echo "Files before DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
 
 $CLICKHOUSE_CLIENT -q "detach table data"
 echo "Files after DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
 
-$CLICKHOUSE_CLIENT -nm -q "
-    attach table data;
-    drop table data;
-"
-# Check that there is no leftovers:
-echo "Files after DROP TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+# metadata file is left
+$CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index 166512b4b85..d510f225161 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,7 +1,4 @@
-Files before DROP TABLE
-format_version.txt
-
-Files after DETACH TABLE
-format_version.txt
-
+data after INSERT	1
+data after ATTACH	1
+Files before DETACH TABLE
 Files after DETACH TABLE
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index 6b8f191edc0..d8c92c5d6fa 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -8,14 +8,41 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 config="${BASH_SOURCE[0]/.sh/.yml}"
 
+# only in Atomic ATTACH from s3_plain works
+new_database="ordinary_$CLICKHOUSE_DATABASE"
+$CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -q "create database $new_database engine=Ordinary"
+CLICKHOUSE_CLIENT=${CLICKHOUSE_CLIENT/--database=$CLICKHOUSE_DATABASE/--database=$new_database}
+CLICKHOUSE_DATABASE="$new_database"
+
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data_read;
     drop table if exists data_write;
 
-    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk';
     create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
+    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key;
 
     insert into data_write values (1);
+    system sync replica data_read;
+    select 'data after INSERT', count() from data_read;
+"
+
+# suppress output
+$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table data_read;
+    attach table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key
+    settings
+        max_suspicious_broken_parts=0,
+        disk=disk(type=s3_plain,
+            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            access_key_id='test',
+            secret_access_key='testtest');
+    select 'data after ATTACH', count() from data_read;
+
+    insert into data_read values (1); -- { serverError TABLE_IS_READ_ONLY }
+    optimize table data_read final; -- { serverError TABLE_IS_READ_ONLY }
     system sync replica data_read; -- { serverError TABLE_IS_READ_ONLY }
 "
 
@@ -23,7 +50,7 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 # trim / to fix "Unable to parse ExceptionName: XMinioInvalidObjectName Message: Object name contains unsupported characters."
 path=${path%/}
 
-echo "Files before DROP TABLE"
+echo "Files before DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
 
 $CLICKHOUSE_CLIENT -nm -q "
@@ -33,13 +60,5 @@ $CLICKHOUSE_CLIENT -nm -q "
 echo "Files after DETACH TABLE"
 clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
 
-$CLICKHOUSE_CLIENT -nm -q "
-    attach table data_read;
-    attach table data_write;
-
-    drop table data_read;
-    drop table data_write;
-"
-# Check that there is no leftovers:
-echo "Files after DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+# metadata file is left
+$CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"

From 66a40bda0acce258debe6158ce39dacf3300c502 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 11:36:07 +0100
Subject: [PATCH 0286/1081] Revert "Prohibit DROP from static storages"

It is actually OK to DROP at least from read-only disk, as for the
write-once it should be OK as well, since CREATE is prohibited anyway,
so there should be no leftovers

CI: https://s3.amazonaws.com/clickhouse-test-reports/59170/c82050d1925439f0ede2b32acb5b1b8df4acae5d/stress_test__asan_.html
CI: https://s3.amazonaws.com/clickhouse-test-reports/59170/c82050d1925439f0ede2b32acb5b1b8df4acae5d/integration_tests__asan__[3_4].html

This reverts commit 082e62712c5e2f4c48d1abc6141ccfd1249d26b4.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp                 | 9 +++++++++
 src/Storages/StorageMergeTree.cpp                        | 4 ----
 src/Storages/StorageReplicatedMergeTree.cpp              | 4 ----
 .../integration/test_attach_backup_from_s3_plain/test.py | 3 ++-
 4 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 62ec058b124..61bfc2bf9cb 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -2741,6 +2741,15 @@ void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 
 void MergeTreeData::dropAllData()
 {
+    /// In case there is read-only/write-once disk we cannot allow to call dropAllData(), but dropping tables is allowed.
+    ///
+    /// Note, that one may think that drop on write-once disk should be
+    /// supported, since it is pretty trivial to implement
+    /// MetadataStorageFromPlainObjectStorageTransaction::removeDirectory(),
+    /// however removing part requires moveDirectory() as well.
+    if (isStaticStorage())
+        return;
+
     LOG_TRACE(log, "dropAllData: waiting for locks.");
     auto settings_ptr = getSettings();
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 9896e04c57f..ead75113c6d 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -323,10 +323,6 @@ void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 
 void StorageMergeTree::drop()
 {
-    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
-    if (isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
-
     shutdown(true);
     dropAllData();
 }
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 2f5daaff36c..6aa6cc60d7b 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1088,10 +1088,6 @@ zkutil::ZooKeeperPtr StorageReplicatedMergeTree::getZooKeeperIfTableShutDown() c
 
 void StorageReplicatedMergeTree::drop()
 {
-    /// In case there is read-only/write-once disk we do not allow DROP, use DETACH instead.
-    if (isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to static storage");
-
     /// There is also the case when user has configured ClickHouse to wrong ZooKeeper cluster
     /// or metadata of staled replica were removed manually,
     /// in this case, has_metadata_in_zookeeper = false, and we also permit to drop the table.
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index 4d48a4438ea..e575c487b7a 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -64,7 +64,8 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
 
     node.query(
         f"""
-    detach table ordinary_db.{table_name};
+    -- NOTE: DROP DATABASE cannot be done w/o this due to metadata leftovers
+    set force_remove_data_recursively_on_drop=1;
     drop database ordinary_db sync;
     """
     )

From 7cc7fb892c4f2ed4317ba0b86a082624d2b2c1a2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 11:42:37 +0100
Subject: [PATCH 0287/1081] tests/test_disk_over_web_server: update expected
 assertion for static storage

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/integration/test_disk_over_web_server/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index a71fdeff302..4b175d188ef 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -172,7 +172,7 @@ def test_incorrect_usage(cluster):
     assert "Table is read-only" in result
 
     result = node2.query_and_get_error("OPTIMIZE TABLE test0 FINAL")
-    assert "Only read-only operations are supported" in result
+    assert "Table is in readonly mode due to static storage" in result
 
     node2.query("DROP TABLE test0 SYNC")
 

From 7ba31bf55c42132dd35ee2ed0caf284587e5dd47 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 16:28:36 +0100
Subject: [PATCH 0288/1081] Do not create format_version.txt on write-once
 storages

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/MergeTreeData.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 61bfc2bf9cb..6ed07da5c3f 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -301,7 +301,11 @@ void MergeTreeData::initializeDirectoriesAndFormatVersion(const std::string & re
             if (disk->isBroken())
                continue;
 
-            if (!disk->isReadOnly())
+            /// Write once disk is almost the same as read-only for MergeTree,
+            /// since it does not support move, that is required for any
+            /// operation over MergeTree, so avoid writing format_version.txt
+            /// into it as well, to avoid leaving it after DROP.
+            if (!disk->isReadOnly() && !disk->isWriteOnce())
             {
                 auto buf = disk->writeFile(format_version_path, DBMS_DEFAULT_BUFFER_SIZE, WriteMode::Rewrite, getContext()->getWriteSettings());
                 writeIntText(format_version.toUnderType(), *buf);

From 90ab986be6a80227ca281a86ce12db1499d830fe Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 16:37:54 +0100
Subject: [PATCH 0289/1081] Revert "Prohibit CREATE on static storages (ATTACH
 should be used instead)"

CREATE is used by Replicated database even for ATTACH, and anyway ATTACH
creates format_version.txt as well (without previuos patch).

This reverts commit 323f1f320ebe7e588d443abf78efa2c60193e7a9.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp           | 6 ++----
 src/Storages/StorageReplicatedMergeTree.cpp | 3 ---
 2 files changed, 2 insertions(+), 7 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index ead75113c6d..f9d360f02e7 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -115,14 +115,12 @@ StorageMergeTree::StorageMergeTree(
     , writer(*this)
     , merger_mutator(*this)
 {
-    if (!attach && isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
-
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
 
+
     loadDataParts(has_force_restore_data_flag, std::nullopt);
 
-    if (!attach && !getDataPartsForInternalUsage().empty())
+    if (!attach && !getDataPartsForInternalUsage().empty() && !isStaticStorage())
         throw Exception(ErrorCodes::INCORRECT_DATA,
                         "Data directory for table already containing data parts - probably "
                         "it was unclean DROP table or manual intervention. "
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6aa6cc60d7b..579cc5f4c30 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -338,9 +338,6 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
     , replicated_fetches_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_fetches_network_bandwidth, getContext()->getReplicatedFetchesThrottler()))
     , replicated_sends_throttler(std::make_shared<Throttler>(getSettings()->max_replicated_sends_network_bandwidth, getContext()->getReplicatedSendsThrottler()))
 {
-    if (!attach && isStaticStorage())
-        throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Creating data on static storage is prohibited, use ATTACH instead");
-
     initializeDirectoriesAndFormatVersion(relative_data_path_, attach, date_column_name);
     /// We create and deactivate all tasks for consistency.
     /// They all will be scheduled and activated by the restarting thread.

From 332924a2b48910b9d9fb2fcfab7c10c78391426f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 15:29:42 +0100
Subject: [PATCH 0290/1081] tests: adjust 02980_s3_plain_DROP_TABLE tests

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...80_s3_plain_DROP_TABLE_MergeTree.reference | 26 +++++++++++++++++++
 .../02980_s3_plain_DROP_TABLE_MergeTree.sh    |  9 +++----
 ...n_DROP_TABLE_ReplicatedMergeTree.reference | 26 +++++++++++++++++++
 ...s3_plain_DROP_TABLE_ReplicatedMergeTree.sh |  8 +++---
 4 files changed, 60 insertions(+), 9 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
index d510f225161..531163e1d84 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.reference
@@ -1,4 +1,30 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
+all_1_1_0
+
+backups/ordinary_default/data/ordinary_default/data/all_1_1_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
 Files after DETACH TABLE
+all_1_1_0
+
+backups/ordinary_default/data/ordinary_default/data/all_1_1_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
index 2059d33ccfd..386c29704b6 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_MergeTree.sh
@@ -1,6 +1,7 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, no-random-settings, no-random-merge-tree-settings
 # Tag no-fasttest: requires S3
+# Tag no-random-settings, no-random-merge-tree-settings: to avoid creating extra files like serialization.json, this test too exocit anyway
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -17,15 +18,13 @@ CLICKHOUSE_DATABASE="$new_database"
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data;
-    create table data (key Int) engine=MergeTree() order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
-
     create table data (key Int) engine=MergeTree() order by key;
     insert into data values (1);
     select 'data after INSERT', count() from data;
 "
 
 # suppress output
-$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+$CLICKHOUSE_CLIENT -q "backup table data to S3('http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table data;
@@ -33,7 +32,7 @@ $CLICKHOUSE_CLIENT -nm -q "
     settings
         max_suspicious_broken_parts=0,
         disk=disk(type=s3_plain,
-            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            endpoint='http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE',
             access_key_id='test',
             secret_access_key='testtest');
     select 'data after ATTACH', count() from data;
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index d510f225161..ad9897b3381 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,4 +1,30 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
+all_0_0_0
+
+backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
 Files after DETACH TABLE
+all_0_0_0
+
+backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+primary.cidx
+serialization.json
+metadata_version.txt
+default_compression_codec.txt
+data.bin
+data.cmrk3
+count.txt
+columns.txt
+checksums.txt
+
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index d8c92c5d6fa..f31ef518c62 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -1,6 +1,7 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, no-random-settings, no-random-merge-tree-settings
 # Tag no-fasttest: requires S3
+# Tag no-random-settings, no-random-merge-tree-settings: to avoid creating extra files like serialization.json, this test too exocit anyway
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -19,7 +20,6 @@ $CLICKHOUSE_CLIENT -nm -q "
     drop table if exists data_write;
 
     create table data_write (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'write') order by key;
-    create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key settings disk='s3_plain_disk'; -- { serverError TABLE_IS_READ_ONLY }
     create table data_read (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', 'read') order by key;
 
     insert into data_write values (1);
@@ -28,7 +28,7 @@ $CLICKHOUSE_CLIENT -nm -q "
 "
 
 # suppress output
-$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
+$CLICKHOUSE_CLIENT -q "backup table data_read to S3('http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE', 'test', 'testtest')" > /dev/null
 
 $CLICKHOUSE_CLIENT -nm -q "
     drop table data_read;
@@ -36,7 +36,7 @@ $CLICKHOUSE_CLIENT -nm -q "
     settings
         max_suspicious_broken_parts=0,
         disk=disk(type=s3_plain,
-            endpoint='http://localhost:11111/test/backups/$CLICKHOUSE_DATABASE',
+            endpoint='http://localhost:11111/test/s3_plain/backups/$CLICKHOUSE_DATABASE',
             access_key_id='test',
             secret_access_key='testtest');
     select 'data after ATTACH', count() from data_read;

From 5227d7c9bce3d1b9cac2b8d3b8ef0c7b61a2a516 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 26 Jan 2024 11:31:44 +0100
Subject: [PATCH 0291/1081] Fix 02475_bson_each_row_format flakiness (due to
 small parsing block)

CI: https://s3.amazonaws.com/clickhouse-test-reports/59170/c82050d1925439f0ede2b32acb5b1b8df4acae5d/stateless_tests__release_/run.log
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/02475_bson_each_row_format.sh | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/tests/queries/0_stateless/02475_bson_each_row_format.sh b/tests/queries/0_stateless/02475_bson_each_row_format.sh
index aa58d27fa50..f5c48608639 100755
--- a/tests/queries/0_stateless/02475_bson_each_row_format.sh
+++ b/tests/queries/0_stateless/02475_bson_each_row_format.sh
@@ -5,6 +5,12 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+# In case of parallel parsing and small block
+# (--min_chunk_bytes_for_parallel_parsing) we may have multiple blocks, and
+# this will break sorting order, so let's limit number of threads to avoid
+# reordering.
+CLICKHOUSE_CLIENT+="--allow_repeated_settings --max_threads 1"
+
 echo "Integers"
 $CLICKHOUSE_CLIENT -q "insert into function file(02475_data.bsonEachRow) select number::Bool as bool, number::Int8 as int8, number::UInt8 as uint8, number::Int16 as int16, number::UInt16 as uint16, number::Int32 as int32, number::UInt32 as uint32, number::Int64 as int64, number::UInt64 as uint64 from numbers(5) settings engine_file_truncate_on_insert=1"
 $CLICKHOUSE_CLIENT -q "select * from file(02475_data.bsonEachRow, auto, 'bool Bool, int8 Int8, uint8 UInt8, int16 Int16, uint16 UInt16, int32 Int32, uint32 UInt32, int64 Int64, uint64 UInt64')"

From 6795d0207f98657e499c66871678c23412ac04ba Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 26 Jan 2024 16:37:54 +0000
Subject: [PATCH 0292/1081] Update test_reload_after_fail_in_cache_dictionary
 for analyzer

---
 tests/analyzer_integration_broken_tests.txt                   | 1 -
 tests/integration/test_dictionaries_update_and_reload/test.py | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 23f22209451..e1d4de59a23 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,7 +1,6 @@
 test_access_for_functions/test.py::test_access_rights_for_function
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
-test_dictionaries_update_and_reload/test.py::test_reload_after_fail_in_cache_dictionary
 test_distributed_backward_compatability/test.py::test_distributed_in_tuple
 test_distributed_type_object/test.py::test_distributed_type_object
 test_executable_table_function/test.py::test_executable_function_input_python
diff --git a/tests/integration/test_dictionaries_update_and_reload/test.py b/tests/integration/test_dictionaries_update_and_reload/test.py
index 3d96d0b8dd4..648ea847afb 100644
--- a/tests/integration/test_dictionaries_update_and_reload/test.py
+++ b/tests/integration/test_dictionaries_update_and_reload/test.py
@@ -281,7 +281,7 @@ def test_reload_after_fail_in_cache_dictionary(started_cluster):
     query_and_get_error = instance.query_and_get_error
 
     # Can't get a value from the cache dictionary because the source (table `test.xypairs`) doesn't respond.
-    expected_error = "Table test.xypairs does not exist"
+    expected_error = "UNKNOWN_TABLE"
     update_error = "Could not update cache dictionary cache_xypairs now"
     assert expected_error in query_and_get_error(
         "SELECT dictGetUInt64('cache_xypairs', 'y', toUInt64(1))"

From 8fcedddcda46f59b8ddf701105b8f8cabff60ba7 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 26 Jan 2024 17:46:49 +0100
Subject: [PATCH 0293/1081] Fix abort in iceberg metadata on bad file paths

---
 src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
index e01a9a831c0..df1536f53fc 100644
--- a/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
+++ b/src/Storages/DataLakes/Iceberg/IcebergMetadata.cpp
@@ -596,10 +596,11 @@ Strings IcebergMetadata::getDataFiles()
             const auto status = status_int_column->getInt(i);
             const auto data_path = std::string(file_path_string_column->getDataAt(i).toView());
             const auto pos = data_path.find(configuration.url.key);
-            const auto file_path = data_path.substr(pos);
             if (pos == std::string::npos)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected to find {} in data path: {}", configuration.url.key, data_path);
 
+            const auto file_path = data_path.substr(pos);
+
             if (ManifestEntryStatus(status) == ManifestEntryStatus::DELETED)
             {
                 LOG_TEST(log, "Processing delete file for path: {}", file_path);

From e6352234c31a1eebea36d461cf29675d8d1a1b63 Mon Sep 17 00:00:00 2001
From: Aleksandr Musorin <aleksandr.musorin@semrush.com>
Date: Tue, 23 Jan 2024 14:43:30 +0100
Subject: [PATCH 0294/1081] Added parsing trailing symbols for type expressions

```sql
SELECT (1, 'foo')::Tuple(a Int, b String,);
SELECT (1, 'foo')::Tuple(Int, String,);
SELECT (1, (2,'foo'))::Tuple(Int, Tuple(Int, String,),);
````

fix
---
 src/Parsers/ParserDataType.cpp                    | 15 +++++++++++++++
 .../0_stateless/02676_trailing_commas.reference   |  3 +++
 .../queries/0_stateless/02676_trailing_commas.sql |  4 ++++
 3 files changed, 22 insertions(+)

diff --git a/src/Parsers/ParserDataType.cpp b/src/Parsers/ParserDataType.cpp
index 3e2a6facac6..99c0b4b29ac 100644
--- a/src/Parsers/ParserDataType.cpp
+++ b/src/Parsers/ParserDataType.cpp
@@ -116,6 +116,18 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     if (!type_name_suffix.empty())
         type_name = type_name_upper + " " + type_name_suffix;
 
+    /// skip trailing comma in types, e.g. Tuple(Int, String,)
+    if (pos->type == TokenType::Comma)
+    {
+        Expected test_expected;
+        auto test_pos = pos;
+        ++test_pos;
+        if (ParserToken(TokenType::ClosingRoundBracket).ignore(test_pos, test_expected))
+        { // the end of the type definition was reached, there was a trailing comma
+            ++pos;
+        }
+    }
+
     auto function_node = std::make_shared<ASTFunction>();
     function_node->name = type_name;
     function_node->no_empty_args = true;
@@ -133,6 +145,9 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     if (!args_parser.parse(pos, expr_list_args, expected))
         return false;
+    if (pos->type == TokenType::Comma)
+        // ignore trailing comma inside Nested structures like Tuple(Int, Tuple(Int, String),)
+        ++pos;
     if (pos->type != TokenType::ClosingRoundBracket)
         return false;
     ++pos;
diff --git a/tests/queries/0_stateless/02676_trailing_commas.reference b/tests/queries/0_stateless/02676_trailing_commas.reference
index 76d173ca23e..cfb2ccd6a0f 100644
--- a/tests/queries/0_stateless/02676_trailing_commas.reference
+++ b/tests/queries/0_stateless/02676_trailing_commas.reference
@@ -3,3 +3,6 @@
 1
 1	2	0
 1
+(1,'foo')
+(1,'foo')
+(1,(2,'foo'))
diff --git a/tests/queries/0_stateless/02676_trailing_commas.sql b/tests/queries/0_stateless/02676_trailing_commas.sql
index 048405c4d20..7fb64bb57a3 100644
--- a/tests/queries/0_stateless/02676_trailing_commas.sql
+++ b/tests/queries/0_stateless/02676_trailing_commas.sql
@@ -3,3 +3,7 @@ SELECT 1, FROM numbers(1);
 WITH 1 as a SELECT a, FROM numbers(1);
 WITH 1 as from SELECT from, from + from, from in [0], FROM numbers(1);
 SELECT n, FROM (SELECT 1 AS n);
+SELECT (1, 'foo')::Tuple(a Int, b String,);
+SELECT (1, 'foo')::Tuple(a Int, b String,,); -- { clientError SYNTAX_ERROR }
+SELECT (1, 'foo')::Tuple(Int, String,);
+SELECT (1, (2,'foo'))::Tuple(Int, Tuple(Int, String,),);

From 0a21e6aa5d99f499749d73cec56981f3f2e82a5b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 26 Jan 2024 19:07:30 +0100
Subject: [PATCH 0295/1081] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.h |  2 +-
 src/Storages/S3Queue/S3QueueSource.cpp      | 11 +++++++----
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index bfb232675b8..f62898889c3 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -89,7 +89,7 @@ public:
     /// shard_id must be in range [0, shards_num - 1]
     size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
 
-    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < shard_id * (threads_per_shard + 1); }
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
 
 private:
     const S3QueueMode mode;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 400fd13d0dd..96805eca10b 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -87,11 +87,14 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 if (val && sharded_processing)
                 {
                     auto shard = metadata->getProcessingIdForPath(val->key);
-                    if (idx != shard && metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                    if (idx != shard)
                     {
-                        LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                        auto & keys = sharded_keys.at(shard);
-                        keys.push_back(val);
+                        if (metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                        {
+                            LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
+                            auto & keys = sharded_keys.at(shard);
+                            keys.push_back(val);
+                        }
                         continue;
                     }
                 }

From 2c6243f365cc0f2248a868a66aa91d0adae6454a Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 26 Jan 2024 19:52:53 +0100
Subject: [PATCH 0296/1081] Update test.py

---
 tests/integration/test_broken_projections/test.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index f8cbe8e6d9a..8be14c6a57b 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -230,7 +230,6 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         node.query("SYSTEM FLUSH LOGS")
         assert "proj1" in node.query(
             f"""
-        SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
@@ -252,7 +251,6 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         node.query("SYSTEM FLUSH LOGS")
         assert "proj2" in node.query(
             f"""
-        SYSTEM FLUSH LOGS;
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'

From 163a3e44d38b249155f4c056e6388b0cffe26153 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Fri, 26 Jan 2024 21:22:39 +0100
Subject: [PATCH 0297/1081] Update run.sh

---
 docker/test/stateless/run.sh | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index b7c04a6fabd..8eeb01449b4 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -246,16 +246,16 @@ clickhouse-client -q "system flush logs" ||:
 stop_logs_replication
 
 # Try to get logs while server is running
-successfuly_saved=0
+failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst
-    successfuly_saved=$?
+    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst } 2>&1 )
+    [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst
-        successfuly_saved=$((successfuly_saved | $?))
-        clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst
-        successfuly_saved=$((successfuly_saved | $?))
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst } 2>&1 )
+        [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst } 2>&1 )
+        [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done
 
@@ -280,7 +280,7 @@ fi
 
 
 # If server crashed dump system logs with clickhouse-local
-if [ $successfuly_saved -ne 0 ]; then
+if [ $failed_to_save_logs -ne 0 ]; then
     # Compress tables.
     #
     # NOTE:

From 5d62cdd58cb6f4988742bf40c1a27c318aeb6172 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 25 Jan 2024 21:05:02 +0300
Subject: [PATCH 0298/1081] Added setting
 update_insert_deduplication_token_in_dependent_materialized_views

---
 src/Core/Settings.h                           |   1 +
 .../Transforms/buildPushingToViewsChain.cpp   |  25 +++++
 ...ation_token_hierarchical_inserts.reference |   9 ++
 ...duplication_token_hierarchical_inserts.sql | 103 ++++++++++++++++++
 4 files changed, 138 insertions(+)
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e0b3ca39899..a09f2d2331d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -588,6 +588,7 @@ class IColumn;
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \
     M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there're constants there", 0) \
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
+    M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
     M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped taraget table during pushing to views", 0) \
     M(Bool, allow_experimental_refreshable_materialized_view, false, "Allow refreshable materialized views (CREATE MATERIALIZED VIEW <name> REFRESH ...).", 0) \
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 960cc019001..0cbbf4ef482 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -244,7 +244,32 @@ Chain buildPushingToViewsChain(
 
         // Do not deduplicate insertions into MV if the main insertion is Ok
         if (disable_deduplication_for_children)
+        {
             insert_context->setSetting("insert_deduplicate", Field{false});
+        }
+        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views)
+        {
+            /** Update deduplication token passed to dependent MV with current table id. So it is possible to properly handle
+              * deduplication in complex INSERT flows.
+              *
+              * Example:
+              *
+              * landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+              *          |                                     |
+              *          └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+              *
+              * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
+              * be inserted into `ds_2_1`.
+              */
+            auto insert_deduplication_token = insert_settings.insert_deduplication_token.toString();
+
+            if (table_id.hasUUID())
+                insert_deduplication_token += "_" + toString(table_id.uuid);
+            else
+                insert_deduplication_token += "_" + table_id.getFullNameNotQuoted();
+
+            insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
+        }
 
         // Processing of blocks for MVs is done block by block, and there will
         // be no parallel reading after (plus it is not a costless operation)
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
new file mode 100644
index 00000000000..a5a9a5539ba
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -0,0 +1,9 @@
+0
+landing	all_1_1_0	0
+ds_1_2	all_1_1_0	0
+ds_1_1	all_1_1_0	0
+ds_2_1	all_1_1_0	0
+ds_2_1	all_2_2_0	0
+ds_3_1	all_1_1_0	0
+ds_3_1	all_2_2_0	0
+10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
new file mode 100644
index 00000000000..4208543c284
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -0,0 +1,103 @@
+SET insert_deduplicate = 1;
+SET deduplicate_blocks_in_dependent_materialized_views = 1;
+SET update_insert_deduplication_token_in_dependent_materialized_views = 1;
+SET insert_deduplication_token = 'test';
+
+DROP TABLE IF EXISTS landing;
+CREATE TABLE landing
+(
+    timestamp UInt64,
+    value UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP TABLE IF EXISTS ds_1_1;
+CREATE TABLE ds_1_1
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_1;
+CREATE MATERIALIZED VIEW mv_1_1 TO ds_1_1 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+DROP TABLE IF EXISTS ds_1_2;
+CREATE TABLE ds_1_2
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_2;
+CREATE MATERIALIZED VIEW mv_1_2 TO ds_1_2 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+DROP TABLE IF EXISTS ds_2_1;
+CREATE TABLE ds_2_1
+(
+    l String,
+    t DateTime,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_2_1;
+CREATE MATERIALIZED VIEW mv_2_1 TO ds_2_1 as
+SELECT '2_1' l, t, v
+FROM ds_1_1;
+
+DROP VIEW IF EXISTS mv_2_2;
+CREATE MATERIALIZED VIEW mv_2_2 TO ds_2_1 as
+SELECT '2_2' l, t, v
+FROM ds_1_2;
+
+DROP TABLE IF EXISTS ds_3_1;
+CREATE TABLE ds_3_1
+(
+    l String,
+    t DateTime,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_3_1;
+CREATE MATERIALIZED VIEW mv_3_1 TO ds_3_1 as
+SELECT '3_1' l, t, v
+FROM ds_2_1;
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SELECT sleep(3);
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SYSTEM FLUSH LOGS;
+SELECT table, name, error FROM system.part_log
+WHERE database = currentDatabase()
+ORDER BY event_time;
+
+SELECT count() FROM landing;
+
+DROP TABLE landing;
+
+DROP TABLE ds_1_1;
+DROP VIEW mv_1_1;
+
+DROP TABLE ds_1_2;
+DROP VIEW mv_1_2;
+
+DROP TABLE ds_2_1;
+DROP VIEW mv_2_1;
+DROP VIEW mv_2_2;
+
+DROP TABLE ds_3_1;
+DROP VIEW mv_3_1;

From 4ae425461fa7c3fb6b9a32d4f209ce558322497f Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 25 Jan 2024 21:22:48 +0300
Subject: [PATCH 0299/1081] Added documentation

---
 docs/en/operations/settings/settings.md | 28 ++++++++++++++++++++++++-
 1 file changed, 27 insertions(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 75d05d55366..3fd409e2d68 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1991,6 +1991,32 @@ If an INSERTed block is skipped due to deduplication in the source table, there
 At the same time, this behaviour “breaks” `INSERT` idempotency. If an `INSERT` into the main table was successful and `INSERT` into a materialized view failed (e.g. because of communication failure with ClickHouse Keeper) a client will get an error and can retry the operation. However, the materialized view won’t receive the second insert because it will be discarded by deduplication in the main (source) table. The setting `deduplicate_blocks_in_dependent_materialized_views` allows for changing this behaviour. On retry, a materialized view will receive the repeat insert and will perform a deduplication check by itself,
 ignoring check result for the source table, and will insert rows lost because of the first failure.
 
+## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
+
+Allows to update insert deduplication token with table identifier during insert in dependent materialized views.
+
+Possible values:
+
+      0 — Disabled.
+      1 — Enabled.
+
+Default value: 0.
+
+Usage:
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
+
+Example:
+```
+landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+         |                                     |
+         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+```
+
+In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
+
 ## insert_deduplication_token {#insert_deduplication_token}
 
 The setting allows a user to provide own deduplication semantic in MergeTree/ReplicatedMergeTree
@@ -5165,7 +5191,7 @@ SETTINGS(dictionary_use_async_executor=1, max_threads=8);
 ## storage_metadata_write_full_object_key {#storage_metadata_write_full_object_key}
 
 When set to `true` the metadata files are written with `VERSION_FULL_OBJECT_KEY` format version. With that format full object storage key names are written to the metadata files.
-When set to `false` the metadata files are written with the previous format version, `VERSION_INLINE_DATA`. With that format only suffixes of object storage key names are are written to the metadata files. The prefix for all of object storage key names is set in configurations files at `storage_configuration.disks` section. 
+When set to `false` the metadata files are written with the previous format version, `VERSION_INLINE_DATA`. With that format only suffixes of object storage key names are are written to the metadata files. The prefix for all of object storage key names is set in configurations files at `storage_configuration.disks` section.
 
 Default value: `false`.
 

From 4a10b7125298b9133ec66b2654138ed459010d33 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 13:49:32 +0300
Subject: [PATCH 0300/1081] Updated documentation

---
 docs/en/operations/settings/settings.md | 52 ++++++++++++-------------
 1 file changed, 26 insertions(+), 26 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 3fd409e2d68..5f197990f4d 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1991,32 +1991,6 @@ If an INSERTed block is skipped due to deduplication in the source table, there
 At the same time, this behaviour “breaks” `INSERT` idempotency. If an `INSERT` into the main table was successful and `INSERT` into a materialized view failed (e.g. because of communication failure with ClickHouse Keeper) a client will get an error and can retry the operation. However, the materialized view won’t receive the second insert because it will be discarded by deduplication in the main (source) table. The setting `deduplicate_blocks_in_dependent_materialized_views` allows for changing this behaviour. On retry, a materialized view will receive the repeat insert and will perform a deduplication check by itself,
 ignoring check result for the source table, and will insert rows lost because of the first failure.
 
-## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
-
-Allows to update insert deduplication token with table identifier during insert in dependent materialized views.
-
-Possible values:
-
-      0 — Disabled.
-      1 — Enabled.
-
-Default value: 0.
-
-Usage:
-
-If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
-
-Example:
-```
-landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
-         |                                     |
-         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
-```
-
-In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
-
-If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
-
 ## insert_deduplication_token {#insert_deduplication_token}
 
 The setting allows a user to provide own deduplication semantic in MergeTree/ReplicatedMergeTree
@@ -2066,6 +2040,32 @@ SELECT * FROM test_table
 └───┘
 ```
 
+## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
+
+Allows to update `insert_deduplication_token` with table identifier during insert in dependent materialized views, if setting `deduplicate_blocks_in_dependent_materialized_views` is enabled and `insert_deduplication_token` is set.
+
+Possible values:
+
+      0 — Disabled.
+      1 — Enabled.
+
+Default value: 0.
+
+Usage:
+
+If setting `deduplicate_blocks_in_dependent_materialized_views` is enabled, `insert_deduplication_token` is passed to dependent materialized views. But in complex INSERT flows it is possible that we want to avoid deduplication for dependent materialized views.
+
+Example:
+```
+landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+         |                                     |
+         └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+```
+
+In this example we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will be inserted into `ds_2_1`. Without `update_insert_deduplication_token_in_dependent_materialized_views` setting enabled, those two different blocks will be deduplicated, because different blocks from `mv_2_1` and `mv_2_2` will have the same `insert_deduplication_token`.
+
+If setting `update_insert_deduplication_token_in_dependent_materialized_views` is enabled, during each insert into dependent materialized views `insert_deduplication_token` is updated with table identifier, so block from `mv_2_1` and block from `mv_2_2` will have different `insert_deduplication_token` and will not be deduplicated.
+
 ## insert_keeper_max_retries
 
 The setting sets the maximum number of retries for ClickHouse Keeper (or ZooKeeper) requests during insert into replicated MergeTree. Only Keeper requests which failed due to network error, Keeper session timeout, or request timeout are considered for retries.

From 0f46200d5aaba14cbfbb2e923826b1394ebc4d2c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 20:09:22 +0300
Subject: [PATCH 0301/1081] Fixed tests

---
 src/Processors/Transforms/buildPushingToViewsChain.cpp       | 5 +++--
 ...insert_deduplication_token_hierarchical_inserts.reference | 4 ++--
 ...02972_insert_deduplication_token_hierarchical_inserts.sql | 2 +-
 3 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 0cbbf4ef482..8ddc3ab0c61 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -247,7 +247,8 @@ Chain buildPushingToViewsChain(
         {
             insert_context->setSetting("insert_deduplicate", Field{false});
         }
-        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views)
+        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
+            !insert_settings.insert_deduplication_token.value.empty())
         {
             /** Update deduplication token passed to dependent MV with current table id. So it is possible to properly handle
               * deduplication in complex INSERT flows.
@@ -261,7 +262,7 @@ Chain buildPushingToViewsChain(
               * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
               * be inserted into `ds_2_1`.
               */
-            auto insert_deduplication_token = insert_settings.insert_deduplication_token.toString();
+            auto insert_deduplication_token = insert_settings.insert_deduplication_token.value;
 
             if (table_id.hasUUID())
                 insert_deduplication_token += "_" + toString(table_id.uuid);
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
index a5a9a5539ba..71c9053d644 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -1,9 +1,9 @@
 0
-landing	all_1_1_0	0
-ds_1_2	all_1_1_0	0
 ds_1_1	all_1_1_0	0
+ds_1_2	all_1_1_0	0
 ds_2_1	all_1_1_0	0
 ds_2_1	all_2_2_0	0
 ds_3_1	all_1_1_0	0
 ds_3_1	all_2_2_0	0
+landing	all_1_1_0	0
 10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 4208543c284..2e982cde738 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -83,7 +83,7 @@ INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
 SYSTEM FLUSH LOGS;
 SELECT table, name, error FROM system.part_log
 WHERE database = currentDatabase()
-ORDER BY event_time;
+ORDER BY event_time, table, name;
 
 SELECT count() FROM landing;
 

From 7d48d0da72af35a2f63d5b6fcf53303e15c5c330 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 15:57:33 +0300
Subject: [PATCH 0302/1081] Fixed tests

---
 .../02972_insert_deduplication_token_hierarchical_inserts.sql   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 2e982cde738..242133e9122 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -83,7 +83,7 @@ INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
 SYSTEM FLUSH LOGS;
 SELECT table, name, error FROM system.part_log
 WHERE database = currentDatabase()
-ORDER BY event_time, table, name;
+ORDER BY table, name;
 
 SELECT count() FROM landing;
 

From 71cd1efd8bdf0d1265f578575217fb8b5404123f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 27 Jan 2024 15:17:40 +0100
Subject: [PATCH 0303/1081] tests: fix
 02980_s3_plain_DROP_TABLE_ReplicatedMergeTree flakiness

In case of commit failed (likely due to fault injection in tests) part
name will have different name, not all_0_0_0, so replace numbers with X.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...2980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference | 8 ++++----
 .../02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh      | 5 +++--
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
index ad9897b3381..1e191b719a5 100644
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.reference
@@ -1,9 +1,9 @@
 data after INSERT	1
 data after ATTACH	1
 Files before DETACH TABLE
-all_0_0_0
+all_X_X_X
 
-backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+backups/ordinary_default/data/ordinary_default/data_read/all_X_X_X:
 primary.cidx
 serialization.json
 metadata_version.txt
@@ -15,9 +15,9 @@ columns.txt
 checksums.txt
 
 Files after DETACH TABLE
-all_0_0_0
+all_X_X_X
 
-backups/ordinary_default/data/ordinary_default/data_read/all_0_0_0:
+backups/ordinary_default/data/ordinary_default/data_read/all_X_X_X:
 primary.cidx
 serialization.json
 metadata_version.txt
diff --git a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
index f31ef518c62..bf20247c7aa 100755
--- a/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
+++ b/tests/queries/0_stateless/02980_s3_plain_DROP_TABLE_ReplicatedMergeTree.sh
@@ -51,14 +51,15 @@ path=$($CLICKHOUSE_CLIENT -q "SELECT replace(data_paths[1], 's3_plain', '') FROM
 path=${path%/}
 
 echo "Files before DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2
+# sed to match any part, since in case of fault injection part name may not be all_0_0_0 but all_1_1_0
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "${path:?}" | tail -n+2 | sed 's/all_[^_]*_[^_]*_0/all_X_X_X/g'
 
 $CLICKHOUSE_CLIENT -nm -q "
     detach table data_read;
     detach table data_write;
 "
 echo "Files after DETACH TABLE"
-clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2
+clickhouse-disks -C "$config" --disk s3_plain_disk list --recursive "$path" | tail -n+2 | sed 's/all_[^_]*_[^_]*_0/all_X_X_X/g'
 
 # metadata file is left
 $CLICKHOUSE_CLIENT --force_remove_data_recursively_on_drop=1 -q "drop database if exists $CLICKHOUSE_DATABASE"

From 9d3b4e530810b2d05f62706a22062519ba18b30b Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Sat, 27 Jan 2024 16:40:11 +0000
Subject: [PATCH 0304/1081] lower memory usage

---
 src/Columns/ColumnAggregateFunction.cpp              |  4 ++--
 src/Columns/ColumnArray.cpp                          | 12 +++++++++---
 src/Columns/ColumnArray.h                            |  1 +
 src/Columns/ColumnConst.cpp                          |  2 +-
 src/Columns/ColumnDecimal.cpp                        |  4 ++--
 src/Columns/ColumnDecimal.h                          |  1 +
 src/Columns/ColumnFixedString.cpp                    |  2 +-
 src/Columns/ColumnFixedString.h                      |  5 +++++
 src/Columns/ColumnLowCardinality.h                   |  2 ++
 src/Columns/ColumnMap.cpp                            |  5 +++++
 src/Columns/ColumnMap.h                              |  1 +
 src/Columns/ColumnNullable.cpp                       |  8 +++++++-
 src/Columns/ColumnNullable.h                         |  1 +
 src/Columns/ColumnString.cpp                         |  7 ++++++-
 src/Columns/ColumnString.h                           |  1 +
 src/Columns/ColumnTuple.cpp                          |  7 +++++++
 src/Columns/ColumnTuple.h                            |  1 +
 src/Columns/ColumnVector.cpp                         |  8 ++++----
 src/Columns/ColumnVector.h                           |  5 +++++
 src/Columns/IColumn.h                                |  5 +----
 src/Common/PODArray.h                                |  7 +++++++
 src/Core/Block.cpp                                   |  2 +-
 src/DataTypes/Serializations/SerializationString.cpp |  2 +-
 src/Storages/MergeTree/MergeTreeReadTask.cpp         |  4 ++++
 src/Storages/MergeTree/MergeTreeSequentialSource.cpp |  5 +++++
 25 files changed, 81 insertions(+), 21 deletions(-)

diff --git a/src/Columns/ColumnAggregateFunction.cpp b/src/Columns/ColumnAggregateFunction.cpp
index 2018015b46d..43e55494747 100644
--- a/src/Columns/ColumnAggregateFunction.cpp
+++ b/src/Columns/ColumnAggregateFunction.cpp
@@ -337,7 +337,7 @@ ColumnPtr ColumnAggregateFunction::indexImpl(const PaddedPODArray<Type> & indexe
     assert(limit <= indexes.size());
     auto res = createView();
 
-    res->data.resize(limit);
+    res->data.resize_exact(limit);
     for (size_t i = 0; i < limit; ++i)
         res->data[i] = data[indexes[i]];
 
@@ -626,7 +626,7 @@ void ColumnAggregateFunction::getPermutation(PermutationSortDirection /*directio
                                             size_t /*limit*/, int /*nan_direction_hint*/, IColumn::Permutation & res) const
 {
     size_t s = data.size();
-    res.resize(s);
+    res.resize_exact(s);
     iota(res.data(), s, IColumn::Permutation::value_type(0));
 }
 
diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 1cb8188bce6..fddfa2ac6b2 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -109,7 +109,7 @@ MutableColumnPtr ColumnArray::cloneResized(size_t to_size) const
             offset = getOffsets().back();
         }
 
-        res->getOffsets().resize(to_size);
+        res->getOffsets().resize_exact(to_size);
         for (size_t i = from_size; i < to_size; ++i)
             res->getOffsets()[i] = offset;
     }
@@ -427,6 +427,12 @@ void ColumnArray::reserve(size_t n)
     getData().reserve(n); /// The average size of arrays is not taken into account here. Or it is considered to be no more than 1.
 }
 
+void ColumnArray::shrinkToFit()
+{
+    getOffsets().shrink_to_fit();
+    getData().shrinkToFit();
+}
+
 void ColumnArray::ensureOwnership()
 {
     getData().ensureOwnership();
@@ -603,7 +609,7 @@ void ColumnArray::expand(const IColumn::Filter & mask, bool inverted)
 
     ssize_t index = mask.size() - 1;
     ssize_t from = offsets_data.size() - 1;
-    offsets_data.resize(mask.size());
+    offsets_data.resize_exact(mask.size());
     UInt64 last_offset = offsets_data[from];
     while (index >= 0)
     {
@@ -831,7 +837,7 @@ ColumnPtr ColumnArray::indexImpl(const PaddedPODArray<T> & indexes, size_t limit
     auto res = ColumnArray::create(data->cloneEmpty());
 
     Offsets & res_offsets = res->getOffsets();
-    res_offsets.resize(limit);
+    res_offsets.resize_exact(limit);
     size_t current_offset = 0;
 
     for (size_t i = 0; i < limit; ++i)
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 2a9bfa405e5..407f44a6f3c 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -108,6 +108,7 @@ public:
     void updatePermutationWithCollation(const Collator & collator, PermutationSortDirection direction, PermutationSortStability stability,
                                     size_t limit, int nan_direction_hint, Permutation & res, EqualRanges& equal_ranges) const override;
     void reserve(size_t n) override;
+    void shrinkToFit() override;
     void ensureOwnership() override;
     size_t byteSize() const override;
     size_t byteSizeAt(size_t n) const override;
diff --git a/src/Columns/ColumnConst.cpp b/src/Columns/ColumnConst.cpp
index 9aa0f5cfa49..57d02e72820 100644
--- a/src/Columns/ColumnConst.cpp
+++ b/src/Columns/ColumnConst.cpp
@@ -128,7 +128,7 @@ MutableColumns ColumnConst::scatter(ColumnIndex num_columns, const Selector & se
 void ColumnConst::getPermutation(PermutationSortDirection /*direction*/, PermutationSortStability /*stability*/,
                                 size_t /*limit*/, int /*nan_direction_hint*/, Permutation & res) const
 {
-    res.resize(s);
+    res.resize_exact(s);
     iota(res.data(), s, IColumn::Permutation::value_type(0));
 }
 
diff --git a/src/Columns/ColumnDecimal.cpp b/src/Columns/ColumnDecimal.cpp
index 20fc5d8e1fe..aef81727ffd 100644
--- a/src/Columns/ColumnDecimal.cpp
+++ b/src/Columns/ColumnDecimal.cpp
@@ -159,7 +159,7 @@ void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection directio
     };
 
     size_t data_size = data.size();
-    res.resize(data_size);
+    res.resize_exact(data_size);
 
     if (limit >= data_size)
         limit = 0;
@@ -318,7 +318,7 @@ MutableColumnPtr ColumnDecimal<T>::cloneResized(size_t size) const
     if (size > 0)
     {
         auto & new_col = static_cast<Self &>(*res);
-        new_col.data.resize(size);
+        new_col.data.resize_exact(size);
 
         size_t count = std::min(this->size(), size);
 
diff --git a/src/Columns/ColumnDecimal.h b/src/Columns/ColumnDecimal.h
index fb24ae4554b..840dc23dc36 100644
--- a/src/Columns/ColumnDecimal.h
+++ b/src/Columns/ColumnDecimal.h
@@ -55,6 +55,7 @@ public:
     size_t allocatedBytes() const override { return data.allocated_bytes(); }
     void protect() override { data.protect(); }
     void reserve(size_t n) override { data.reserve(n); }
+    void shrinkToFit() override { data.shrink_to_fit(); }
 
     void insertFrom(const IColumn & src, size_t n) override { data.push_back(static_cast<const Self &>(src).getData()[n]); }
     void insertData(const char * src, size_t /*length*/) override;
diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index a18e5c522a1..1ba59ce4f4b 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -39,7 +39,7 @@ MutableColumnPtr ColumnFixedString::cloneResized(size_t size) const
     if (size > 0)
     {
         auto & new_col = assert_cast<ColumnFixedString &>(*new_col_holder);
-        new_col.chars.resize(size * n);
+        new_col.chars.resize_exact(size * n);
 
         size_t count = std::min(this->size(), size);
         memcpy(new_col.chars.data(), chars.data(), count * n * sizeof(chars[0]));
diff --git a/src/Columns/ColumnFixedString.h b/src/Columns/ColumnFixedString.h
index 445432b7b28..70c26ba8496 100644
--- a/src/Columns/ColumnFixedString.h
+++ b/src/Columns/ColumnFixedString.h
@@ -181,6 +181,11 @@ public:
         chars.reserve(n * size);
     }
 
+    void shrinkToFit() override
+    {
+        chars.shrink_to_fit();
+    }
+
     void resize(size_t size)
     {
         chars.resize(n * size);
diff --git a/src/Columns/ColumnLowCardinality.h b/src/Columns/ColumnLowCardinality.h
index 91bd5945fd9..c6fcfc0a4b7 100644
--- a/src/Columns/ColumnLowCardinality.h
+++ b/src/Columns/ColumnLowCardinality.h
@@ -159,6 +159,7 @@ public:
     }
 
     void reserve(size_t n) override { idx.reserve(n); }
+    void shrinkToFit() override { idx.shrinkToFit(); }
 
     /// Don't count the dictionary size as it can be shared between different blocks.
     size_t byteSize() const override { return idx.getPositions()->byteSize(); }
@@ -295,6 +296,7 @@ public:
 
         void popBack(size_t n) { positions->popBack(n); }
         void reserve(size_t n) { positions->reserve(n); }
+        void shrinkToFit() { positions->shrinkToFit(); }
 
         UInt64 getMaxPositionForCurrentType() const;
 
diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index ddcde43ca23..61abe9d2598 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -229,6 +229,11 @@ void ColumnMap::reserve(size_t n)
     nested->reserve(n);
 }
 
+void ColumnMap::shrinkToFit()
+{
+    nested->shrinkToFit();
+}
+
 void ColumnMap::ensureOwnership()
 {
     nested->ensureOwnership();
diff --git a/src/Columns/ColumnMap.h b/src/Columns/ColumnMap.h
index fde8a7e0e67..118c5b3d3df 100644
--- a/src/Columns/ColumnMap.h
+++ b/src/Columns/ColumnMap.h
@@ -83,6 +83,7 @@ public:
     void updatePermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                         size_t limit, int nan_direction_hint, IColumn::Permutation & res, EqualRanges & equal_ranges) const override;
     void reserve(size_t n) override;
+    void shrinkToFit() override;
     void ensureOwnership() override;
     size_t byteSize() const override;
     size_t byteSizeAt(size_t n) const override;
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 4ee6bb3d586..1a2bc378ff1 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -97,7 +97,7 @@ MutableColumnPtr ColumnNullable::cloneResized(size_t new_size) const
 
     if (new_size > 0)
     {
-        new_null_map->getData().resize(new_size);
+        new_null_map->getData().resize_exact(new_size);
 
         size_t count = std::min(size(), new_size);
         memcpy(new_null_map->getData().data(), getNullMapData().data(), count * sizeof(getNullMapData()[0]));
@@ -678,6 +678,12 @@ void ColumnNullable::reserve(size_t n)
     getNullMapData().reserve(n);
 }
 
+void ColumnNullable::shrinkToFit()
+{
+    getNestedColumn().shrinkToFit();
+    getNullMapData().shrink_to_fit();
+}
+
 void ColumnNullable::ensureOwnership()
 {
     getNestedColumn().ensureOwnership();
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index b57fdf3064d..988783abfa3 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -109,6 +109,7 @@ public:
     void updatePermutationWithCollation(const Collator & collator, IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                         size_t limit, int null_direction_hint, Permutation & res, EqualRanges& equal_ranges) const override;
     void reserve(size_t n) override;
+    void shrinkToFit() override;
     void ensureOwnership() override;
     size_t byteSize() const override;
     size_t byteSizeAt(size_t n) const override;
diff --git a/src/Columns/ColumnString.cpp b/src/Columns/ColumnString.cpp
index 50fe90ad8ef..b1ce50f9a2e 100644
--- a/src/Columns/ColumnString.cpp
+++ b/src/Columns/ColumnString.cpp
@@ -71,8 +71,8 @@ MutableColumnPtr ColumnString::cloneResized(size_t to_size) const
         /// Empty strings are just zero terminating bytes.
 
         res->chars.resize_fill(res->chars.size() + to_size - from_size);
+        res->offsets.resize_exact(to_size);
 
-        res->offsets.resize(to_size);
         for (size_t i = from_size; i < to_size; ++i)
         {
             ++offset;
@@ -494,6 +494,11 @@ void ColumnString::reserve(size_t n)
     offsets.reserve(n);
 }
 
+void ColumnString::shrinkToFit()
+{
+    chars.shrink_to_fit();
+    offsets.shrink_to_fit();
+}
 
 void ColumnString::getExtremes(Field & min, Field & max) const
 {
diff --git a/src/Columns/ColumnString.h b/src/Columns/ColumnString.h
index 345513248fd..f2844b40aff 100644
--- a/src/Columns/ColumnString.h
+++ b/src/Columns/ColumnString.h
@@ -259,6 +259,7 @@ public:
     ColumnPtr compress() const override;
 
     void reserve(size_t n) override;
+    void shrinkToFit() override;
 
     void getExtremes(Field & min, Field & max) const override;
 
diff --git a/src/Columns/ColumnTuple.cpp b/src/Columns/ColumnTuple.cpp
index 356bb0493d2..55899bbd50b 100644
--- a/src/Columns/ColumnTuple.cpp
+++ b/src/Columns/ColumnTuple.cpp
@@ -444,6 +444,13 @@ void ColumnTuple::reserve(size_t n)
         getColumn(i).reserve(n);
 }
 
+void ColumnTuple::shrinkToFit()
+{
+    const size_t tuple_size = columns.size();
+    for (size_t i = 0; i < tuple_size; ++i)
+        getColumn(i).shrinkToFit();
+}
+
 void ColumnTuple::ensureOwnership()
 {
     const size_t tuple_size = columns.size();
diff --git a/src/Columns/ColumnTuple.h b/src/Columns/ColumnTuple.h
index 79099f4c098..d5d0915de96 100644
--- a/src/Columns/ColumnTuple.h
+++ b/src/Columns/ColumnTuple.h
@@ -91,6 +91,7 @@ public:
     void updatePermutationWithCollation(const Collator & collator, IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                     size_t limit, int nan_direction_hint, IColumn::Permutation & res, EqualRanges& equal_ranges) const override;
     void reserve(size_t n) override;
+    void shrinkToFit() override;
     void ensureOwnership() override;
     size_t byteSize() const override;
     size_t byteSizeAt(size_t n) const override;
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index b1cf449dfde..802d4293b90 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -237,7 +237,7 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
                                     size_t limit, int nan_direction_hint, IColumn::Permutation & res) const
 {
     size_t data_size = data.size();
-    res.resize(data_size);
+    res.resize_exact(data_size);
 
     if (data_size == 0)
         return;
@@ -424,7 +424,7 @@ MutableColumnPtr ColumnVector<T>::cloneResized(size_t size) const
     if (size > 0)
     {
         auto & new_col = static_cast<Self &>(*res);
-        new_col.data.resize(size);
+        new_col.data.resize_exact(size);
 
         size_t count = std::min(this->size(), size);
         memcpy(new_col.data.data(), data.data(), count * sizeof(data[0]));
@@ -628,8 +628,8 @@ inline void doFilterAligned(const UInt8 *& filt_pos, const UInt8 *& filt_end_ali
         filt_pos += SIMD_ELEMENTS;
         data_pos += SIMD_ELEMENTS;
     }
-    /// resize to the real size.
-    res_data.resize(current_offset);
+    /// Resize to the real size.
+    res_data.resize_exact(current_offset);
 }
 )
 
diff --git a/src/Columns/ColumnVector.h b/src/Columns/ColumnVector.h
index 517375f8eb4..cfc2ad6272e 100644
--- a/src/Columns/ColumnVector.h
+++ b/src/Columns/ColumnVector.h
@@ -182,6 +182,11 @@ public:
         data.reserve(n);
     }
 
+    void shrinkToFit() override
+    {
+        data.shrink_to_fit();
+    }
+
     const char * getFamilyName() const override { return TypeName<T>.data(); }
     TypeIndex getDataType() const override { return TypeToTypeIndex<T>; }
 
diff --git a/src/Columns/IColumn.h b/src/Columns/IColumn.h
index 1ccdf255bf4..4f992263605 100644
--- a/src/Columns/IColumn.h
+++ b/src/Columns/IColumn.h
@@ -399,10 +399,7 @@ public:
 
     /// Requests the removal of unused capacity.
     /// It is a non-binding request to reduce the capacity of the underlying container to its size.
-    virtual MutablePtr shrinkToFit() const
-    {
-        return cloneResized(size());
-    }
+    virtual void shrinkToFit() {}
 
     /// If we have another column as a source (owner of data), copy all data to ourself and reset source.
     virtual void ensureOwnership() {}
diff --git a/src/Common/PODArray.h b/src/Common/PODArray.h
index 6a048d1c6c0..1a4047a2588 100644
--- a/src/Common/PODArray.h
+++ b/src/Common/PODArray.h
@@ -6,6 +6,7 @@
 #include <Common/PODArray_fwd.h>
 #include <base/getPageSize.h>
 #include <boost/noncopyable.hpp>
+#include <cstdlib>
 #include <cstring>
 #include <cstddef>
 #include <cassert>
@@ -238,6 +239,12 @@ public:
         resize_assume_reserved(n);
     }
 
+    template <typename ... TAllocatorParams>
+    void shrink_to_fit(TAllocatorParams &&... allocator_params)
+    {
+        realloc(PODArrayDetails::minimum_memory_for_elements(size(), ELEMENT_SIZE, pad_left, pad_right), std::forward<TAllocatorParams>(allocator_params)...);
+    }
+
     void resize_assume_reserved(const size_t n) /// NOLINT
     {
         c_end = c_start + PODArrayDetails::byte_size(n, ELEMENT_SIZE);
diff --git a/src/Core/Block.cpp b/src/Core/Block.cpp
index a7d5b0a869f..dfd60b994f4 100644
--- a/src/Core/Block.cpp
+++ b/src/Core/Block.cpp
@@ -601,7 +601,7 @@ Block Block::shrinkToFit() const
 {
     Columns new_columns(data.size(), nullptr);
     for (size_t i = 0; i < data.size(); ++i)
-        new_columns[i] = data[i].column->shrinkToFit();
+        new_columns[i] = data[i].column->cloneResized(data[i].column->size());
     return cloneWithColumns(new_columns);
 }
 
diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index b2b083fd466..e2935a78c32 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -208,7 +208,7 @@ static NO_INLINE void deserializeBinarySSE2(ColumnString::Chars & data, ColumnSt
         data[offset - 1] = 0;
     }
 
-    data.resize(offset);
+    data.resize_exact(offset);
 }
 
 
diff --git a/src/Storages/MergeTree/MergeTreeReadTask.cpp b/src/Storages/MergeTree/MergeTreeReadTask.cpp
index dcfed700fac..41c7531b6a6 100644
--- a/src/Storages/MergeTree/MergeTreeReadTask.cpp
+++ b/src/Storages/MergeTree/MergeTreeReadTask.cpp
@@ -184,7 +184,11 @@ MergeTreeReadTask::BlockAndProgress MergeTreeReadTask::read(const BlockSizeParam
 
     Block block;
     if (read_result.num_rows != 0)
+    {
+        for (const auto & column : read_result.columns)
+            column->assumeMutableRef().shrinkToFit();
         block = sample_block.cloneWithColumns(read_result.columns);
+    }
 
     BlockAndProgress res = {
         .block = std::move(block),
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index 29af7fb4820..d0fbc316024 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -140,6 +140,7 @@ MergeTreeSequentialSource::MergeTreeSequentialSource(
 
         if (storage.supportsSubcolumns())
             options.withSubcolumns();
+
         columns_for_reader = storage_snapshot->getColumnsByNames(options, columns_to_read);
     }
     else
@@ -156,6 +157,7 @@ MergeTreeSequentialSource::MergeTreeSequentialSource(
     read_settings.local_fs_method = LocalFSReadMethod::pread;
     if (read_with_direct_io)
         read_settings.direct_io_threshold = 1;
+
     /// Configure throttling
     switch (type)
     {
@@ -224,7 +226,10 @@ try
             for (size_t i = 0; i < num_columns; ++i)
             {
                 if (header.has(it->name))
+                {
+                    columns[i]->assumeMutableRef().shrinkToFit();
                     res_columns.emplace_back(std::move(columns[i]));
+                }
 
                 ++it;
             }

From eb909a5db4ea844f69afb146c20de33ce25a01ff Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Sat, 27 Jan 2024 18:36:38 +0100
Subject: [PATCH 0305/1081] Reapply add MySQL net write/read settings

---
 src/Server/MySQLHandler.cpp                   | 46 +++++++++++++------
 src/Server/MySQLHandler.h                     |  9 ++--
 .../02967_mysql_settings_override.reference   | 23 ++++++++++
 .../02967_mysql_settings_override.sh          | 31 +++++++++++++
 4 files changed, 91 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/02967_mysql_settings_override.reference
 create mode 100755 tests/queries/0_stateless/02967_mysql_settings_override.sh

diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index c159a09c874..260219c1556 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -66,7 +66,7 @@ static String showCountWarningsReplacementQuery(const String & query);
 static String selectEmptyReplacementQuery(const String & query);
 static String showTableStatusReplacementQuery(const String & query);
 static String killConnectionIdReplacementQuery(const String & query);
-static String selectLimitReplacementQuery(const String & query);
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting);
 
 MySQLHandler::MySQLHandler(
     IServer & server_,
@@ -88,12 +88,14 @@ MySQLHandler::MySQLHandler(
     if (ssl_enabled)
         server_capabilities |= CLIENT_SSL;
 
-    replacements.emplace("SHOW WARNINGS", showWarningsReplacementQuery);
-    replacements.emplace("SHOW COUNT(*) WARNINGS", showCountWarningsReplacementQuery);
-    replacements.emplace("KILL QUERY", killConnectionIdReplacementQuery);
-    replacements.emplace("SHOW TABLE STATUS LIKE", showTableStatusReplacementQuery);
-    replacements.emplace("SHOW VARIABLES", selectEmptyReplacementQuery);
-    replacements.emplace("SET SQL_SELECT_LIMIT", selectLimitReplacementQuery);
+    queries_replacements.emplace("SHOW WARNINGS", showWarningsReplacementQuery);
+    queries_replacements.emplace("SHOW COUNT(*) WARNINGS", showCountWarningsReplacementQuery);
+    queries_replacements.emplace("KILL QUERY", killConnectionIdReplacementQuery);
+    queries_replacements.emplace("SHOW TABLE STATUS LIKE", showTableStatusReplacementQuery);
+    queries_replacements.emplace("SHOW VARIABLES", selectEmptyReplacementQuery);
+    settings_replacements.emplace("SQL_SELECT_LIMIT", "limit");
+    settings_replacements.emplace("NET_WRITE_TIMEOUT", "send_timeout");
+    settings_replacements.emplace("NET_READ_TIMEOUT", "receive_timeout");
 }
 
 void MySQLHandler::run()
@@ -342,16 +344,30 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
         bool should_replace = false;
         bool with_output = false;
 
-        for (auto const & x : replacements)
+        // Queries replacements
+        for (auto const & [query_to_replace, replacement_fn] : queries_replacements)
         {
-            if (0 == strncasecmp(x.first.c_str(), query.c_str(), x.first.size()))
+            if (0 == strncasecmp(query_to_replace.c_str(), query.c_str(), query_to_replace.size()))
             {
                 should_replace = true;
-                replacement_query = x.second(query);
+                replacement_query = replacement_fn(query);
                 break;
             }
         }
 
+        // Settings replacements
+        if (!should_replace)
+            for (auto const & [mysql_setting, native_setting] : settings_replacements)
+            {
+                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, native_setting);
+                if (replacement_query_opt.has_value())
+                {
+                    should_replace = true;
+                    replacement_query = replacement_query_opt.value();
+                    break;
+                }
+            }
+
         ReadBufferFromString replacement(replacement_query);
 
         auto query_context = session->makeQueryContext();
@@ -601,12 +617,12 @@ static String showTableStatusReplacementQuery(const String & query)
     return query;
 }
 
-static String selectLimitReplacementQuery(const String & query)
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting)
 {
-    const String prefix = "SET SQL_SELECT_LIMIT";
-    if (query.starts_with(prefix))
-        return "SET limit" + std::string(query.data() + prefix.length());
-    return query;
+    const String prefix = "SET " + mysql_setting;
+    if (0 == strncasecmp(prefix.c_str(), query.c_str(), prefix.size()))
+        return "SET " + native_setting + String(query.data() + prefix.length());
+    return std::nullopt;
 }
 
 /// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
diff --git a/src/Server/MySQLHandler.h b/src/Server/MySQLHandler.h
index 867a90a6205..8f9dcd872db 100644
--- a/src/Server/MySQLHandler.h
+++ b/src/Server/MySQLHandler.h
@@ -92,9 +92,12 @@ protected:
     MySQLProtocol::PacketEndpointPtr packet_endpoint;
     std::unique_ptr<Session> session;
 
-    using ReplacementFn = std::function<String(const String & query)>;
-    using Replacements = std::unordered_map<std::string, ReplacementFn>;
-    Replacements replacements;
+    using QueryReplacementFn = std::function<String(const String & query)>;
+    using QueriesReplacements = std::unordered_map<std::string, QueryReplacementFn>;
+    QueriesReplacements queries_replacements;
+
+    using SettingsReplacements = std::unordered_map<std::string, std::string>;
+    SettingsReplacements settings_replacements;
 
     std::mutex prepared_statements_mutex;
     UInt32 current_prepared_statement_id TSA_GUARDED_BY(prepared_statements_mutex) = 0;
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.reference b/tests/queries/0_stateless/02967_mysql_settings_override.reference
new file mode 100644
index 00000000000..bc058f4889e
--- /dev/null
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.reference
@@ -0,0 +1,23 @@
+-- Init
+s
+a
+b
+c
+d
+-- Uppercase tests
+s
+a
+b
+name	value
+send_timeout	22
+name	value
+receive_timeout	33
+-- Lowercase tests
+s
+a
+b
+c
+name	value
+send_timeout	55
+name	value
+receive_timeout	66
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
new file mode 100755
index 00000000000..e3439a80ab4
--- /dev/null
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -0,0 +1,31 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires mysql client
+
+# Tests the override of certain MySQL proprietary settings to ClickHouse native settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+CHANGED_SETTINGS_QUERY="SELECT name, value FROM system.settings WHERE name IN ('send_timeout', 'receive_timeout') AND changed;"
+
+TEST_TABLE="mysql_settings_override_test"
+
+DROP_TABLE="DROP TABLE IF EXISTS $TEST_TABLE;"
+CREATE_TABLE="CREATE TABLE $TEST_TABLE (s String) ENGINE MergeTree ORDER BY s;"
+INSERT_STMT="INSERT INTO $TEST_TABLE VALUES ('a'), ('b'), ('c'), ('d');"
+SELECT_STMT="SELECT * FROM $TEST_TABLE;"
+
+echo "-- Init"
+${MYSQL_CLIENT} --execute "$DROP_TABLE $CREATE_TABLE $INSERT_STMT $SELECT_STMT" # should fetch all 4 records
+
+echo "-- Uppercase tests"
+${MYSQL_CLIENT} --execute "SET SQL_SELECT_LIMIT = 2; $SELECT_STMT" # should fetch 2 records out of 4
+${MYSQL_CLIENT} --execute "SET NET_WRITE_TIMEOUT = 22; $CHANGED_SETTINGS_QUERY"
+${MYSQL_CLIENT} --execute "SET NET_READ_TIMEOUT = 33; $CHANGED_SETTINGS_QUERY"
+
+echo "-- Lowercase tests"
+${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
+${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
+${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"

From 7d785c47e292b8f28d7c1b947393432316cd9c14 Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Sat, 27 Jan 2024 18:45:57 +0100
Subject: [PATCH 0306/1081] Add drop table

---
 tests/queries/0_stateless/02967_mysql_settings_override.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
index e3439a80ab4..cee18255eeb 100755
--- a/tests/queries/0_stateless/02967_mysql_settings_override.sh
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -29,3 +29,5 @@ echo "-- Lowercase tests"
 ${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
 ${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"
+
+${MYSQL_CLIENT} --execute "$DROP_TABLE"

From 7022ca9eceb1fc6c2abc97a77ee5b770b6a3997b Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sat, 27 Jan 2024 20:24:03 +0100
Subject: [PATCH 0307/1081] Fix _block_number column with non-default
 serializations and mutation

---
 src/Storages/MergeTree/MutateTask.cpp         | 10 +++++
 ...parse_serialization_and_mutation.reference |  0
 ...mber_sparse_serialization_and_mutation.sql | 39 +++++++++++++++++++
 3 files changed, 49 insertions(+)
 create mode 100644 tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference
 create mode 100644 tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 6bcdfe34296..302a9bb2b1e 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -21,6 +21,7 @@
 #include <Storages/MutationCommands.h>
 #include <Storages/MergeTree/MergeTreeDataMergerMutator.h>
 #include <Storages/MergeTree/MergeTreeIndexInverted.h>
+#include <Storages/BlockNumberColumn.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <boost/algorithm/string/replace.hpp>
 #include <Common/ProfileEventsScope.h>
@@ -308,6 +309,15 @@ getColumnsForNewDataPart(
         }
     }
 
+    if (!storage_columns_set.contains(BlockNumberColumn::name))
+    {
+        if (source_part->tryGetSerialization(BlockNumberColumn::name) != nullptr)
+        {
+            storage_columns.push_back({BlockNumberColumn::name, BlockNumberColumn::type});
+            storage_columns_set.insert(BlockNumberColumn::name);
+        }
+    }
+
     SerializationInfoByName new_serialization_infos;
     for (const auto & [name, old_info] : serialization_infos)
     {
diff --git a/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql
new file mode 100644
index 00000000000..7a1de2897fb
--- /dev/null
+++ b/tests/queries/0_stateless/02973_block_number_sparse_serialization_and_mutation.sql
@@ -0,0 +1,39 @@
+-- Tags: zookeeper
+
+-- we need exact block-numbers
+SET insert_keeper_fault_injection_probability=0;
+
+DROP TABLE IF EXISTS table_with_some_columns;
+
+CREATE TABLE table_with_some_columns(
+    key UInt64,
+    value0 UInt8
+)
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/table_with_some_columns', '1')
+ORDER BY key
+SETTINGS allow_experimental_block_number_column=1,
+ratio_of_defaults_for_sparse_serialization=0.0001,
+min_bytes_for_wide_part = 0,
+replace_long_file_name_to_hash=0; -- simpler to debug
+
+INSERT INTO table_with_some_columns SELECT rand(), number + 10 from numbers(100000);
+
+INSERT INTO table_with_some_columns SELECT rand(), number + 10 from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+INSERT INTO table_with_some_columns SELECT rand(), number+222222222 from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+set alter_sync = 2;
+
+ALTER TABLE table_with_some_columns DROP COLUMN value0;
+
+INSERT INTO table_with_some_columns SELECT rand() from numbers(1);
+
+OPTIMIZE TABLE table_with_some_columns FINAL;
+
+SELECT *, _block_number FROM table_with_some_columns where not ignore(*) Format Null;
+
+DROP TABLE IF EXISTS table_with_some_columns;

From 8944e7a0b180a711d9eae4cb6a1064a2030e445a Mon Sep 17 00:00:00 2001
From: Joshua Hildred <jthildred@gmail.com>
Date: Sat, 27 Jan 2024 12:20:49 -0800
Subject: [PATCH 0308/1081] update curl submodule to be version 8.50 to address
 CVE-2023-48795

---
 contrib/curl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/curl b/contrib/curl
index d755a5f7c00..7161cb17c01 160000
--- a/contrib/curl
+++ b/contrib/curl
@@ -1 +1 @@
-Subproject commit d755a5f7c009dd63a61b2c745180d8ba937cbfeb
+Subproject commit 7161cb17c01dcff1dc5bf89a18437d9d729f1ecd

From bade45d197884812886fd6eedd85883f5d67fa50 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sat, 27 Jan 2024 21:30:49 +0100
Subject: [PATCH 0309/1081] impl

---
 contrib/aws                      |  2 +-
 contrib/aws-c-auth               |  2 +-
 contrib/aws-c-cal                |  2 +-
 contrib/aws-c-common             |  2 +-
 contrib/aws-c-compression        |  2 +-
 contrib/aws-c-event-stream       |  2 +-
 contrib/aws-c-http               |  2 +-
 contrib/aws-c-io                 |  2 +-
 contrib/aws-c-mqtt               |  2 +-
 contrib/aws-c-s3                 |  2 +-
 contrib/aws-c-sdkutils           |  2 +-
 contrib/aws-checksums            |  2 +-
 contrib/aws-cmake/CMakeLists.txt | 11 ++++++++++-
 contrib/aws-crt-cpp              |  2 +-
 contrib/aws-s2n-tls              |  2 +-
 15 files changed, 24 insertions(+), 15 deletions(-)

diff --git a/contrib/aws b/contrib/aws
index ca02358dcc7..4ec215f3607 160000
--- a/contrib/aws
+++ b/contrib/aws
@@ -1 +1 @@
-Subproject commit ca02358dcc7ce3ab733dd4cbcc32734eecfa4ee3
+Subproject commit 4ec215f3607c2111bf2cc91ba842046a6b5eb0c4
diff --git a/contrib/aws-c-auth b/contrib/aws-c-auth
index 97133a2b5db..baeffa791d9 160000
--- a/contrib/aws-c-auth
+++ b/contrib/aws-c-auth
@@ -1 +1 @@
-Subproject commit 97133a2b5dbca1ccdf88cd6f44f39d0531d27d12
+Subproject commit baeffa791d9d1cf61460662a6d9ac2186aaf05df
diff --git a/contrib/aws-c-cal b/contrib/aws-c-cal
index 85dd7664b78..9453687ff54 160000
--- a/contrib/aws-c-cal
+++ b/contrib/aws-c-cal
@@ -1 +1 @@
-Subproject commit 85dd7664b786a389c6fb1a6f031ab4bb2282133d
+Subproject commit 9453687ff5493ba94eaccf8851200565c4364c77
diff --git a/contrib/aws-c-common b/contrib/aws-c-common
index 45dcb2849c8..80f21b3cac5 160000
--- a/contrib/aws-c-common
+++ b/contrib/aws-c-common
@@ -1 +1 @@
-Subproject commit 45dcb2849c891dba2100b270b4676765c92949ff
+Subproject commit 80f21b3cac5ac51c6b8a62c7d2a5ef58a75195ee
diff --git a/contrib/aws-c-compression b/contrib/aws-c-compression
index b517b7decd0..99ec79ee297 160000
--- a/contrib/aws-c-compression
+++ b/contrib/aws-c-compression
@@ -1 +1 @@
-Subproject commit b517b7decd0dac30be2162f5186c250221c53aff
+Subproject commit 99ec79ee2970f1a045d4ced1501b97ee521f2f85
diff --git a/contrib/aws-c-event-stream b/contrib/aws-c-event-stream
index 2f9b60c42f9..08f24e384e5 160000
--- a/contrib/aws-c-event-stream
+++ b/contrib/aws-c-event-stream
@@ -1 +1 @@
-Subproject commit 2f9b60c42f90840ec11822acda3d8cdfa97a773d
+Subproject commit 08f24e384e5be20bcffa42b49213d24dad7881ae
diff --git a/contrib/aws-c-http b/contrib/aws-c-http
index dd344619879..a082f8a2067 160000
--- a/contrib/aws-c-http
+++ b/contrib/aws-c-http
@@ -1 +1 @@
-Subproject commit dd34461987947672444d0bc872c5a733dfdb9711
+Subproject commit a082f8a2067e4a31db73f1d4ffd702a8dc0f7089
diff --git a/contrib/aws-c-io b/contrib/aws-c-io
index d58ed4f272b..11ce3c750a1 160000
--- a/contrib/aws-c-io
+++ b/contrib/aws-c-io
@@ -1 +1 @@
-Subproject commit d58ed4f272b1cb4f89ac9196526ceebe5f2b0d89
+Subproject commit 11ce3c750a1dac7b04069fc5bff89e97e91bad4d
diff --git a/contrib/aws-c-mqtt b/contrib/aws-c-mqtt
index 33c3455cec8..6d36cd37262 160000
--- a/contrib/aws-c-mqtt
+++ b/contrib/aws-c-mqtt
@@ -1 +1 @@
-Subproject commit 33c3455cec82b16feb940e12006cefd7b3ef4194
+Subproject commit 6d36cd3726233cb757468d0ea26f6cd8dad151ec
diff --git a/contrib/aws-c-s3 b/contrib/aws-c-s3
index d7bfe602d69..de36fee8fe7 160000
--- a/contrib/aws-c-s3
+++ b/contrib/aws-c-s3
@@ -1 +1 @@
-Subproject commit d7bfe602d6925948f1fff95784e3613cca6a3900
+Subproject commit de36fee8fe7ab02f10987877ae94a805bf440c1f
diff --git a/contrib/aws-c-sdkutils b/contrib/aws-c-sdkutils
index 208a701fa01..fd8c0ba2e23 160000
--- a/contrib/aws-c-sdkutils
+++ b/contrib/aws-c-sdkutils
@@ -1 +1 @@
-Subproject commit 208a701fa01e99c7c8cc3dcebc8317da71362972
+Subproject commit fd8c0ba2e233997eaaefe82fb818b8b444b956d3
diff --git a/contrib/aws-checksums b/contrib/aws-checksums
index ad53be196a2..321b805559c 160000
--- a/contrib/aws-checksums
+++ b/contrib/aws-checksums
@@ -1 +1 @@
-Subproject commit ad53be196a25bbefa3700a01187fdce573a7d2d0
+Subproject commit 321b805559c8e911be5bddba13fcbd222a3e2d3a
diff --git a/contrib/aws-cmake/CMakeLists.txt b/contrib/aws-cmake/CMakeLists.txt
index 950a0e06cd0..b913908911c 100644
--- a/contrib/aws-cmake/CMakeLists.txt
+++ b/contrib/aws-cmake/CMakeLists.txt
@@ -35,6 +35,8 @@ set(AWS_PUBLIC_COMPILE_DEFS)
 set(AWS_PRIVATE_COMPILE_DEFS)
 set(AWS_PRIVATE_LIBS)
 
+list(APPEND AWS_PRIVATE_COMPILE_DEFS "-DINTEL_NO_ITTNOTIFY_API")
+
 if (CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG")
     list(APPEND AWS_PRIVATE_COMPILE_DEFS "-DDEBUG_BUILD")
 endif()
@@ -85,14 +87,20 @@ file(GLOB AWS_SDK_CORE_SRC
     "${AWS_SDK_CORE_DIR}/source/external/cjson/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/external/tinyxml2/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/http/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/http/crt/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/http/standard/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/internal/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/monitoring/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/net/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/net/linux-shared/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/platform/linux-shared/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/smithy/tracing/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/base64/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/utils/component-registry/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/crypto/*.cpp"
-    "${AWS_SDK_CORE_DIR}/source/utils/crypto/openssl/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/crypto/factory/*.cpp"
+    "${AWS_SDK_CORE_DIR}/source/utils/crypto/openssl/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/event/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/json/*.cpp"
     "${AWS_SDK_CORE_DIR}/source/utils/logging/*.cpp"
@@ -176,6 +184,7 @@ file(GLOB AWS_COMMON_SRC
     "${AWS_COMMON_DIR}/source/*.c"
     "${AWS_COMMON_DIR}/source/external/*.c"
     "${AWS_COMMON_DIR}/source/posix/*.c"
+    "${AWS_COMMON_DIR}/source/linux/*.c"
 )
 
 file(GLOB AWS_COMMON_ARCH_SRC
diff --git a/contrib/aws-crt-cpp b/contrib/aws-crt-cpp
index 8a301b7e842..86adce22528 160000
--- a/contrib/aws-crt-cpp
+++ b/contrib/aws-crt-cpp
@@ -1 +1 @@
-Subproject commit 8a301b7e842f1daed478090c869207300972379f
+Subproject commit 86adce22528b811efa5ca27f65d8d5a38223cbfa
diff --git a/contrib/aws-s2n-tls b/contrib/aws-s2n-tls
index 71f4794b758..9a1e7545402 160000
--- a/contrib/aws-s2n-tls
+++ b/contrib/aws-s2n-tls
@@ -1 +1 @@
-Subproject commit 71f4794b7580cf780eb4aca77d69eded5d3c7bb4
+Subproject commit 9a1e75454023e952b366ce1eab9c54007250119f

From 00c140b7bbf834efa81c54c9c403653824607455 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 27 Jan 2024 21:13:08 +0000
Subject: [PATCH 0310/1081] Fix getting filename from read buffer wrappers

---
 src/IO/CompressedReadBufferWrapper.h |  5 +++--
 src/IO/ReadBuffer.cpp                |  5 ++++-
 src/IO/ReadBufferWrapperBase.h       | 15 +++++++++++++++
 src/IO/WithFileName.cpp              |  8 ++++----
 4 files changed, 26 insertions(+), 7 deletions(-)
 create mode 100644 src/IO/ReadBufferWrapperBase.h

diff --git a/src/IO/CompressedReadBufferWrapper.h b/src/IO/CompressedReadBufferWrapper.h
index bb58a7bfeb3..66e57488434 100644
--- a/src/IO/CompressedReadBufferWrapper.h
+++ b/src/IO/CompressedReadBufferWrapper.h
@@ -1,11 +1,12 @@
 #pragma once
 #include <IO/BufferWithOwnMemory.h>
 #include <IO/ReadBuffer.h>
+#include <IO/ReadBufferWrapperBase.h>
 
 namespace DB
 {
 
-class CompressedReadBufferWrapper : public BufferWithOwnMemory<ReadBuffer>
+class CompressedReadBufferWrapper : public BufferWithOwnMemory<ReadBuffer>, public ReadBufferWrapperBase
 {
 public:
     CompressedReadBufferWrapper(
@@ -16,7 +17,7 @@ public:
     : BufferWithOwnMemory<ReadBuffer>(buf_size, existing_memory, alignment)
     , in(std::move(in_)) {}
 
-    const ReadBuffer & getWrappedReadBuffer() const { return *in; }
+    const ReadBuffer & getWrappedReadBuffer() const override { return *in; }
     ReadBuffer & getWrappedReadBuffer() { return *in; }
 
     void prefetch(Priority priority) override { in->prefetch(priority); }
diff --git a/src/IO/ReadBuffer.cpp b/src/IO/ReadBuffer.cpp
index bf054d08425..0d1cd322fdd 100644
--- a/src/IO/ReadBuffer.cpp
+++ b/src/IO/ReadBuffer.cpp
@@ -1,4 +1,5 @@
 #include <IO/ReadBuffer.h>
+#include <IO/ReadBufferWrapperBase.h>
 
 
 namespace DB
@@ -7,7 +8,7 @@ namespace DB
 namespace
 {
     template <typename CustomData>
-    class ReadBufferWrapper : public ReadBuffer
+    class ReadBufferWrapper : public ReadBuffer, public ReadBufferWrapperBase
     {
     public:
         ReadBufferWrapper(ReadBuffer & in_, CustomData && custom_data_)
@@ -15,6 +16,8 @@ namespace
         {
         }
 
+        const ReadBuffer & getWrappedReadBuffer() const override { return in; }
+
     private:
         ReadBuffer & in;
         CustomData custom_data;
diff --git a/src/IO/ReadBufferWrapperBase.h b/src/IO/ReadBufferWrapperBase.h
new file mode 100644
index 00000000000..1c594e8018a
--- /dev/null
+++ b/src/IO/ReadBufferWrapperBase.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include <IO/ReadBuffer.h>
+
+namespace DB
+{
+
+class ReadBufferWrapperBase
+{
+public:
+    virtual const ReadBuffer & getWrappedReadBuffer() const = 0;
+    virtual ~ReadBufferWrapperBase() = default;
+};
+
+}
diff --git a/src/IO/WithFileName.cpp b/src/IO/WithFileName.cpp
index 2383182f7e7..7b50b205935 100644
--- a/src/IO/WithFileName.cpp
+++ b/src/IO/WithFileName.cpp
@@ -1,5 +1,5 @@
 #include <IO/WithFileName.h>
-#include <IO/CompressedReadBufferWrapper.h>
+#include <IO/ReadBufferWrapperBase.h>
 #include <IO/ParallelReadBuffer.h>
 #include <IO/PeekableReadBuffer.h>
 
@@ -16,10 +16,10 @@ static String getFileName(const T & entry)
 
 String getFileNameFromReadBuffer(const ReadBuffer & in)
 {
-    if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
-        return getFileName(compressed->getWrappedReadBuffer());
+    if (const auto * wrapper = dynamic_cast<const ReadBufferWrapperBase *>(&in))
+        return getFileNameFromReadBuffer(wrapper->getWrappedReadBuffer());
     else if (const auto * parallel = dynamic_cast<const ParallelReadBuffer *>(&in))
-        return getFileName(parallel->getReadBuffer());
+        return getFileNameFromReadBuffer(parallel->getReadBuffer());
     else if (const auto * peekable = dynamic_cast<const PeekableReadBuffer *>(&in))
         return getFileNameFromReadBuffer(peekable->getSubBuffer());
     else

From 24ab61932e438c887f7224092d9524397881e9c3 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sat, 27 Jan 2024 22:42:43 +0100
Subject: [PATCH 0311/1081] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 8eeb01449b4..19f9783cd01 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -249,12 +249,12 @@ stop_logs_replication
 failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst } 2>&1 )
+    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst } 2>&1 )
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst } 2>&1 )
+        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 5023851b471c3fc4564db3bc8d01c351f6cb1fa2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Sat, 27 Jan 2024 22:09:40 +0000
Subject: [PATCH 0312/1081] Add test

---
 .../02973_s3_compressed_file_in_error_message.reference  | 1 +
 .../02973_s3_compressed_file_in_error_message.sh         | 9 +++++++++
 2 files changed, 10 insertions(+)
 create mode 100644 tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
 create mode 100755 tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
new file mode 100755
index 00000000000..2af0a83bd26
--- /dev/null
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
+

From 37823a7b91a7bafc05289ec9e4ed1f4448146219 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sat, 27 Jan 2024 23:45:14 +0100
Subject: [PATCH 0313/1081] use upstream repo

---
 .gitmodules | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.gitmodules b/.gitmodules
index 68016bf8c5b..a618104f364 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -99,7 +99,7 @@
 	url = https://github.com/awslabs/aws-c-event-stream
 [submodule "aws-c-common"]
 	path = contrib/aws-c-common
-	url = https://github.com/ClickHouse/aws-c-common
+	url = https://github.com/awslabs/aws-c-common.git
 [submodule "aws-checksums"]
 	path = contrib/aws-checksums
 	url = https://github.com/awslabs/aws-checksums

From 07750ee9494cdbd8e7cb838eec79f1a00f6b8afb Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 26 Jan 2024 19:38:58 +0300
Subject: [PATCH 0314/1081] Added AtomicLogger

---
 base/poco/Foundation/src/Logger.cpp           | 13 ++---
 src/Common/AtomicLogger.h                     | 51 +++++++++++++++++++
 src/Common/Exception.cpp                      | 10 ++++
 src/Common/Exception.h                        |  3 ++
 src/Common/Logger.h                           |  1 -
 src/Common/logger_useful.h                    |  4 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  8 +--
 src/Storages/MergeTree/MergeTreeData.cpp      | 26 +++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  7 +--
 src/Storages/StorageMergeTree.cpp             |  6 +--
 src/Storages/StorageReplicatedMergeTree.cpp   | 16 +++---
 11 files changed, 103 insertions(+), 42 deletions(-)
 create mode 100644 src/Common/AtomicLogger.h

diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 7c54116aaa4..e67b05a9225 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -304,16 +304,12 @@ struct LoggerDeleter
 {
 	void operator()(Poco::Logger * logger)
 	{
-		if (Logger::destroy(logger->name()))
-			return;
-
-		logger->release();
+		Logger::destroy(logger->name());
 	}
 };
 
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
-	logger.duplicate();
 	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
 }
 
@@ -329,8 +325,13 @@ Logger& Logger::get(const std::string& name)
 LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
+	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
 
-	return makeLoggerPtr(unsafeGet(name));
+	Logger & logger = unsafeGet(name);
+	if (logger_exists)
+		logger.duplicate();
+
+	return makeLoggerPtr(logger);
 }
 
 Logger& Logger::unsafeGet(const std::string& name)
diff --git a/src/Common/AtomicLogger.h b/src/Common/AtomicLogger.h
new file mode 100644
index 00000000000..bfbe7caad10
--- /dev/null
+++ b/src/Common/AtomicLogger.h
@@ -0,0 +1,51 @@
+#pragma once
+
+#include <memory>
+
+#include <Common/Logger.h>
+#include <Common/SharedMutex.h>
+#include <Common/SharedLockGuard.h>
+
+
+/** AtomicLogger allows to atomically change logger.
+  * Standard library does not have atomic_shared_ptr, and we do not use std::atomic* operations,
+  * because standard library implementation uses fixed table of mutexes, and it is better to avoid contention here.
+  */
+class AtomicLogger
+{
+public:
+    explicit AtomicLogger(LoggerPtr logger_)
+        : logger(std::move(logger_))
+    {}
+
+    explicit AtomicLogger(const std::string & log_name)
+        : AtomicLogger(::getLogger(log_name))
+    {}
+
+    void store(LoggerPtr new_logger)
+    {
+        std::lock_guard lock(log_mutex);
+        logger = std::move(new_logger);
+    }
+
+    void store(const std::string & new_log_name)
+    {
+        auto new_logger = ::getLogger(new_log_name);
+        store(std::move(new_logger));
+    }
+
+    LoggerPtr load() const
+    {
+        DB::SharedLockGuard lock(log_mutex);
+        return logger;
+    }
+
+    String loadName() const
+    {
+        DB::SharedLockGuard lock(log_mutex);
+        return logger->name();
+    }
+private:
+    mutable DB::SharedMutex log_mutex;
+    LoggerPtr logger TSA_GUARDED_BY(log_mutex);
+};
diff --git a/src/Common/Exception.cpp b/src/Common/Exception.cpp
index ff83f6ba807..7e73e2c0783 100644
--- a/src/Common/Exception.cpp
+++ b/src/Common/Exception.cpp
@@ -257,6 +257,11 @@ void tryLogCurrentException(LoggerPtr logger, const std::string & start_of_messa
     tryLogCurrentException(logger.get(), start_of_message);
 }
 
+void tryLogCurrentException(const AtomicLogger & logger, const std::string & start_of_message)
+{
+    tryLogCurrentException(logger.load(), start_of_message);
+}
+
 static void getNoSpaceLeftInfoMessage(std::filesystem::path path, String & msg)
 {
     path = std::filesystem::absolute(path);
@@ -529,6 +534,11 @@ void tryLogException(std::exception_ptr e, LoggerPtr logger, const std::string &
     }
 }
 
+void tryLogException(std::exception_ptr e, const AtomicLogger & logger, const std::string & start_of_message)
+{
+    tryLogException(e, logger.load(), start_of_message);
+}
+
 std::string getExceptionMessage(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace)
 {
     return getExceptionMessageAndPattern(e, with_stacktrace, check_embedded_stacktrace).text;
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 8afed6034cf..817a4400080 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -11,6 +11,7 @@
 #include <base/scope_guard.h>
 #include <Common/LoggingFormatStringHelpers.h>
 #include <Common/Logger.h>
+#include <Common/AtomicLogger.h>
 #include <Common/StackTrace.h>
 
 #include <fmt/format.h>
@@ -245,6 +246,7 @@ using Exceptions = std::vector<std::exception_ptr>;
 void tryLogCurrentException(const char * log_name, const std::string & start_of_message = "");
 void tryLogCurrentException(Poco::Logger * logger, const std::string & start_of_message = "");
 void tryLogCurrentException(LoggerPtr logger, const std::string & start_of_message = "");
+void tryLogCurrentException(const AtomicLogger & logger, const std::string & start_of_message = "");
 
 
 /** Prints current exception in canonical format.
@@ -290,6 +292,7 @@ struct ExecutionStatus
 /// TODO: Logger leak constexpr overload
 void tryLogException(std::exception_ptr e, const char * log_name, const std::string & start_of_message = "");
 void tryLogException(std::exception_ptr e, LoggerPtr logger, const std::string & start_of_message = "");
+void tryLogException(std::exception_ptr e, const AtomicLogger & logger, const std::string & start_of_message = "");
 
 std::string getExceptionMessage(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace = false);
 PreformattedMessage getExceptionMessageAndPattern(const Exception & e, bool with_stacktrace, bool check_embedded_stacktrace = false);
diff --git a/src/Common/Logger.h b/src/Common/Logger.h
index 13e1c6bf8f5..6dcdea9a9d8 100644
--- a/src/Common/Logger.h
+++ b/src/Common/Logger.h
@@ -43,7 +43,6 @@ LoggerRawPtr getRawLogger(const std::string & name);
 
 LoggerRawPtr createRawLogger(const std::string & name, Poco::Channel * channel, Poco::Message::Priority level = Poco::Message::PRIO_INFORMATION);
 
-
 /** Returns true, if currently Logger with specified name is created.
   * Otherwise, returns false.
   */
diff --git a/src/Common/logger_useful.h b/src/Common/logger_useful.h
index 3899d060b7c..8e78e93e198 100644
--- a/src/Common/logger_useful.h
+++ b/src/Common/logger_useful.h
@@ -9,6 +9,7 @@
 #include <Common/ProfileEvents.h>
 #include <Common/LoggingFormatStringHelpers.h>
 #include <Common/Logger.h>
+#include <Common/AtomicLogger.h>
 
 namespace Poco { class Logger; }
 
@@ -20,7 +21,8 @@ using LogSeriesLimiterPtr = std::shared_ptr<LogSeriesLimiter>;
 
 namespace
 {
-    [[maybe_unused]] const ::Poco::Logger * getLoggerHelper(const LoggerPtr & logger) { return logger.get(); }
+    [[maybe_unused]] LoggerPtr getLoggerHelper(const LoggerPtr & logger) { return logger; }
+    [[maybe_unused]] LoggerPtr getLoggerHelper(const AtomicLogger & logger) { return logger.load(); }
     [[maybe_unused]] const ::Poco::Logger * getLoggerHelper(const ::Poco::Logger * logger) { return logger; }
     [[maybe_unused]] std::unique_ptr<LogToStrImpl> getLoggerHelper(std::unique_ptr<LogToStrImpl> && logger) { return logger; }
     [[maybe_unused]] std::unique_ptr<LogFrequencyLimiterIml> getLoggerHelper(std::unique_ptr<LogFrequencyLimiterIml> && logger) { return logger; }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 87f23b0da2a..19730dc05c1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1663,7 +1663,7 @@ try
 
     metadata_manager->deleteAll(true);
     metadata_manager->assertAllDeleted(true);
-    getDataPartStorage().rename(to.parent_path(), to.filename(), storage.log, remove_new_dir_if_exists, fsync_dir);
+    getDataPartStorage().rename(to.parent_path(), to.filename(), storage.log.load(), remove_new_dir_if_exists, fsync_dir);
     metadata_manager->updateAll(true);
 
     auto new_projection_root_path = to.string();
@@ -1758,7 +1758,7 @@ void IMergeTreeDataPart::remove()
     }
 
     bool is_temporary_part = is_temp || state == MergeTreeDataPartState::Temporary;
-    getDataPartStorage().remove(std::move(can_remove_callback), checksums, projection_checksums, is_temporary_part, storage.log);
+    getDataPartStorage().remove(std::move(can_remove_callback), checksums, projection_checksums, is_temporary_part, storage.log.load());
 }
 
 std::optional<String> IMergeTreeDataPart::getRelativePathForPrefix(const String & prefix, bool detached, bool broken) const
@@ -1775,7 +1775,7 @@ std::optional<String> IMergeTreeDataPart::getRelativePathForPrefix(const String
     if (detached && parent_part)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot detach projection");
 
-    return getDataPartStorage().getRelativePathForPrefix(storage.log, prefix, detached, broken);
+    return getDataPartStorage().getRelativePathForPrefix(storage.log.load(), prefix, detached, broken);
 }
 
 std::optional<String> IMergeTreeDataPart::getRelativePathForDetachedPart(const String & prefix, bool broken) const
@@ -1841,7 +1841,7 @@ MutableDataPartStoragePtr IMergeTreeDataPart::makeCloneOnDisk(
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Can not clone data part {} to empty directory.", name);
 
     String path_to_clone = fs::path(storage.relative_data_path) / directory_name / "";
-    return getDataPartStorage().clonePart(path_to_clone, getDataPartStorage().getPartDirectory(), disk, read_settings, write_settings, storage.log, cancellation_hook);
+    return getDataPartStorage().clonePart(path_to_clone, getDataPartStorage().getPartDirectory(), disk, read_settings, write_settings, storage.log.load(), cancellation_hook);
 }
 
 UInt64 IMergeTreeDataPart::getIndexSizeFromFile() const
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 39c113c240e..f0eeb3602d5 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -354,8 +354,7 @@ MergeTreeData::MergeTreeData(
     , merging_params(merging_params_)
     , require_part_metadata(require_part_metadata_)
     , broken_part_callback(broken_part_callback_)
-    , log_name(std::make_shared<String>(table_id_.getNameForLogs()))
-    , log(getLogger(*log_name))
+    , log(table_id_.getNameForLogs())
     , storage_settings(std::move(storage_settings_))
     , pinned_part_uuids(std::make_shared<PinnedPartUUIDs>())
     , data_parts_by_info(data_parts_indexes.get<TagByInfo>())
@@ -1296,7 +1295,7 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
         res.is_broken = true;
         tryLogCurrentException(log, fmt::format("while loading part {} on path {}", part_name, part_path));
 
-        res.size_of_part = calculatePartSizeSafe(res.part, log);
+        res.size_of_part = calculatePartSizeSafe(res.part, log.load());
         auto part_size_str = res.size_of_part ? formatReadableSizeWithBinarySuffix(*res.size_of_part) : "failed to calculate size";
 
         LOG_ERROR(log,
@@ -1327,7 +1326,7 @@ MergeTreeData::LoadPartResult MergeTreeData::loadDataPart(
     if (part_disk_ptr->exists(marker_path))
     {
         /// NOTE: getBytesOnDisk() cannot be used here, since it may be zero if checksums.txt does not exist.
-        res.size_of_part = calculatePartSizeSafe(res.part, log);
+        res.size_of_part = calculatePartSizeSafe(res.part, log.load());
         res.is_broken = true;
 
         auto part_size_str = res.size_of_part ? formatReadableSizeWithBinarySuffix(*res.size_of_part) : "failed to calculate size";
@@ -2114,7 +2113,7 @@ size_t MergeTreeData::clearOldTemporaryDirectories(const String & root_path, siz
                     {
                         /// Actually we don't rely on temporary_directories_lifetime when removing old temporaries directories,
                         /// it's just an extra level of protection just in case we have a bug.
-                        LOG_INFO(LogFrequencyLimiter(log, 10), "{} is in use (by merge/mutation/INSERT) (consider increasing temporary_directories_lifetime setting)", full_path);
+                        LOG_INFO(LogFrequencyLimiter(log.load(), 10), "{} is in use (by merge/mutation/INSERT) (consider increasing temporary_directories_lifetime setting)", full_path);
                         continue;
                     }
                     else if (!disk->exists(it->path()))
@@ -2734,8 +2733,7 @@ void MergeTreeData::rename(const String & new_table_path, const StorageID & new_
 void MergeTreeData::renameInMemory(const StorageID & new_table_id)
 {
     IStorage::renameInMemory(new_table_id);
-    std::atomic_store(&log_name, std::make_shared<String>(new_table_id.getNameForLogs()));
-    log = getLogger(*log_name);
+    log.store(new_table_id.getNameForLogs());
 }
 
 void MergeTreeData::dropAllData()
@@ -6249,13 +6247,13 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                     log,
                     "Would like to reserve space on volume '{}' by TTL rule of table '{}' but volume was not found",
                     move_ttl_entry->destination_name,
-                    *std::atomic_load(&log_name));
+                    log.loadName());
             else if (move_ttl_entry->destination_type == DataDestinationType::DISK && !move_ttl_entry->if_exists)
                 LOG_WARNING(
                     log,
                     "Would like to reserve space on disk '{}' by TTL rule of table '{}' but disk was not found",
                     move_ttl_entry->destination_name,
-                    *std::atomic_load(&log_name));
+                    log.loadName());
         }
         else if (is_insert && !perform_ttl_move_on_insert)
         {
@@ -6264,7 +6262,7 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                 "TTL move on insert to {} {} for table {} is disabled",
                 (move_ttl_entry->destination_type == DataDestinationType::VOLUME ? "volume" : "disk"),
                 move_ttl_entry->destination_name,
-                *std::atomic_load(&log_name));
+                log.loadName());
         }
         else
         {
@@ -6280,13 +6278,13 @@ ReservationPtr MergeTreeData::tryReserveSpacePreferringTTLRules(
                         log,
                         "Would like to reserve space on volume '{}' by TTL rule of table '{}' but there is not enough space",
                         move_ttl_entry->destination_name,
-                        *std::atomic_load(&log_name));
+                        log.loadName());
                 else if (move_ttl_entry->destination_type == DataDestinationType::DISK)
                     LOG_WARNING(
                         log,
                         "Would like to reserve space on disk '{}' by TTL rule of table '{}' but there is not enough space",
                         move_ttl_entry->destination_name,
-                        *std::atomic_load(&log_name));
+                        log.loadName());
             }
         }
     }
@@ -7989,7 +7987,7 @@ bool MergeTreeData::insertQueryIdOrThrowNoLock(const String & query_id, size_t m
         throw Exception(
             ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
             "Too many simultaneous queries for table {}. Maximum is: {}",
-            *std::atomic_load(&log_name),
+            log.loadName(),
             max_queries);
     query_id_set.insert(query_id);
     return true;
@@ -8181,7 +8179,7 @@ ReservationPtr MergeTreeData::balancedReservation(
                     }
 
                     // Record submerging big parts in the tagger to clean them up.
-                    tagger_ptr->emplace(*this, part_name, std::move(covered_parts), log);
+                    tagger_ptr->emplace(*this, part_name, std::move(covered_parts), log.load());
                 }
             }
         }
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index caef247500a..29aafcc3a13 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -462,7 +462,7 @@ public:
     /// Load the set of data parts from disk. Call once - immediately after the object is created.
     void loadDataParts(bool skip_sanity_checks, std::optional<std::unordered_set<std::string>> expected_parts);
 
-    String getLogName() const { return *std::atomic_load(&log_name); }
+    String getLogName() const { return log.loadName(); }
 
     Int64 getMaxBlockNumber() const;
 
@@ -1115,10 +1115,7 @@ protected:
     /// Engine-specific methods
     BrokenPartCallback broken_part_callback;
 
-    /// log_name will change during table RENAME. Use atomic_shared_ptr to allow concurrent RW.
-    /// NOTE clang-14 doesn't have atomic_shared_ptr yet. Use std::atomic* operations for now.
-    std::shared_ptr<String> log_name;
-    LoggerPtr log;
+    AtomicLogger log;
 
     /// Storage settings.
     /// Use get and set to receive readonly versions.
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 7e6c5ca3924..b402191f895 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -683,7 +683,7 @@ std::optional<MergeTreeMutationStatus> StorageMergeTree::getIncompleteMutationsS
 
     const auto & mutation_entry = current_mutation_it->second;
 
-    auto txn = tryGetTransactionForMutation(mutation_entry, log);
+    auto txn = tryGetTransactionForMutation(mutation_entry, log.load());
     /// There's no way a transaction may finish before a mutation that was started by the transaction.
     /// But sometimes we need to check status of an unrelated mutation, in this case we don't care about transactions.
     assert(txn || mutation_entry.tid.isPrehistoric() || from_another_mutation);
@@ -829,7 +829,7 @@ CancellationCode StorageMergeTree::killMutation(const String & mutation_id)
     if (!to_kill)
         return CancellationCode::NotFound;
 
-    if (auto txn = tryGetTransactionForMutation(*to_kill, log))
+    if (auto txn = tryGetTransactionForMutation(*to_kill, log.load()))
     {
         LOG_TRACE(log, "Cancelling transaction {} which had started mutation {}", to_kill->tid, mutation_id);
         TransactionLog::instance().rollbackTransaction(txn);
@@ -1222,7 +1222,7 @@ MergeMutateSelectedEntryPtr StorageMergeTree::selectPartsToMutate(
             if (!part->version.isVisible(first_mutation_tid.start_csn, first_mutation_tid))
                 continue;
 
-            txn = tryGetTransactionForMutation(mutations_begin_it->second, log);
+            txn = tryGetTransactionForMutation(mutations_begin_it->second, log.load());
             if (!txn)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot find transaction {} that has started mutation {} "
                                 "that is going to be applied to part {}",
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index c82721d2a18..9c2f9dba485 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -320,7 +320,7 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
                     attach,
                     [this] (const std::string & name) { enqueuePartForCheck(name); })
     , zookeeper_name(zkutil::extractZooKeeperName(zookeeper_path_))
-    , zookeeper_path(zkutil::extractZooKeeperPath(zookeeper_path_, /* check_starts_with_slash */ !attach, log))
+    , zookeeper_path(zkutil::extractZooKeeperPath(zookeeper_path_, /* check_starts_with_slash */ !attach, log.load()))
     , replica_name(replica_name_)
     , replica_path(fs::path(zookeeper_path) / "replicas" / replica_name_)
     , reader(*this)
@@ -812,7 +812,7 @@ bool StorageReplicatedMergeTree::createTableIfNotExists(const StorageMetadataPtr
             else
             {
                 auto metadata_drop_lock = zkutil::EphemeralNodeHolder::existing(drop_lock_path, *zookeeper);
-                if (!removeTableNodesFromZooKeeper(zookeeper, zookeeper_path, metadata_drop_lock, log))
+                if (!removeTableNodesFromZooKeeper(zookeeper, zookeeper_path, metadata_drop_lock, log.load()))
                 {
                     /// Someone is recursively removing table right now, we cannot create new table until old one is removed
                     continue;
@@ -1128,7 +1128,7 @@ void StorageReplicatedMergeTree::drop()
             if (lost_part_count > 0)
                 LOG_INFO(log, "Dropping table with non-zero lost_part_count equal to {}", lost_part_count);
         }
-        dropReplica(zookeeper, zookeeper_path, replica_name, log, getSettings(), &has_metadata_in_zookeeper);
+        dropReplica(zookeeper, zookeeper_path, replica_name, log.load(), getSettings(), &has_metadata_in_zookeeper);
     }
 }
 
@@ -4181,7 +4181,7 @@ void StorageReplicatedMergeTree::startBeingLeader()
         return;
     }
 
-    zkutil::checkNoOldLeaders(log, *zookeeper, fs::path(zookeeper_path) / "leader_election");
+    zkutil::checkNoOldLeaders(log.load(), *zookeeper, fs::path(zookeeper_path) / "leader_election");
 
     LOG_INFO(log, "Became leader");
     is_leader = true;
@@ -4275,7 +4275,7 @@ void StorageReplicatedMergeTree::waitForUniquePartsToBeFetchedByOtherReplicas(St
 
     auto zookeeper = getZooKeeperIfTableShutDown();
 
-    auto unique_parts_set = findReplicaUniqueParts(replica_name, zookeeper_path, format_version, zookeeper, log);
+    auto unique_parts_set = findReplicaUniqueParts(replica_name, zookeeper_path, format_version, zookeeper, log.load());
     if (unique_parts_set.empty())
     {
         LOG_INFO(log, "Will not wait for unique parts to be fetched because we don't have any unique parts");
@@ -9348,7 +9348,7 @@ StorageReplicatedMergeTree::unlockSharedData(const IMergeTreeDataPart & part, co
 
     return unlockSharedDataByID(
         part.getUniqueId(), shared_id, part.info, replica_name,
-        part.getDataPartStorage().getDiskType(), zookeeper, *getSettings(), log, zookeeper_path, format_version);
+        part.getDataPartStorage().getDiskType(), zookeeper, *getSettings(), log.load(), zookeeper_path, format_version);
 }
 
 namespace
@@ -10301,7 +10301,7 @@ void StorageReplicatedMergeTree::backupData(
         bool exists = false;
         Strings mutation_ids;
         {
-            ZooKeeperRetriesControl retries_ctl("getMutations", log, zookeeper_retries_info, nullptr);
+            ZooKeeperRetriesControl retries_ctl("getMutations", log.load(), zookeeper_retries_info, nullptr);
             retries_ctl.retryLoop([&]()
             {
                 if (!zookeeper || zookeeper->expired())
@@ -10320,7 +10320,7 @@ void StorageReplicatedMergeTree::backupData(
                 bool mutation_id_exists = false;
                 String mutation;
 
-                ZooKeeperRetriesControl retries_ctl("getMutation", log, zookeeper_retries_info, nullptr);
+                ZooKeeperRetriesControl retries_ctl("getMutation", log.load(), zookeeper_retries_info, nullptr);
                 retries_ctl.retryLoop([&]()
                 {
                     if (!zookeeper || zookeeper->expired())

From 50309dfd908e5e1da4addb3f53d1b750687c473d Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 16:30:36 +0300
Subject: [PATCH 0315/1081] Fixed tests

---
 base/poco/Foundation/include/Poco/Logger.h |  11 --
 base/poco/Foundation/src/Logger.cpp        | 114 ++++++++++++++-------
 src/Common/tests/gtest_log.cpp             |   3 -
 3 files changed, 78 insertions(+), 50 deletions(-)

diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index f91d836f190..cf202718662 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -904,13 +904,6 @@ public:
     /// Returns a pointer to the Logger with the given name if it
     /// exists, or a null pointer otherwise.
 
-    static bool destroy(const std::string & name);
-    /// Destroys the logger with the specified name. Does nothing
-    /// if the logger is not found.
-    ///
-    /// After a logger has been destroyed, all references to it
-    /// become invalid.
-
     static void shutdown();
     /// Shuts down the logging framework and releases all
     /// Loggers.
@@ -940,8 +933,6 @@ public:
     static const std::string ROOT; /// The name of the root logger ("").
 
 protected:
-    typedef std::map<std::string, Logger *> LoggerMap;
-
     Logger(const std::string & name, Channel * pChannel, int level);
     ~Logger();
 
@@ -962,8 +953,6 @@ private:
     std::string _name;
     Channel * _pChannel;
     std::atomic_int _level;
-
-    static LoggerMap * _pLoggerMap;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index e67b05a9225..d8c90e7ccb9 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -20,6 +20,7 @@
 #include "Poco/NumberParser.h"
 #include "Poco/String.h"
 
+#include <cassert>
 #include <mutex>
 
 namespace
@@ -37,12 +38,20 @@ std::mutex & getLoggerMutex()
 	return *logger_mutex;
 }
 
+struct LoggerEntry
+{
+	Poco::Logger * logger;
+	bool owned_by_shared_ptr = false;
+};
+
+using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
+LoggerMap * _pLoggerMap = nullptr;
+
 }
 
 namespace Poco {
 
 
-Logger::LoggerMap* Logger::_pLoggerMap = 0;
 const std::string Logger::ROOT;
 
 
@@ -134,12 +143,12 @@ void Logger::setLevel(const std::string& name, int level)
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = name.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, name) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, name) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setLevel(level);
+				it.second.logger->setLevel(level);
 			}
 		}
 	}
@@ -153,12 +162,12 @@ void Logger::setChannel(const std::string& name, Channel* pChannel)
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = name.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, name) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, name) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setChannel(pChannel);
+				it.second.logger->setChannel(pChannel);
 			}
 		}
 	}
@@ -172,12 +181,12 @@ void Logger::setProperty(const std::string& loggerName, const std::string& prope
 	if (_pLoggerMap)
 	{
 		std::string::size_type len = loggerName.length();
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
 			if (len == 0 ||
-				(it->first.compare(0, len, loggerName) == 0 && (it->first.length() == len || it->first[len] == '.')))
+				(it.first.compare(0, len, loggerName) == 0 && (it.first.length() == len || it.first[len] == '.')))
 			{
-				it->second->setProperty(propertyName, value);
+				it.second.logger->setProperty(propertyName, value);
 			}
 		}
 	}
@@ -304,10 +313,31 @@ struct LoggerDeleter
 {
 	void operator()(Poco::Logger * logger)
 	{
-		Logger::destroy(logger->name());
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		/// If logger infrastructure is destroyed just decrement logger reference count
+		if (!_pLoggerMap)
+		{
+			logger->release();
+			return;
+		}
+
+		auto it = _pLoggerMap->find(logger->name());
+		assert(it != _pLoggerMap->end());
+
+		/** If reference count is 1, this means this shared pointer owns logger
+		  * and need destroy it.
+		  */
+		size_t reference_count_before_release = logger->release();
+		if (reference_count_before_release == 1)
+		{
+			assert(it->second.owned_by_shared_ptr);
+			_pLoggerMap->erase(it);
+		}
 	}
 };
 
+
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
 	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
@@ -315,25 +345,52 @@ inline LoggerPtr makeLoggerPtr(Logger & logger)
 
 }
 
+
 Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeGet(name);
+	Logger & logger = unsafeGet(name);
+
+	/** If there are already shared pointer created for this logger
+	  * we need to increment Logger reference count and now logger
+	  * is owned by logger infrastructure.
+	  */
+	auto it = _pLoggerMap->find(name);
+	if (it->second.owned_by_shared_ptr)
+	{
+		it->second.logger->duplicate();
+		it->second.owned_by_shared_ptr = false;
+	}
+
+	return logger;
 }
 
+
 LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
 
 	Logger & logger = unsafeGet(name);
+
+	/** If logger already exists, then this shared pointer does not own it.
+	  * If logger does not exists, logger infrastructure could be already destroyed
+	  * or logger was created.
+	  */
 	if (logger_exists)
+	{
 		logger.duplicate();
+	}
+	else if (_pLoggerMap)
+	{
+		_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+	}
 
 	return makeLoggerPtr(logger);
 }
 
+
 Logger& Logger::unsafeGet(const std::string& name)
 {
 	Logger* pLogger = find(name);
@@ -390,10 +447,14 @@ void Logger::shutdown()
 
 	if (_pLoggerMap)
 	{
-		for (LoggerMap::iterator it = _pLoggerMap->begin(); it != _pLoggerMap->end(); ++it)
+		for (auto & it : *_pLoggerMap)
 		{
-			it->second->release();
+			if (it.second.owned_by_shared_ptr)
+				continue;
+
+			it.second.logger->release();
 		}
+
 		delete _pLoggerMap;
 		_pLoggerMap = 0;
 	}
@@ -406,32 +467,12 @@ Logger* Logger::find(const std::string& name)
 	{
 		LoggerMap::iterator it = _pLoggerMap->find(name);
 		if (it != _pLoggerMap->end())
-			return it->second;
+			return it->second.logger;
 	}
 	return 0;
 }
 
 
-bool Logger::destroy(const std::string& name)
-{
-	std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-	if (_pLoggerMap)
-	{
-		LoggerMap::iterator it = _pLoggerMap->find(name);
-		if (it != _pLoggerMap->end())
-		{
-			if (it->second->release() == 1)
-				_pLoggerMap->erase(it);
-
-			return true;
-		}
-	}
-
-	return false;
-}
-
-
 void Logger::names(std::vector<std::string>& names)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
@@ -539,7 +580,8 @@ void Logger::add(Logger* pLogger)
 {
 	if (!_pLoggerMap)
 		_pLoggerMap = new LoggerMap;
-	_pLoggerMap->insert(LoggerMap::value_type(pLogger->name(), pLogger));
+
+	_pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
 }
 
 
diff --git a/src/Common/tests/gtest_log.cpp b/src/Common/tests/gtest_log.cpp
index 419aac370d6..622497fe2f5 100644
--- a/src/Common/tests/gtest_log.cpp
+++ b/src/Common/tests/gtest_log.cpp
@@ -32,7 +32,6 @@ TEST(Logger, TestLog)
         LOG_TEST(log, "Hello World");
 
         EXPECT_EQ(oss.str(), "Hello World\n");
-        Poco::Logger::destroy("TestLogger");
     }
 
     {   /// Test logs invisible for other levels
@@ -45,8 +44,6 @@ TEST(Logger, TestLog)
             LOG_TEST(log, "Hello World");
 
             EXPECT_EQ(oss.str(), "");
-
-            Poco::Logger::destroy(std::string{level} + "_Logger");
         }
     }
 

From bccd8b5e270caccf1011971c424e2acee64b9e95 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 27 Jan 2024 19:17:17 +0300
Subject: [PATCH 0316/1081] Fixed tests

---
 base/poco/Foundation/src/Logger.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index d8c90e7ccb9..cfc063c8979 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -422,7 +422,10 @@ LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return makeLoggerPtr(unsafeCreate(name, pChannel, level));
+	Logger & logger = unsafeCreate(name, pChannel, level);
+	_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+
+	return makeLoggerPtr(logger);
 }
 
 Logger& Logger::root()

From 5165fb7286a145091e9cf89a92284a34d22c31c0 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sun, 28 Jan 2024 13:55:23 +0300
Subject: [PATCH 0317/1081] Fixed build

---
 src/Common/AtomicLogger.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/AtomicLogger.h b/src/Common/AtomicLogger.h
index bfbe7caad10..4bda55e070b 100644
--- a/src/Common/AtomicLogger.h
+++ b/src/Common/AtomicLogger.h
@@ -47,5 +47,5 @@ public:
     }
 private:
     mutable DB::SharedMutex log_mutex;
-    LoggerPtr logger TSA_GUARDED_BY(log_mutex);
+    LoggerPtr logger;
 };

From d264a5a148c577ab046dc4bbef50b5a4e0c32db9 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 28 Jan 2024 12:06:52 +0100
Subject: [PATCH 0318/1081] Update client & settings to std::shared_ptr<const>

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  6 ++--
 src/Backups/BackupIO_AzureBlobStorage.h       |  8 +++---
 .../AzureBlobStorage/AzureObjectStorage.h     |  6 ++--
 .../Cached/CachedObjectStorage.h              |  2 +-
 src/Disks/ObjectStorages/IObjectStorage.h     |  2 +-
 .../copyAzureBlobStorageFile.cpp              | 28 +++++++++----------
 .../copyAzureBlobStorageFile.h                | 10 +++----
 7 files changed, 31 insertions(+), 31 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 1b4c10ad0cb..d99f296cca1 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -89,7 +89,7 @@ std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const
         key = file_name;
     }
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client.get(), key, read_settings, settings.get()->max_single_read_retries,
+        client, key, read_settings, settings.get()->max_single_read_retries,
         settings.get()->max_single_download_retries);
 }
 
@@ -262,7 +262,7 @@ std::unique_ptr<ReadBuffer> BackupWriterAzureBlobStorage::readFile(const String
     }
 
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client.get(), key, read_settings, settings.get()->max_single_read_retries,
+        client, key, read_settings, settings.get()->max_single_read_retries,
         settings.get()->max_single_download_retries);
 }
 
@@ -278,7 +278,7 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
         key = file_name;
     }
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
-        client.get(),
+        client,
         key,
         settings.get()->max_single_part_upload_size,
         DBMS_DEFAULT_BUFFER_SIZE,
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 87dc470cdb3..95325044a62 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -28,10 +28,10 @@ public:
 
 private:
     const DataSourceDescription data_source_description;
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
-    MultiVersion<AzureObjectStorageSettings> settings;
+    std::shared_ptr<const AzureObjectStorageSettings> settings;
 };
 
 class BackupWriterAzureBlobStorage : public BackupWriterDefault
@@ -57,10 +57,10 @@ private:
     std::unique_ptr<ReadBuffer> readFile(const String & file_name, size_t expected_file_size) override;
     void removeFilesBatch(const Strings & file_names);
     const DataSourceDescription data_source_description;
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> client;
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client;
     StorageAzureBlob::Configuration configuration;
     std::unique_ptr<AzureObjectStorage> object_storage;
-    MultiVersion<AzureObjectStorageSettings> settings;
+    std::shared_ptr<const AzureObjectStorageSettings> settings;
 };
 
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 30fedb601dc..0ae12fb205f 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -137,11 +137,11 @@ public:
 
     bool isRemote() const override { return true; }
 
-    MultiVersion<AzureObjectStorageSettings> & getSettings() { return settings; }
+    std::shared_ptr<const AzureObjectStorageSettings> getSettings() { return settings.get(); }
 
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient() override
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> getAzureBlobStorageClient() override
     {
-        return client;
+        return client.get();
     }
 
 private:
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
index 2ed8990515f..1f293e5857e 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
@@ -122,7 +122,7 @@ public:
     static bool canUseReadThroughCache(const ReadSettings & settings);
 
 #if USE_AZURE_BLOB_STORAGE
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient() override
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> getAzureBlobStorageClient() override
     {
         return object_storage->getAzureBlobStorageClient();
     }
diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index e066beaefcc..049935ad60c 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -226,7 +226,7 @@ public:
     virtual WriteSettings patchSettings(const WriteSettings & write_settings) const;
 
 #if USE_AZURE_BLOB_STORAGE
-    virtual MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & getAzureBlobStorageClient()
+    virtual std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> getAzureBlobStorageClient()
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "This function is only implemented for AzureBlobStorage");
     }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index e5517a1a021..537a5a191e7 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -44,12 +44,12 @@ namespace
     public:
         UploadHelper(
             const CreateReadBuffer & create_read_buffer_,
-            MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client_,
+            std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client_,
             size_t offset_,
             size_t total_size_,
             const String & dest_container_for_logging_,
             const String & dest_blob_,
-            MultiVersion<AzureObjectStorageSettings> settings_,
+            std::shared_ptr<const AzureObjectStorageSettings> settings_,
             ThreadPoolCallbackRunner<void> schedule_,
             bool for_disk_azure_blob_storage_,
             const Poco::Logger * log_)
@@ -71,12 +71,12 @@ namespace
 
     protected:
         std::function<std::unique_ptr<SeekableReadBuffer>()> create_read_buffer;
-        MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client;
+        std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client;
         size_t offset;
         size_t total_size;
         const String & dest_container_for_logging;
         const String & dest_blob;
-        MultiVersion<AzureObjectStorageSettings> settings;
+        std::shared_ptr<const AzureObjectStorageSettings> settings;
         ThreadPoolCallbackRunner<void> schedule;
         bool for_disk_azure_blob_storage;
         const Poco::Logger * log;
@@ -116,7 +116,7 @@ namespace
 
         void completeMultipartUpload()
         {
-            auto block_blob_client = client.get()->GetBlockBlobClient(dest_blob);
+            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
             block_blob_client.CommitBlockList(block_ids);
         }
 
@@ -222,7 +222,7 @@ namespace
             if (for_disk_azure_blob_storage)
                 ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
 
-            auto block_blob_client = client.get()->GetBlockBlobClient(dest_blob);
+            auto block_blob_client = client->GetBlockBlobClient(dest_blob);
 
             while (!task.read_buffer->eof())
             {
@@ -267,10 +267,10 @@ void copyDataToAzureBlobStorageFile(
     const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
     size_t offset,
     size_t size,
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> dest_client,
     const String & dest_container_for_logging,
     const String & dest_blob,
-    MultiVersion<AzureObjectStorageSettings> settings,
+    std::shared_ptr<const AzureObjectStorageSettings> settings,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
 {
@@ -280,15 +280,15 @@ void copyDataToAzureBlobStorageFile(
 
 
 void copyAzureBlobStorageFile(
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> src_client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> dest_client,
     const String & src_container_for_logging,
     const String & src_blob,
     size_t offset,
     size_t size,
     const String & dest_container_for_logging,
     const String & dest_blob,
-    MultiVersion<AzureObjectStorageSettings> settings,
+    std::shared_ptr<const AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     ThreadPoolCallbackRunner<void> schedule,
     bool for_disk_azure_blob_storage)
@@ -300,8 +300,8 @@ void copyAzureBlobStorageFile(
         if (for_disk_azure_blob_storage)
             ProfileEvents::increment(ProfileEvents::DiskAzureCopyObject);
 
-        auto block_blob_client_src = src_client.get()->GetBlockBlobClient(src_blob);
-        auto block_blob_client_dest = dest_client.get()->GetBlockBlobClient(dest_blob);
+        auto block_blob_client_src = src_client->GetBlockBlobClient(src_blob);
+        auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_blob);
         auto source_uri = block_blob_client_src.GetUrl();
 
         if (size < max_single_operation_copy_size)
@@ -328,7 +328,7 @@ void copyAzureBlobStorageFile(
         LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container_for_logging, src_blob);
         auto create_read_buffer = [&]
         {
-            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client.get(), src_blob, read_settings, settings.get()->max_single_read_retries,
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_blob, read_settings, settings.get()->max_single_read_retries,
             settings.get()->max_single_download_retries);
         };
 
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index 15a31031f63..83814f42693 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -21,15 +21,15 @@ using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
 /// Copies a file from AzureBlobStorage to AzureBlobStorage.
 /// The parameters `src_offset` and `src_size` specify a part in the source to copy.
 void copyAzureBlobStorageFile(
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & src_client,
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & dest_client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> src_client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> dest_client,
     const String & src_container_for_logging,
     const String & src_blob,
     size_t src_offset,
     size_t src_size,
     const String & dest_container_for_logging,
     const String & dest_blob,
-    MultiVersion<AzureObjectStorageSettings> settings,
+    std::shared_ptr<const AzureObjectStorageSettings> settings,
     const ReadSettings & read_settings,
     ThreadPoolCallbackRunner<void> schedule_ = {},
     bool for_disk_azure_blob_storage = false);
@@ -44,10 +44,10 @@ void copyDataToAzureBlobStorageFile(
     const std::function<std::unique_ptr<SeekableReadBuffer>()> & create_read_buffer,
     size_t offset,
     size_t size,
-    MultiVersion<Azure::Storage::Blobs::BlobContainerClient> & client,
+    std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> client,
     const String & dest_container_for_logging,
     const String & dest_blob,
-    MultiVersion<AzureObjectStorageSettings> settings,
+    std::shared_ptr<const AzureObjectStorageSettings> settings,
     ThreadPoolCallbackRunner<void> schedule_ = {},
     bool for_disk_azure_blob_storage = false);
 

From d70fe79a1e4aeb61a2c17fbe8d67e285228a3eb3 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sun, 28 Jan 2024 12:28:08 +0100
Subject: [PATCH 0319/1081] Revert "Disable randomization of
 allow_experimental_block_number_column flag (#56474)"

This reverts commit 951d9ac1446d990f6da476217eeb5330ad5b8137.
---
 docker/test/stateless/stress_tests.lib        | 2 ++
 tests/config/config.d/merge_tree_settings.xml | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index 6f0dabb5207..ab573555a43 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -78,6 +78,8 @@ function configure()
         randomize_config_boolean_value use_compression zookeeper
     fi
 
+    randomize_config_boolean_value allow_experimental_block_number_column merge_tree_settings
+
     # for clickhouse-server (via service)
     echo "ASAN_OPTIONS='malloc_context_size=10 verbosity=1 allocator_release_to_os_interval_ms=10000'" >> /etc/environment
     # for clickhouse-client
diff --git a/tests/config/config.d/merge_tree_settings.xml b/tests/config/config.d/merge_tree_settings.xml
index f277c18fa3f..7dcea114b90 100644
--- a/tests/config/config.d/merge_tree_settings.xml
+++ b/tests/config/config.d/merge_tree_settings.xml
@@ -2,5 +2,7 @@
     <merge_tree>
         <!-- 10 seconds (default is 1 minute) -->
         <zookeeper_session_expiration_check_period>10</zookeeper_session_expiration_check_period>
+        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
+        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
     </merge_tree>
 </clickhouse>

From febd4ce8d794749da1346428709f72ce0e34495f Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 13:41:33 +0100
Subject: [PATCH 0320/1081] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 19f9783cd01..5c1398bf308 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -249,12 +249,12 @@ stop_logs_replication
 failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
-    error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
+    err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
+        err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
-        error=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
+        err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 9dd6362ae7488169b4dc8be9be92e3a982131cdb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 13:44:56 +0100
Subject: [PATCH 0321/1081] Play UI: improve rendering of errors from JSON
 formats

---
 programs/server/play.html | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/programs/server/play.html b/programs/server/play.html
index e6662693bd7..507a96382a7 100644
--- a/programs/server/play.html
+++ b/programs/server/play.html
@@ -993,7 +993,16 @@
     function renderError(response)
     {
         clear();
-        document.getElementById('error').innerText = response ? response : "No response.";
+
+        let message = response;
+        try {
+            let json = JSON.parse(response);
+            if (json.exception) {
+                message = json.exception;
+            }
+        } catch (e) {}
+
+        document.getElementById('error').innerText = message ? message : "No response.";
         document.getElementById('error').style.display = 'block';
         document.getElementById('logo-container').style.display = 'none';
     }

From e0f0b21e907eb0d20655f83641f26261793910cf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 14:24:13 +0100
Subject: [PATCH 0322/1081] Remove KQL

---
 src/Interpreters/executeQuery.cpp | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 533d58aaa8f..3ff3db6b8ff 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -102,6 +102,7 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
     extern const int QUERY_WAS_CANCELLED;
     extern const int INCORRECT_DATA;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 
@@ -709,10 +710,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     {
         if (settings.dialect == Dialect::kusto && !internal)
         {
-            ParserKQLStatement parser(end, settings.allow_settings_after_format_in_insert);
-
-            /// TODO: parser should fail early when max_query_size limit is reached.
-            ast = parseKQLQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Kusto dialect is disabled until these two bugs will be fixed: https://github.com/ClickHouse/ClickHouse/issues/59037 and https://github.com/ClickHouse/ClickHouse/issues/59036");
         }
         else if (settings.dialect == Dialect::prql && !internal)
         {

From b54be00783c38786370bce20930e626adc8fb3a1 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sun, 28 Jan 2024 14:36:22 +0100
Subject: [PATCH 0323/1081] fix build

---
 contrib/aws-cmake/CMakeLists.txt | 6 +++---
 contrib/aws-crt-cpp              | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/contrib/aws-cmake/CMakeLists.txt b/contrib/aws-cmake/CMakeLists.txt
index b913908911c..abde20addaf 100644
--- a/contrib/aws-cmake/CMakeLists.txt
+++ b/contrib/aws-cmake/CMakeLists.txt
@@ -25,6 +25,7 @@ include("${ClickHouse_SOURCE_DIR}/contrib/aws-cmake/AwsFeatureTests.cmake")
 include("${ClickHouse_SOURCE_DIR}/contrib/aws-cmake/AwsThreadAffinity.cmake")
 include("${ClickHouse_SOURCE_DIR}/contrib/aws-cmake/AwsThreadName.cmake")
 include("${ClickHouse_SOURCE_DIR}/contrib/aws-cmake/AwsSIMD.cmake")
+include("${ClickHouse_SOURCE_DIR}/contrib/aws-crt-cpp/cmake/AwsGetVersion.cmake")
 
 
 # Gather sources and options.
@@ -123,9 +124,8 @@ OPTION(USE_AWS_MEMORY_MANAGEMENT "Aws memory management" OFF)
 configure_file("${AWS_SDK_CORE_DIR}/include/aws/core/SDKConfig.h.in"
     "${CMAKE_CURRENT_BINARY_DIR}/include/aws/core/SDKConfig.h" @ONLY)
 
-list(APPEND AWS_PUBLIC_COMPILE_DEFS "-DAWS_SDK_VERSION_MAJOR=1")
-list(APPEND AWS_PUBLIC_COMPILE_DEFS "-DAWS_SDK_VERSION_MINOR=10")
-list(APPEND AWS_PUBLIC_COMPILE_DEFS "-DAWS_SDK_VERSION_PATCH=36")
+aws_get_version(AWS_CRT_CPP_VERSION_MAJOR AWS_CRT_CPP_VERSION_MINOR AWS_CRT_CPP_VERSION_PATCH FULL_VERSION GIT_HASH)
+configure_file("${AWS_CRT_DIR}/include/aws/crt/Config.h.in" "${AWS_CRT_DIR}/include/aws/crt/Config.h" @ONLY)
 
 list(APPEND AWS_SOURCES ${AWS_SDK_CORE_SRC} ${AWS_SDK_CORE_NET_SRC} ${AWS_SDK_CORE_PLATFORM_SRC})
 
diff --git a/contrib/aws-crt-cpp b/contrib/aws-crt-cpp
index 86adce22528..f532d6abc0d 160000
--- a/contrib/aws-crt-cpp
+++ b/contrib/aws-crt-cpp
@@ -1 +1 @@
-Subproject commit 86adce22528b811efa5ca27f65d8d5a38223cbfa
+Subproject commit f532d6abc0d2b0d8b5d6fe9e7c51eaedbe4afbd0

From 27cd21848360815c5db49647b5d8efc6e55f2b99 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 15:10:57 +0100
Subject: [PATCH 0324/1081] No debug symbols in Rust

---
 rust/prql/Cargo.toml | 2 +-
 rust/skim/Cargo.toml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/rust/prql/Cargo.toml b/rust/prql/Cargo.toml
index f29aa4aaef9..ca8a19b41ac 100644
--- a/rust/prql/Cargo.toml
+++ b/rust/prql/Cargo.toml
@@ -13,7 +13,7 @@ serde_json = "1.0"
 crate-type = ["staticlib"]
 
 [profile.release]
-debug = true
+debug = false
 
 [profile.release-thinlto]
 inherits = "release"
diff --git a/rust/skim/Cargo.toml b/rust/skim/Cargo.toml
index 22af40c3e33..0839b888d8b 100644
--- a/rust/skim/Cargo.toml
+++ b/rust/skim/Cargo.toml
@@ -17,7 +17,7 @@ cxx-build = "1.0.83"
 crate-type = ["staticlib"]
 
 [profile.release]
-debug = true
+debug = false
 
 [profile.release-thinlto]
 inherits = "release"

From b3b2b7a1e6352379d90d72bc773737f386ec1c36 Mon Sep 17 00:00:00 2001
From: Maksim Alekseev <alekseevmaksim63@list.ru>
Date: Sun, 28 Jan 2024 17:29:08 +0300
Subject: [PATCH 0325/1081] Fix architecture name in select of Rust target

---
 contrib/corrosion-cmake/CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/corrosion-cmake/CMakeLists.txt b/contrib/corrosion-cmake/CMakeLists.txt
index 04871c761ab..9b98ed6efb3 100644
--- a/contrib/corrosion-cmake/CMakeLists.txt
+++ b/contrib/corrosion-cmake/CMakeLists.txt
@@ -28,7 +28,7 @@ elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-aarch64")
     set(Rust_CARGO_TARGET "aarch64-unknown-linux-gnu")
 elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
     set(Rust_CARGO_TARGET "x86_64-apple-darwin")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "darwin"))
+elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "aarch64"))
     set(Rust_CARGO_TARGET "aarch64-apple-darwin")
 elseif((CMAKE_TOOLCHAIN_FILE MATCHES "freebsd") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
     set(Rust_CARGO_TARGET "x86_64-unknown-freebsd")

From 29700fbad154328fcaeda059a6b4644f95edee11 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Sun, 28 Jan 2024 15:33:27 +0100
Subject: [PATCH 0326/1081] Fix special build

---
 src/Columns/ColumnMap.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index 307a1ef0f62..4a758ca248a 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -141,9 +141,9 @@ void ColumnMap::updateHashFast(SipHash & hash) const
     nested->updateHashFast(hash);
 }
 
-void ColumnMap::insertFrom(const IColumn & src, size_t start)
+void ColumnMap::insertFrom(const IColumn & src, size_t n)
 {
-    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), start);
+    nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), n);
 }
 
 void ColumnMap::insertRangeFrom(const IColumn & src, size_t start, size_t length)

From 368a26a2aac14da37914b5a25f9537008e48d349 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sun, 28 Jan 2024 15:48:49 +0100
Subject: [PATCH 0327/1081] fix build

---
 contrib/update-submodules.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/update-submodules.sh b/contrib/update-submodules.sh
index 7195de020bd..072d7a5dc2f 100755
--- a/contrib/update-submodules.sh
+++ b/contrib/update-submodules.sh
@@ -24,7 +24,7 @@ git config --file .gitmodules --get-regexp '.*path' | sed 's/[^ ]* //' | xargs -
 # We don't want to depend on any third-party CMake files.
 # To check it, find and delete them.
 grep -o -P '"contrib/[^"]+"' .gitmodules |
-  grep -v -P 'contrib/(llvm-project|google-protobuf|grpc|abseil-cpp|corrosion)' |
+  grep -v -P 'contrib/(llvm-project|google-protobuf|grpc|abseil-cpp|corrosion|aws-crt-cpp)' |
   xargs -I@ find @ \
     -'(' -name 'CMakeLists.txt' -or -name '*.cmake' -')' -and -not -name '*.h.cmake' \
     -delete

From d36c92a21900c7f47680ee67cb93864d02105bdf Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Sun, 28 Jan 2024 15:09:39 +0000
Subject: [PATCH 0328/1081] CI: Add rust dir to build digest

---
 tests/ci/ci_config.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index ece7f2f7bae..df72c02cb7d 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -213,6 +213,7 @@ class BuildConfig:
                     "./programs",
                     "./packages",
                     "./docker/packager/packager",
+                    "./rust",
                 ],
                 exclude_files=[".md"],
                 docker=["clickhouse/binary-builder"],

From aa6c7e78beb843b1c830a947615836a89291519b Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Sun, 28 Jan 2024 15:47:17 +0000
Subject: [PATCH 0329/1081] fix deadlock in AsyncLoader::stop()

---
 src/Common/AsyncLoader.cpp              | 44 ++++++++++++++++++-------
 src/Common/AsyncLoader.h                |  5 ---
 src/Common/tests/gtest_async_loader.cpp | 12 +++++--
 3 files changed, 43 insertions(+), 18 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index e9de95363bc..140194e10b4 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -2,6 +2,7 @@
 
 #include <limits>
 #include <optional>
+#include <fmt/format.h>
 #include <base/defines.h>
 #include <base/scope_guard.h>
 #include <Common/ErrorCodes.h>
@@ -195,13 +196,6 @@ void LoadTask::remove()
     }
 }
 
-void LoadTask::detach()
-{
-    jobs.clear();
-    goal_jobs.clear();
-}
-
-
 AsyncLoader::AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_)
     : log_failures(log_failures_)
     , log_progress(log_progress_)
@@ -214,7 +208,22 @@ AsyncLoader::AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool lo
 
 AsyncLoader::~AsyncLoader()
 {
-    stop();
+    // All `LoadTask` objects should be destructed before AsyncLoader destruction because they hold a reference.
+    // To make sure we check for all pending jobs to be finished.
+    std::unique_lock lock{mutex};
+    if (scheduled_jobs.empty() && finished_jobs.empty())
+        return;
+
+    std::vector<String> scheduled;
+    std::vector<String> finished;
+    scheduled.reserve(scheduled_jobs.size());
+    finished.reserve(finished_jobs.size());
+    for (const auto & [job, _] : scheduled_jobs)
+        scheduled.push_back(job->name);
+    for (const auto & job : finished_jobs)
+        finished.push_back(job->name);
+    LOG_ERROR(log, "Bug. Destruction with pending ({}) and finished ({}) load jobs.", fmt::join(scheduled, ", "), fmt::join(finished, ", "));
+    abort();
 }
 
 void AsyncLoader::start()
@@ -236,6 +245,17 @@ void AsyncLoader::wait()
         for (auto & p : pools)
             p.thread_pool->wait();
         lock.lock();
+
+        // If there is no way for all jobs to finish, throw LOGICAL_ERROR instead of deadlock
+        if (!scheduled_jobs.empty() && !hasWorker(lock))
+        {
+            std::vector<String> names;
+            names.reserve(scheduled_jobs.size());
+            for (const auto & [job, _] : scheduled_jobs)
+                names.push_back(job->name);
+            LOG_ERROR(log, "Waiting for load jobs to finish while being stopped: {}.", fmt::join(names, ", "));
+            abort();
+        }
     }
 }
 
@@ -243,10 +263,12 @@ void AsyncLoader::stop()
 {
     {
         std::unique_lock lock{mutex};
-        is_running = false;
-        // NOTE: there is no need to notify because workers never wait
+        is_running = false; // NOTE: there is no need to notify because workers never wait
     }
-    wait();
+
+    // Wait for all currently running jobs to finish (and do NOT wait all pending jobs)
+    for (auto & p : pools)
+        p.thread_pool->wait();
 }
 
 void AsyncLoader::schedule(LoadTask & task)
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index c2a9c901f1c..b1b336d24dc 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -198,10 +198,6 @@ public:
     // Remove all jobs of this task from AsyncLoader.
     void remove();
 
-    // Do not track jobs in this task.
-    // WARNING: Jobs will never be removed() and are going to be stored as finished jobs until ~AsyncLoader().
-    void detach();
-
     // Return the final jobs in this tasks. This job subset should be used as `dependencies` for dependent jobs or tasks:
     //   auto load_task = loadSomethingAsync(async_loader, load_after_task.goals(), something);
     const LoadJobSet & goals() const { return goal_jobs.empty() ? jobs : goal_jobs; }
@@ -333,7 +329,6 @@ private:
 public:
     AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_);
 
-    // Stops AsyncLoader before destruction
     // WARNING: all tasks instances should be destructed before associated AsyncLoader.
     ~AsyncLoader();
 
diff --git a/src/Common/tests/gtest_async_loader.cpp b/src/Common/tests/gtest_async_loader.cpp
index d978d23750c..950c7bbab76 100644
--- a/src/Common/tests/gtest_async_loader.cpp
+++ b/src/Common/tests/gtest_async_loader.cpp
@@ -622,7 +622,13 @@ TEST(AsyncLoader, CustomDependencyFailure)
     auto dependent_job1 = makeLoadJob({ collect_job }, "dependent_job1", dependent_job_func);
     auto dependent_job2 = makeLoadJob({ collect_job }, "dependent_job2", dependent_job_func);
     auto dependent_job3 = makeLoadJob({ collect_job }, "dependent_job3", dependent_job_func);
-    auto task = t.schedule({ dependent_job1, dependent_job2, dependent_job3 }); // Other jobs should be discovery automatically
+    auto task = t.schedule({
+            dependent_job1, dependent_job2, dependent_job3,
+            collect_job,
+            late_dep1, late_dep2, late_dep3,
+            good_dep1, good_dep2, good_dep3,
+            evil_dep1, evil_dep2, evil_dep3,
+        });
 
     t.loader.wait(collect_job, true);
     canceled_sync.arrive_and_wait(); // (A)
@@ -1022,8 +1028,10 @@ TEST(AsyncLoader, SetMaxThreads)
     };
 
     // Generate enough independent jobs
+    std::vector<LoadTaskPtr> tasks;
+    tasks.reserve(1000);
     for (int i = 0; i < 1000; i++)
-        t.schedule({makeLoadJob({}, "job", job_func)})->detach();
+        tasks.push_back(t.schedule({makeLoadJob({}, "job", job_func)}));
 
     t.loader.start();
     while (sync_index < syncs.size())

From 41883ddb34d39dba8aaf5e06099c7623575239b6 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 18:15:11 +0100
Subject: [PATCH 0330/1081] Update run.sh

---
 docker/test/stateless/run.sh | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 5c1398bf308..89e8eb13a6d 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -250,11 +250,14 @@ failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
     err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
+    echo $err
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
+        echo $err
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
+        echo $err
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 4dcf27e5b20f3c00e3cec066eb0c462b6dda3f38 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 18:27:15 +0100
Subject: [PATCH 0331/1081] /binary: allow specifying user/password/host

---
 programs/server/binary.html | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/programs/server/binary.html b/programs/server/binary.html
index 988dd33a72a..74095dff537 100644
--- a/programs/server/binary.html
+++ b/programs/server/binary.html
@@ -60,10 +60,16 @@
         /// If it is hosted on server, assume that it is the address of ClickHouse.
         if (location.protocol != 'file:') {
             host = location.origin;
-            user = 'default';
             add_http_cors_header = false;
         }
 
+        if (window.location.search) {
+            const params = new URLSearchParams(window.location.search);
+            if (params.has('host')) { host = params.get('host'); }
+            if (params.has('user')) { user = params.get('user'); }
+            if (params.has('password')) { password = params.get('password'); }
+        }
+
         let map = L.map('space', {
             crs: L.CRS.Simple,
             center: [-512, 512],

From c7663c6d92b7841c118f23cc5c1f66589dff1c8b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 18:31:10 +0100
Subject: [PATCH 0332/1081] Remove tests

---
 .../02366_kql_create_table.reference          |   4 -
 .../0_stateless/02366_kql_create_table.sql    |  29 --
 .../0_stateless/02366_kql_datatype.reference  | 105 -----
 .../0_stateless/02366_kql_datatype.sql        | 117 ------
 .../0_stateless/02366_kql_distinct.reference  |  27 --
 .../0_stateless/02366_kql_distinct.sql        |  28 --
 .../0_stateless/02366_kql_extend.reference    |  32 --
 .../queries/0_stateless/02366_kql_extend.sql  |  61 ---
 .../02366_kql_func_binary.reference           |   7 -
 .../0_stateless/02366_kql_func_binary.sql     |   8 -
 .../02366_kql_func_datetime.reference         |  76 ----
 .../0_stateless/02366_kql_func_datetime.sql   |  86 -----
 .../02366_kql_func_dynamic.reference          | 152 --------
 .../0_stateless/02366_kql_func_dynamic.sql    | 161 --------
 .../0_stateless/02366_kql_func_ip.reference   | 123 ------
 .../queries/0_stateless/02366_kql_func_ip.sql | 131 -------
 .../0_stateless/02366_kql_func_math.reference |   4 -
 .../0_stateless/02366_kql_func_math.sql       |   7 -
 .../02366_kql_func_scalar.reference           |  16 -
 .../0_stateless/02366_kql_func_scalar.sql     |  26 --
 .../02366_kql_func_string.reference           | 360 ------------------
 .../0_stateless/02366_kql_func_string.sql     | 313 ---------------
 .../02366_kql_makeseries.reference            |  60 ---
 .../0_stateless/02366_kql_makeseries.sql      |  77 ----
 .../0_stateless/02366_kql_mvexpand.reference  |  65 ----
 .../0_stateless/02366_kql_mvexpand.sql        |  35 --
 ...02366_kql_native_interval_format.reference |  23 --
 .../02366_kql_native_interval_format.sql.j2   |  16 -
 .../02366_kql_operator_in_sql.reference       |  60 ---
 .../0_stateless/02366_kql_operator_in_sql.sql |  42 --
 .../0_stateless/02366_kql_summarize.reference |  92 -----
 .../0_stateless/02366_kql_summarize.sql       | 102 -----
 .../0_stateless/02366_kql_tabular.reference   | 139 -------
 .../queries/0_stateless/02366_kql_tabular.sql |  88 -----
 34 files changed, 2672 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02366_kql_create_table.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_create_table.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_datatype.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_datatype.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_distinct.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_distinct.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_extend.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_extend.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_binary.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_binary.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_datetime.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_datetime.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_dynamic.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_dynamic.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_ip.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_ip.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_math.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_math.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_scalar.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_scalar.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_string.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_func_string.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_makeseries.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_makeseries.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_mvexpand.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_mvexpand.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_native_interval_format.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_native_interval_format.sql.j2
 delete mode 100644 tests/queries/0_stateless/02366_kql_operator_in_sql.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_operator_in_sql.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_summarize.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_summarize.sql
 delete mode 100644 tests/queries/0_stateless/02366_kql_tabular.reference
 delete mode 100644 tests/queries/0_stateless/02366_kql_tabular.sql

diff --git a/tests/queries/0_stateless/02366_kql_create_table.reference b/tests/queries/0_stateless/02366_kql_create_table.reference
deleted file mode 100644
index 35136b5ff42..00000000000
--- a/tests/queries/0_stateless/02366_kql_create_table.reference
+++ /dev/null
@@ -1,4 +0,0 @@
--- test create table --
-Theodore
-Diaz
-Theodore	Diaz	28
diff --git a/tests/queries/0_stateless/02366_kql_create_table.sql b/tests/queries/0_stateless/02366_kql_create_table.sql
deleted file mode 100644
index b266679b06a..00000000000
--- a/tests/queries/0_stateless/02366_kql_create_table.sql
+++ /dev/null
@@ -1,29 +0,0 @@
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES  ('Theodore','Diaz','Skilled Manual','Bachelors',28),('Stephanie','Cox','Management abcd defg','Bachelors',33),('Peter','Nara','Skilled Manual','Graduate Degree',26),('Latoya','Shen','Professional','Graduate Degree',25),('Apple','','Skilled Manual','Bachelors',28),(NULL,'why','Professional','Partial College',38);
-Select '-- test create table --' ;
-Select * from kql(Customers|project FirstName) limit 1;;
-DROP TABLE IF EXISTS kql_table1;
-CREATE TABLE kql_table1 ENGINE = Memory AS select *, now() as new_column From kql(Customers | project LastName | filter LastName=='Diaz');
-select LastName from kql_table1 limit 1;
-DROP TABLE IF EXISTS kql_table2;
-CREATE TABLE kql_table2
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-INSERT INTO kql_table2 select * from kql(Customers|project FirstName,LastName,Age | filter FirstName=='Theodore');
-select * from kql_table2 limit 1;
--- select * from kql(Customers | where FirstName !in ("test", "test2"));
-DROP TABLE IF EXISTS Customers;
-DROP TABLE IF EXISTS kql_table1;
-DROP TABLE IF EXISTS kql_table2;
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02366_kql_datatype.reference b/tests/queries/0_stateless/02366_kql_datatype.reference
deleted file mode 100644
index fe666f3734c..00000000000
--- a/tests/queries/0_stateless/02366_kql_datatype.reference
+++ /dev/null
@@ -1,105 +0,0 @@
--- bool
-true
-\N
--- int
-123
-\N
--- long
-123
-255
--1
-\N
-456
--- real
-0.01
-\N
-nan
-inf
--inf
--- datetime
-2015-12-31 23:59:59.900000000
-2015-12-31 00:00:00.000000000
-2014-05-25 08:20:03.123456000
-2014-11-08 15:55:55.000000000
-2014-11-08 15:55:00.000000000
-2014-11-08 00:00:00.000000000
-\N
-2014-05-25 08:20:03.123456000
-2014-11-08 15:55:55.123456000
--- time
-1216984.12345
-45055.123
-86400
--86400
-6.000000000000001e-9
-6e-7
-172800
-259200
--- guid
-\N
--- timespan (time)
-172800
-1800
-10
-0.1
-0.00001
-1e-7
-1120343
--- null
-1
-\N	\N	\N	\N	\N
--- decimal
-\N
-123.345
-100000
--- dynamic
-\N
-1
-86400
-[1,2,3]
-[[1],[2],[3]]
-['a','b','c']
--- cast functions
-true
-1
--- tobool("false")
-false
-1
--- tobool(1)
-true
-1
--- tobool(123)
-true
-1
--- tobool("abc")
-\N
-\N
--- todouble()
-123.4
-\N
--- toreal()
-123.4
-\N
--- toint()
-1
-\N
--- tostring()
-123
-1
--- todatetime()
-1
-\N
--- make_timespan()
-01:12:00	01:12:30	1.12:30:55
--- totimespan()
-1e-7
-60
-\N
-1120343
--- tolong()
-123
-\N
--- todecimal()
-123.345
-\N
-\N
diff --git a/tests/queries/0_stateless/02366_kql_datatype.sql b/tests/queries/0_stateless/02366_kql_datatype.sql
deleted file mode 100644
index ecd29504298..00000000000
--- a/tests/queries/0_stateless/02366_kql_datatype.sql
+++ /dev/null
@@ -1,117 +0,0 @@
-set dialect = 'kusto';
-
-print '-- bool'
-print bool(true);
-print bool(true);
-print bool(null);
-print '-- int';
-print int(123);
-print int(null);
-print int('4'); -- { clientError BAD_ARGUMENTS }
-print '-- long';
-print long(123);
-print long(0xff);
-print long(-1);
-print long(null);
-print 456;
-print '-- real';
-print real(0.01);
-print real(null);
-print real(nan);
-print real(+inf);
-print real(-inf);
-print double('4.2'); -- { clientError BAD_ARGUMENTS }
-print '-- datetime';
-print datetime(2015-12-31 23:59:59.9);
-print datetime(2015-12-31);
-print datetime('2014-05-25T08:20:03.123456');
-print datetime('2014-11-08 15:55:55');
-print datetime('2014-11-08 15:55');
-print datetime('2014-11-08');
-print datetime(null);
-print datetime('2014-05-25T08:20:03.123456Z');
-print datetime('2014-11-08 15:55:55.123456Z');
-print '-- time';
-print time('14.02:03:04.12345');
-print time('12:30:55.123');
-print time(1d);
-print time(-1d);
-print time(6nanoseconds);
-print time(6tick);
-print time(2);
-print time(2) + 1d;
-print '-- guid'
-print guid(74be27de-1e4e-49d9-b579-fe0b331d3642);
-print guid(null);
-print '-- timespan (time)';
-print timespan(2d); --              2 days
---print timespan(1.5h); -- 	        1.5 hour
-print timespan(30m); -- 	        30 minutes
-print timespan(10s); -- 	        10 seconds
---print timespan(0.1s); -- 	        0.1 second
-print timespan(100ms); -- 	        100 millisecond
-print timespan(10microsecond); -- 	10 microseconds
-print timespan(1tick); --           100 nanoseconds
---print timespan(1.5h) / timespan(30m);
-print timespan('12.23:12:23') / timespan(1s);
-print '-- null';
-print isnull(null);
-print bool(null), int(null), long(null), real(null), double(null);
-print '-- decimal';
-print decimal(null);
-print decimal(123.345);
-print decimal(1e5);
-print '-- dynamic'; -- no support for mixed types and bags for now
-print dynamic(null);
-print dynamic(1);
-print dynamic(timespan(1d));
-print dynamic([1,2,3]);
-print dynamic([[1], [2], [3]]);
-print dynamic(['a', "b", 'c']);
-print '-- cast functions'
-print '--tobool("true")'; -- == true
-print tobool('true'); -- == true
-print tobool('true') == toboolean('true'); -- == true
-print '-- tobool("false")'; -- == false
-print tobool('false'); -- == false
-print tobool('false') == toboolean('false'); -- == false
-print '-- tobool(1)'; -- == true
-print tobool(1); -- == true
-print tobool(1) == toboolean(1); -- == true
-print '-- tobool(123)'; -- == true
-print tobool(123); -- == true
-print tobool(123) == toboolean(123); -- == true
-print '-- tobool("abc")'; -- == null
-print tobool('abc'); -- == null
-print tobool('abc') == toboolean('abc'); -- == null
-print '-- todouble()';
-print todouble('123.4');
-print todouble('abc') == null;
-print '-- toreal()';
-print toreal("123.4");
-print toreal('abc') == null;
-print '-- toint()';
-print toint("123") == int(123);
-print toint('abc');
-print '-- tostring()';
-print tostring(123);
-print tostring(null) == '';
-print '-- todatetime()';
-print todatetime("2015-12-24") == datetime(2015-12-24);
-print todatetime('abc') == null;
-print '-- make_timespan()';
-print v1=make_timespan(1,12), v2=make_timespan(1,12,30), v3=make_timespan(1,12,30,55.123);
-print '-- totimespan()';
-print totimespan(1tick);
-print totimespan('0.00:01:00');
-print totimespan('abc');
-print totimespan('12.23:12:23') / totimespan(1s);
--- print totimespan(strcat('12.', '23', ':12:', '23')) / timespan(1s); -> 1120343
-print '-- tolong()';
-print tolong('123');
-print tolong('abc');
-print '-- todecimal()';
-print todecimal(123.345);
-print todecimal(null);
-print todecimal('abc');
--- print todecimal(4 * 2 + 3); -> 11
diff --git a/tests/queries/0_stateless/02366_kql_distinct.reference b/tests/queries/0_stateless/02366_kql_distinct.reference
deleted file mode 100644
index 2100f44f18c..00000000000
--- a/tests/queries/0_stateless/02366_kql_distinct.reference
+++ /dev/null
@@ -1,27 +0,0 @@
---  distinct * --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
-\N	why	Professional	Partial College	38
---  distinct one column --
-Skilled Manual
-Management abcd defg
-Professional
---  distinct two column --
-Skilled Manual	Bachelors
-Management abcd defg	Bachelors
-Skilled Manual	Graduate Degree
-Professional	Graduate Degree
-Professional	Partial College
---  distinct with where --
-Skilled Manual	Bachelors
-Management abcd defg	Bachelors
-Skilled Manual	Graduate Degree
-Professional	Graduate Degree
-Professional	Partial College
---  distinct with where, order --
-Skilled Manual	Bachelors
-Skilled Manual	Graduate Degree
-Professional	Graduate Degree
diff --git a/tests/queries/0_stateless/02366_kql_distinct.sql b/tests/queries/0_stateless/02366_kql_distinct.sql
deleted file mode 100644
index 3c997eb4865..00000000000
--- a/tests/queries/0_stateless/02366_kql_distinct.sql
+++ /dev/null
@@ -1,28 +0,0 @@
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES ('Theodore','Diaz','Skilled Manual','Bachelors',28), ('Stephanie','Cox','Management abcd defg','Bachelors',33),('Peter','Nara','Skilled Manual','Graduate Degree',26),('Latoya','Shen','Professional','Graduate Degree',25),('Apple','','Skilled Manual','Bachelors',28),(NULL,'why','Professional','Partial College',38);
-
-set dialect = 'kusto';
-
-print '--  distinct * --';
-Customers | distinct *;
-
-print '--  distinct one column --';
-Customers | distinct Occupation;
-
-print '--  distinct two column --';
-Customers | distinct Occupation, Education;
-
-print '--  distinct with where --';
-Customers where Age <30 | distinct Occupation, Education;
-
-print '--  distinct with where, order --';
-Customers |where Age <30 | order by Age| distinct Occupation, Education;
diff --git a/tests/queries/0_stateless/02366_kql_extend.reference b/tests/queries/0_stateless/02366_kql_extend.reference
deleted file mode 100644
index 2936c9ea19c..00000000000
--- a/tests/queries/0_stateless/02366_kql_extend.reference
+++ /dev/null
@@ -1,32 +0,0 @@
--- extend #1 --
-Aldi	Apple	4	2016-09-10	400
-Costco	Apple	2	2016-09-11	200
--- extend #2 --
-Apple	200
-Apple	400
--- extend #3 --
-Apple cost 480 on average based on 5 samples.
-Snargaluff cost 28080 on average based on 5 samples.
--- extend #4 --
-1
--- extend #5 --
-Aldi	Apple	4	2016-09-10	Apple was purchased from Aldi for $4 on 2016-09-10	400
-Costco	Apple	2	2016-09-11	Apple was purchased from Costco for $2 on 2016-09-11	200
--- extend #6 --
-Aldi	Apple	2016-09-10	400
-Costco	Apple	2016-09-11	200
-Aldi	Apple	2016-09-10	600
-Costco	Snargaluff	2016-09-12	10000
-Aldi	Apple	2016-09-12	700
-Aldi	Snargaluff	2016-09-11	40000
-Costco	Snargaluff	2016-09-12	10400
-Aldi	Apple	2016-09-12	500
-Aldi	Snargaluff	2016-09-11	60000
-Costco	Snargaluff	2016-09-10	20000
--- extend #7 --
-5
--- extend #8 --
--- extend #9 --
--- extend #10 --
--- extend #11 --
-5	[2,1]
diff --git a/tests/queries/0_stateless/02366_kql_extend.sql b/tests/queries/0_stateless/02366_kql_extend.sql
deleted file mode 100644
index 0a3c1f3dcd4..00000000000
--- a/tests/queries/0_stateless/02366_kql_extend.sql
+++ /dev/null
@@ -1,61 +0,0 @@
--- datatable(Supplier:string, Fruit:string, Price: real, Purchase:datetime)
--- [
---     'Aldi','Apple',4,'2016-09-10',
---     'Costco','Apple',2,'2016-09-11',
---     'Aldi','Apple',6,'2016-09-10',
---     'Costco','Snargaluff',100,'2016-09-12',
---     'Aldi','Apple',7,'2016-09-12',
---     'Aldi','Snargaluff',400,'2016-09-11',
---     'Costco','Snargaluff',104,'2016-09-12',
---     'Aldi','Apple',5,'2016-09-12',
---     'Aldi','Snargaluff',600,'2016-09-11',
---     'Costco','Snargaluff',200,'2016-09-10',
--- ]
-
-
-DROP TABLE IF EXISTS Ledger;
-CREATE TABLE Ledger
-(
-   Supplier Nullable(String),
-   Fruit String ,
-   Price Float64,
-   Purchase Date
-) ENGINE = Memory;
-INSERT INTO Ledger VALUES  ('Aldi','Apple',4,'2016-09-10'), ('Costco','Apple',2,'2016-09-11'), ('Aldi','Apple',6,'2016-09-10'), ('Costco','Snargaluff',100,'2016-09-12'), ('Aldi','Apple',7,'2016-09-12'), ('Aldi','Snargaluff',400,'2016-09-11'),('Costco','Snargaluff',104,'2016-09-12'),('Aldi','Apple',5,'2016-09-12'),('Aldi','Snargaluff',600,'2016-09-11'),('Costco','Snargaluff',200,'2016-09-10');
-
--- This test requies sorting after some of aggregations but I don't know KQL, sorry
-set max_bytes_before_external_group_by = 0;
-set dialect = 'kusto';
-
-print '-- extend #1 --';
-Ledger | extend PriceInCents = 100 * Price | take 2;
-
-print '-- extend #2 --';
-Ledger | extend PriceInCents = 100 * Price | sort by PriceInCents asc | project Fruit, PriceInCents | take 2;
-
-print '-- extend #3 --';
-Ledger | extend PriceInCents = 100 * Price | sort by PriceInCents asc | project Fruit, PriceInCents | summarize AveragePrice = avg(PriceInCents), Purchases = count() by Fruit | extend Sentence = strcat(Fruit, ' cost ', tostring(AveragePrice), ' on average based on ', tostring(Purchases), ' samples.') | project Sentence;
-
-print '-- extend #4 --';
-Ledger | extend a = Price | extend b = a | extend c = a, d = b + 500 | extend Pass = bool(b == a and c == a and d == b + 500) | summarize binary_all_and(Pass);
-
-print '-- extend #5 --';
-Ledger | take 2 | extend strcat(Fruit, ' was purchased from ', Supplier, ' for $', tostring(Price), ' on ', tostring(Purchase)) | extend PriceInCents = 100 * Price;
-
-print '-- extend #6 --';
-Ledger | extend Price = 100 * Price;
-
-print '-- extend #7 --';
-print a = 4 | extend a = 5;
-
-print '-- extend #8 --';
--- print x = 5 | extend array_sort_desc(range(0, x), range(1, x + 1))
-
-print '-- extend #9 --';
-print x = 19 | extend = 4 + ; -- { clientError SYNTAX_ERROR }
-
-print '-- extend #10 --';
-Ledger | extend PriceInCents = * Price | sort by PriceInCents asc | project Fruit, PriceInCents | summarize AveragePrice = avg(PriceInCents), Purchases = count() by Fruit | extend Sentence = strcat(Fruit, ' cost ', tostring(AveragePrice), ' on average based on ', tostring(Purchases), ' samples.') | project Sentence; -- { clientError SYNTAX_ERROR }
-
-print '-- extend #11 --'; -- should ideally return this in the future: 5	[2,1] because of the alias ex
-print x = 5 | extend ex = array_sort_desc(dynamic([1, 2]), dynamic([3, 4]));
diff --git a/tests/queries/0_stateless/02366_kql_func_binary.reference b/tests/queries/0_stateless/02366_kql_func_binary.reference
deleted file mode 100644
index 6276cd6d867..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_binary.reference
+++ /dev/null
@@ -1,7 +0,0 @@
- -- binary functions
-4	7
-1
-1
-1
-7	3
-1
diff --git a/tests/queries/0_stateless/02366_kql_func_binary.sql b/tests/queries/0_stateless/02366_kql_func_binary.sql
deleted file mode 100644
index 824022b564c..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_binary.sql
+++ /dev/null
@@ -1,8 +0,0 @@
-set dialect='kusto';
-print ' -- binary functions';
-print binary_and(4,7), binary_or(4,7);
-print binary_shift_left(1, 1) == binary_shift_left(1, 65);
-print binary_shift_right(2, 1) == binary_shift_right(2, 65);
-print binary_shift_right(binary_shift_left(1, 65), 65) == 1;
-print binary_xor(2, 5), bitset_count_ones(42);
-print bitset_count_ones(binary_shift_left(binary_and(4,7), 1));
diff --git a/tests/queries/0_stateless/02366_kql_func_datetime.reference b/tests/queries/0_stateless/02366_kql_func_datetime.reference
deleted file mode 100644
index 40d8d7e19ac..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_datetime.reference
+++ /dev/null
@@ -1,76 +0,0 @@
--- dayofmonth()
-31
--- dayofweek()
-4.00:00:00
--- dayofyear()
-365
--- getmonth()
-10
--- getyear()
-2015
--- hoursofday()
-23
--- startofday()
-2017-01-01 00:00:00.000000000
-2016-12-31 00:00:00.000000000
-2017-01-02 00:00:00.000000000
--- endofday()
-2017-01-01 23:59:59.999999000
-2016-12-31 23:59:59.999999000
-2017-01-02 23:59:59.999999000
--- endofmonth()
-2017-01-31 23:59:59.999999000
-2016-12-31 23:59:59.999999000
-2017-02-28 23:59:59.999999000
-2022-09-30 23:59:59.999999000
--- startofweek()
-2017-01-01 00:00:00.000000000
-2016-12-25 00:00:00.000000000
-2017-01-08 00:00:00.000000000
--- endofweek()
-2017-01-07 23:59:59.999999000
-2016-12-31 23:59:59.999999000
-2017-01-14 23:59:59.999999000
--- startofyear()
-2017-01-01 00:00:00.000000000
-2016-01-01 00:00:00.000000000
-2018-01-01 00:00:00.000000000
--- endofyear()
-2017-12-31 23:59:59.999999000
-2016-12-31 23:59:59.999999000
-2018-12-31 23:59:59.999999000
--- unixtime_seconds_todatetime()
-2019-01-01 00:00:00.000000000
-1970-01-02 00:00:00.000000000
-1969-12-31 00:00:00.000000000
--- unixtime_microseconds_todatetime
-2019-01-01 00:00:00.000000
--- unixtime_milliseconds_todatetime()
-2019-01-01 00:00:00.000
--- unixtime_nanoseconds_todatetime()
-2019-01-01 00:00:00.000000000
--- weekofyear()
-52
--- monthofyear()
-12
--- weekofyear()
-52
--- now()
-1
--- make_datetime()
-1
-2017-10-01 12:10:00.0000000
-2017-10-01 12:11:00.0000000
--- format_datetime
-15-12-14 02:03:04.1234500
-17-01-29 [09:00:05]	2017-01-29 [09:00:05]	17-01-29 [09:00:05 AM]
--- format_timespan()
-02:03:04.1234500
-29.09:00:05:12
--- ago()
--- datetime_diff()
-17	2	13	4	29	2	5	10
--- datetime_part()
-2017	4	10	44	30	303	01	02	03
--- datetime_add()
-2018-01-01 00:00:00.0000000	2017-04-01 00:00:00.0000000	2017-02-01 00:00:00.0000000	2017-01-08 00:00:00.0000000	2017-01-02 00:00:00.0000000	2017-01-01 01:00:00.0000000	2017-01-01 00:01:00.0000000	2017-01-01 00:00:01.0000000
diff --git a/tests/queries/0_stateless/02366_kql_func_datetime.sql b/tests/queries/0_stateless/02366_kql_func_datetime.sql
deleted file mode 100644
index b1fba4166a9..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_datetime.sql
+++ /dev/null
@@ -1,86 +0,0 @@
-set dialect = 'kusto';
-
-print '-- dayofmonth()';
-print dayofmonth(datetime(2015-12-31));
-print '-- dayofweek()';
-print dayofweek(datetime(2015-12-31));
-print '-- dayofyear()';
-print dayofyear(datetime(2015-12-31));
-print '-- getmonth()';
-print getmonth(datetime(2015-10-12));
-print '-- getyear()';
-print getyear(datetime(2015-10-12));
-print '-- hoursofday()';
-print hourofday(datetime(2015-12-31 23:59:59.9));
-print '-- startofday()';
-print startofday(datetime(2017-01-01 10:10:17));
-print startofday(datetime(2017-01-01 10:10:17), -1);
-print startofday(datetime(2017-01-01 10:10:17), 1);
-print '-- endofday()';
-print endofday(datetime(2017-01-01 10:10:17));
-print endofday(datetime(2017-01-01 10:10:17), -1);
-print endofday(datetime(2017-01-01 10:10:17), 1);
-print '-- endofmonth()';
-print endofmonth(datetime(2017-01-01 10:10:17));
-print endofmonth(datetime(2017-01-01 10:10:17), -1);
-print endofmonth(datetime(2017-01-01 10:10:17), 1);
-print endofmonth(datetime(2022-09-23));
-print '-- startofweek()';
-print startofweek(datetime(2017-01-01 10:10:17));
-print startofweek(datetime(2017-01-01 10:10:17), -1);
-print startofweek(datetime(2017-01-01 10:10:17), 1);
-print '-- endofweek()';
-print endofweek(datetime(2017-01-01 10:10:17));
-print endofweek(datetime(2017-01-01 10:10:17), -1);
-print endofweek(datetime(2017-01-01 10:10:17), 1);
-print '-- startofyear()';
-print startofyear(datetime(2017-01-01 10:10:17));
-print startofyear(datetime(2017-01-01 10:10:17), -1);
-print startofyear(datetime(2017-01-01 10:10:17), 1);
-print '-- endofyear()';
-print endofyear(datetime(2017-01-01 10:10:17));
-print endofyear(datetime(2017-01-01 10:10:17), -1);
-print endofyear(datetime(2017-01-01 10:10:17), 1);
-print '-- unixtime_seconds_todatetime()';
-print unixtime_seconds_todatetime(1546300800);
-print unixtime_seconds_todatetime(1d);
-print unixtime_seconds_todatetime(-1d);
-print '-- unixtime_microseconds_todatetime';
-print unixtime_microseconds_todatetime(1546300800000000);
-print '-- unixtime_milliseconds_todatetime()';
-print unixtime_milliseconds_todatetime(1546300800000);
-print '-- unixtime_nanoseconds_todatetime()';
-print unixtime_nanoseconds_todatetime(1546300800000000000);
-print '-- weekofyear()';
-print week_of_year(datetime(2000-01-01));
-print '-- monthofyear()';
-print monthofyear(datetime(2015-12-31));
-print '-- weekofyear()';
-print week_of_year(datetime(2000-01-01));
-print '-- now()';
-print getyear(now(-2d))>1900;
-print '-- make_datetime()';
-print make_datetime(2017,10,01,12,10) == datetime(2017-10-01 12:10:00);
-print year_month_day_hour_minute = make_datetime(2017,10,01,12,10);
-print year_month_day_hour_minute_second = make_datetime(2017,10,01,12,11,0.1234567);
-print '-- format_datetime';
-print format_datetime(datetime(2015-12-14 02:03:04.12345), 'y-M-d h:m:s.fffffff');
-print v1=format_datetime(datetime(2017-01-29 09:00:05),'yy-MM-dd [HH:mm:ss]'), v2=format_datetime(datetime(2017-01-29 09:00:05), 'yyyy-M-dd [H:mm:ss]'), v3=format_datetime(datetime(2017-01-29 09:00:05), 'yy-MM-dd [hh:mm:ss tt]');
-print '-- format_timespan()';
-print format_timespan(time('14.02:03:04.12345'), 'h:m:s.fffffff');
-print v1=format_timespan(time('29.09:00:05.12345'), 'dd.hh:mm:ss:FF');
--- print v2=format_timespan(time('29.09:00:05.12345'), 'ddd.h:mm:ss [fffffff]'); == '029.9:00:05 [1234500]'
-print '-- ago()';
--- print ago(1d) - now();
-print '-- datetime_diff()';
-print year = datetime_diff('year',datetime(2017-01-01),datetime(2000-12-31)), quarter = datetime_diff('quarter',datetime(2017-07-01),datetime(2017-03-30)), month = datetime_diff('month',datetime(2017-01-01),datetime(2015-12-30)), week = datetime_diff('week',datetime(2017-10-29 00:00),datetime(2017-09-30 23:59)), day = datetime_diff('day',datetime(2017-10-29 00:00),datetime(2017-09-30 23:59)), hour = datetime_diff('hour',datetime(2017-10-31 01:00),datetime(2017-10-30 23:59)), minute = datetime_diff('minute',datetime(2017-10-30 23:05:01),datetime(2017-10-30 23:00:59)), second = datetime_diff('second',datetime(2017-10-30 23:00:10.100),datetime(2017-10-30 23:00:00.900));
--- millisecond = datetime_diff('millisecond',datetime(2017-10-30 23:00:00.200100),datetime(2017-10-30 23:00:00.100900)),
--- microsecond = datetime_diff('microsecond',datetime(2017-10-30 23:00:00.1009001),datetime(2017-10-30 23:00:00.1008009)),
--- nanosecond = datetime_diff('nanosecond',datetime(2017-10-30 23:00:00.0000000),datetime(2017-10-30 23:00:00.0000007))
-print '-- datetime_part()';
-print year = datetime_part("year", datetime(2017-10-30 01:02:03.7654321)),quarter = datetime_part("quarter", datetime(2017-10-30 01:02:03.7654321)),month = datetime_part("month", datetime(2017-10-30 01:02:03.7654321)),weekOfYear = datetime_part("week_of_year", datetime(2017-10-30 01:02:03.7654321)),day = datetime_part("day", datetime(2017-10-30 01:02:03.7654321)),dayOfYear = datetime_part("dayOfYear", datetime(2017-10-30 01:02:03.7654321)),hour = datetime_part("hour", datetime(2017-10-30 01:02:03.7654321)),minute = datetime_part("minute", datetime(2017-10-30 01:02:03.7654321)),second = datetime_part("second", datetime(2017-10-30 01:02:03.7654321));
--- millisecond = datetime_part("millisecond", dt),
--- microsecond = datetime_part("microsecond", dt),
--- nanosecond = datetime_part("nanosecond", dt)
-print '-- datetime_add()';
-print  year = datetime_add('year',1,make_datetime(2017,1,1)),quarter = datetime_add('quarter',1,make_datetime(2017,1,1)),month = datetime_add('month',1,make_datetime(2017,1,1)),week = datetime_add('week',1,make_datetime(2017,1,1)),day = datetime_add('day',1,make_datetime(2017,1,1)),hour = datetime_add('hour',1,make_datetime(2017,1,1)),minute = datetime_add('minute',1,make_datetime(2017,1,1)),second = datetime_add('second',1,make_datetime(2017,1,1));
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02366_kql_func_dynamic.reference b/tests/queries/0_stateless/02366_kql_func_dynamic.reference
deleted file mode 100644
index 564f1eebc4b..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_dynamic.reference
+++ /dev/null
@@ -1,152 +0,0 @@
--- constant index value
-1	c	['A',NULL,'C']
--- array_length()
-1
-1
--- array_sum()
-1
-1
--- array_index_of()
-3
-1
--- array_iif()
-[1,5,3]
-[1,5,3]
-[1,5,NULL]
-[NULL,NULL,NULL]
--- array_concat()
-[1,2,3,4,5,6]
--- array_reverse()
-[]
-[1]
-[4,3,2,1]
-['example','an','is','this']
--- array_rotate_left()
-[]
-[]
-[]
-[3,4,5,1,2]
-[1,2,3,4,5]
-[3,4,5,1,2]
-[4,5,1,2,3]
-[1,2,3,4,5]
-[4,5,1,2,3]
--- array_rotate_right()
-[]
-[]
-[]
-[4,5,1,2,3]
-[1,2,3,4,5]
-[4,5,1,2,3]
-[3,4,5,1,2]
-[1,2,3,4,5]
-[3,4,5,1,2]
--- array_shift_left()
-[]
-[]
-[]
-[3,4,5,NULL,NULL]
-[NULL,NULL,1,2,3]
-[3,4,5,-1,-1]
-['c','','']
--- array_shift_right()
-[]
-[]
-[]
-[3,4,5,NULL,NULL]
-[NULL,NULL,1,2,3]
-[3,4,5,-1,-1]
-['c','','']
--- array_slice()
-[3,4]
--- array_split()
-[[1],[2,3],[4,5]]
-[[1,2],[3,4,5]]
-[[1],[2,3],[4,5]]
-[[1,2,3,4],[],[4,5]]
--- array_sort_asc()
-(['a','c','c','d',NULL])
-([1,2,3,4])
-['a','b','c']
-(['p','q','r'],['hello','clickhouse','world'])
-([NULL,'a','c','c','d'])
-([NULL,'a','c','c','d'])
-([NULL,NULL,NULL])
-[1,2,3,NULL,NULL]
-['a','e','b','c','d']
-(['George','John','Paul','Ringo'])
-(['blue','green','yellow',NULL,NULL])
-([NULL,NULL,'blue','green','yellow'])
--- array_sort_desc()
-(['d','c','c','a',NULL])
-([4,3,2,1])
-['c','b','a']
-(['r','q','p'],['world','clickhouse','hello'])
-([NULL,'d','c','c','a'])
-([NULL,'d','c','c','a'])
-([NULL,NULL,NULL])
-[3,2,1,NULL,NULL]
-['d','c','b','e','a']
-(['Ringo','Paul','John','George'])
-(['yellow','green','blue',NULL,NULL])
-([NULL,NULL,'yellow','green','blue'])
--- jaccard_index()
-0.75
-0
-0
-nan
-0
-0.75
-0.25
--- pack_array()
-1	2	4	[1,2,4]
-['ab','0.0.0.42','4.2']
--- repeat()
-[]
-[1,1,1]
-['asd','asd','asd']
-[86400,86400,86400]
-[true,true,true]
-[NULL]
-[NULL]
--- set_difference()
-[]
-[]
-[]
-[]
-[4,5,6]
-[4]
-[1,3]
-[1,2,3]
-['d','s']
-['Chewbacca','Han Solo']
--- set_has_element()
-0
-1
-0
-1
-0
--- set_intersect()
-[]
-[1,2,3]
-[1,2,3]
-[]
-[5]
-[]
-['a']
-['Darth Vader']
--- set_union()
-[]
-[1,2,3]
-[1,2,3,4,5,6]
-[1,2,3,4]
-[1,2,3,4,5]
-[1,2,3]
-['a','d','f','s']
-['Chewbacca','Darth Sidious','Darth Vader','Han Solo']
--- zip()
-[]
-[[1,2],[3,4],[5,6]]
-[['Darth','Vader','has a suit'],['Master','Yoda','doesn\'t have a suit']]
-[[1,10],[2,20],[3,NULL]]
-[[NULL,1],[NULL,2],[NULL,3]]
diff --git a/tests/queries/0_stateless/02366_kql_func_dynamic.sql b/tests/queries/0_stateless/02366_kql_func_dynamic.sql
deleted file mode 100644
index b0956f032d0..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_dynamic.sql
+++ /dev/null
@@ -1,161 +0,0 @@
-DROP TABLE IF EXISTS array_test;
-CREATE TABLE array_test (floats Array(Float64),
-                         strings Array(String),
-                         nullable_strings Array(Nullable(String))
-                         ) ENGINE=Memory;
-INSERT INTO array_test VALUES([1.0, 2.5], ['a', 'c'], ['A', NULL, 'C']);
-set dialect = 'kusto';
-print '-- constant index value';
-array_test | project floats[0], strings[1], nullable_strings;
-print '-- array_length()';
-print array_length(dynamic(['John', 'Denver', 'Bob', 'Marley'])) == 4;
-print array_length(dynamic([1, 2, 3])) == 3;
-print '-- array_sum()';
-print array_sum(dynamic([2, 5, 3])) == 10;
-print array_sum(dynamic([2.5, 5.5, 3])) == 11;
-print '-- array_index_of()';
-print array_index_of(dynamic(['John', 'Denver', 'Bob', 'Marley']), 'Marley');
-print array_index_of(dynamic([1, 2, 3]), 2);
-print '-- array_iif()';
-print array_iif(dynamic([true,false,true]), dynamic([1,2,3]), dynamic([4,5,6]));
-print array_iif(dynamic([1,0,1]), dynamic([1,2,3]), dynamic([4,5,6]));
-print array_iif(dynamic([true,false,true]), dynamic([1,2]), dynamic([4,5,6]));
-print array_iif(dynamic(['a','b','c']), dynamic([1,2,3]), dynamic([4,5,6]));
-print '-- array_concat()';
-print array_concat(dynamic([1,2,3]),dynamic([4,5,6]));
-print '-- array_reverse()';
-print array_reverse(dynamic([]));
-print array_reverse(dynamic([1]));
-print array_reverse(dynamic([1,2,3,4]));
-print array_reverse(dynamic(["this", "is", "an", "example"]));
-print '-- array_rotate_left()';
-print array_rotate_left(dynamic([]), 0);
-print array_rotate_left(dynamic([]), 500);
-print array_rotate_left(dynamic([]), -500);
-print array_rotate_left(dynamic([1,2,3,4,5]), 2);
-print array_rotate_left(dynamic([1,2,3,4,5]), 5);
-print array_rotate_left(dynamic([1,2,3,4,5]), 7);
-print array_rotate_left(dynamic([1,2,3,4,5]), -2);
-print array_rotate_left(dynamic([1,2,3,4,5]), -5);
-print array_rotate_left(dynamic([1,2,3,4,5]), -7);
-print '-- array_rotate_right()';
-print array_rotate_right(dynamic([]), 0);
-print array_rotate_right(dynamic([]), 500);
-print array_rotate_right(dynamic([]), -500);
-print array_rotate_right(dynamic([1,2,3,4,5]), 2);
-print array_rotate_right(dynamic([1,2,3,4,5]), 5);
-print array_rotate_right(dynamic([1,2,3,4,5]), 7);
-print array_rotate_right(dynamic([1,2,3,4,5]), -2);
-print array_rotate_right(dynamic([1,2,3,4,5]), -5);
-print array_rotate_right(dynamic([1,2,3,4,5]), -7);
-print '-- array_shift_left()';
-print array_shift_left(dynamic([]), 0);
-print array_shift_left(dynamic([]), 555);
-print array_shift_left(dynamic([]), -555);
-print array_shift_left(dynamic([1,2,3,4,5]), 2);
-print array_shift_left(dynamic([1,2,3,4,5]), -2);
-print array_shift_left(dynamic([1,2,3,4,5]), 2, -1);
-print array_shift_left(dynamic(['a', 'b', 'c']), 2);
-print '-- array_shift_right()';
-print array_shift_left(dynamic([]), 0);
-print array_shift_left(dynamic([]), 555);
-print array_shift_left(dynamic([]), -555);
-print array_shift_right(dynamic([1,2,3,4,5]), -2);
-print array_shift_right(dynamic([1,2,3,4,5]), 2);
-print array_shift_right(dynamic([1,2,3,4,5]), -2, -1);
-print array_shift_right(dynamic(['a', 'b', 'c']), -2);
-print '-- array_slice()';
---print array_slice(dynamic([1,2,3]), 1, 2); -- will enable whe analyzer dixed
-print array_slice(dynamic([1,2,3,4,5]), -3, -2);
-print '-- array_split()';
-print array_split(dynamic([1,2,3,4,5]), dynamic([1,-2]));
-print array_split(dynamic([1,2,3,4,5]), 2);
-print array_split(dynamic([1,2,3,4,5]), dynamic([1,3]));
-print array_split(dynamic([1,2,3,4,5]), dynamic([-1,-2]));
-print '-- array_sort_asc()';
-print array_sort_asc(dynamic([null, 'd', 'a', 'c', 'c']));
-print array_sort_asc(dynamic([4, 1, 3, 2]));
-print array_sort_asc(dynamic(['b', 'a', 'c']), dynamic(['q', 'p', 'r']))[0];
-print array_sort_asc(dynamic(['q', 'p', 'r']), dynamic(['clickhouse','hello', 'world']));
-print array_sort_asc( dynamic(['d', null, 'a', 'c', 'c']) , false);
-print array_sort_asc( dynamic(['d', null, 'a', 'c', 'c']) , 1 > 2);
-print array_sort_asc( dynamic([null, null, null]) , false);
-print array_sort_asc(dynamic([2, 1, null,3, null]), dynamic([20, 10, 40, 30, 50]), 1 < 2)[0];
-print array_sort_asc(dynamic(['1','3','4','5','2']),dynamic(["a","b","c","d","e"]), dynamic(["a","b","c","d","e"]), dynamic(["a","b","c","d","e"]))[3];
-print array_sort_asc(split("John,Paul,George,Ringo", ","));
-print array_sort_asc(dynamic([null,"blue","yellow","green",null]));
-print array_sort_asc(dynamic([null,"blue","yellow","green",null]), false);
-print '-- array_sort_desc()';
-print array_sort_desc(dynamic([null, 'd', 'a', 'c', 'c']));
-print array_sort_desc(dynamic([4, 1, 3, 2]));
-print array_sort_desc(dynamic(['b', 'a', 'c']), dynamic(['q', 'p', 'r']))[0];
-print array_sort_desc(dynamic(['q', 'p', 'r']), dynamic(['clickhouse','hello', 'world']));
-print array_sort_desc( dynamic(['d', null, 'a', 'c', 'c']) , false);
-print array_sort_desc( dynamic(['d', null, 'a', 'c', 'c']) , 1 > 2);
-print array_sort_desc( dynamic([null, null, null]) , false);
-print array_sort_desc(dynamic([2, 1, null,3, null]), dynamic([20, 10, 40, 30, 50]), 1 < 2)[0];
-print array_sort_desc(dynamic(['1','3','4','5','2']),dynamic(["a","b","c","d","e"]), dynamic(["a","b","c","d","e"]), dynamic(["a","b","c","d","e"]))[3];
-print array_sort_desc(split("John,Paul,George,Ringo", ","));
-print array_sort_desc(dynamic([null,"blue","yellow","green",null]));
-print array_sort_desc(dynamic([null,"blue","yellow","green",null]), false);
-print '-- jaccard_index()';
-print jaccard_index(dynamic([1, 1, 2, 2, 3, 3]), dynamic([1, 2, 3, 4, 4, 4]));
-print jaccard_index(dynamic([1, 2, 3]), dynamic([]));
-print jaccard_index(dynamic([]), dynamic([1, 2, 3, 4]));
-print jaccard_index(dynamic([]), dynamic([]));
-print jaccard_index(dynamic([1, 2, 3]), dynamic([4, 5, 6, 7]));
-print jaccard_index(dynamic(['a', 's', 'd']), dynamic(['f', 'd', 's', 'a']));
-print jaccard_index(dynamic(['Chewbacca', 'Darth Vader', 'Han Solo']), dynamic(['Darth Sidious', 'Darth Vader']));
-print '-- pack_array()';
-print pack_array(); -- { clientError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
-print x = 1 | extend y = x * 2 | extend z = y * 2 | extend pack_array(x,y,z);
-print pack_array(strcat('a', 'b'), format_ipv4(42), tostring(4.2));
-print '-- repeat()';
-print repeat(1, 0);
-print repeat(1, 3);
-print repeat("asd", 3);
-print repeat(timespan(1d), 3);
-print repeat(true, 3);
-print repeat(1, -3);
-print repeat(6.7,-4);
-print '-- set_difference()';
-print set_difference(dynamic([]), dynamic([]));
-print set_difference(dynamic([]), dynamic([9]));
-print set_difference(dynamic([]), dynamic(["asd"]));
-print set_difference(dynamic([1, 1, 2, 2, 3, 3]), dynamic([1, 2, 3]));
-print array_sort_asc(set_difference(dynamic([1, 4, 2, 3, 5, 4, 6]), dynamic([1, 2, 3])))[0];
-print set_difference(dynamic([4]), dynamic([1, 2, 3]));
-print array_sort_asc(set_difference(dynamic([1, 2, 3, 4, 5]), dynamic([5]), dynamic([2, 4])))[0];
-print array_sort_asc(set_difference(dynamic([1, 2, 3]), dynamic([])))[0];
-print array_sort_asc(set_difference(dynamic(['a', 's', 'd']), dynamic(['a', 'f'])))[0];
-print array_sort_asc(set_difference(dynamic(['Chewbacca', 'Darth Vader', 'Han Solo']), dynamic(['Darth Sidious', 'Darth Vader'])))[0];
-print '-- set_has_element()';
-print set_has_element(dynamic([]), 9);
-print set_has_element(dynamic(["this", "is", "an", "example"]), "example");
-print set_has_element(dynamic(["this", "is", "an", "example"]), "examplee");
-print set_has_element(dynamic([1, 2, 3]), 2);
-print set_has_element(dynamic([1, 2, 3, 4.2]), 4);
-print '-- set_intersect()';
-print set_intersect(dynamic([]), dynamic([]));
-print array_sort_asc(set_intersect(dynamic([1, 1, 2, 2, 3, 3]), dynamic([1, 2, 3])))[0];
-print array_sort_asc(set_intersect(dynamic([1, 4, 2, 3, 5, 4, 6]), dynamic([1, 2, 3])))[0];
-print set_intersect(dynamic([4]), dynamic([1, 2, 3]));
-print set_intersect(dynamic([1, 2, 3, 4, 5]), dynamic([1, 3, 5]), dynamic([2, 5]));
-print set_intersect(dynamic([1, 2, 3]), dynamic([]));
-print set_intersect(dynamic(['a', 's', 'd']), dynamic(['a', 'f']));
-print set_intersect(dynamic(['Chewbacca', 'Darth Vader', 'Han Solo']), dynamic(['Darth Sidious', 'Darth Vader']));
-print '-- set_union()';
-print set_union(dynamic([]), dynamic([]));
-print array_sort_asc(set_union(dynamic([1, 1, 2, 2, 3, 3]), dynamic([1, 2, 3])))[0];
-print array_sort_asc(set_union(dynamic([1, 4, 2, 3, 5, 4, 6]), dynamic([1, 2, 3])))[0];
-print array_sort_asc(set_union(dynamic([4]), dynamic([1, 2, 3])))[0];
-print array_sort_asc(set_union(dynamic([1, 3, 4]), dynamic([5]), dynamic([2, 4])))[0];
-print array_sort_asc(set_union(dynamic([1, 2, 3]), dynamic([])))[0];
-print array_sort_asc(set_union(dynamic(['a', 's', 'd']), dynamic(['a', 'f'])))[0];
-print array_sort_asc(set_union(dynamic(['Chewbacca', 'Darth Vader', 'Han Solo']), dynamic(['Darth Sidious', 'Darth Vader'])))[0];
-print '-- zip()';
-print zip(dynamic([]), dynamic([]));
-print zip(dynamic([1,3,5]), dynamic([2,4,6]));
-print zip(dynamic(['Darth','Master']), dynamic(['Vader','Yoda']), dynamic(['has a suit','doesn\'t have a suit']));
-print zip(dynamic([1,2,3]), dynamic([10,20]));
-print zip(dynamic([]), dynamic([1,2,3]));
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02366_kql_func_ip.reference b/tests/queries/0_stateless/02366_kql_func_ip.reference
deleted file mode 100644
index 2a0bbf53fff..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_ip.reference
+++ /dev/null
@@ -1,123 +0,0 @@
--- ipv4_is_private(\'127.0.0.1\')
-0
--- ipv4_is_private(\'10.1.2.3\')
-1
--- ipv4_is_private(\'192.168.1.1/24\')
-1
-ipv4_is_private(strcat(\'192.\',\'168.\',\'1.\',\'1\',\'/24\'))
-1
--- ipv4_is_private(\'abc\')
-\N
--- ipv4_netmask_suffix(\'192.168.1.1/24\')
-24
--- ipv4_netmask_suffix(\'192.168.1.1\')
-32
--- ipv4_netmask_suffix(\'127.0.0.1/16\')
-16
--- ipv4_netmask_suffix(\'abc\')
-\N
-ipv4_netmask_suffix(strcat(\'127.\', \'0.\', \'0.1/16\'))
-16
--- ipv4_is_in_range(\'127.0.0.1\', \'127.0.0.1\')
-1
--- ipv4_is_in_range(\'192.168.1.6\', \'192.168.1.1/24\')
-1
--- ipv4_is_in_range(\'192.168.1.1\', \'192.168.2.1/24\')
-0
--- ipv4_is_in_range(strcat(\'192.\',\'168.\', \'1.1\'), \'192.168.2.1/24\')
-0
--- ipv4_is_in_range(\'abc\', \'127.0.0.1\')
-\N
--- parse_ipv6(127.0.0.1)
-0000:0000:0000:0000:0000:ffff:7f00:0001
--- parse_ipv6(fe80::85d:e82c:9446:7994)
-fe80:0000:0000:0000:085d:e82c:9446:7994
--- parse_ipv4(\'127.0.0.1\')
-2130706433
--- parse_ipv4(\'192.1.168.1\') < parse_ipv4(\'192.1.168.2\')
-1
--- parse_ipv4(arrayStringConcat([\'127\', \'0\', \'0\', \'1\'], \'.\'))
--- parse_ipv4_mask(\'127.0.0.1\', 24) == 2130706432
-2130706432
--- parse_ipv4_mask(\'abc\', 31)
-\N
-\N
--- parse_ipv4_mask(\'192.1.168.2\', 31) == parse_ipv4_mask(\'192.1.168.3\', 31)
-3221334018
-3221334018
--- ipv4_is_match(\'127.0.0.1\', \'127.0.0.1\')
-1
--- ipv4_is_match(\'192.168.1.1\', \'192.168.1.255\')
-0
--- ipv4_is_match(\'192.168.1.1/24\', \'192.168.1.255/24\')
-1
--- ipv4_is_match(\'192.168.1.1\', \'192.168.1.255\', 24)
-1
--- ipv4_is_match(\'abc\', \'def\', 24)
-\N
--- ipv4_compare()
-0
--1
-1
-0
-0
-0
-0
-0
-0
-0
-0
--- format_ipv4()
-192.168.1.0
-192.168.1.1
-192.168.1.0
-192.168.1.0
-1
-1
-127.0.0.0
--- format_ipv4_mask()
-192.168.1.0/24
-192.168.1.0/24
-192.168.1.0/24
-192.168.1.1/32
-192.168.1.0/24
-1
-1
-127.0.0.0/24
--- parse_ipv6_mask()
-0000:0000:0000:0000:0000:0000:0000:0000
-fe80:0000:0000:0000:085d:e82c:9446:7900
-0000:0000:0000:0000:0000:ffff:c0a8:ff00
-0000:0000:0000:0000:0000:ffff:c0a8:ff00
-0000:0000:0000:0000:0000:ffff:ffff:ffff
-fe80:0000:0000:0000:085d:e82c:9446:7994
-fe80:0000:0000:0000:085d:e82c:9446:7900
-0000:0000:0000:0000:0000:ffff:c0a8:ffff
-0000:0000:0000:0000:0000:ffff:c0a8:ff00
--- ipv6_is_match()
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
diff --git a/tests/queries/0_stateless/02366_kql_func_ip.sql b/tests/queries/0_stateless/02366_kql_func_ip.sql
deleted file mode 100644
index c9b335f203a..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_ip.sql
+++ /dev/null
@@ -1,131 +0,0 @@
-set dialect='kusto';
-print '-- ipv4_is_private(\'127.0.0.1\')';
-print ipv4_is_private('127.0.0.1');
-print '-- ipv4_is_private(\'10.1.2.3\')';
-print ipv4_is_private('10.1.2.3');
-print '-- ipv4_is_private(\'192.168.1.1/24\')';
-print ipv4_is_private('192.168.1.1/24');
-print 'ipv4_is_private(strcat(\'192.\',\'168.\',\'1.\',\'1\',\'/24\'))';
-print ipv4_is_private(strcat('192.','168.','1.','1','/24'));
-print '-- ipv4_is_private(\'abc\')';
-print ipv4_is_private('abc'); -- == null
-
-print '-- ipv4_netmask_suffix(\'192.168.1.1/24\')';
-print ipv4_netmask_suffix('192.168.1.1/24'); -- == 24
-print '-- ipv4_netmask_suffix(\'192.168.1.1\')';
-print ipv4_netmask_suffix('192.168.1.1'); -- == 32
-print '-- ipv4_netmask_suffix(\'127.0.0.1/16\')';
-print ipv4_netmask_suffix('127.0.0.1/16'); -- == 16
-print '-- ipv4_netmask_suffix(\'abc\')';
-print ipv4_netmask_suffix('abc'); -- == null
-print 'ipv4_netmask_suffix(strcat(\'127.\', \'0.\', \'0.1/16\'))';
-print ipv4_netmask_suffix(strcat('127.', '0.', '0.1/16')); -- == 16
-
-print '-- ipv4_is_in_range(\'127.0.0.1\', \'127.0.0.1\')';
-print ipv4_is_in_range('127.0.0.1', '127.0.0.1'); -- == true
-print '-- ipv4_is_in_range(\'192.168.1.6\', \'192.168.1.1/24\')';
-print ipv4_is_in_range('192.168.1.6', '192.168.1.1/24'); -- == true
-print '-- ipv4_is_in_range(\'192.168.1.1\', \'192.168.2.1/24\')';
-print ipv4_is_in_range('192.168.1.1', '192.168.2.1/24'); -- == false
-print '-- ipv4_is_in_range(strcat(\'192.\',\'168.\', \'1.1\'), \'192.168.2.1/24\')';
-print ipv4_is_in_range(strcat('192.','168.', '1.1'), '192.168.2.1/24'); -- == false
-print '-- ipv4_is_in_range(\'abc\', \'127.0.0.1\')'; -- == null
-print ipv4_is_in_range('abc', '127.0.0.1');
-
-print '-- parse_ipv6(127.0.0.1)';
-print parse_ipv6('127.0.0.1');
-print '-- parse_ipv6(fe80::85d:e82c:9446:7994)';
-print parse_ipv6('fe80::85d:e82c:9446:7994');
-print '-- parse_ipv4(\'127.0.0.1\')';
-print parse_ipv4('127.0.0.1');
-print '-- parse_ipv4(\'192.1.168.1\') < parse_ipv4(\'192.1.168.2\')';
-print parse_ipv4('192.1.168.1') < parse_ipv4('192.1.168.2');
-print '-- parse_ipv4(arrayStringConcat([\'127\', \'0\', \'0\', \'1\'], \'.\'))';
-print parse_ipv4(arrayStringConcat(['127', '0', '0', '1'], '.')); -- { clientError UNKNOWN_FUNCTION }
-
-print '-- parse_ipv4_mask(\'127.0.0.1\', 24) == 2130706432';
-print parse_ipv4_mask('127.0.0.1', 24);
-print '-- parse_ipv4_mask(\'abc\', 31)';
-print parse_ipv4_mask('abc', 31)
-print '-- parse_ipv4_mask(\'192.1.168.2\', 1000)';
-print parse_ipv4_mask('192.1.168.2', 1000);
-print '-- parse_ipv4_mask(\'192.1.168.2\', 31) == parse_ipv4_mask(\'192.1.168.3\', 31)';
---print parse_ipv4_mask('192.1.168.2', 31) == parse_ipv4_mask('192.1.168.3', 31); // this qual failed in analyzer 3221334018
-print parse_ipv4_mask('192.1.168.2', 31);
-print parse_ipv4_mask('192.1.168.3', 31);
-print '-- ipv4_is_match(\'127.0.0.1\', \'127.0.0.1\')';
-print ipv4_is_match('127.0.0.1', '127.0.0.1');
-print '-- ipv4_is_match(\'192.168.1.1\', \'192.168.1.255\')';
-print ipv4_is_match('192.168.1.1', '192.168.1.255');
-print '-- ipv4_is_match(\'192.168.1.1/24\', \'192.168.1.255/24\')';
-print ipv4_is_match('192.168.1.1/24', '192.168.1.255/24');
-print '-- ipv4_is_match(\'192.168.1.1\', \'192.168.1.255\', 24)';
-print ipv4_is_match('192.168.1.1', '192.168.1.255', 24);
-print '-- ipv4_is_match(\'abc\', \'def\', 24)';
-print ipv4_is_match('abc', 'dev', 24);
-print '-- ipv4_compare()';
-print ipv4_compare('127.0.0.1', '127.0.0.1');
-print ipv4_compare('192.168.1.1', '192.168.1.255');
-print ipv4_compare('192.168.1.255', '192.168.1.1');
-print ipv4_compare('192.168.1.1/24', '192.168.1.255/24');
-print ipv4_compare('192.168.1.1', '192.168.1.255', 24);
-print ipv4_compare('192.168.1.1/24', '192.168.1.255');
-print ipv4_compare('192.168.1.1', '192.168.1.255/24');
-print ipv4_compare('192.168.1.1/30', '192.168.1.255/24');
-print ipv4_compare('192.168.1.1', '192.168.1.0', 31);
-print ipv4_compare('192.168.1.1/24', '192.168.1.255', 31);
-print ipv4_compare('192.168.1.1', '192.168.1.255', 24);
-print '-- format_ipv4()';
-print format_ipv4('192.168.1.255', 24);
-print format_ipv4('192.168.1.1', 32);
-print format_ipv4('192.168.1.1/24', 32);
-print format_ipv4(3232236031, 24);
-print format_ipv4('192.168.1.1/24', -1) == '';
-print format_ipv4('abc', 24) == '';
-print format_ipv4(strcat('127.0', '.0.', '1', '/32'), 12 + 12);
-print '-- format_ipv4_mask()';
-print format_ipv4_mask('192.168.1.255', 24);
-print format_ipv4_mask(3232236031, 24);
-print format_ipv4_mask('192.168.1.1', 24);
-print format_ipv4_mask('192.168.1.1', 32);
-print format_ipv4_mask('192.168.1.1/24', 32);
-print format_ipv4_mask('192.168.1.1/24', -1) == '';
-print format_ipv4_mask('abc', 24) == '';
-print format_ipv4_mask(strcat('127.0', '.0.', '1', '/32'), 12 + 12);
-print '-- parse_ipv6_mask()';
-print parse_ipv6_mask("127.0.0.1", 24);
-print parse_ipv6_mask("fe80::85d:e82c:9446:7994", 120);
-print parse_ipv6_mask("192.168.255.255", 120);
-print parse_ipv6_mask("192.168.255.255/24", 124);
-print parse_ipv6_mask("255.255.255.255", 128);
-print parse_ipv6_mask("fe80::85d:e82c:9446:7994", 128);
-print parse_ipv6_mask("fe80::85d:e82c:9446:7994/120", 124);
-print parse_ipv6_mask("::192.168.255.255", 128);
-print parse_ipv6_mask("::192.168.255.255/24", 128);
-print '-- ipv6_is_match()';
-print ipv6_is_match('::ffff:7f00:1', '127.0.0.1') == true;
-print ipv6_is_match('fe80::85d:e82c:9446:7994', 'fe80::85d:e82c:9446:7995') == false;
-print ipv6_is_match('192.168.1.1/24', '192.168.1.255/24') == true;
-print ipv6_is_match('fe80::85d:e82c:9446:7994/127', 'fe80::85d:e82c:9446:7995/127') == true;
-print ipv6_is_match('fe80::85d:e82c:9446:7994', 'fe80::85d:e82c:9446:7995', 127) == true;
-print ipv6_is_match('192.168.1.1',    '192.168.1.1'); --       // Equal IPs
-print ipv6_is_match('192.168.1.1/24', '192.168.1.255'); --     // 24 bit IP4-prefix is used for comparison
-print ipv6_is_match('192.168.1.1',    '192.168.1.255/24'); --  // 24 bit IP4-prefix is used for comparison
-print ipv6_is_match('192.168.1.1/30', '192.168.1.255/24'); --  // 24 bit IP4-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994', 'fe80::85d:e82c:9446:7994'); --         // Equal IPs
-print ipv6_is_match('fe80::85d:e82c:9446:7994/120', 'fe80::85d:e82c:9446:7998'); --     // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994', 'fe80::85d:e82c:9446:7998/120'); --     // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994/120', 'fe80::85d:e82c:9446:7998/120'); -- // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('192.168.1.1',      '::ffff:c0a8:0101'); -- // Equal IPs
-print ipv6_is_match('192.168.1.1/24',   '::ffff:c0a8:01ff'); -- // 24 bit IP-prefix is used for comparison
-print ipv6_is_match('::ffff:c0a8:0101', '192.168.1.255/24'); -- // 24 bit IP-prefix is used for comparison
-print ipv6_is_match('::192.168.1.1/30', '192.168.1.255/24'); -- // 24 bit IP-prefix is used for comparison
-print ipv6_is_match('192.168.1.1',    '192.168.1.0',   31); -- // 31 bit IP4-prefix is used for comparison
-print ipv6_is_match('192.168.1.1/24', '192.168.1.255', 31); -- // 24 bit IP4-prefix is used for comparison
-print ipv6_is_match('192.168.1.1',    '192.168.1.255', 24); -- // 24 bit IP4-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994', 'fe80::85d:e82c:9446:7995',     127); -- // 127 bit IP6-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994/127', 'fe80::85d:e82c:9446:7998', 120); -- // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('fe80::85d:e82c:9446:7994/120', 'fe80::85d:e82c:9446:7998', 127); -- // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('192.168.1.1/24',   '::ffff:c0a8:01ff', 127); -- // 127 bit IP6-prefix is used for comparison
-print ipv6_is_match('::ffff:c0a8:0101', '192.168.1.255',    120); -- // 120 bit IP6-prefix is used for comparison
-print ipv6_is_match('::192.168.1.1/30', '192.168.1.255/24', 127); -- // 120 bit IP6-prefix is used for comparison
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02366_kql_func_math.reference b/tests/queries/0_stateless/02366_kql_func_math.reference
deleted file mode 100644
index 92f283abcb6..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_math.reference
+++ /dev/null
@@ -1,4 +0,0 @@
--- isnan --
-1
-0
-0
diff --git a/tests/queries/0_stateless/02366_kql_func_math.sql b/tests/queries/0_stateless/02366_kql_func_math.sql
deleted file mode 100644
index 4e83622eb6b..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_math.sql
+++ /dev/null
@@ -1,7 +0,0 @@
-set dialect = 'kusto';
-print '-- isnan --';
-print isnan(double(nan));
-print isnan(4.2);
-print isnan(4); -- { serverError FUNCTION_THROW_IF_VALUE_IS_NON_ZERO }
-print isnan(real(+inf));
-print isnan(dynamic(null)); -- { serverError FUNCTION_THROW_IF_VALUE_IS_NON_ZERO }
diff --git a/tests/queries/0_stateless/02366_kql_func_scalar.reference b/tests/queries/0_stateless/02366_kql_func_scalar.reference
deleted file mode 100644
index b7fa62c5d43..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_scalar.reference
+++ /dev/null
@@ -1,16 +0,0 @@
--- bin_at()
-4.5
--12:0:0
-2017-05-14 12:00:00.000000000
-2017-05-14 00:00:00.000000000
-2018-02-25 15:14:00.000000000	5
-2018-02-24 15:14:00.000000000	3
-2018-02-23 15:14:00.000000000	4
--- bin()
-4
-1970-05-11 00:00:00.000000000
-336:0:0
-1970-05-11 13:45:07.345000000
-1970-05-11 13:45:07.345623000
-2022-09-26 10:13:23.987232000
-1970-05-11 13:45:07.456336000
diff --git a/tests/queries/0_stateless/02366_kql_func_scalar.sql b/tests/queries/0_stateless/02366_kql_func_scalar.sql
deleted file mode 100644
index d7e94cfd9d1..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_scalar.sql
+++ /dev/null
@@ -1,26 +0,0 @@
-DROP TABLE IF EXISTS Bin_at_test;
-CREATE TABLE Bin_at_test
-(    
-    `Date` DateTime('UTC'),
-    Num Nullable(UInt8)
-) ENGINE = Memory;
-INSERT INTO Bin_at_test VALUES ('2018-02-24T15:14:01',3), ('2018-02-23T16:14:01',4), ('2018-02-26T15:14:01',5);
-
-set dialect = 'kusto';
-print '-- bin_at()';
-print bin_at(6.5, 2.5, 7);
-print bin_at(1h, 1d, 12h);
-print bin_at(datetime(2017-05-15 10:20:00.0), 1d, datetime(1970-01-01 12:00:00.0));
-print bin_at(datetime(2017-05-17 10:20:00.0), 7d, datetime(2017-06-04 00:00:00.0));
-Bin_at_test | summarize sum(Num) by d = todatetime(bin_at(Date, 1d, datetime('2018-02-24 15:14:00'))) | order by d;
-print '-- bin()';
-print bin(4.5, 1);
-print bin(datetime(1970-05-11 13:45:07), 1d);
-print bin(16d, 7d);
-print bin(datetime(1970-05-11 13:45:07.345623), 1ms);
--- print bin(datetime(2022-09-26 10:13:23.987234), 6ms); -> 2022-09-26 10:13:23.982000000
-print bin(datetime(1970-05-11 13:45:07.345623), 1microsecond);
-print bin(datetime(2022-09-26 10:13:23.987234), 6microseconds);
-print bin(datetime(1970-05-11 13:45:07.456345672), 16microseconds);
--- print bin(datetime(2022-09-26 10:13:23.987234128), 1tick); -> 2022-09-26 10:13:23.987234100
--- print bin(datetime(2022-09-26 10:13:23.987234128), 99nanosecond); -> null
diff --git a/tests/queries/0_stateless/02366_kql_func_string.reference b/tests/queries/0_stateless/02366_kql_func_string.reference
deleted file mode 100644
index 9bdd38ca5db..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_string.reference
+++ /dev/null
@@ -1,360 +0,0 @@
--- test String Functions --
--- Customers |where Education contains \'degree\'
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-
--- Customers |where Education !contains \'degree\'
-\N	why	Professional	Partial College	38
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers |where Education contains \'Degree\'
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-
--- Customers |where Education !contains \'Degree\'
-\N	why	Professional	Partial College	38
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where FirstName endswith \'RE\'
-Theodore	Diaz	Skilled Manual	Bachelors	28
-
--- Customers | where ! FirstName endswith \'RE\'
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
---Customers | where FirstName endswith_cs \'re\'
-Theodore	Diaz	Skilled Manual	Bachelors	28
-
--- Customers | where FirstName !endswith_cs \'re\'
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation == \'Skilled Manual\'
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation != \'Skilled Manual\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation has \'skilled\'
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation !has \'skilled\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation has \'Skilled\'
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation !has \'Skilled\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation hasprefix_cs \'Ab\'
-
--- Customers | where Occupation !hasprefix_cs \'Ab\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation hasprefix_cs \'ab\'
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation !hasprefix_cs \'ab\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation hassuffix \'Ent\'
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation !hassuffix \'Ent\'
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Occupation hassuffix \'ent\'
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers | where Occupation hassuffix \'ent\'
-Stephanie	Cox	Management abcd defg	Bachelors	33
-
--- Customers |where Education in (\'Bachelors\',\'High School\')
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where Education !in (\'Bachelors\',\'High School\')
-\N	why	Professional	Partial College	38
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-
--- Customers | where FirstName matches regex \'P.*r\'
-Peter	Nara	Skilled Manual	Graduate Degree	26
-
--- Customers | where FirstName startswith \'pet\'
-Peter	Nara	Skilled Manual	Graduate Degree	26
-
--- Customers | where FirstName !startswith \'pet\'
-Latoya	Shen	Professional	Graduate Degree	25
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where FirstName startswith_cs \'pet\'
-
--- Customers | where FirstName !startswith_cs \'pet\'
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where isempty(LastName)
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where isnotempty(LastName)
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
-\N	why	Professional	Partial College	38
-
--- Customers | where isnotnull(FirstName)
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
-
--- Customers | where isnull(FirstName)
-\N	why	Professional	Partial College	38
-
--- Customers | project url_decode(\'https%3A%2F%2Fwww.test.com%2Fhello%20word\') | take 1
-https://www.test.com/hello word
-
--- Customers | project url_encode(\'https://www.test.com/hello word\') | take 1
-https%3A%2F%2Fwww.test.com%2Fhello%20word
-
--- Customers | project name_abbr = strcat(substring(FirstName,0,3), \' \', substring(LastName,2))
-\N
-Lat en
-Pet ra
-The az
-Ste x
-App 
-
--- Customers | project name = strcat(FirstName, \' \', LastName)
-\N
-Latoya Shen
-Peter Nara
-Theodore Diaz
-Stephanie Cox
-Apple 
-
--- Customers | project FirstName, strlen(FirstName)
-\N	\N
-Latoya	6
-Peter	5
-Theodore	8
-Stephanie	9
-Apple	5
-
--- Customers | project strrep(FirstName,2,\'_\')
-\N
-Latoya_Latoya
-Peter_Peter
-Theodore_Theodore
-Stephanie_Stephanie
-Apple_Apple
-
--- Customers | project toupper(FirstName)
-\N
-LATOYA
-PETER
-THEODORE
-STEPHANIE
-APPLE
-
--- Customers | project tolower(FirstName)
-\N
-latoya
-peter
-theodore
-stephanie
-apple
-
--- support subquery for in orerator (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/in-cs-operator) (subquery need to be wraped with bracket inside bracket); TODO: case-insensitive not supported yet
-Latoya	Shen	Professional	Graduate Degree	25
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- has_all (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/has-all-operator); TODO: subquery not supported yet
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Apple		Skilled Manual	Bachelors	28
-
--- has_any (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/has-anyoperator); TODO: subquery not supported yet
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Apple		Skilled Manual	Bachelors	28
-
--- countof (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/countoffunction)
-3
-3
-1
-
--- extract ( https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/extractfunction)
-PINEAPPLE ice cream is 20
-PINEAPPLE
-20
-
-20
-\N
-\N
-\N
-\N
-\N
-45.6
-45.6
-
--- extract_all (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/extractallfunction); TODO: captureGroups not supported yet
-[['T','h','e'],['p','ric','e'],['P','INEAPPL','E'],['i','c','e'],['c','rea','m']]
-
--- extract_json (https://learn.microsoft.com/en-us/azure/data-explorer/kusto/query/extractjsonfunction)
-
-
-John
-iPhone
-\N
-26
-26
-26
-26
-\N
-
--- split (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/splitfunction)
-['aa','bb']
-['bbb']
-['']
-['a','','b']
-['aa','cc']
-['aabbcc']
-['aaa','bbb','ccc']
-[NULL]
-
--- strcat_delim (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/strcat-delimfunction); TODO: only support string now.
-1-2-Ab
-
--- indexof (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/indexoffunction); TODO: length and occurrence not supported yet
-2
-2
--1
--- base64_encode_fromguid()
-8jMxriJurkmwahbmqbIS6w==
--- base64_decode_toarray()
-[]
-[75,117,115,116,111]
--- base64_decode_toguid()
-10e99626-bc2b-4c75-bb3e-fe606de25700
-1
--- base64_encode_tostring
-
-S3VzdG8x
--- base64_decode_tostring
-
-Kusto1
--- parse_url()
-{"Scheme":"scheme","Host":"","Port":"0","Path":"/this/is/a/path","Username":"username","Password":"password","Query Parameters":{"k1":"v1","k2":"v2"},"Fragment":"fragment"}
--- parse_urlquery()
-{"Query Parameters":{"k1":"v1","k2":"v2","k3":"v3"}}
--- strcmp()
-0	1	-1	1
--- substring()
-CD
--- translate()
-kusto		xxx
--- trim()
-https://www.ibm.com
-Te st1
- asd 
-asd
-sd
--- trim_start()
-www.ibm.com
-Te st1// $
-asdw
-
-asd
--- trim_end()
-https
-- Te st1
-wasd
-
-asd
--- trim, trim_start, trim_end all at once
---https://bing.com--	--	https://bing.com--	--https://bing.com	https://bing.com
--- replace_regex
-Number was: 1
--- has_any_index()
-0	1	-1	-1
--- parse_version()
-1000000020000000300000040
-1000000020000000000000000
-1000000020000000000000000
-\N
-\N
-\N
-\N
-1000000020000000300000004
-1000000020000000000000000
-1000000020000000300000000
-1000000000000000000000000
--- parse_json()
-[1,2,3]
-[{"a":123.5,"b":"{\\"c\\":456}"}]
--- parse_command_line()
-[NULL]
-[NULL]
--- reverse()
-321
-43.321
-
-dsa
-][
-]3,2,1[
-]\'redaV\',\'htraD\'[
-000000000.00:00:21 51-01-7102
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
--- parse_csv()
-['']
-['aaa']
-['aa','b','cc']
-['record1','a','b','c']
diff --git a/tests/queries/0_stateless/02366_kql_func_string.sql b/tests/queries/0_stateless/02366_kql_func_string.sql
deleted file mode 100644
index d251b04e08b..00000000000
--- a/tests/queries/0_stateless/02366_kql_func_string.sql
+++ /dev/null
@@ -1,313 +0,0 @@
--- Tags: no-fasttest
-
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES ('Theodore','Diaz','Skilled Manual','Bachelors',28), ('Stephanie','Cox','Management abcd defg','Bachelors',33),('Peter','Nara','Skilled Manual','Graduate Degree',26),('Latoya','Shen','Professional','Graduate Degree',25),('Apple','','Skilled Manual','Bachelors',28),(NULL,'why','Professional','Partial College',38);
-
--- datatable (Version:string) [
---     '1.2.3.4',
---     '1.2',
---     '1.2.3',
---     '1'
--- ]
-
-DROP TABLE IF EXISTS Versions;
-CREATE TABLE Versions
-(    
-    Version String
-) ENGINE = Memory;
-INSERT INTO Versions VALUES ('1.2.3.4'),('1.2'),('1.2.3'),('1');
-
-
-set dialect='kusto';
-print '-- test String Functions --';
-
-print '-- Customers |where Education contains \'degree\'';
-Customers |where Education contains 'degree' | order by LastName;
-print '';
-print '-- Customers |where Education !contains \'degree\'';
-Customers |where Education !contains 'degree' | order by LastName;
-print '';
-print '-- Customers |where Education contains \'Degree\'';
-Customers |where Education contains 'Degree' | order by LastName;
-print '';
-print '-- Customers |where Education !contains \'Degree\'';
-Customers |where Education !contains 'Degree' | order by LastName;
-print '';
-print '-- Customers | where FirstName endswith \'RE\'';
-Customers | where FirstName endswith 'RE' | order by LastName;
-print '';
-print '-- Customers | where ! FirstName endswith \'RE\'';
-Customers | where FirstName ! endswith 'RE' | order by LastName;
-print '';
-print '--Customers | where FirstName endswith_cs \'re\'';
-Customers | where FirstName endswith_cs 're' | order by LastName;
-print '';
-print '-- Customers | where FirstName !endswith_cs \'re\'';
-Customers | where FirstName !endswith_cs 're' | order by LastName;
-print '';
-print '-- Customers | where Occupation == \'Skilled Manual\'';
-Customers | where Occupation == 'Skilled Manual' | order by LastName;
-print '';
-print '-- Customers | where Occupation != \'Skilled Manual\'';
-Customers | where Occupation != 'Skilled Manual' | order by LastName;
-print '';
-print '-- Customers | where Occupation has \'skilled\'';
-Customers | where Occupation has 'skilled' | order by LastName;
-print '';
-print '-- Customers | where Occupation !has \'skilled\'';
-Customers | where Occupation !has 'skilled' | order by LastName;
-print '';
-print '-- Customers | where Occupation has \'Skilled\'';
-Customers | where Occupation has 'Skilled'| order by LastName;
-print '';
-print '-- Customers | where Occupation !has \'Skilled\'';
-Customers | where Occupation !has 'Skilled'| order by LastName;
-print '';
-print '-- Customers | where Occupation hasprefix_cs \'Ab\'';
-Customers | where Occupation hasprefix_cs 'Ab'| order by LastName;
-print '';
-print '-- Customers | where Occupation !hasprefix_cs \'Ab\'';
-Customers | where Occupation !hasprefix_cs 'Ab'| order by LastName;
-print '';
-print '-- Customers | where Occupation hasprefix_cs \'ab\'';
-Customers | where Occupation hasprefix_cs 'ab'| order by LastName;
-print '';
-print '-- Customers | where Occupation !hasprefix_cs \'ab\'';
-Customers | where Occupation !hasprefix_cs 'ab'| order by LastName;
-print '';
-print '-- Customers | where Occupation hassuffix \'Ent\'';
-Customers | where Occupation hassuffix 'Ent'| order by LastName;
-print '';
-print '-- Customers | where Occupation !hassuffix \'Ent\'';
-Customers | where Occupation !hassuffix 'Ent'| order by LastName;
-print '';
-print '-- Customers | where Occupation hassuffix \'ent\'';
-Customers | where Occupation hassuffix 'ent'| order by LastName;
-print '';
-print '-- Customers | where Occupation hassuffix \'ent\'';
-Customers | where Occupation hassuffix 'ent'| order by LastName;
-print '';
-print '-- Customers |where Education in (\'Bachelors\',\'High School\')';
-Customers |where Education in ('Bachelors','High School')| order by LastName;
-print '';
-print '-- Customers | where Education !in (\'Bachelors\',\'High School\')';
-Customers | where Education !in ('Bachelors','High School')| order by LastName;
-print '';
-print '-- Customers | where FirstName matches regex \'P.*r\'';
-Customers | where FirstName matches regex 'P.*r'| order by LastName;
-print '';
-print '-- Customers | where FirstName startswith \'pet\'';
-Customers | where FirstName startswith 'pet'| order by LastName;
-print '';
-print '-- Customers | where FirstName !startswith \'pet\'';
-Customers | where FirstName !startswith 'pet'| order by LastName;
-print '';
-print '-- Customers | where FirstName startswith_cs \'pet\'';
-Customers | where FirstName startswith_cs 'pet'| order by LastName;
-print '';
-print '-- Customers | where FirstName !startswith_cs \'pet\'';
-Customers | where FirstName !startswith_cs 'pet'| order by LastName;
-print '';
-print '-- Customers | where isempty(LastName)';
-Customers | where isempty(LastName);
-print '';
-print '-- Customers | where isnotempty(LastName)';
-Customers | where isnotempty(LastName);
-print '';
-print '-- Customers | where isnotnull(FirstName)';
-Customers | where isnotnull(FirstName)| order by LastName;
-print '';
-print '-- Customers | where isnull(FirstName)';
-Customers | where isnull(FirstName)| order by LastName;
-print '';
-print '-- Customers | project url_decode(\'https%3A%2F%2Fwww.test.com%2Fhello%20word\') | take 1';
-Customers | project url_decode('https%3A%2F%2Fwww.test.com%2Fhello%20word') | take 1;
-print '';
-print '-- Customers | project url_encode(\'https://www.test.com/hello word\') | take 1';
-Customers | project url_encode('https://www.test.com/hello word') | take 1;
-print '';
-print '-- Customers | project name_abbr = strcat(substring(FirstName,0,3), \' \', substring(LastName,2))';
-Customers | project name_abbr = strcat(substring(FirstName,0,3), ' ', substring(LastName,2))| order by LastName;
-print '';
-print '-- Customers | project name = strcat(FirstName, \' \', LastName)';
-Customers | project name = strcat(FirstName, ' ', LastName)| order by LastName;
-print '';
-print '-- Customers | project FirstName, strlen(FirstName)';
-Customers | project FirstName, strlen(FirstName)| order by LastName;
-print '';
-print '-- Customers | project strrep(FirstName,2,\'_\')';
-Customers | project strrep(FirstName,2,'_')| order by LastName;
-print '';
-print '-- Customers | project toupper(FirstName)';
-Customers | project toupper(FirstName)| order by LastName;
-print '';
-print '-- Customers | project tolower(FirstName)';
-Customers | project tolower(FirstName)| order by LastName;
-print '';
-print '-- support subquery for in orerator (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/in-cs-operator) (subquery need to be wraped with bracket inside bracket); TODO: case-insensitive not supported yet';
-Customers | where Age in ((Customers|project Age|where Age < 30)) | order by LastName;
--- Customer | where LastName in~ ("diaz", "cox")
-print '';
-print '-- has_all (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/has-all-operator); TODO: subquery not supported yet';
-Customers | where Occupation has_all ('manual', 'skilled') | order by LastName;
-print '';
-print '-- has_any (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/has-anyoperator); TODO: subquery not supported yet';
-Customers|where Occupation has_any ('Skilled','abcd');
-print '';
-print '-- countof (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/countoffunction)';
-Customers | project countof('The cat sat on the mat', 'at') | take 1;
-Customers | project countof('The cat sat on the mat', 'at', 'normal') | take 1;
-Customers | project countof('The cat sat on the mat', '\\s.he', 'regex') | take 1;
-print '';
-print '-- extract ( https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/extractfunction)';
-print extract('(\\b[A-Z]+\\b).+(\\b\\d+)', 0, 'The price of PINEAPPLE ice cream is 20');
-print extract('(\\b[A-Z]+\\b).+(\\b\\d+)', 1, 'The price of PINEAPPLE ice cream is 20');
-print extract('(\\b[A-Z]+\\b).+(\\b\\d+)', 2, 'The price of PINEAPPLE ice cream is 20');
-print extract('(\\b[A-Z]+\\b).+(\\b\\d+)', 3, 'The price of PINEAPPLE ice cream is 20');
-print extract('(\\b[A-Z]+\\b).+(\\b\\d+)', 2, 'The price of PINEAPPLE ice cream is 20', typeof(real));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(bool));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(date));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(guid));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(int));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(long));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(real));
-print extract("x=([0-9.]+)", 1, "hello x=45.6|wo" , typeof(decimal));
-print '';
-print '-- extract_all (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/extractallfunction); TODO: captureGroups not supported yet';
-Customers | project extract_all('(\\w)(\\w+)(\\w)','The price of PINEAPPLE ice cream is 20') | take 1;
-print '';
-print '-- extract_json (https://learn.microsoft.com/en-us/azure/data-explorer/kusto/query/extractjsonfunction)';
-print extract_json('', ''); -- { serverError BAD_ARGUMENTS }
-print extract_json('a', ''); -- { serverError BAD_ARGUMENTS }
-print extract_json('$.firstName', '');
-print extract_json('$.phoneNumbers[0].type', '');
-print extractjson('$.firstName', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}');
-print extract_json('$.phoneNumbers[0].type', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(string));
-print extract_json('$.phoneNumbers[0].type', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(int));
-print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}');
-print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(int));
-print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(long));
--- print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(bool)); -> true
-print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(double));
-print extract_json('$.age', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(guid));
--- print extract_json('$.phoneNumbers', '{"firstName":"John","lastName":"doe","age":26,"address":{"streetAddress":"naist street","city":"Nara","postalCode":"630-0192"},"phoneNumbers":[{"type":"iPhone","number":"0123-4567-8888"},{"type":"home","number":"0123-4567-8910"}]}', typeof(dynamic)); we won't be able to handle this particular case for a while, because it should return a dictionary
-print '';
-print '-- split (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/splitfunction)';
-Customers | project split('aa_bb', '_') | take 1;
-Customers | project split('aaa_bbb_ccc', '_', 1) | take 1;
-Customers | project split('', '_') | take 1;
-Customers | project split('a__b', '_') | take 1;
-Customers | project split('aabbcc', 'bb') | take 1;
-Customers | project split('aabbcc', '') | take 1;
-Customers | project split('aaa_bbb_ccc', '_', -1) | take 1;
-Customers | project split('aaa_bbb_ccc', '_', 10) | take 1;
-print '';
-print '-- strcat_delim (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/strcat-delimfunction); TODO: only support string now.';
-Customers | project strcat_delim('-', '1', '2', strcat('A','b')) | take 1;
--- Customers | project strcat_delim('-', '1', '2', 'A' , 1s);
-print '';
-print '-- indexof (https://docs.microsoft.com/en-us/azure/data-explorer/kusto/query/indexoffunction); TODO: length and occurrence not supported yet';
-Customers | project indexof('abcdefg','cde') | take 1;
-Customers | project indexof('abcdefg','cde',2) | take 1;
-Customers | project indexof('abcdefg','cde',6) | take 1;
-print '-- base64_encode_fromguid()';
--- print base64_encode_fromguid(guid(null));
-print base64_encode_fromguid(guid('ae3133f2-6e22-49ae-b06a-16e6a9b212eb'));
-print base64_encode_fromguid(dynamic(null)); -- { serverError FUNCTION_THROW_IF_VALUE_IS_NON_ZERO }
-print base64_encode_fromguid("abcd1231"); -- { serverError FUNCTION_THROW_IF_VALUE_IS_NON_ZERO }
-print '-- base64_decode_toarray()';
-print base64_decode_toarray('');
-print base64_decode_toarray('S3VzdG8=');
-print '-- base64_decode_toguid()';
-print base64_decode_toguid("JpbpECu8dUy7Pv5gbeJXAA==");
-print base64_decode_toguid(base64_encode_fromguid(guid('ae3133f2-6e22-49ae-b06a-16e6a9b212eb'))) == guid('ae3133f2-6e22-49ae-b06a-16e6a9b212eb');
-print '-- base64_encode_tostring';
-print base64_encode_tostring('');
-print base64_encode_tostring('Kusto1');
-print '-- base64_decode_tostring';
-print base64_decode_tostring('');
-print base64_decode_tostring('S3VzdG8x');
-print '-- parse_url()';
-print parse_url('scheme://username:password@host:1234/this/is/a/path?k1=v1&k2=v2#fragment');
-print '-- parse_urlquery()';
-print parse_urlquery('k1=v1&k2=v2&k3=v3');
-print '-- strcmp()';
-print strcmp('ABC','ABC'), strcmp('abc','ABC'), strcmp('ABC','abc'), strcmp('abcde','abc');
-print '-- substring()';
-print substring("ABCD", -2, 2);
-print '-- translate()';
-print translate('krasp', 'otsku', 'spark'), translate('abc', '', 'ab'), translate('abc', 'x', 'abc');
-print '-- trim()';
-print trim("--", "--https://www.ibm.com--");
-print trim("[^\w]+", strcat("- ","Te st", "1", "// $"));
-print trim("", " asd ");
-print trim("a$", "asd");
-print trim("^a", "asd");
-print '-- trim_start()';
-print trim_start("https://", "https://www.ibm.com");
-print trim_start("[^\w]+", strcat("-  ","Te st", "1", "// $"));
-print trim_start("asd$", "asdw");
-print trim_start("asd$", "asd");
-print trim_start("d$", "asd");
-print '-- trim_end()';
-print trim_end("://www.ibm.com", "https://www.ibm.com");
-print trim_end("[^\w]+", strcat("- ","Te st", "1", "// $"));
-print trim_end("^asd", "wasd");
-print trim_end("^asd", "asd");
-print trim_end("^a", "asd");
-print '-- trim, trim_start, trim_end all at once';
-print str = "--https://bing.com--", pattern = '--' | extend start = trim_start(pattern, str), end = trim_end(pattern, str), both = trim(pattern, str);
-print '-- replace_regex';
-print replace_regex(strcat('Number is ', '1'), 'is (\d+)', 'was: \1');
-print '-- has_any_index()';
-print has_any_index('this is an example', dynamic(['this', 'example'])), has_any_index("this is an example", dynamic(['not', 'example'])), has_any_index("this is an example", dynamic(['not', 'found'])), has_any_index("this is an example", dynamic([]));
-print '-- parse_version()';
-print parse_version(42); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
--- print parse_version(''); -> NULL
-print parse_version('1.2.3.40');
-print parse_version('1.2');
-print parse_version(strcat('1.', '2'));
-print parse_version('1.2.4.5.6');
-print parse_version('moo'); 
-print parse_version('moo.boo.foo');
-print parse_version(strcat_delim('.', 'moo', 'boo', 'foo'));
-Versions | project parse_version(Version);
-print '-- parse_json()';
-print parse_json(dynamic([1, 2, 3]));
-print parse_json('{"a":123.5, "b":"{\\"c\\":456}"}');
-print '-- parse_command_line()';
-print parse_command_line(55, 'windows'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
--- print parse_command_line((52 + 3) * 4 % 2, 'windows'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
-print parse_command_line('', 'windows');
-print parse_command_line(strrep(' ', 6), 'windows'); 
--- print parse_command_line('echo \"hello world!\" print$?', 'windows'); -> ["echo","hello world!","print$?"]
--- print parse_command_line("yolo swag 'asd bcd' \"moo moo \"", 'windows'); -> ["yolo","swag","'asd","bcd'","moo moo "]
--- print parse_command_line(strcat_delim(' ', "yolo", "swag", "\'asd bcd\'", "\"moo moo \""), 'windows'); -> ["yolo","swag","'asd","bcd'","moo moo "]
-print '-- reverse()';
-print reverse(123);
-print reverse(123.34);
-print reverse('');
-print reverse("asd");
-print reverse(dynamic([]));
-print reverse(dynamic([1, 2, 3]));
-print reverse(dynamic(['Darth', "Vader"]));
-print reverse(datetime(2017-10-15 12:00));
--- print reverse(timespan(3h)); -> 00:00:30
-Customers | where Education contains 'degree' | order by reverse(FirstName);
-print '-- parse_csv()';
-print parse_csv('');
-print parse_csv(65); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
-print parse_csv('aaa');
-print result=parse_csv('aa,b,cc');
-print result_multi_record=parse_csv('record1,a,b,c\nrecord2,x,y,z');
--- print result=parse_csv('aa,"b,b,b",cc,"Escaping quotes: ""Title""","line1\nline2"'); -> ["aa","b,b,b","cc","Escaping quotes: \"Title\"","line1\nline2"]
--- print parse_csv(strcat(strcat_delim(',', 'aa', '"b,b,b"', 'cc', '"Escaping quotes: ""Title"""', '"line1\nline2"'), '\r\n', strcat_delim(',', 'asd', 'qcf'))); -> ["aa","b,b,b","cc","Escaping quotes: \"Title\"","line1\nline2"]
diff --git a/tests/queries/0_stateless/02366_kql_makeseries.reference b/tests/queries/0_stateless/02366_kql_makeseries.reference
deleted file mode 100644
index 8e7fde997bf..00000000000
--- a/tests/queries/0_stateless/02366_kql_makeseries.reference
+++ /dev/null
@@ -1,60 +0,0 @@
--- from to
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Costco	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[0,2,0]
-Aldi	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[0,500,0]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
--- from
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Costco	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000']	[0,2]
-Aldi	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000']	[0,500]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
--- to
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Costco	Apple	['2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[2,0]
-Aldi	Snargaluff	['2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[500,0]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
--- without from/to
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Costco	Apple	['2016-09-11 00:00:00.000000000']	[2]
-Aldi	Snargaluff	['2016-09-11 00:00:00.000000000']	[500]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
--- without by
-['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[70,334,54]
--- without aggregation alias
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Aldi	Snargaluff	['2016-09-11 00:00:00.000000000']	[500]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
-Costco	Apple	['2016-09-11 00:00:00.000000000']	[2]
--- assign group alias
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[200,0,102]
-Aldi	Snargaluff	['2016-09-11 00:00:00.000000000']	[500]
-Aldi	Apple	['2016-09-10 00:00:00.000000000','2016-09-11 00:00:00.000000000','2016-09-12 00:00:00.000000000']	[5,0,6]
-Costco	Apple	['2016-09-11 00:00:00.000000000']	[2]
--- 3d step
-Costco	Snargaluff	['2016-09-10 00:00:00.000000000']	[134.66666666666666]
-Costco	Apple	['2016-09-10 00:00:00.000000000']	[2]
-Aldi	Snargaluff	['2016-09-10 00:00:00.000000000']	[500]
-Aldi	Apple	['2016-09-10 00:00:00.000000000']	[5.5]
--- numeric column
-Costco	Snargaluff	[10,11,12,13,14]	[200,0,102,0,0]
-Aldi	Snargaluff	[10,11,12,13,14]	[0,500,0,0,0]
-Aldi	Apple	[10,11,12,13,14]	[5,0,6,0,0]
-Costco	Apple	[10,11,12,13,14]	[0,2,0,0,0]
--- from
-Costco	Snargaluff	[10,11,12]	[200,0,102]
-Aldi	Snargaluff	[10,11]	[0,500]
-Aldi	Apple	[10,11,12]	[5,0,6]
-Costco	Apple	[10,11]	[0,2]
--- to
-Costco	Snargaluff	[8,12,16]	[200,102,0]
-Aldi	Snargaluff	[8,12,16]	[500,0,0]
-Aldi	Apple	[8,12,16]	[5,6,0]
-Costco	Apple	[8,12,16]	[2,0,0]
--- without from/to
-Costco	Snargaluff	[10,12]	[200,102]
-Aldi	Snargaluff	[10]	[500]
-Aldi	Apple	[10,12]	[5,6]
-Costco	Apple	[10]	[2]
--- without by
-[10,12]	[202,54]
-['2017-01-01 00:00:00.000000000','2017-01-02 00:00:00.000000000','2017-01-03 00:00:00.000000000','2017-01-04 00:00:00.000000000','2017-01-05 00:00:00.000000000','2017-01-06 00:00:00.000000000','2017-01-07 00:00:00.000000000','2017-01-08 00:00:00.000000000','2017-01-09 00:00:00.000000000']	[4,3,5,0,10.5,4,3,8,6.5]
diff --git a/tests/queries/0_stateless/02366_kql_makeseries.sql b/tests/queries/0_stateless/02366_kql_makeseries.sql
deleted file mode 100644
index c9ca91c0be0..00000000000
--- a/tests/queries/0_stateless/02366_kql_makeseries.sql
+++ /dev/null
@@ -1,77 +0,0 @@
--- Azure Data Explore Test Data
--- let make_series_test_table = datatable (Supplier:string, Fruit:string, Price: real, Purchase:datetime)
--- [
--- 'Aldi','Apple',4,'2016-09-10',
--- 'Costco','Apple',2,'2016-09-11',
--- 'Aldi','Apple',6,'2016-09-10',
--- 'Costco','Snargaluff',100,'2016-09-12',
--- 'Aldi','Apple',7,'2016-09-12',
--- 'Aldi','Snargaluff',400,'2016-09-11',
--- 'Costco','Snargaluff',104,'2016-09-12',
--- 'Aldi','Apple',5,'2016-09-12',
--- 'Aldi','Snargaluff',600,'2016-09-11',
--- 'Costco','Snargaluff',200,'2016-09-10',
--- ];
-DROP TABLE IF EXISTS make_series_test_table;
-CREATE TABLE make_series_test_table
-(
-   Supplier Nullable(String),
-   Fruit String ,
-   Price Float64,
-   Purchase Date
-) ENGINE = Memory;
-INSERT INTO make_series_test_table VALUES  ('Aldi','Apple',4,'2016-09-10'), ('Costco','Apple',2,'2016-09-11'), ('Aldi','Apple',6,'2016-09-10'), ('Costco','Snargaluff',100,'2016-09-12'), ('Aldi','Apple',7,'2016-09-12'), ('Aldi','Snargaluff',400,'2016-09-11'),('Costco','Snargaluff',104,'2016-09-12'),('Aldi','Apple',5,'2016-09-12'),('Aldi','Snargaluff',600,'2016-09-11'),('Costco','Snargaluff',200,'2016-09-10');
-DROP TABLE IF EXISTS make_series_test_table2;
-CREATE TABLE make_series_test_table2
-(
-   Supplier Nullable(String),
-   Fruit String ,
-   Price Int32,
-   Purchase Int32
-) ENGINE = Memory;
-INSERT INTO make_series_test_table2 VALUES  ('Aldi','Apple',4,10),('Costco','Apple',2,11),('Aldi','Apple',6,10),('Costco','Snargaluff',100,12),('Aldi','Apple',7,12),('Aldi','Snargaluff',400,11),('Costco','Snargaluff',104,12),('Aldi','Apple',5,12),('Aldi','Snargaluff',600,11),('Costco','Snargaluff',200,10);
-DROP TABLE IF EXISTS make_series_test_table3;
-CREATE TABLE make_series_test_table3
-(
-    timestamp datetime,
-    metric Float64,
-) ENGINE = Memory;
-INSERT INTO make_series_test_table3 VALUES (parseDateTimeBestEffort('2016-12-31T06:00', 'UTC'), 50), (parseDateTimeBestEffort('2017-01-01', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-02', 'UTC'), 3), (parseDateTimeBestEffort('2017-01-03', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-03T03:00', 'UTC'), 6), (parseDateTimeBestEffort('2017-01-05', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-05T13:40', 'UTC'), 13), (parseDateTimeBestEffort('2017-01-06', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-07', 'UTC'), 3), (parseDateTimeBestEffort('2017-01-08', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-08T21:00', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-09', 'UTC'), 2), (parseDateTimeBestEffort('2017-01-09T12:00', 'UTC'), 11), (parseDateTimeBestEffort('2017-01-10T05:00', 'UTC'), 5);
-
--- This test requies sorting after some of aggregations but I don't know KQL, sorry
-set max_bytes_before_external_group_by = 0;
-set dialect = 'kusto';
-
-print '-- from to';
-make_series_test_table |  make-series PriceAvg = avg(Price) default=0 on Purchase from datetime(2016-09-10)  to datetime(2016-09-13) step 1d by Supplier, Fruit | order by Supplier, Fruit;
-print '-- from';
-make_series_test_table |  make-series PriceAvg = avg(Price) default=0 on Purchase from datetime(2016-09-10)  step 1d by Supplier, Fruit | order by Supplier, Fruit;
-print '-- to';
-make_series_test_table |  make-series PriceAvg = avg(Price) default=0 on Purchase to datetime(2016-09-13) step 1d by Supplier, Fruit | order by Supplier, Fruit;
-print '-- without from/to';
-make_series_test_table | make-series PriceAvg = avg(Price) default=0 on Purchase step 1d by Supplier, Fruit | order by Supplier, Fruit;
-print '-- without by';
-make_series_test_table | make-series PriceAvg = avg(Price) default=0 on Purchase step 1d;
-print '-- without aggregation alias';
-make_series_test_table | make-series avg(Price) default=0 on Purchase step 1d by Supplier, Fruit;
-print '-- assign group alias';
-make_series_test_table | make-series avg(Price) default=0 on Purchase step 1d by Supplier_Name = Supplier, Fruit;
-print '-- 3d step';
-make_series_test_table | make-series PriceAvg = avg(Price) default=0 on Purchase from datetime(2016-09-10)  to datetime(2016-09-13) step 3d by Supplier, Fruit | order by Supplier, Fruit;
-
-print '-- numeric column'
-print '-- from to';
-make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase from 10 to  15 step  1.0  by Supplier, Fruit;
-print '-- from';
-make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase from 10 step  1.0  by Supplier, Fruit;
-print '-- to';
-make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase to 18 step  4.0  by Supplier, Fruit;
-print '-- without from/to';
-make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase step  2.0  by Supplier, Fruit;
-print '-- without by';
-make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase step  2.0;
-
-make_series_test_table3 | make-series avg(metric) default=0  on timestamp from datetime(2017-01-01) to datetime(2017-01-10) step 1d
-
--- print '-- summarize --'
--- make_series_test_table | summarize count() by format_datetime(bin(Purchase, 1d), 'yy-MM-dd');
diff --git a/tests/queries/0_stateless/02366_kql_mvexpand.reference b/tests/queries/0_stateless/02366_kql_mvexpand.reference
deleted file mode 100644
index 25be070eb0b..00000000000
--- a/tests/queries/0_stateless/02366_kql_mvexpand.reference
+++ /dev/null
@@ -1,65 +0,0 @@
--- mv-expand --
--- mv_expand_test_table | mv-expand c --
-1	['Salmon','Steak','Chicken']	1	[5,6,7,8]
-1	['Salmon','Steak','Chicken']	2	[5,6,7,8]
-1	['Salmon','Steak','Chicken']	3	[5,6,7,8]
-1	['Salmon','Steak','Chicken']	4	[5,6,7,8]
--- mv_expand_test_table | mv-expand c, d --
-1	['Salmon','Steak','Chicken']	1	5
-1	['Salmon','Steak','Chicken']	2	6
-1	['Salmon','Steak','Chicken']	3	7
-1	['Salmon','Steak','Chicken']	4	8
--- mv_expand_test_table | mv-expand b | mv-expand c --
-1	Salmon	1	[5,6,7,8]
-1	Salmon	2	[5,6,7,8]
-1	Salmon	3	[5,6,7,8]
-1	Salmon	4	[5,6,7,8]
-1	Steak	1	[5,6,7,8]
-1	Steak	2	[5,6,7,8]
-1	Steak	3	[5,6,7,8]
-1	Steak	4	[5,6,7,8]
-1	Chicken	1	[5,6,7,8]
-1	Chicken	2	[5,6,7,8]
-1	Chicken	3	[5,6,7,8]
-1	Chicken	4	[5,6,7,8]
--- mv_expand_test_table | mv-expand with_itemindex=index b, c, d --
-0	1	Salmon	1	5
-1	1	Steak	2	6
-2	1	Chicken	3	7
-3	1		4	8
--- mv_expand_test_table | mv-expand array_concat(c,d) --
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	1
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	2
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	3
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	4
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	5
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	6
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	7
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	8
--- mv_expand_test_table | mv-expand x = c, y = d --
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	1	5
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	2	6
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	3	7
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	4	8
--- mv_expand_test_table | mv-expand xy = array_concat(c, d) --
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	1
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	2
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	3
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	4
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	5
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	6
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	7
-1	['Salmon','Steak','Chicken']	[1,2,3,4]	[5,6,7,8]	8
--- mv_expand_test_table | mv-expand xy = array_concat(c, d) limit 2| summarize count() by xy --
-1	1
-2	1
--- mv_expand_test_table | mv-expand with_itemindex=index c,d to typeof(bool) --
-0	1	['Salmon','Steak','Chicken']	1	true
-1	1	['Salmon','Steak','Chicken']	2	true
-2	1	['Salmon','Steak','Chicken']	3	true
-3	1	['Salmon','Steak','Chicken']	4	true
--- mv_expand_test_table | mv-expand c to typeof(bool) --
-1	['Salmon','Steak','Chicken']	[5,6,7,8]	true
-1	['Salmon','Steak','Chicken']	[5,6,7,8]	true
-1	['Salmon','Steak','Chicken']	[5,6,7,8]	true
-1	['Salmon','Steak','Chicken']	[5,6,7,8]	true
diff --git a/tests/queries/0_stateless/02366_kql_mvexpand.sql b/tests/queries/0_stateless/02366_kql_mvexpand.sql
deleted file mode 100644
index e7798609646..00000000000
--- a/tests/queries/0_stateless/02366_kql_mvexpand.sql
+++ /dev/null
@@ -1,35 +0,0 @@
--- datatable(a: int, b: dynamic, c: dynamic, d: dynamic) [
---    1, dynamic(['Salmon', 'Steak', 'Chicken']), dynamic([1, 2, 3, 4]), dynamic([5, 6, 7, 8])
--- ]
-
-DROP TABLE IF EXISTS mv_expand_test_table;
-CREATE TABLE mv_expand_test_table
-(    
-   a UInt8,
-   b Array(String),
-   c Array(Int8),
-   d Array(Int8)
-) ENGINE = Memory;
-INSERT INTO mv_expand_test_table VALUES (1, ['Salmon', 'Steak','Chicken'],[1,2,3,4],[5,6,7,8]);
-set dialect='kusto';
-print '-- mv-expand --';
-print '-- mv_expand_test_table | mv-expand c --';
-mv_expand_test_table | mv-expand c;
-print '-- mv_expand_test_table | mv-expand c, d --';
-mv_expand_test_table | mv-expand c, d;
-print '-- mv_expand_test_table | mv-expand b | mv-expand c --';
-mv_expand_test_table | mv-expand b | mv-expand c;
-print '-- mv_expand_test_table | mv-expand with_itemindex=index b, c, d --';
-mv_expand_test_table | mv-expand with_itemindex=index b, c, d;
-print '-- mv_expand_test_table | mv-expand array_concat(c,d) --';
-mv_expand_test_table | mv-expand array_concat(c,d);
-print '-- mv_expand_test_table | mv-expand x = c, y = d --';
-mv_expand_test_table | mv-expand x = c, y = d;
-print '-- mv_expand_test_table | mv-expand xy = array_concat(c, d) --';
-mv_expand_test_table | mv-expand xy = array_concat(c, d);
-print '-- mv_expand_test_table | mv-expand xy = array_concat(c, d) limit 2| summarize count() by xy --';
-mv_expand_test_table | mv-expand xy = array_concat(c, d) limit 2| summarize count() by xy;
-print '-- mv_expand_test_table | mv-expand with_itemindex=index c,d to typeof(bool) --';
-mv_expand_test_table | mv-expand with_itemindex=index c,d to typeof(bool);
-print '-- mv_expand_test_table | mv-expand c to typeof(bool) --';
-mv_expand_test_table | mv-expand c to typeof(bool);
diff --git a/tests/queries/0_stateless/02366_kql_native_interval_format.reference b/tests/queries/0_stateless/02366_kql_native_interval_format.reference
deleted file mode 100644
index 8a12c6885c4..00000000000
--- a/tests/queries/0_stateless/02366_kql_native_interval_format.reference
+++ /dev/null
@@ -1,23 +0,0 @@
-numeric
-kusto
-00:00:00
-00:00:00.0000001
-00:00:00.0010000
-00:00:42
-01:06:00
-2.18:00:00
-5.00:00:00
-7.00:00:00
-14.00:00:00
-('00:01:12','21.00:00:00','00:00:00.0000002')
-numeric
-99
-100
-1
-42
-66
-66
-5
-1
-2
-(72,3,200)
diff --git a/tests/queries/0_stateless/02366_kql_native_interval_format.sql.j2 b/tests/queries/0_stateless/02366_kql_native_interval_format.sql.j2
deleted file mode 100644
index 0731687222d..00000000000
--- a/tests/queries/0_stateless/02366_kql_native_interval_format.sql.j2
+++ /dev/null
@@ -1,16 +0,0 @@
-select value from system.settings where name = 'interval_output_format';
-
-{% for format in ['kusto', 'numeric'] -%}
-select '{{ format }}';
-set interval_output_format = '{{ format }}';
-select toIntervalNanosecond(99);
-select toIntervalNanosecond(100);
-select toIntervalMillisecond(1);
-select toIntervalSecond(42);
-select toIntervalMinute(66);
-select toIntervalHour(66);
-select toIntervalDay(5);
-select toIntervalWeek(1);
-select toIntervalWeek(2);
-select toIntervalSecond(72) + toIntervalWeek(3) + toIntervalNanosecond(200);
-{% endfor -%}
diff --git a/tests/queries/0_stateless/02366_kql_operator_in_sql.reference b/tests/queries/0_stateless/02366_kql_operator_in_sql.reference
deleted file mode 100644
index 4e0987aa5c3..00000000000
--- a/tests/queries/0_stateless/02366_kql_operator_in_sql.reference
+++ /dev/null
@@ -1,60 +0,0 @@
--- #1 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Apple		Skilled Manual	Bachelors	28
--- #2 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #3 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #4 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #5 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #6 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #7 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #8 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #9 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #10 --
--- #11 --
--- #12 --
--- #13 --
--- #14 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
--- #15 --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management abcd defg	Bachelors	33
-Latoya	Shen	Professional	Graduate Degree	25
-Apple		Skilled Manual	Bachelors	28
diff --git a/tests/queries/0_stateless/02366_kql_operator_in_sql.sql b/tests/queries/0_stateless/02366_kql_operator_in_sql.sql
deleted file mode 100644
index 0b02faa0680..00000000000
--- a/tests/queries/0_stateless/02366_kql_operator_in_sql.sql
+++ /dev/null
@@ -1,42 +0,0 @@
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES  ('Theodore','Diaz','Skilled Manual','Bachelors',28),('Stephanie','Cox','Management abcd defg','Bachelors',33),('Peter','Nara','Skilled Manual','Graduate Degree',26),('Latoya','Shen','Professional','Graduate Degree',25),('Apple','','Skilled Manual','Bachelors',28),(NULL,'why','Professional','Partial College',38);
-Select '-- #1 --' ;
-select * from kql($$Customers | where FirstName !in ('Peter', 'Latoya')$$);
-Select '-- #2 --' ;
-select * from kql($$Customers | where FirstName !in ("test", "test2")$$);
-Select '-- #3 --' ;
-select * from kql($$Customers | where FirstName !contains 'Pet'$$);
-Select '-- #4 --' ;
-select * from kql($$Customers | where FirstName !contains_cs 'Pet'$$);
-Select '-- #5 --' ;
-select * from kql($$Customers | where FirstName !endswith 'ter'$$);
-Select '-- #6 --' ;
-select * from kql($$Customers | where FirstName !endswith_cs 'ter'$$);
-Select '-- #7 --' ;
-select * from kql($$Customers | where FirstName != 'Peter'$$);
-Select '-- #8 --' ;
-select * from kql($$Customers | where FirstName !has 'Peter'$$);
-Select '-- #9 --' ;
-select * from kql($$Customers | where FirstName !has_cs 'peter'$$);
-Select '-- #10 --' ;
--- select * from kql($$Customers | where FirstName !hasprefix 'Peter'$$); -- will enable when analyzer fixed `and` issue
-Select '-- #11 --' ;
---select * from kql($$Customers | where FirstName !hasprefix_cs 'Peter'$$);
-Select '-- #12 --' ;
---select * from kql($$Customers | where FirstName !hassuffix 'Peter'$$);
-Select '-- #13 --' ;
---select * from kql($$Customers | where FirstName !hassuffix_cs 'Peter'$$);
-Select '-- #14 --' ;
-select * from kql($$Customers | where FirstName !startswith 'Peter'$$);
-Select '-- #15 --' ;
-select * from kql($$Customers | where FirstName !startswith_cs 'Peter'$$);
-DROP TABLE IF EXISTS Customers;
diff --git a/tests/queries/0_stateless/02366_kql_summarize.reference b/tests/queries/0_stateless/02366_kql_summarize.reference
deleted file mode 100644
index aeb42feb6be..00000000000
--- a/tests/queries/0_stateless/02366_kql_summarize.reference
+++ /dev/null
@@ -1,92 +0,0 @@
--- test summarize --
-12	25	46	32.416666666666664	389
-Skilled Manual	5	26	36	30.2	151
-Professional	6	25	46	34.166666666666664	205
-Management abcd defg	1	33	33	33	33
-Skilled Manual	0
-Professional	2
-Management abcd defg	0
-Skilled Manual	36
-Professional	38
-Management abcd defg	33
-Skilled Manual	26
-Professional	25
-Management abcd defg	33
-Skilled Manual	30.2
-Professional	29.25
-Management abcd defg	33
-Skilled Manual	151
-Professional	117
-Management abcd defg	33
-4
-2
-40	2
-30	4
-20	6
-Skilled Manual	5
-Professional	6
-Management abcd defg	1
--- make_list() --
-Skilled Manual	['Bachelors','Graduate Degree','High School','Partial College','Bachelors']
-Professional	['Graduate Degree','Partial College','Partial College','Partial College','Partial College','Partial College']
-Management abcd defg	['Bachelors']
-Skilled Manual	['Bachelors','Graduate Degree']
-Professional	['Graduate Degree','Partial College']
-Management abcd defg	['Bachelors']
--- make_list_if() --
-Skilled Manual	['Edward','Christine']
-Professional	['Dalton','Angel']
-Management abcd defg	['Stephanie']
-Skilled Manual	['Edward']
-Professional	['Dalton']
-Management abcd defg	['Stephanie']
--- make_set() --
-Skilled Manual	['Graduate Degree','High School','Partial College','Bachelors']
-Professional	['Graduate Degree','Partial College']
-Management abcd defg	['Bachelors']
-Skilled Manual	['Graduate Degree','Bachelors']
-Professional	['Graduate Degree','Partial College']
-Management abcd defg	['Bachelors']
--- make_set_if() --
-Skilled Manual	['Partial College','High School']
-Professional	['Partial College']
-Management abcd defg	['Bachelors']
-Skilled Manual	['High School']
-Professional	['Partial College']
-Management abcd defg	['Bachelors']
--- stdev() --
-6.855102059227432
--- stdevif() --
-7.557189365836421
--- binary_all_and --
-42
--- binary_all_or --
-46
--- binary_all_xor --
-4
-43.8
-25.55	30.5	43.8
-30.5
-35
-[25,35,45]
--- Summarize following sort --
-Skilled Manual	5
-Professional	6
-Management abcd defg	1
--- summarize with bin --
-0	1
-245000	2
-0	1
-245	2
-0	1
-245	2
-2015-10-12 00:00:00.000000000
-2016-10-12 00:00:00.000000000
--- make_list_with_nulls --
-['Theodore','Stephanie','Peter','Latoya','Joshua','Edward','Dalton','Christine','Cameron','Angel','Apple',NULL]
-Skilled Manual	['Theodore','Peter','Edward','Christine','Apple']
-Professional	['Latoya','Joshua','Dalton','Cameron','Angel',NULL]
-Management abcd defg	['Stephanie']
-Skilled Manual	['Theodore','Peter','Edward','Christine','Apple']	[28,26,36,33,28]
-Professional	['Latoya','Joshua','Dalton','Cameron','Angel',NULL]	[25,26,42,28,46,38]
-Management abcd defg	['Stephanie']	[33]
diff --git a/tests/queries/0_stateless/02366_kql_summarize.sql b/tests/queries/0_stateless/02366_kql_summarize.sql
deleted file mode 100644
index bb12d1f251f..00000000000
--- a/tests/queries/0_stateless/02366_kql_summarize.sql
+++ /dev/null
@@ -1,102 +0,0 @@
--- datatable(FirstName:string, LastName:string, Occupation:string, Education:string, Age:int) [
---     'Theodore', 'Diaz', 'Skilled Manual', 'Bachelors', 28,
---     'Stephanie', 'Cox', 'Management abcd defg', 'Bachelors', 33,
---     'Peter', 'Nara', 'Skilled Manual', 'Graduate Degree', 26,
---     'Latoya', 'Shen', 'Professional', 'Graduate Degree', 25,
---     'Joshua', 'Lee', 'Professional', 'Partial College', 26,
---     'Edward', 'Hernandez', 'Skilled Manual', 'High School', 36,
---     'Dalton', 'Wood', 'Professional', 'Partial College', 42,
---     'Christine', 'Nara', 'Skilled Manual', 'Partial College', 33,
---     'Cameron', 'Rodriguez', 'Professional', 'Partial College', 28,
---     'Angel', 'Stewart', 'Professional', 'Partial College', 46,
---     'Apple', '', 'Skilled Manual', 'Bachelors', 28,
---     dynamic(null), 'why', 'Professional', 'Partial College', 38
--- ]
-
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(
-    FirstName Nullable(String),
-    LastName String,
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES  ('Theodore','Diaz','Skilled Manual','Bachelors',28),('Stephanie','Cox','Management abcd defg','Bachelors',33),('Peter','Nara','Skilled Manual','Graduate Degree',26),('Latoya','Shen','Professional','Graduate Degree',25),('Joshua','Lee','Professional','Partial College',26),('Edward','Hernandez','Skilled Manual','High School',36),('Dalton','Wood','Professional','Partial College',42),('Christine','Nara','Skilled Manual','Partial College',33),('Cameron','Rodriguez','Professional','Partial College',28),('Angel','Stewart','Professional','Partial College',46),('Apple','','Skilled Manual','Bachelors',28),(NULL,'why','Professional','Partial College',38);
-
-drop table if exists EventLog;
-create table EventLog
-(
-    LogEntry String,
-    Created Int64
-) ENGINE = Memory;
-
-insert into EventLog values ('Darth Vader has entered the room.', 546), ('Rambo is suspciously looking at Darth Vader.', 245234), ('Darth Sidious electrocutes both using Force Lightning.', 245554);
-
-drop table if exists Dates;
-create table Dates
-(
-    EventTime DateTime,
-) ENGINE = Memory;
-
-Insert into Dates VALUES ('2015-10-12') , ('2016-10-12')
-Select '-- test summarize --' ;
-set dialect='kusto';
-Customers | summarize count(), min(Age), max(Age), avg(Age), sum(Age);
-Customers | summarize count(), min(Age), max(Age), avg(Age), sum(Age) by Occupation | order by Occupation;
-Customers | summarize countif(Age>40) by Occupation | order by Occupation;
-Customers | summarize MyMax = maxif(Age, Age<40) by Occupation | order by Occupation;
-Customers | summarize MyMin = minif(Age, Age<40) by Occupation | order by Occupation;
-Customers | summarize MyAvg = avgif(Age, Age<40) by Occupation | order by Occupation;
-Customers | summarize MySum = sumif(Age, Age<40) by Occupation | order by Occupation;
-Customers | summarize dcount(Education);
-Customers | summarize dcountif(Education, Occupation=='Professional');
-Customers | summarize count_ = count() by bin(Age, 10) | order by count_ asc;
-Customers | summarize job_count = count() by Occupation | where job_count > 0 | order by Occupation;
-Customers | summarize 'Edu Count'=count() by Education | sort by 'Edu Count' desc; -- { clientError 62 }
-
-print '-- make_list() --';
-Customers | summarize f_list = make_list(Education) by Occupation | sort by Occupation;
-Customers | summarize f_list = make_list(Education, 2) by Occupation | sort by Occupation;
-print '-- make_list_if() --';
-Customers | summarize f_list = make_list_if(FirstName, Age>30) by Occupation | sort by Occupation;
-Customers | summarize f_list = make_list_if(FirstName, Age>30, 1) by Occupation | sort by Occupation;
-print '-- make_set() --';
-Customers | summarize f_list = make_set(Education) by Occupation | sort by Occupation;
-Customers | summarize f_list = make_set(Education, 2) by Occupation | sort by Occupation;
-print '-- make_set_if() --';
-Customers | summarize f_list = make_set_if(Education, Age>30) by Occupation | sort by Occupation;
-Customers | summarize f_list = make_set_if(Education, Age>30, 1) by Occupation | sort by Occupation;
-print '-- stdev() --';
-Customers | project Age | summarize stdev(Age);
-print '-- stdevif() --';
-Customers | project Age | summarize stdevif(Age, Age%2==0);
-print '-- binary_all_and --';
-Customers | project Age | where Age > 40 | summarize binary_all_and(Age);
-print '-- binary_all_or --';
-Customers | project Age | where Age > 40 | summarize binary_all_or(Age);
-print '-- binary_all_xor --';
-Customers | project Age | where Age > 40 | summarize binary_all_xor(Age);
-
-Customers | project Age | summarize percentile(Age, 95);
-Customers | project Age | summarize percentiles(Age, 5, 50, 95)|project round(percentiles_Age[0],2),round(percentiles_Age[1],2),round(percentiles_Age[2],2);
-Customers | project Age | summarize percentiles(Age, 5, 50, 95)[1];
-Customers | summarize w=count() by AgeBucket=bin(Age, 5) | summarize percentilew(AgeBucket, w, 75);
-Customers | summarize w=count() by AgeBucket=bin(Age, 5) | summarize percentilesw(AgeBucket, w, 50, 75, 99.9);
-
-print '-- Summarize following sort --';
-Customers | sort by FirstName | summarize count() by Occupation | sort by Occupation;
-
-print '-- summarize with bin --';
-EventLog | summarize count=count() by bin(Created, 1000) | sort by count asc;
-EventLog | summarize count=count() by bin(unixtime_seconds_todatetime(Created/1000), 1s) | sort by count asc;
-EventLog | summarize count=count() by time_label=bin(Created/1000, 1s) | sort by count asc;
-Dates | project bin(datetime(EventTime), 1m);
-print '-- make_list_with_nulls --';
-Customers | summarize t = make_list_with_nulls(FirstName);
-Customers | summarize f_list = make_list_with_nulls(FirstName) by Occupation | sort by Occupation;
-Customers | summarize f_list = make_list_with_nulls(FirstName), a_list = make_list_with_nulls(Age) by Occupation | sort by Occupation;
--- TODO:
--- arg_max()
--- arg_min()
diff --git a/tests/queries/0_stateless/02366_kql_tabular.reference b/tests/queries/0_stateless/02366_kql_tabular.reference
deleted file mode 100644
index e70c02ce34f..00000000000
--- a/tests/queries/0_stateless/02366_kql_tabular.reference
+++ /dev/null
@@ -1,139 +0,0 @@
--- test Query only has table name: --
-Theodore	Diaz	Skilled Manual	Bachelors	28
-Stephanie	Cox	Management	Bachelors	33
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Latoya	Shen	Professional	Graduate Degree	25
-Joshua	Lee	Professional	Partial College	26
-Edward	Hernandez	Skilled Manual	High School	36
-Dalton	Wood	Professional	Partial College	42
-Christine	Nara	Skilled Manual	Partial College	33
-Cameron	Rodriguez	Professional	Partial College	28
-Angel	Stewart	Professional	Partial College	46
--- Query has Column Selection --
-Theodore	Diaz	Skilled Manual
-Stephanie	Cox	Management
-Peter	Nara	Skilled Manual
-Latoya	Shen	Professional
-Joshua	Lee	Professional
-Edward	Hernandez	Skilled Manual
-Dalton	Wood	Professional
-Christine	Nara	Skilled Manual
-Cameron	Rodriguez	Professional
-Angel	Stewart	Professional
--- Query has limit --
-Theodore	Diaz	Skilled Manual
-Stephanie	Cox	Management
-Peter	Nara	Skilled Manual
-Latoya	Shen	Professional
-Joshua	Lee	Professional
-Theodore	Diaz	Skilled Manual
-Stephanie	Cox	Management
-Peter	Nara	Skilled Manual
-Latoya	Shen	Professional
-Joshua	Lee	Professional
--- Query has second limit with bigger value --
-Theodore	Diaz	Skilled Manual
-Stephanie	Cox	Management
-Peter	Nara	Skilled Manual
-Latoya	Shen	Professional
-Joshua	Lee	Professional
--- Query has second limit with smaller value --
-Theodore	Diaz	Skilled Manual
-Stephanie	Cox	Management
-Peter	Nara	Skilled Manual
--- Query has second Column selection --
-Theodore	Diaz
-Stephanie	Cox
-Peter	Nara
--- Query has second Column selection with extra column --
--- Query with desc sort --
-Theodore
-Stephanie
-Peter
-Latoya
-Joshua
-Skilled Manual
-Skilled Manual
-Professional
-Professional
-Management
--- Query with asc sort --
-Management
-Professional
-Professional
-Skilled Manual
-Skilled Manual
--- Query with sort (without keyword asc desc) --
-Theodore
-Stephanie
-Peter
-Latoya
-Joshua
-Skilled Manual
-Skilled Manual
-Professional
-Professional
-Management
--- Query with sort 2 Columns with different direction --
-Stephanie	Cox	Management
-Latoya	Shen	Professional
-Joshua	Lee	Professional
-Peter	Nara	Skilled Manual
-Theodore	Diaz	Skilled Manual
--- Query with second sort --
-Stephanie	Cox	Management
-Latoya	Shen	Professional
-Joshua	Lee	Professional
-Peter	Nara	Skilled Manual
-Theodore	Diaz	Skilled Manual
--- Test String Equals (==) --
-Theodore	Diaz	Skilled Manual
-Peter	Nara	Skilled Manual
-Edward	Hernandez	Skilled Manual
-Christine	Nara	Skilled Manual
--- Test String Not equals (!=) --
-Stephanie	Cox	Management
-Latoya	Shen	Professional
-Joshua	Lee	Professional
-Dalton	Wood	Professional
-Cameron	Rodriguez	Professional
-Angel	Stewart	Professional
--- Test Filter using a list (in) --
-Theodore	Diaz	Skilled Manual	Bachelors
-Stephanie	Cox	Management	Bachelors
-Edward	Hernandez	Skilled Manual	High School
--- Test Filter using a list (!in) --
-Peter	Nara	Skilled Manual	Graduate Degree
-Latoya	Shen	Professional	Graduate Degree
-Joshua	Lee	Professional	Partial College
-Dalton	Wood	Professional	Partial College
-Christine	Nara	Skilled Manual	Partial College
-Cameron	Rodriguez	Professional	Partial College
-Angel	Stewart	Professional	Partial College
--- Test Filter using common string operations (contains_cs) --
-Joshua	Lee	Professional	Partial College
-Dalton	Wood	Professional	Partial College
-Christine	Nara	Skilled Manual	Partial College
-Cameron	Rodriguez	Professional	Partial College
-Angel	Stewart	Professional	Partial College
--- Test Filter using common string operations (startswith_cs) --
-Latoya	Shen	Professional	Graduate Degree
-Joshua	Lee	Professional	Partial College
-Dalton	Wood	Professional	Partial College
-Cameron	Rodriguez	Professional	Partial College
-Angel	Stewart	Professional	Partial College
--- Test Filter using common string operations (endswith_cs) --
-Latoya	Shen	Professional	Graduate Degree
-Joshua	Lee	Professional	Partial College
--- Test Filter using numerical equal (==) --
-Peter	Nara	Skilled Manual	Graduate Degree	26
-Joshua	Lee	Professional	Partial College	26
--- Test Filter using numerical great and less (> , <) --
-Stephanie	Cox	Management	Bachelors	33
-Edward	Hernandez	Skilled Manual	High School	36
-Christine	Nara	Skilled Manual	Partial College	33
--- Test Filter using multi where --
-Dalton	Wood	Professional	Partial College	42
-Angel	Stewart	Professional	Partial College	46
--- Complex query with unknown function --
--- Missing column in front of startsWith --
diff --git a/tests/queries/0_stateless/02366_kql_tabular.sql b/tests/queries/0_stateless/02366_kql_tabular.sql
deleted file mode 100644
index f73c4c09cca..00000000000
--- a/tests/queries/0_stateless/02366_kql_tabular.sql
+++ /dev/null
@@ -1,88 +0,0 @@
-DROP TABLE IF EXISTS Customers;
-CREATE TABLE Customers
-(    
-    FirstName Nullable(String),
-    LastName String, 
-    Occupation String,
-    Education String,
-    Age Nullable(UInt8)
-) ENGINE = Memory;
-
-INSERT INTO Customers VALUES ('Theodore','Diaz','Skilled Manual','Bachelors',28), ('Stephanie','Cox','Management','Bachelors',33), ('Peter','Nara','Skilled Manual','Graduate Degree',26), ('Latoya','Shen','Professional','Graduate Degree',25), ('Joshua','Lee','Professional','Partial College',26), ('Edward','Hernandez','Skilled Manual','High School',36), ('Dalton','Wood','Professional','Partial College',42), ('Christine','Nara','Skilled Manual','Partial College',33), ('Cameron','Rodriguez','Professional','Partial College',28), ('Angel','Stewart','Professional','Partial College',46);
-
-set dialect='kusto';
-print '-- test Query only has table name: --';
-Customers;
-
-print '-- Query has Column Selection --';
-Customers | project FirstName,LastName,Occupation;
-
-print '-- Query has limit --';
-Customers | project FirstName,LastName,Occupation | take 5;
-Customers | project FirstName,LastName,Occupation | limit 5;
-
-print '-- Query has second limit with bigger value --';
-Customers | project FirstName,LastName,Occupation | take 5 | take 7;
-
-print '-- Query has second limit with smaller value --';
-Customers | project FirstName,LastName,Occupation | take 5 | take 3;
-
-print '-- Query has second Column selection --';
-Customers | project FirstName,LastName,Occupation | take 3 | project FirstName,LastName;
-
-print '-- Query has second Column selection with extra column --';
-Customers| project FirstName,LastName,Occupation | take 3 | project FirstName,LastName,Education;-- { serverError 47 }
-
-print '-- Query with desc sort --';
-Customers | project FirstName | take 5 | sort by FirstName desc;
-Customers | project Occupation | take 5 | order by Occupation desc;
-
-print '-- Query with asc sort --';
-Customers | project Occupation | take 5 | sort by Occupation asc;
-
-print '-- Query with sort (without keyword asc desc) --';
-Customers | project FirstName | take 5 | sort by FirstName;
-Customers | project Occupation | take 5 | order by Occupation;
-
-print '-- Query with sort 2 Columns with different direction --';
-Customers | project FirstName,LastName,Occupation | take 5 | sort by Occupation asc, LastName desc;
-
-print '-- Query with second sort --';
-Customers | project FirstName,LastName,Occupation | take 5 | sort by Occupation desc |sort by Occupation asc, LastName desc;
-
-print '-- Test String Equals (==) --';
-Customers | project FirstName,LastName,Occupation | where Occupation == 'Skilled Manual';
-
-print '-- Test String Not equals (!=) --';
-Customers | project FirstName,LastName,Occupation | where Occupation != 'Skilled Manual';
-
-print '-- Test Filter using a list (in) --';
-Customers | project FirstName,LastName,Occupation,Education | where Education in  ('Bachelors','High School');
-
-print '-- Test Filter using a list (!in) --';
-set dialect='kusto';
-Customers | project FirstName,LastName,Occupation,Education | where Education !in  ('Bachelors','High School');
-
-print '-- Test Filter using common string operations (contains_cs) --';
-Customers | project FirstName,LastName,Occupation,Education | where Education contains_cs 'Coll';
-
-print '-- Test Filter using common string operations (startswith_cs) --';
-Customers | project FirstName,LastName,Occupation,Education | where Occupation startswith_cs 'Prof';
-
-print '-- Test Filter using common string operations (endswith_cs) --';
-Customers | project FirstName,LastName,Occupation,Education | where FirstName endswith_cs 'a';
-
-print '-- Test Filter using numerical equal (==) --';
-Customers | project FirstName,LastName,Occupation,Education,Age | where Age == 26;
-
-print '-- Test Filter using numerical great and less (> , <) --';
-Customers | project FirstName,LastName,Occupation,Education,Age | where Age > 30 and Age < 40;
-
-print '-- Test Filter using multi where --';
-Customers | project FirstName,LastName,Occupation,Education,Age | where Age > 30 | where Occupation == 'Professional';
-
-print '-- Complex query with unknown function --';
-hits | where CounterID == 62 and EventDate >= '2013-07-14' and EventDate <= '2013-07-15' and IsRefresh == 0 and DontCountHits == 0 | summarize count() by d=bin(poopoo(EventTime), 1m) | order by d | limit 10; -- { clientError UNKNOWN_FUNCTION }
-
-print '-- Missing column in front of startsWith --';
-StormEvents | where startswith "W" | summarize Count=count() by State; -- { clientError SYNTAX_ERROR }

From f57edeb7dd9b2c7b6b98ee919decf1f7b8cef97c Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Sun, 28 Jan 2024 18:32:02 +0100
Subject: [PATCH 0333/1081] impl

---
 .../00165_jit_aggregate_functions.reference   |  70 ------------
 .../00165_jit_aggregate_functions.sql         | 102 ------------------
 2 files changed, 172 deletions(-)

diff --git a/tests/queries/1_stateful/00165_jit_aggregate_functions.reference b/tests/queries/1_stateful/00165_jit_aggregate_functions.reference
index fa084170f53..62baba2af8b 100644
--- a/tests/queries/1_stateful/00165_jit_aggregate_functions.reference
+++ b/tests/queries/1_stateful/00165_jit_aggregate_functions.reference
@@ -68,73 +68,3 @@ Simple functions with non compilable function without key
 4611686725751467379	9223371678237104442	3626326766789368100	61384643584599682996279588	408650940859.2896	104735.01095549858	8873898	9223372036854775807	4611686018427387904	3818489297630359920
 Simple functions if combinator without key
 4611687533683519016	9223371678237104442	4124667747700004330	930178817930.5122	321189.2280948817	4434274	9223372036854775806	4611686018427387904	2265422677606390266
-Aggregation without JIT compilation
-Simple functions
-1704509	4611700827100483880	9223360787015464643	10441337359398154812	19954243669348.844	9648741.579254271	523264	9223372036854775807	4611686018427387904	4544239379628300646
-732797	4611701940806302259	9223355550934604746	977192643464016658	2054229034942.3723	51998323.94457991	475698	9223372036854775807	4611686018427387904	4091184823334377716
-598875	4611701407242345792	9223362250391155632	9312163881623734456	27615161624211.875	12261797.824844675	337212	9223372036854775807	4611686018427387904	3725992504798702670
-792887	4611699550286611812	9223290551912005343	6930300520201292824	27479710385933.586	53095331.60360441	252197	9223372036854775807	4611686018427387904	6536441508464694614
-3807842	4611710821592843606	9223326163906184987	16710274896338005145	85240848090850.69	22373416.533275086	196036	9223372036854775807	4611686018427387904	1797862753609257231
-25703952	4611709443519524003	9223353913449113943	9946868158853570839	67568783303242.086	3154349.826950714	147211	9223372036854775807	4611686018427387904	8737124378202300429
-716829	4611852156092872082	9223361623076951140	15381015774917924786	170693446547158.72	201431892.4773785	90109	9223372036854775807	4611686018427387904	8209915323001116338
-59183	4611730685242027332	9223354909338698162	8078812522502896568	94622946187035.42	1425270865.0901496	85379	9223372036854775807	4611686018427387904	8909082036598843562
-33010362	4611704682869732882	9223268545373999677	2064452191838585926	26532987929602.555	3695122.4062526934	77807	9223372036854775807	4611686018427387904	5411365383789552292
-800784	4611752907938305166	9223340418389788041	18082918611792817587	233352070043266.62	36535786.81446395	77492	9223372036854775807	4611686018427387904	2059255810151375435
-20810645	4611712185532639162	9223218900001937412	4996531385439292694	68246505203164.63	6316535.831023813	73213	9223372036854775807	4611686018427387904	8852740550386113674
-25843850	4611690025407720929	9223346023778617822	12755881190906812868	185015319325648.16	9962165.34831339	68945	9223372036854775807	4611686018427387904	7849665866595760148
-23447120	4611796031755620254	9223329309291309758	17231649548755339966	255019232629204.38	7937191.271698021	67570	9223372036854775807	4611686018427387904	3435410911925610424
-14739804	4611692230555590277	9223313509005166531	2458378896777063244	38308020331864.36	14590240.469105456	64174	9223372036854775807	4611686018427387904	511910855240035342
-32077710	4611884228437061959	9223352444952988904	12965822147651192908	214467085941034.7	7257521.096258734	60456	9223372036854775807	4611686018427387904	2256071920672551964
-22446879	4611846229717089436	9223124373140579096	13530160492087688838	231724477077663.4	4737362.521046629	58389	9223372036854775807	4611686018427387904	6236276364886386410
-170282	4611833225706935900	9223371583739401906	8076893424988479310	141657635880324.8	1613795518.1065989	57017	9223372036854775807	4611686018427387904	4755775861151848768
-11482817	4611708000353743073	9223337838355779113	14841435427430843458	283531099960470.8	9938452.835998287	52345	9223372036854775807	4611686018427387904	5371586112642152558
-63469	4611695097019173921	9223353530156141191	6296784708578574520	120762239817777.88	579655378.4603049	52142	9223372036854775807	4611686018427387904	4150567963952988110
-29103473	4611744585914335132	9223333530281362537	5908285283932344933	123712996438970.34	867841.595541967	47758	9223372036854775807	4611686018427387904	3238284030821087319
-Simple functions with non compilable function
-1704509	4611700827100483880	9223360787015464643	10441337359398154812	3620921835565807284859452	19954243669348.844	9648741.579254271	523264	9223372036854775807	4611686018427387904	4544239379628300646
-732797	4611701940806302259	9223355550934604746	977192643464016658	3289442827160604417733394	2054229034942.3723	51998323.94457991	475698	9223372036854775807	4611686018427387904	4091184823334377716
-598875	4611701407242345792	9223362250391155632	9312163881623734456	2330921446573746856380600	27615161624211.875	12261797.824844675	337212	9223372036854775807	4611686018427387904	3725992504798702670
-792887	4611699550286611812	9223290551912005343	6930300520201292824	1745179600137886041476120	27479710385933.586	53095331.60360441	252197	9223372036854775807	4611686018427387904	6536441508464694614
-3807842	4611710821592843606	9223326163906184987	16710274896338005145	1356295121550317411019929	85240848090850.69	22373416.533275086	196036	9223372036854775807	4611686018427387904	1797862753609257231
-25703952	4611709443519524003	9223353913449113943	9946868158853570839	1018731388338768841564439	67568783303242.086	3154349.826950714	147211	9223372036854775807	4611686018427387904	8737124378202300429
-716829	4611852156092872082	9223361623076951140	15381015774917924786	623810478612337115371442	170693446547158.72	201431892.4773785	90109	9223372036854775807	4611686018427387904	8209915323001116338
-59183	4611730685242027332	9223354909338698162	8078812522502896568	589916507545680254024632	94622946187035.42	1425270865.0901496	85379	9223372036854775807	4611686018427387904	8909082036598843562
-33010362	4611704682869732882	9223268545373999677	2064452191838585926	538517864195994778911814	26532987929602.555	3695122.4062526934	77807	9223372036854775807	4611686018427387904	5411365383789552292
-800784	4611752907938305166	9223340418389788041	18082918611792817587	535545510122473785781683	233352070043266.62	36535786.81446395	77492	9223372036854775807	4611686018427387904	2059255810151375435
-20810645	4611712185532639162	9223218900001937412	4996531385439292694	506405014842860050255126	68246505203164.63	6316535.831023813	73213	9223372036854775807	4611686018427387904	8852740550386113674
-25843850	4611690025407720929	9223346023778617822	12755881190906812868	476547495537329753708996	185015319325648.16	9962165.34831339	68945	9223372036854775807	4611686018427387904	7849665866595760148
-23447120	4611796031755620254	9223329309291309758	17231649548755339966	467236365548464278670014	255019232629204.38	7937191.271698021	67570	9223372036854775807	4611686018427387904	3435410911925610424
-14739804	4611692230555590277	9223313509005166531	2458378896777063244	444126268697527941770060	38308020331864.36	14590240.469105456	64174	9223372036854775807	4611686018427387904	511910855240035342
-32077710	4611884228437061959	9223352444952988904	12965822147651192908	417407443977973675608140	214467085941034.7	7257521.096258734	60456	9223372036854775807	4611686018427387904	2256071920672551964
-22446879	4611846229717089436	9223124373140579096	13530160492087688838	403462269796593691082374	231724477077663.4	4737362.521046629	58389	9223372036854775807	4611686018427387904	6236276364886386410
-170282	4611833225706935900	9223371583739401906	8076893424988479310	394417911933408911581006	141657635880324.8	1613795518.1065989	57017	9223372036854775807	4611686018427387904	4755775861151848768
-11482817	4611708000353743073	9223337838355779113	14841435427430843458	361995300393829962204226	283531099960470.8	9938452.835998287	52345	9223372036854775807	4611686018427387904	5371586112642152558
-63469	4611695097019173921	9223353530156141191	6296784708578574520	360843057610541117735096	120762239817777.88	579655378.4603049	52142	9223372036854775807	4611686018427387904	4150567963952988110
-29103473	4611744585914335132	9223333530281362537	5908285283932344933	330534668598011678200421	123712996438970.34	867841.595541967	47758	9223372036854775807	4611686018427387904	3238284030821087319
-Simple functions if combinator
-1704509	4611700827100483880	9223310246721229500	16398241567152875142	62618822667209.71	2224726.7626273884	261874	9223372036854775806	4611686018427387904	4518874482384062894
-732797	4611721382223060002	9223355550934604746	16281585268876620522	68472164943295.68	5898616.931652982	237784	9223372036854775806	4611686018427387904	3641900047478154650
-598875	4611701407242345792	9223362250391155632	3577699408183553052	21300140553347.42	53771550.26565126	167966	9223372036854775806	4611686018427387904	1688477495230210408
-792887	4611699550286611812	9223164887726235740	7088177025760385824	56461952267903.89	92835869.96920013	125539	9223372036854775806	4611686018427387904	4850868151095058072
-3807842	4611710821592843606	9223283397553859544	5756765290752687660	58835559208469.4	39794091.419183925	97845	9223372036854775806	4611686018427387904	6845214684357194564
-25703952	4611784761593342388	9223241341744449690	4782279928971192568	65182094768443.91	9276773.708181158	73368	9223372036854775806	4611686018427387904	1384302533387727316
-716829	4611852156092872082	9223361623076951140	8613712481895484190	191445613359755.62	291083243.75407773	44993	9223372036854775806	4611686018427387904	6344483471397203854
-59183	4611730685242027332	9223354909338698162	18369075291092794110	429013599530392	5925109959.715378	42817	9223372036854775806	4611686018427387904	5909305558020042898
-33010362	4611704682869732882	9223092117352620518	9991152681891671022	257099731913529.5	12412830.045471078	38861	9223372036854775806	4611686018427387904	4672855013852508626
-800784	4611752907938305166	9223309994342931384	5251877538869750510	135472890315726.03	53535427.52018088	38767	9223372036854775806	4611686018427387904	7801864489649220514
-20810645	4611712185532639162	9223218900001937412	11803718472901310700	323593455407553	10496765.20741332	36477	9223372036854775806	4611686018427387904	5941995311893397960
-25843850	4611744529689964352	9223346023778617822	127137885677350808	3700925266420.715	18966925.191309396	34353	9223372036854775806	4611686018427387904	6700111718676827412
-23447120	4611796031755620254	9223329309291309758	1841522159325376278	54534534450526.42	6271211.193812284	33768	9223372036854775806	4611686018427387904	2325654077031843898
-14739804	4611762063154116632	9223007205463222212	16302703534054321116	506987919332451.8	6885575.861759452	32156	9223372036854775806	4611686018427387904	2114922310535979832
-32077710	4612033458080771112	9223352444952988904	421072759851674408	13955745719596.793	12220152.393889504	30172	9223372036854775806	4611686018427387904	4399934528735249092
-22446879	4611846229717089436	9223124373140579096	6577134317587565298	224866980668999.47	2482202.163802278	29249	9223372036854775806	4611686018427387904	8763910740678180498
-170282	4611833225706935900	9223371583739401906	15764226366913732386	551447384017691	2515144222.953728	28587	9223372036854775806	4611686018427387904	8217388408377809010
-11482817	4611990575414646848	9223302669582414438	9828522700609834800	378121905921203.2	34845264.2080656	25993	9223372036854775806	4611686018427387904	4689180182672571856
-63469	4612175339998036670	9222961628400798084	17239621485933250238	663164390134376.5	7825349797.6059	25996	9223372036854775806	4611686018427387904	2067736879306995526
-29103473	4611744585914335132	9223035551850347954	12590190375872647672	525927999326314.7	26049107.15514301	23939	9223372036854775806	4611686018427387904	8318055464870862444
-Simple functions without key
-4611686725751467379	9223371678237104442	3626326766789368100	408650940859.2896	104735.01095549858	8873898	9223372036854775807	4611686018427387904	3818489297630359920
-Simple functions with non compilable function without key
-4611686725751467379	9223371678237104442	3626326766789368100	61384643584599682996279588	408650940859.2896	104735.01095549858	8873898	9223372036854775807	4611686018427387904	3818489297630359920
-Simple functions if combinator without key
-4611687533683519016	9223371678237104442	4124667747700004330	930178817930.5122	321189.2280948817	4434274	9223372036854775806	4611686018427387904	2265422677606390266
diff --git a/tests/queries/1_stateful/00165_jit_aggregate_functions.sql b/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
index 157d5892ad8..7fd0e1822a5 100644
--- a/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
+++ b/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
@@ -1,4 +1,3 @@
-SET compile_aggregate_expressions = 1;
 SET min_count_to_compile_aggregate_expression = 0;
 SET max_bytes_before_external_group_by='200M'; -- might be randomized to 1 leading to timeout
 
@@ -101,104 +100,3 @@ SELECT
 FROM test.hits
 ORDER BY min_watch_id
 DESC LIMIT 20;
-
-SET compile_aggregate_expressions = 0;
-
-SELECT 'Aggregation without JIT compilation';
-
-SELECT 'Simple functions';
-
-SELECT
-    CounterID,
-    min(WatchID),
-    max(WatchID),
-    sum(WatchID),
-    avg(WatchID),
-    avgWeighted(WatchID, CounterID),
-    count(WatchID),
-    groupBitOr(WatchID),
-    groupBitAnd(WatchID),
-    groupBitXor(WatchID)
-FROM test.hits
-GROUP BY CounterID ORDER BY count() DESC LIMIT 20;
-
-SELECT 'Simple functions with non compilable function';
-SELECT
-    CounterID,
-    min(WatchID),
-    max(WatchID),
-    sum(WatchID),
-    sum(toUInt128(WatchID)),
-    avg(WatchID),
-    avgWeighted(WatchID, CounterID),
-    count(WatchID),
-    groupBitOr(WatchID),
-    groupBitAnd(WatchID),
-    groupBitXor(WatchID)
-FROM test.hits
-GROUP BY CounterID ORDER BY count() DESC LIMIT 20;
-
-SELECT 'Simple functions if combinator';
-
-WITH (WatchID % 2 == 0) AS predicate
-SELECT
-    CounterID,
-    minIf(WatchID,predicate),
-    maxIf(WatchID, predicate),
-    sumIf(WatchID, predicate),
-    avgIf(WatchID, predicate),
-    avgWeightedIf(WatchID, CounterID, predicate),
-    countIf(WatchID, predicate),
-    groupBitOrIf(WatchID, predicate),
-    groupBitAndIf(WatchID, predicate),
-    groupBitXorIf(WatchID, predicate)
-FROM test.hits
-GROUP BY CounterID ORDER BY count() DESC LIMIT 20;
-
-SELECT 'Simple functions without key';
-
-SELECT
-    min(WatchID) AS min_watch_id,
-    max(WatchID),
-    sum(WatchID),
-    avg(WatchID),
-    avgWeighted(WatchID, CounterID),
-    count(WatchID),
-    groupBitOr(WatchID),
-    groupBitAnd(WatchID),
-    groupBitXor(WatchID)
-FROM test.hits
-ORDER BY min_watch_id DESC LIMIT 20;
-
-SELECT 'Simple functions with non compilable function without key';
-
-SELECT
-    min(WatchID) AS min_watch_id,
-    max(WatchID),
-    sum(WatchID),
-    sum(toUInt128(WatchID)),
-    avg(WatchID),
-    avgWeighted(WatchID, CounterID),
-    count(WatchID),
-    groupBitOr(WatchID),
-    groupBitAnd(WatchID),
-    groupBitXor(WatchID)
-FROM test.hits
-ORDER BY min_watch_id DESC LIMIT 20;
-
-SELECT 'Simple functions if combinator without key';
-
-WITH (WatchID % 2 == 0) AS predicate
-SELECT
-    minIf(WatchID, predicate) as min_watch_id,
-    maxIf(WatchID, predicate),
-    sumIf(WatchID, predicate),
-    avgIf(WatchID, predicate),
-    avgWeightedIf(WatchID, CounterID, predicate),
-    countIf(WatchID, predicate),
-    groupBitOrIf(WatchID, predicate),
-    groupBitAndIf(WatchID, predicate),
-    groupBitXorIf(WatchID, predicate)
-FROM test.hits
-ORDER BY min_watch_id
-DESC LIMIT 20;

From cc4d4647f50295c3c1a1757f0f4213a28fe79e81 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Sun, 28 Jan 2024 22:24:03 +0100
Subject: [PATCH 0334/1081] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 89e8eb13a6d..05b9ec2a06f 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -250,14 +250,14 @@ failed_to_save_logs=0
 for table in query_log zookeeper_log trace_log transactions_info_log metric_log
 do
     err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst; } 2>&1 )
-    echo $err
+    echo "$err"
     [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst; } 2>&1 )
-        echo $err
+        echo "$err"
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
         err=$( { clickhouse-client -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst; } 2>&1 )
-        echo $err
+        echo "$err"
         [[ "0" != "${#err}"  ]] && failed_to_save_logs=1
     fi
 done

From 8798f469b3a0e38341e759f5cc98ca86b8220069 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 22:27:21 +0100
Subject: [PATCH 0335/1081] Fix conflicts.

---
 tests/ci/ci_config.py | 47 +++++++------------------------------------
 1 file changed, 7 insertions(+), 40 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 0fc4b3505ce..8c8c45b877c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -50,6 +50,7 @@ class JobNames(metaclass=WithIter):
 
     STATELESS_TEST_DEBUG = "Stateless tests (debug)"
     STATELESS_TEST_RELEASE = "Stateless tests (release)"
+    STATELESS_TEST_RELEASE_COVERAGE = "Stateless tests (coverage)"
     STATELESS_TEST_AARCH64 = "Stateless tests (aarch64)"
     STATELESS_TEST_ASAN = "Stateless tests (asan)"
     STATELESS_TEST_TSAN = "Stateless tests (tsan)"
@@ -64,6 +65,7 @@ class JobNames(metaclass=WithIter):
 
     STATEFUL_TEST_DEBUG = "Stateful tests (debug)"
     STATEFUL_TEST_RELEASE = "Stateful tests (release)"
+    STATEFUL_TEST_RELEASE_COVERAGE = "Stateful tests (coverage)"
     STATEFUL_TEST_AARCH64 = "Stateful tests (aarch64)"
     STATEFUL_TEST_ASAN = "Stateful tests (asan)"
     STATEFUL_TEST_TSAN = "Stateful tests (tsan)"
@@ -763,18 +765,6 @@ CI_CONFIG = CIConfig(
     builds_report_config={
         JobNames.BUILD_CHECK: BuildReportConfig(
             builds=[
-<<<<<<< HEAD
-                "package_release",
-                "package_aarch64",
-                "package_asan",
-                "package_ubsan",
-                "package_tsan",
-                "package_msan",
-                "package_debug",
-                "package_release_coverage",
-                "binary_release",
-                "fuzzers",
-=======
                 Build.PACKAGE_RELEASE,
                 Build.PACKAGE_AARCH64,
                 Build.PACKAGE_ASAN,
@@ -782,9 +772,9 @@ CI_CONFIG = CIConfig(
                 Build.PACKAGE_TSAN,
                 Build.PACKAGE_MSAN,
                 Build.PACKAGE_DEBUG,
+                Build.PACKAGE_RELEASE_COVERAGE,
                 Build.BINARY_RELEASE,
                 Build.FUZZERS,
->>>>>>> master
             ]
         ),
         JobNames.BUILD_CHECK_SPECIAL: BuildReportConfig(
@@ -872,33 +862,15 @@ CI_CONFIG = CIConfig(
         JobNames.STATEFUL_TEST_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
-<<<<<<< HEAD
-        "Stateful tests (coverage)": TestConfig(
-            "package_release_coverage", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        JobNames.STATEFUL_TEST_RELEASE_COVERAGE: TestConfig(
+            Build.PACKAGE_RELEASE_COVERAGE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
-        "Stateful tests (aarch64)": TestConfig(
-            "package_aarch64", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
-        ),
-        "Stateful tests (release, DatabaseOrdinary)": TestConfig(
-            "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
-        ),
-        "Stateful tests (release, ParallelReplicas)": TestConfig(
-            "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
-=======
         JobNames.STATEFUL_TEST_AARCH64: TestConfig(
             Build.PACKAGE_AARCH64, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
-        # FIXME: delete?
-        # "Stateful tests (release, DatabaseOrdinary)": TestConfig(
-        #     Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
-        # ),
-        # "Stateful tests (release, DatabaseReplicated)": TestConfig(
-        #     Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params) # type: ignore
-        # ),
         # Stateful tests for parallel replicas
         JobNames.STATEFUL_TEST_PARALLEL_REPL_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
->>>>>>> master
         ),
         JobNames.STATEFUL_TEST_PARALLEL_REPL_DEBUG: TestConfig(
             Build.PACKAGE_DEBUG, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
@@ -939,16 +911,11 @@ CI_CONFIG = CIConfig(
         JobNames.STATELESS_TEST_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),
-<<<<<<< HEAD
-        "Stateless tests (coverage)": TestConfig(
-            "package_release_coverage", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        JobNames.STATELESS_TEST_RELEASE_COVERAGE: TestConfig(
+            Build.PACKAGE_RELEASE_COVERAGE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),
-        "Stateless tests (aarch64)": TestConfig(
-            "package_aarch64", job_config=JobConfig(**statless_test_common_params)  # type: ignore
-=======
         JobNames.STATELESS_TEST_AARCH64: TestConfig(
             Build.PACKAGE_AARCH64, job_config=JobConfig(**statless_test_common_params)  # type: ignore
->>>>>>> master
         ),
         JobNames.STATELESS_TEST_ANALYZER_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**statless_test_common_params)  # type: ignore

From 1ef8062c7701c1788abda4d5da7ee56a5b9de372 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 22:28:09 +0100
Subject: [PATCH 0336/1081] Split by batches

---
 tests/ci/ci_config.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 8c8c45b877c..0cfddbe0435 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -912,7 +912,8 @@ CI_CONFIG = CIConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),
         JobNames.STATELESS_TEST_RELEASE_COVERAGE: TestConfig(
-            Build.PACKAGE_RELEASE_COVERAGE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
+            Build.PACKAGE_RELEASE_COVERAGE,
+            job_config=JobConfig(num_batches=6, **statless_test_common_params)  # type: ignore
         ),
         JobNames.STATELESS_TEST_AARCH64: TestConfig(
             Build.PACKAGE_AARCH64, job_config=JobConfig(**statless_test_common_params)  # type: ignore

From aec3f28ccb92e18595e87bce8e51e831b8c17b92 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 23:06:50 +0100
Subject: [PATCH 0337/1081] Support backups for compressed in-memory tables

---
 programs/server/config.xml                    |  4 +++
 src/Formats/NativeWriter.cpp                  |  3 +-
 src/Storages/StorageMemory.cpp                | 22 ++++++++++---
 ...3_backup_of_in_memory_compressed.reference |  2 ++
 .../02973_backup_of_in_memory_compressed.sh   | 31 +++++++++++++++++++
 5 files changed, 56 insertions(+), 6 deletions(-)
 create mode 100644 tests/queries/0_stateless/02973_backup_of_in_memory_compressed.reference
 create mode 100755 tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh

diff --git a/programs/server/config.xml b/programs/server/config.xml
index 0dc271692b8..6a40818332b 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -1562,6 +1562,10 @@
         <max_entry_size_in_rows>30000000</max_entry_size_in_rows>
     </query_cache>
 
+    <backups>
+        <allowed_path>backups</allowed_path>
+    </backups>
+
     <!-- This allows to disable exposing addresses in stack traces for security reasons.
          Please be aware that it does not improve security much, but makes debugging much harder.
          The addresses that are small offsets from zero will be displayed nevertheless to show nullptr dereferences.
diff --git a/src/Formats/NativeWriter.cpp b/src/Formats/NativeWriter.cpp
index 70d5b7914a7..b150561a5fc 100644
--- a/src/Formats/NativeWriter.cpp
+++ b/src/Formats/NativeWriter.cpp
@@ -49,8 +49,9 @@ static void writeData(const ISerialization & serialization, const ColumnPtr & co
 {
     /** If there are columns-constants - then we materialize them.
       * (Since the data type does not know how to serialize / deserialize constants.)
+      * The same for compressed columns in-memory.
       */
-    ColumnPtr full_column = column->convertToFullColumnIfConst();
+    ColumnPtr full_column = column->convertToFullColumnIfConst()->decompress();
 
     ISerialization::SerializeBinaryBulkSettings settings;
     settings.getter = [&ostr](ISerialization::SubstreamPath) -> WriteBuffer * { return &ostr; };
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 0011e3c57a2..02d81eda59a 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -79,11 +79,11 @@ public:
             for (const auto & elem : block)
                 compressed_block.insert({ elem.column->compress(), elem.type, elem.name });
 
-            new_blocks.emplace_back(compressed_block);
+            new_blocks.push_back(std::move(compressed_block));
         }
         else
         {
-            new_blocks.emplace_back(block);
+            new_blocks.push_back(std::move(block));
         }
     }
 
@@ -472,9 +472,21 @@ void StorageMemory::restoreDataImpl(const BackupPtr & backup, const String & dat
 
         while (auto block = block_in.read())
         {
-            new_bytes += block.bytes();
-            new_rows += block.rows();
-            new_blocks.push_back(std::move(block));
+            if (compress)
+            {
+                Block compressed_block;
+                for (const auto & elem : block)
+                    compressed_block.insert({ elem.column->compress(), elem.type, elem.name });
+
+                new_blocks.push_back(std::move(compressed_block));
+            }
+            else
+            {
+                new_blocks.push_back(std::move(block));
+            }
+
+            new_bytes += new_blocks.back().bytes();
+            new_rows += new_blocks.back().rows();
         }
     }
 
diff --git a/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.reference b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.reference
new file mode 100644
index 00000000000..00479541d22
--- /dev/null
+++ b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.reference
@@ -0,0 +1,2 @@
+0
+1000000	Hello, world	Hello, world
diff --git a/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh
new file mode 100755
index 00000000000..c49d86b95c7
--- /dev/null
+++ b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh
@@ -0,0 +1,31 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+# Because we are creating a backup with fixed path.
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT --multiquery "
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (x String) ENGINE = Memory SETTINGS compress = 1;
+INSERT INTO test SELECT 'Hello, world' FROM numbers(1000000);
+"
+
+$CLICKHOUSE_CLIENT --multiquery "
+BACKUP TABLE test TO File('test.zip');
+" --format Null
+
+$CLICKHOUSE_CLIENT --multiquery "
+TRUNCATE TABLE test;
+SELECT count() FROM test;
+"
+
+$CLICKHOUSE_CLIENT --multiquery "
+RESTORE TABLE test FROM File('test.zip');
+" --format Null
+
+$CLICKHOUSE_CLIENT --multiquery "
+SELECT count(), min(x), max(x) FROM test;
+DROP TABLE test;
+"

From 982e3ddbddb0baaa2ac11f9dec74a8be8c8e8545 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 23:11:03 +0100
Subject: [PATCH 0338/1081] Fix Python

---
 tests/ci/ci_config.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 0cfddbe0435..7458f25805f 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -913,7 +913,7 @@ CI_CONFIG = CIConfig(
         ),
         JobNames.STATELESS_TEST_RELEASE_COVERAGE: TestConfig(
             Build.PACKAGE_RELEASE_COVERAGE,
-            job_config=JobConfig(num_batches=6, **statless_test_common_params)  # type: ignore
+            job_config=JobConfig(num_batches=6, **statless_test_common_params),  # type: ignore
         ),
         JobNames.STATELESS_TEST_AARCH64: TestConfig(
             Build.PACKAGE_AARCH64, job_config=JobConfig(**statless_test_common_params)  # type: ignore

From 30f48e18938bbc5683d781f1cbfe7bfcf3fec8d9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 28 Jan 2024 23:54:35 +0100
Subject: [PATCH 0339/1081] Use MergeTree as a default table engine

---
 src/Core/Settings.h               | 2 +-
 src/Core/SettingsChangesHistory.h | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e0b3ca39899..4460a365846 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -558,7 +558,7 @@ class IColumn;
     M(UInt64, min_free_disk_space_for_temporary_data, 0, "The minimum disk space to keep while writing temporary data used in external sorting and aggregation.", 0) \
     \
     M(DefaultTableEngine, default_temporary_table_engine, DefaultTableEngine::Memory, "Default table engine used when ENGINE is not set in CREATE TEMPORARY statement.",0) \
-    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::None, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
+    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::MergeTree, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
     M(Bool, show_table_uuid_in_table_create_query_if_not_nil, false, "For tables in databases with Engine=Atomic show UUID of the table in its CREATE query.", 0) \
     M(Bool, database_atomic_wait_for_drop_and_detach_synchronously, false, "When executing DROP or DETACH TABLE in Atomic database, wait for table data to be finally dropped or detached.", 0) \
     M(Bool, enable_scalar_subquery_optimization, true, "If it is set to true, prevent scalar subqueries from (de)serializing large scalar values and possibly avoid running the same subquery more than once.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index dff0ebb759c..7bdab886934 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -100,6 +100,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
+              {"default_table_engine", DefaultTableEngine::None, DefaultTableEngine::MergeTree, "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},

From a3cc98c4f637601be1fa468fbaa6bb689bb80542 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 29 Jan 2024 01:56:15 +0300
Subject: [PATCH 0340/1081] Update 02973_backup_of_in_memory_compressed.sh

---
 .../queries/0_stateless/02973_backup_of_in_memory_compressed.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh
index c49d86b95c7..b212e42061f 100755
--- a/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh
+++ b/tests/queries/0_stateless/02973_backup_of_in_memory_compressed.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-parallel
+# Tags: no-parallel, no-fasttest
 # Because we are creating a backup with fixed path.
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

From 7aea3847dbea8a4d25b9aaafff5250edfbb47f1e Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Mon, 29 Jan 2024 11:54:19 +0800
Subject: [PATCH 0341/1081] improve exception message of function
 regexp_extract

---
 src/Functions/regexpExtract.cpp | 24 +++++++++++++++---------
 1 file changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/Functions/regexpExtract.cpp b/src/Functions/regexpExtract.cpp
index 0502d2fbfdc..e7c982d675a 100644
--- a/src/Functions/regexpExtract.cpp
+++ b/src/Functions/regexpExtract.cpp
@@ -124,21 +124,23 @@ private:
         res_offsets.push_back(res_offset);
     }
 
-    static void vectorConstant(
+    void vectorConstant(
         const ColumnString::Chars & data,
         const ColumnString::Offsets & offsets,
         const std::string & pattern,
         ssize_t index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         const OptimizedRegularExpression regexp = Regexps::createRegexp<false, false, false>(pattern);
         unsigned capture = regexp.getNumberOfSubpatterns();
         if (index < 0 || index >= capture + 1)
             throw Exception(
                 ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                "Index value {} is out of range, should be in [0, {})",
+                "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                 index,
+                pattern,
+                getName(),
                 capture + 1);
 
         OptimizedRegularExpression::MatchVec matches;
@@ -161,13 +163,13 @@ private:
         }
     }
 
-    static void vectorVector(
+    void vectorVector(
         const ColumnString::Chars & data,
         const ColumnString::Offsets & offsets,
         const std::string & pattern,
         const ColumnPtr & column_index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         res_data.reserve(data.size() / 5);
         res_offsets.reserve(offsets.size());
@@ -187,8 +189,10 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range, should be in [0, {})",
+                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                     index,
+                    pattern,
+                    getName(),
                     capture + 1);
 
             regexp.match(
@@ -202,12 +206,12 @@ private:
         }
     }
 
-    static void constantVector(
+    void constantVector(
         const std::string & str,
         const std::string & pattern,
         const ColumnPtr & column_index,
         ColumnString::Chars & res_data,
-        ColumnString::Offsets & res_offsets)
+        ColumnString::Offsets & res_offsets) const
     {
         size_t rows = column_index->size();
         res_data.reserve(str.size() / 5);
@@ -230,8 +234,10 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range, should be in [0, {})",
+                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
                     index,
+                    pattern,
+                    getName(),
                     capture + 1);
 
             saveMatch(matches, index, padded_str, 0, res_data, res_offsets, res_offset);

From a22b68f46fec54f98fc3c3cb9a9c1f597bae7ffd Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 10:49:36 +0100
Subject: [PATCH 0342/1081] Added setting azure_max_single_part_copy_size

---
 src/Core/Settings.h                                         | 3 ++-
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp               | 4 +++-
 .../ObjectStorages/AzureBlobStorage/AzureObjectStorage.h    | 3 +++
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp        | 6 +-----
 4 files changed, 9 insertions(+), 7 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 305d6466658..4ae5d1585f3 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -82,7 +82,8 @@ class IColumn;
     M(UInt64, s3_upload_part_size_multiply_parts_count_threshold, 500, "Each time this number of parts was uploaded to S3, s3_min_upload_part_size is multiplied by s3_upload_part_size_multiply_factor.", 0) \
     M(UInt64, s3_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited. You ", 0) \
     M(UInt64, s3_max_single_part_upload_size, 32*1024*1024, "The maximum size of object to upload using singlepart upload to S3.", 0) \
-    M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0) \
+    M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0)                                                                             \
+    M(UInt64, azure_max_single_part_copy_size, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage.", 0) \
     M(UInt64, s3_max_single_read_retries, 4, "The maximum number of retries during single S3 read.", 0) \
     M(UInt64, azure_max_single_read_retries, 4, "The maximum number of retries during single Azure blob storage read.", 0) \
     M(UInt64, s3_max_unexpected_write_error_retries, 4, "The maximum number of retries in case of unexpected errors during S3 write.", 0) \
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 02b0d5bb599..9da84d430e4 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -7,6 +7,7 @@
 #include <optional>
 #include <azure/identity/managed_identity_credential.hpp>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <Interpreters/Context.h>
 
 using namespace Azure::Storage::Blobs;
 
@@ -157,7 +158,7 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
     }
 }
 
-std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr /*context*/)
+std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
     return std::make_unique<AzureObjectStorageSettings>(
         config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024),
@@ -166,6 +167,7 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getInt(config_prefix + ".max_single_download_retries", 3),
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
         config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
+        config.getUInt64(config_prefix + ".max_single_part_copy_size", context->getSettings().azure_max_single_part_copy_size),
         config.getBool(config_prefix + ".use_native_copy", false)
     );
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 0ae12fb205f..18b1a70defe 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -25,6 +25,7 @@ struct AzureObjectStorageSettings
         int max_single_download_retries_,
         int list_object_keys_size_,
         size_t max_upload_part_size_,
+        size_t max_single_part_copy_size_,
         bool use_native_copy_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
@@ -32,6 +33,7 @@ struct AzureObjectStorageSettings
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
         , max_upload_part_size(max_upload_part_size_)
+        , max_single_part_copy_size(max_single_part_copy_size_)
         , use_native_copy(use_native_copy_)
     {
     }
@@ -46,6 +48,7 @@ struct AzureObjectStorageSettings
     size_t min_upload_part_size = 16 * 1024 * 1024;
     size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
     size_t max_part_number = 10000;
+    size_t max_single_part_copy_size = 256 * 1024 * 1024;
     bool use_native_copy = false;
 };
 
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 537a5a191e7..ff4cfe62feb 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -33,10 +33,6 @@ namespace ErrorCodes
     extern const int AZURE_BLOB_STORAGE_ERROR;
 }
 
-
-size_t max_single_operation_copy_size = 256 * 1024 * 1024;
-
-
 namespace
 {
     class UploadHelper
@@ -304,7 +300,7 @@ void copyAzureBlobStorageFile(
         auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_blob);
         auto source_uri = block_blob_client_src.GetUrl();
 
-        if (size < max_single_operation_copy_size)
+        if (size < settings.get()->max_single_part_copy_size)
         {
             block_blob_client_dest.CopyFromUri(source_uri);
         }

From 99a1b269d71054a1d4d1e59a55b229469652435c Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 11:00:59 +0100
Subject: [PATCH 0343/1081] Removed unwanted setting

---
 src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 18b1a70defe..7d5c8f07a75 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -47,7 +47,6 @@ struct AzureObjectStorageSettings
     int list_object_keys_size = 1000;
     size_t min_upload_part_size = 16 * 1024 * 1024;
     size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
-    size_t max_part_number = 10000;
     size_t max_single_part_copy_size = 256 * 1024 * 1024;
     bool use_native_copy = false;
 };

From ce0ebd964519d0961d92318e8a171d5338365213 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 11:14:19 +0100
Subject: [PATCH 0344/1081] Removed unwanted log lines

---
 src/Backups/BackupImpl.cpp | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/Backups/BackupImpl.cpp b/src/Backups/BackupImpl.cpp
index 0fb0d8cbda9..28a7d60b52c 100644
--- a/src/Backups/BackupImpl.cpp
+++ b/src/Backups/BackupImpl.cpp
@@ -535,7 +535,6 @@ void BackupImpl::checkBackupDoesntExist() const
     else
         file_name_to_check_existence = ".backup";
 
-    LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkBackupDoesntExist 1");
     if (writer->fileExists(file_name_to_check_existence))
         throw Exception(ErrorCodes::BACKUP_ALREADY_EXISTS, "Backup {} already exists", backup_name_for_logging);
 
@@ -567,8 +566,6 @@ bool BackupImpl::checkLockFile(bool throw_if_failed) const
 
     if (throw_if_failed)
     {
-        LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkLockFile");
-
         if (!writer->fileExists(lock_file_name))
         {
             throw Exception(

From 94be2cf7a657e0cc824d0d7a29b5ef44575235c3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 13:28:07 +0300
Subject: [PATCH 0345/1081] Fixed tests

---
 tests/config/users.d/readonly.xml         | 3 ++-
 tests/config/users.d/session_log_test.xml | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/config/users.d/readonly.xml b/tests/config/users.d/readonly.xml
index 0fe1e3fe6d9..799de11decf 100644
--- a/tests/config/users.d/readonly.xml
+++ b/tests/config/users.d/readonly.xml
@@ -9,7 +9,8 @@
     <users>
         <readonly>
             <password></password>
-            <networks incl="networks" replace="replace">
+
+            <networks>
                 <ip>::1</ip>
                 <ip>127.0.0.1</ip>
             </networks>
diff --git a/tests/config/users.d/session_log_test.xml b/tests/config/users.d/session_log_test.xml
index cc2c2c5fcde..f93b0efd828 100644
--- a/tests/config/users.d/session_log_test.xml
+++ b/tests/config/users.d/session_log_test.xml
@@ -18,7 +18,8 @@
     <users>
         <session_log_test_xml_user>
             <no_password></no_password>
-            <networks incl="networks" replace="replace">
+
+            <networks>
                 <ip>::1</ip>
                 <ip>127.0.0.1</ip>
             </networks>

From ab2b12ba9f9a33e185362244eb396f0d111865c8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 11:40:12 +0100
Subject: [PATCH 0346/1081] Fix typo

---
 docs/en/operations/system-tables/metrics.md        | 2 +-
 src/Common/CurrentMetrics.cpp                      | 2 +-
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 +--
 3 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/system-tables/metrics.md b/docs/en/operations/system-tables/metrics.md
index 3dec6345eb6..898e6ae2e2c 100644
--- a/docs/en/operations/system-tables/metrics.md
+++ b/docs/en/operations/system-tables/metrics.md
@@ -287,7 +287,7 @@ Number of threads in the HashedDictionary thread pool running a task.
 
 ### IOPrefetchThreads
 
-Number of threads in the IO prefertch thread pool.
+Number of threads in the IO prefetch thread pool.
 
 ### IOPrefetchThreadsActive
 
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 724b6ab62f7..e7534f71dbb 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -87,7 +87,7 @@
     M(MarksLoaderThreads, "Number of threads in thread pool for loading marks.") \
     M(MarksLoaderThreadsActive, "Number of threads in the thread pool for loading marks running a task.") \
     M(MarksLoaderThreadsScheduled, "Number of queued or active jobs in the thread pool for loading marks.") \
-    M(IOPrefetchThreads, "Number of threads in the IO prefertch thread pool.") \
+    M(IOPrefetchThreads, "Number of threads in the IO prefetch thread pool.") \
     M(IOPrefetchThreadsActive, "Number of threads in the IO prefetch thread pool running a task.") \
     M(IOPrefetchThreadsScheduled, "Number of queued or active jobs in the IO prefetch thread pool.") \
     M(IOWriterThreads, "Number of threads in the IO writer thread pool.") \
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index ab48a4a798c..93e2a12d69c 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2657 
+personal_ws-1.1 en 2657
 AArch
 ACLs
 ALTERs
@@ -2060,7 +2060,6 @@ prebuild
 prebuilt
 preemptable
 preferServerCiphers
-prefertch
 prefetch
 prefetchsize
 preloaded

From bd83830ceafe2637279f61a482077189b83ba25c Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Mon, 29 Jan 2024 12:17:38 +0100
Subject: [PATCH 0347/1081] CI: WA for issue with perf test with artifact reuse
 (#59325)

* CI: WA for issue with perf test with artifact reuse

 #do_not_test

* Automatic style fix

---------

Co-authored-by: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
---
 tests/ci/ci_config.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index df72c02cb7d..e011b8ad3c9 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -214,6 +214,11 @@ class BuildConfig:
                     "./packages",
                     "./docker/packager/packager",
                     "./rust",
+                    # FIXME: This is a WA to rebuild the CH and recreate the Performance.tar.zst artifact
+                    # when there are changes in performance test scripts.
+                    # Due to the current design of the perf test we need to rebuild CH when the performance test changes,
+                    # otherwise the changes will not be visible in the PerformanceTest job in CI
+                    "./tests/performance",
                 ],
                 exclude_files=[".md"],
                 docker=["clickhouse/binary-builder"],

From 5c5ec7465bb0ea47ddb9cc6661df4a860a20ee94 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:28:29 +0100
Subject: [PATCH 0348/1081] Update test

---
 .../test_broken_projections/test.py           | 24 +++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 8be14c6a57b..e0b8c3d9247 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -228,13 +228,23 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         )
         time.sleep(2)
         node.query("SYSTEM FLUSH LOGS")
-        assert "proj1" in node.query(
+        res = node.query(
             f"""
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
+        if res == "":
+            res = node.query(
+                """
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log
+            """
+            )
+            print(res)
+            assert False
+        assert "proj1" in res
 
     query_id = random_str()
 
@@ -249,13 +259,23 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         )
         time.sleep(2)
         node.query("SYSTEM FLUSH LOGS")
-        assert "proj2" in node.query(
+        res = node.query(
             f"""
         SELECT query, splitByChar('.', arrayJoin(projections))[-1]
         FROM system.query_log
         WHERE query_id='{query_id}' AND type='QueryFinish'
         """
         )
+        if res == "":
+            res = node.query(
+                """
+                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log
+            """
+            )
+            print(res)
+            assert False
+        assert "proj2" in res
 
     assert check_result == int(node.query(f"CHECK TABLE {table}"))
 

From ef252d8376c1d296e2da52b8ff14b3c4b611df3e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:36:00 +0100
Subject: [PATCH 0349/1081] Validate settings with keeper, add a test

---
 src/Storages/S3Queue/S3QueueTableMetadata.cpp | 50 ++++++++++++--
 src/Storages/S3Queue/S3QueueTableMetadata.h   |  2 +
 .../integration/test_storage_s3_queue/test.py | 66 +++++++++++++++++++
 3 files changed, 114 insertions(+), 4 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.cpp b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
index 104f70224b6..3ee2594135d 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
@@ -16,8 +16,22 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int METADATA_MISMATCH;
+    extern const int BAD_ARGUMENTS;
 }
 
+namespace
+{
+    S3QueueMode modeFromString(const std::string & mode)
+    {
+        if (mode == "ordered")
+            return S3QueueMode::ORDERED;
+        if (mode == "unordered")
+            return S3QueueMode::UNORDERED;
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected S3Queue mode: {}", mode);
+    }
+}
+
+
 S3QueueTableMetadata::S3QueueTableMetadata(
     const StorageS3::Configuration & configuration,
     const S3QueueSettings & engine_settings,
@@ -28,10 +42,11 @@ S3QueueTableMetadata::S3QueueTableMetadata(
     mode = engine_settings.mode.toString();
     s3queue_tracked_files_limit = engine_settings.s3queue_tracked_files_limit;
     s3queue_tracked_file_ttl_sec = engine_settings.s3queue_tracked_file_ttl_sec;
+    s3queue_total_shards_num = engine_settings.s3queue_total_shards_num;
+    s3queue_processing_threads_num = engine_settings.s3queue_processing_threads_num;
     columns = storage_metadata.getColumns().toString();
 }
 
-
 String S3QueueTableMetadata::toString() const
 {
     Poco::JSON::Object json;
@@ -39,6 +54,8 @@ String S3QueueTableMetadata::toString() const
     json.set("mode", mode);
     json.set("s3queue_tracked_files_limit", s3queue_tracked_files_limit);
     json.set("s3queue_tracked_file_ttl_sec", s3queue_tracked_file_ttl_sec);
+    json.set("s3queue_total_shards_num", s3queue_total_shards_num);
+    json.set("s3queue_processing_threads_num", s3queue_processing_threads_num);
     json.set("format_name", format_name);
     json.set("columns", columns);
 
@@ -58,6 +75,10 @@ void S3QueueTableMetadata::read(const String & metadata_str)
     s3queue_tracked_file_ttl_sec = json->getValue<UInt64>("s3queue_tracked_file_ttl_sec");
     format_name = json->getValue<String>("format_name");
     columns = json->getValue<String>("columns");
+    if (json->has("s3queue_total_shards_num"))
+        s3queue_total_shards_num = json->getValue<UInt64>("s3queue_total_shards_num");
+    if (json->has("s3queue_processing_threads_num"))
+        s3queue_processing_threads_num = json->getValue<UInt64>("s3queue_processing_threads_num");
 }
 
 S3QueueTableMetadata S3QueueTableMetadata::parse(const String & metadata_str)
@@ -67,7 +88,6 @@ S3QueueTableMetadata S3QueueTableMetadata::parse(const String & metadata_str)
     return metadata;
 }
 
-
 void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata & from_zk) const
 {
     if (after_processing != from_zk.after_processing)
@@ -83,8 +103,8 @@ void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata
             ErrorCodes::METADATA_MISMATCH,
             "Existing table metadata in ZooKeeper differs in engine mode. "
             "Stored in ZooKeeper: {}, local: {}",
-            DB::toString(from_zk.mode),
-            DB::toString(mode));
+            from_zk.mode,
+            mode);
 
     if (s3queue_tracked_files_limit != from_zk.s3queue_tracked_files_limit)
         throw Exception(
@@ -109,6 +129,28 @@ void S3QueueTableMetadata::checkImmutableFieldsEquals(const S3QueueTableMetadata
             "Stored in ZooKeeper: {}, local: {}",
             from_zk.format_name,
             format_name);
+
+    if (modeFromString(mode) == S3QueueMode::ORDERED)
+    {
+        if (s3queue_processing_threads_num != from_zk.s3queue_processing_threads_num)
+        {
+            throw Exception(
+                ErrorCodes::METADATA_MISMATCH,
+                "Existing table metadata in ZooKeeper differs in s3queue_processing_threads_num setting. "
+                "Stored in ZooKeeper: {}, local: {}",
+                from_zk.s3queue_processing_threads_num,
+                s3queue_processing_threads_num);
+        }
+        if (s3queue_total_shards_num != from_zk.s3queue_total_shards_num)
+        {
+            throw Exception(
+                ErrorCodes::METADATA_MISMATCH,
+                "Existing table metadata in ZooKeeper differs in s3queue_total_shards_num setting. "
+                "Stored in ZooKeeper: {}, local: {}",
+                from_zk.s3queue_total_shards_num,
+                s3queue_total_shards_num);
+        }
+    }
 }
 
 void S3QueueTableMetadata::checkEquals(const S3QueueTableMetadata & from_zk) const
diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.h b/src/Storages/S3Queue/S3QueueTableMetadata.h
index f15665692c4..30642869930 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.h
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.h
@@ -23,6 +23,8 @@ struct S3QueueTableMetadata
     String mode;
     UInt64 s3queue_tracked_files_limit;
     UInt64 s3queue_tracked_file_ttl_sec;
+    UInt64 s3queue_total_shards_num;
+    UInt64 s3queue_processing_threads_num;
 
     S3QueueTableMetadata() = default;
     S3QueueTableMetadata(const StorageS3::Configuration & configuration, const S3QueueSettings & engine_settings, const StorageInMemoryMetadata & storage_metadata);
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 5209c6f9642..4dc5f7e6556 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -165,6 +165,7 @@ def create_table(
     file_format="CSV",
     auth=DEFAULT_AUTH,
     bucket=None,
+    expect_error=False,
 ):
     auth_params = ",".join(auth)
     bucket = started_cluster.minio_bucket if bucket is None else bucket
@@ -184,6 +185,10 @@ def create_table(
         ENGINE = S3Queue('{url}', {auth_params}, {file_format})
         SETTINGS {",".join((k+"="+repr(v) for k, v in settings.items()))}
         """
+
+    if expect_error:
+        return node.query_and_get_error(create_query)
+
     node.query(create_query)
 
 
@@ -1200,3 +1205,64 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+
+
+def test_settings_check(started_cluster):
+    node = started_cluster.instances["instance"]
+    node_2 = started_cluster.instances["instance2"]
+    table_name = f"test_settings_check"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    mode = "ordered"
+
+    i = 0
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        mode,
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+            "s3queue_processing_threads_num": 5,
+            "s3queue_total_shards_num": 2,
+            "s3queue_current_shard_num": i,
+        },
+    )
+
+    assert (
+        "Existing table metadata in ZooKeeper differs in s3queue_total_shards_num setting. Stored in ZooKeeper: 2, local: 3"
+        in create_table(
+            started_cluster,
+            node_2,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": 5,
+                "s3queue_total_shards_num": 3,
+                "s3queue_current_shard_num": i,
+            },
+            expect_error=True,
+        )
+    )
+
+    assert (
+        "Existing table metadata in ZooKeeper differs in s3queue_processing_threads_num setting. Stored in ZooKeeper: 5, local: 2"
+        in create_table(
+            started_cluster,
+            node_2,
+            table_name,
+            mode,
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": 2,
+                "s3queue_total_shards_num": 2,
+                "s3queue_current_shard_num": i,
+            },
+            expect_error=True,
+        )
+    )

From d0ea5392db7362cda42befbe9a0239ee1b3e8af8 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 12:36:32 +0100
Subject: [PATCH 0350/1081] Fix storing iterated keys

---
 src/Storages/S3Queue/S3QueueFilesMetadata.h |  7 ++++
 src/Storages/S3Queue/S3QueueSource.cpp      | 43 +++++++++++++++------
 2 files changed, 38 insertions(+), 12 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index f62898889c3..0cc03783868 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -91,6 +91,13 @@ public:
 
     bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
 
+    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const
+    {
+        std::vector<size_t> res(threads_per_shard);
+        std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
+        return res;
+    }
+
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 96805eca10b..832a50386ee 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -54,8 +54,8 @@ StorageS3QueueSource::FileIterator::FileIterator(
 {
     if (sharded_processing)
     {
-        for (size_t i = 0; i < metadata->getProcessingThreadsNum(); ++i)
-            sharded_keys.emplace(i, std::deque<KeyWithInfoPtr>{});
+        for (const auto & id : metadata->getProcessingIdsForShard(current_shard))
+            sharded_keys.emplace(id, std::deque<KeyWithInfoPtr>{});
     }
 }
 
@@ -73,11 +73,20 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 /// we need to check sharded_keys and to next() under lock.
                 lk.lock();
 
-                auto & keys = sharded_keys.at(idx);
-                if (!keys.empty())
+                if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
                 {
-                    val = keys.front();
-                    keys.pop_front();
+                    auto & keys = it->second;
+                    if (!keys.empty())
+                    {
+                        val = keys.front();
+                        keys.pop_front();
+                    }
+                }
+                else
+                {
+                    throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                    "Processing id {} does not exist (Expexted ids: {})",
+                                    idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                 }
             }
 
@@ -86,14 +95,24 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 val = glob_iterator->next();
                 if (val && sharded_processing)
                 {
-                    auto shard = metadata->getProcessingIdForPath(val->key);
-                    if (idx != shard)
+                    const auto processing_id_for_key = metadata->getProcessingIdForPath(val->key);
+                    if (idx != processing_id_for_key)
                     {
-                        if (metadata->isProcessingIdBelongsToShard(shard, current_shard))
+                        if (metadata->isProcessingIdBelongsToShard(processing_id_for_key, current_shard))
                         {
-                            LOG_TEST(log, "Key {} is for shard {} (total: {})", val->key, shard, sharded_keys.size());
-                            auto & keys = sharded_keys.at(shard);
-                            keys.push_back(val);
+                            LOG_TEST(log, "Putting key {} into queue of shard {} (total: {})",
+                                     val->key, processing_id_for_key, sharded_keys.size());
+
+                            if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
+                            {
+                                it->second.push_back(val);
+                            }
+                            else
+                            {
+                                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                                "Processing id {} does not exist (Expexted ids: {})",
+                                                idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
+                            }
                         }
                         continue;
                     }

From 9f2093df75f0b0960e1d1a0fa80305f55d00a32e Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Mon, 29 Jan 2024 12:54:29 +0100
Subject: [PATCH 0351/1081] Restart CI

---
 src/Parsers/ParserDataType.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ParserDataType.cpp b/src/Parsers/ParserDataType.cpp
index 99c0b4b29ac..b75f17dca72 100644
--- a/src/Parsers/ParserDataType.cpp
+++ b/src/Parsers/ParserDataType.cpp
@@ -123,7 +123,7 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         auto test_pos = pos;
         ++test_pos;
         if (ParserToken(TokenType::ClosingRoundBracket).ignore(test_pos, test_expected))
-        { // the end of the type definition was reached, there was a trailing comma
+        { // the end of the type definition was reached and there was a trailing comma
             ++pos;
         }
     }

From c79a151ccac29b18ecdc4b451ecc9beda510d3c4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:00:49 +0100
Subject: [PATCH 0352/1081] Simplify query_run_metric_arrays in perf tests

---
 tests/performance/scripts/compare.sh | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/tests/performance/scripts/compare.sh b/tests/performance/scripts/compare.sh
index 92ba383f965..e4bc64b3e28 100755
--- a/tests/performance/scripts/compare.sh
+++ b/tests/performance/scripts/compare.sh
@@ -444,10 +444,8 @@ create view query_logs as
 create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-arrays.tsv')
     as
     with (
-        -- sumMapState with the list of all keys with 'nan' values. 'nan' is because
-        -- sumMap removes keys with positive/negative zeros.
         with (select groupUniqArrayArray(mapKeys(ProfileEvents)) from query_logs) as all_names
-            select arrayReduce('sumMapState', [(all_names, arrayMap(x->nan, all_names))])
+            select arrayReduce('sumMapState', [(all_names, arrayMap(x->0::Nullable(Float64), all_names))])
         ) as all_metrics
     select test, query_index, version, query_id,
         (finalizeAggregation(
@@ -456,14 +454,12 @@ create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-
                     all_metrics,
                     arrayReduce('sumMapState',
                         [(mapKeys(ProfileEvents),
-                            arrayMap(x->toFloat64(x), mapValues(ProfileEvents)))]
+                            arrayMap(x->toNullable(toFloat64(x)), mapValues(ProfileEvents)))]
                     ),
                     arrayReduce('sumMapState', [(
                         ['client_time', 'server_time', 'memory_usage'],
-                        arrayMap(x->if(x != 0., x, nan), [
-                            toFloat64(query_runs.time),
-                            toFloat64(query_duration_ms / 1000.),
-                            toFloat64(memory_usage)]))])
+                        [toNullable(toFloat64(query_runs.time)), toNullable(toFloat64(query_duration_ms / 1000.)), toNullable(toFloat64(memory_usage))]
+                      )])
                 ]
             )) as metrics_tuple).1 metric_names,
         arrayMap(x->if(isNaN(x),0,x), metrics_tuple.2) metric_values

From 6a2fcb778fa7d5f4149ad275f15244e6903c4ab6 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:07:30 +0100
Subject: [PATCH 0353/1081] Restore comment

---
 tests/performance/scripts/compare.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/performance/scripts/compare.sh b/tests/performance/scripts/compare.sh
index e4bc64b3e28..39c6854fbf9 100755
--- a/tests/performance/scripts/compare.sh
+++ b/tests/performance/scripts/compare.sh
@@ -444,6 +444,8 @@ create view query_logs as
 create table query_run_metric_arrays engine File(TSV, 'analyze/query-run-metric-arrays.tsv')
     as
     with (
+        -- sumMapState with the list of all keys with nullable '0' values because sumMap removes keys with default values
+        -- and 0::Nullable != NULL
         with (select groupUniqArrayArray(mapKeys(ProfileEvents)) from query_logs) as all_names
             select arrayReduce('sumMapState', [(all_names, arrayMap(x->0::Nullable(Float64), all_names))])
         ) as all_metrics

From cef109a887c9c1546db1702eaec48089fb11cfd1 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 29 Jan 2024 13:19:46 +0100
Subject: [PATCH 0354/1081] Fix backward compatibility check

---
 docker/test/stateless/stress_tests.lib        | 2 +-
 docker/test/upgrade/run.sh                    | 1 +
 tests/config/config.d/block_number.xml        | 6 ++++++
 tests/config/config.d/merge_tree_settings.xml | 2 --
 tests/config/install.sh                       | 1 +
 5 files changed, 9 insertions(+), 3 deletions(-)
 create mode 100644 tests/config/config.d/block_number.xml

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index ab573555a43..6e1834d6cde 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -78,7 +78,7 @@ function configure()
         randomize_config_boolean_value use_compression zookeeper
     fi
 
-    randomize_config_boolean_value allow_experimental_block_number_column merge_tree_settings
+    randomize_config_boolean_value allow_experimental_block_number_column block_number
 
     # for clickhouse-server (via service)
     echo "ASAN_OPTIONS='malloc_context_size=10 verbosity=1 allocator_release_to_os_interval_ms=10000'" >> /etc/environment
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 9c008209316..aaba5cc6a8c 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -122,6 +122,7 @@ rm /etc/clickhouse-server/config.d/merge_tree.xml
 rm /etc/clickhouse-server/config.d/enable_wait_for_shutdown_replicated_tables.xml
 rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 rm /etc/clickhouse-server/config.d/storage_conf_02963.xml
+rm /etc/clickhouse-server/config.d/block_number.xml
 rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 rm /etc/clickhouse-server/users.d/s3_cache_new.xml
 rm /etc/clickhouse-server/users.d/replicated_ddl_entry.xml
diff --git a/tests/config/config.d/block_number.xml b/tests/config/config.d/block_number.xml
new file mode 100644
index 00000000000..b56f1f1afc2
--- /dev/null
+++ b/tests/config/config.d/block_number.xml
@@ -0,0 +1,6 @@
+<clickhouse>
+    <merge_tree>
+        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
+        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
+    </merge_tree>
+</clickhouse>
diff --git a/tests/config/config.d/merge_tree_settings.xml b/tests/config/config.d/merge_tree_settings.xml
index 7dcea114b90..f277c18fa3f 100644
--- a/tests/config/config.d/merge_tree_settings.xml
+++ b/tests/config/config.d/merge_tree_settings.xml
@@ -2,7 +2,5 @@
     <merge_tree>
         <!-- 10 seconds (default is 1 minute) -->
         <zookeeper_session_expiration_check_period>10</zookeeper_session_expiration_check_period>
-        <!-- Setting randomized for stress test, it is disabled here and this line is used to randomize it in the script -->
-        <allow_experimental_block_number_column>0</allow_experimental_block_number_column>
     </merge_tree>
 </clickhouse>
diff --git a/tests/config/install.sh b/tests/config/install.sh
index a68a4c19501..cfe810cda84 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -64,6 +64,7 @@ ln -sf $SRC_PATH/config.d/backups.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/filesystem_caches_path.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/validate_tcp_client_information.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/zero_copy_destructive_operations.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/block_number.xml $DEST_SERVER_PATH/config.d/
 
 # Not supported with fasttest.
 if [ "${DEST_SERVER_PATH}" = "/etc/clickhouse-server" ]

From 5affd6af2ebd07f97e0c9f3f42d0976420cf8e92 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 15:32:22 +0300
Subject: [PATCH 0355/1081] IVolume constructor improve exception message

---
 src/Disks/IVolume.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IVolume.cpp b/src/Disks/IVolume.cpp
index 0b072e6ba8b..d763c55c4aa 100644
--- a/src/Disks/IVolume.cpp
+++ b/src/Disks/IVolume.cpp
@@ -46,7 +46,7 @@ IVolume::IVolume(
     }
 
     if (disks.empty())
-        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Volume must contain at least one disk");
+        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Volume {} must contain at least one disk", name);
 }
 
 std::optional<UInt64> IVolume::getMaxUnreservedFreeSpace() const

From 71e5ee81d828917907b74655b1282aaf5627d00a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 13:36:58 +0100
Subject: [PATCH 0356/1081] Enable JIT with UBSAN

---
 contrib/llvm-project-cmake/CMakeLists.txt                    | 5 ++---
 tests/queries/0_stateless/02252_jit_profile_events.sql       | 2 +-
 .../queries/0_stateless/02723_jit_aggregation_bug_48120.sql  | 2 +-
 3 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/contrib/llvm-project-cmake/CMakeLists.txt b/contrib/llvm-project-cmake/CMakeLists.txt
index d09060912d8..ed73af1277c 100644
--- a/contrib/llvm-project-cmake/CMakeLists.txt
+++ b/contrib/llvm-project-cmake/CMakeLists.txt
@@ -1,6 +1,5 @@
-if (APPLE OR SANITIZE STREQUAL "undefined" OR SANITIZE STREQUAL "memory")
-    # llvm-tblgen, that is used during LLVM build, doesn't work with UBSan.
-    set (ENABLE_EMBEDDED_COMPILER_DEFAULT OFF)
+if (APPLE OR SANITIZE STREQUAL "memory")
+    # llvm-tblgen, that is used during LLVM build, doesn't work with MSAN.
     set (ENABLE_DWARF_PARSER_DEFAULT OFF)
 else()
     set (ENABLE_EMBEDDED_COMPILER_DEFAULT ${ENABLE_LIBRARIES})
diff --git a/tests/queries/0_stateless/02252_jit_profile_events.sql b/tests/queries/0_stateless/02252_jit_profile_events.sql
index fbd6040c21c..4b69dde2a45 100644
--- a/tests/queries/0_stateless/02252_jit_profile_events.sql
+++ b/tests/queries/0_stateless/02252_jit_profile_events.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-ubsan, no-asan, no-msan, no-cpu-aarch64
+-- Tags: no-fasttest, no-cpu-aarch64, no-msan
 
 SET compile_expressions = 1;
 SET min_count_to_compile_expression = 0;
diff --git a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
index a9a6d3058b2..88561f9d895 100644
--- a/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
+++ b/tests/queries/0_stateless/02723_jit_aggregation_bug_48120.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-ubsan, no-msan, no-cpu-aarch64
+-- Tags: no-fasttest, no-cpu-aarch64, no-msan
 
 drop table if exists dummy;
 CREATE TABLE dummy ( num1 Int32, num2 Enum8('foo' = 0, 'bar' = 1, 'tar' = 2) )

From 2fa1aebe511147348b75a910d5f927dd19095f2d Mon Sep 17 00:00:00 2001
From: Aris Tritas <aris.tritas@aiven.io>
Date: Sun, 28 Jan 2024 16:46:37 +0100
Subject: [PATCH 0357/1081] Update condition required to define Rust target
 toolchain in corrosion-cmake

The `CMAKE_TOOLCHAIN_FILE` variable is used for cross-compilation. Currently,
the build is blocked when it's unset. Keep the default Rust target toolchain
variable unless the CMake toolchain variable is set.
---
 contrib/corrosion-cmake/CMakeLists.txt | 47 +++++++++++++-------------
 1 file changed, 24 insertions(+), 23 deletions(-)

diff --git a/contrib/corrosion-cmake/CMakeLists.txt b/contrib/corrosion-cmake/CMakeLists.txt
index 9b98ed6efb3..4f60304d74d 100644
--- a/contrib/corrosion-cmake/CMakeLists.txt
+++ b/contrib/corrosion-cmake/CMakeLists.txt
@@ -16,29 +16,30 @@ message(STATUS "Checking Rust toolchain for current target")
 
 # See https://doc.rust-lang.org/nightly/rustc/platform-support.html
 
-if(CMAKE_TOOLCHAIN_FILE MATCHES "ppc64le")
-    set(Rust_CARGO_TARGET "powerpc64le-unknown-linux-gnu")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-x86_64") AND (CMAKE_TOOLCHAIN_FILE MATCHES "musl"))
-    set(Rust_CARGO_TARGET "x86_64-unknown-linux-musl")
-elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-x86_64")
-    set(Rust_CARGO_TARGET "x86_64-unknown-linux-gnu")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-aarch64") AND (CMAKE_TOOLCHAIN_FILE MATCHES "musl"))
-    set(Rust_CARGO_TARGET "aarch64-unknown-linux-musl")
-elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-aarch64")
-    set(Rust_CARGO_TARGET "aarch64-unknown-linux-gnu")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
-    set(Rust_CARGO_TARGET "x86_64-apple-darwin")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "aarch64"))
-    set(Rust_CARGO_TARGET "aarch64-apple-darwin")
-elseif((CMAKE_TOOLCHAIN_FILE MATCHES "freebsd") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
-    set(Rust_CARGO_TARGET "x86_64-unknown-freebsd")
-elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-riscv64")
-    set(Rust_CARGO_TARGET "riscv64gc-unknown-linux-gnu")
-else()
-    message(FATAL_ERROR "Unsupported rust target")
-endif()
-
-message(STATUS "Switched Rust target to ${Rust_CARGO_TARGET}")
+if(DEFINED CMAKE_TOOLCHAIN_FILE)
+    if(CMAKE_TOOLCHAIN_FILE MATCHES "ppc64le")
+        set(Rust_CARGO_TARGET "powerpc64le-unknown-linux-gnu")
+    elseif((CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-x86_64") AND (CMAKE_TOOLCHAIN_FILE MATCHES "musl"))
+        set(Rust_CARGO_TARGET "x86_64-unknown-linux-musl")
+    elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-x86_64")
+        set(Rust_CARGO_TARGET "x86_64-unknown-linux-gnu")
+    elseif((CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-aarch64") AND (CMAKE_TOOLCHAIN_FILE MATCHES "musl"))
+        set(Rust_CARGO_TARGET "aarch64-unknown-linux-musl")
+    elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-aarch64")
+        set(Rust_CARGO_TARGET "aarch64-unknown-linux-gnu")
+    elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
+        set(Rust_CARGO_TARGET "x86_64-apple-darwin")
+    elseif((CMAKE_TOOLCHAIN_FILE MATCHES "darwin") AND (CMAKE_TOOLCHAIN_FILE MATCHES "aarch64"))
+        set(Rust_CARGO_TARGET "aarch64-apple-darwin")
+    elseif((CMAKE_TOOLCHAIN_FILE MATCHES "freebsd") AND (CMAKE_TOOLCHAIN_FILE MATCHES "x86_64"))
+        set(Rust_CARGO_TARGET "x86_64-unknown-freebsd")
+    elseif(CMAKE_TOOLCHAIN_FILE MATCHES "linux/toolchain-riscv64")
+        set(Rust_CARGO_TARGET "riscv64gc-unknown-linux-gnu")
+    else()
+        message(FATAL_ERROR "Unsupported rust target")
+    endif()
+    message(STATUS "Switched Rust target to ${Rust_CARGO_TARGET}")
+endif ()
 
 # FindRust.cmake
 list(APPEND CMAKE_MODULE_PATH "${ClickHouse_SOURCE_DIR}/contrib/corrosion/cmake")

From 9fa76bea7e8215f1359d3c3608fd3a0165210658 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 13:48:36 +0100
Subject: [PATCH 0358/1081] Support FORMAT clause in BACKUP/RESTORE query.

---
 src/Parsers/ASTBackupQuery.cpp        | 17 +++++++++--------
 src/Parsers/ASTBackupQuery.h          |  6 +++---
 src/Parsers/ParserQuery.cpp           |  5 +----
 src/Parsers/ParserQueryWithOutput.cpp |  5 ++++-
 4 files changed, 17 insertions(+), 16 deletions(-)

diff --git a/src/Parsers/ASTBackupQuery.cpp b/src/Parsers/ASTBackupQuery.cpp
index 2c26e723687..bdb78eaf971 100644
--- a/src/Parsers/ASTBackupQuery.cpp
+++ b/src/Parsers/ASTBackupQuery.cpp
@@ -261,23 +261,24 @@ ASTPtr ASTBackupQuery::clone() const
     if (settings)
         res->settings = settings->clone();
 
+    cloneOutputOptions(*res);
+
     return res;
 }
 
 
-void ASTBackupQuery::formatImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const
+void ASTBackupQuery::formatQueryImpl(const FormatSettings & fs, FormatState &, FormatStateStacked) const
 {
-    format.ostr << (format.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? "BACKUP " : "RESTORE ")
-                << (format.hilite ? hilite_none : "");
+    fs.ostr << (fs.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? "BACKUP " : "RESTORE ") << (fs.hilite ? hilite_none : "");
 
-    formatElements(elements, format);
-    formatOnCluster(format);
+    formatElements(elements, fs);
+    formatOnCluster(fs);
 
-    format.ostr << (format.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? " TO " : " FROM ") << (format.hilite ? hilite_none : "");
-    backup_name->format(format);
+    fs.ostr << (fs.hilite ? hilite_keyword : "") << ((kind == Kind::BACKUP) ? " TO " : " FROM ") << (fs.hilite ? hilite_none : "");
+    backup_name->format(fs);
 
     if (settings || base_backup_name)
-        formatSettings(settings, base_backup_name, cluster_host_ids, format);
+        formatSettings(settings, base_backup_name, cluster_host_ids, fs);
 }
 
 ASTPtr ASTBackupQuery::getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams & params) const
diff --git a/src/Parsers/ASTBackupQuery.h b/src/Parsers/ASTBackupQuery.h
index 0201c2b14f9..27aa1680748 100644
--- a/src/Parsers/ASTBackupQuery.h
+++ b/src/Parsers/ASTBackupQuery.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Parsers/IAST.h>
+#include <Parsers/ASTQueryWithOutput.h>
 #include <Parsers/ASTQueryWithOnCluster.h>
 
 
@@ -40,7 +40,7 @@ class ASTFunction;
   * For the BACKUP command this clause allows to set the name which an object will have inside the backup.
   * And for the RESTORE command this clause allows to set the name which an object will have after RESTORE has finished.
   */
-class ASTBackupQuery : public IAST, public ASTQueryWithOnCluster
+class ASTBackupQuery : public ASTQueryWithOutput, public ASTQueryWithOnCluster
 {
 public:
     enum Kind
@@ -91,7 +91,7 @@ public:
 
     String getID(char) const override;
     ASTPtr clone() const override;
-    void formatImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
+    void formatQueryImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
     ASTPtr getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams &) const override;
     QueryKind getQueryKind() const override;
 
diff --git a/src/Parsers/ParserQuery.cpp b/src/Parsers/ParserQuery.cpp
index 7ed69940bed..22ddc25019f 100644
--- a/src/Parsers/ParserQuery.cpp
+++ b/src/Parsers/ParserQuery.cpp
@@ -1,6 +1,5 @@
 #include <Parsers/ParserAlterQuery.h>
 #include <Parsers/ParserCreateFunctionQuery.h>
-#include <Parsers/ParserBackupQuery.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserCreateIndexQuery.h>
 #include <Parsers/ParserDropFunctionQuery.h>
@@ -61,7 +60,6 @@ bool ParserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     ParserExternalDDLQuery external_ddl_p;
     ParserTransactionControl transaction_control_p;
     ParserDeleteQuery delete_p;
-    ParserBackupQuery backup_p;
 
     bool res = query_with_output_p.parse(pos, node, expected)
         || insert_p.parse(pos, node, expected)
@@ -86,8 +84,7 @@ bool ParserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         || grant_p.parse(pos, node, expected)
         || external_ddl_p.parse(pos, node, expected)
         || transaction_control_p.parse(pos, node, expected)
-        || delete_p.parse(pos, node, expected)
-        || backup_p.parse(pos, node, expected);
+        || delete_p.parse(pos, node, expected);
 
     return res;
 }
diff --git a/src/Parsers/ParserQueryWithOutput.cpp b/src/Parsers/ParserQueryWithOutput.cpp
index f03df6cacfe..7a627ae5f6a 100644
--- a/src/Parsers/ParserQueryWithOutput.cpp
+++ b/src/Parsers/ParserQueryWithOutput.cpp
@@ -2,6 +2,7 @@
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTSetQuery.h>
 #include <Parsers/ParserAlterQuery.h>
+#include <Parsers/ParserBackupQuery.h>
 #include <Parsers/ParserCheckQuery.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserDescribeTableQuery.h>
@@ -65,6 +66,7 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     ParserShowGrantsQuery show_grants_p;
     ParserShowPrivilegesQuery show_privileges_p;
     ParserExplainQuery explain_p(end, allow_settings_after_format_in_insert);
+    ParserBackupQuery backup_p;
 
     ASTPtr query;
 
@@ -94,7 +96,8 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
         || show_access_p.parse(pos, query, expected)
         || show_access_entities_p.parse(pos, query, expected)
         || show_grants_p.parse(pos, query, expected)
-        || show_privileges_p.parse(pos, query, expected);
+        || show_privileges_p.parse(pos, query, expected)
+        || backup_p.parse(pos, query, expected);
 
     if (!parsed)
         return false;

From 1904e4c6bfde4dd84bdad747b4d6b8764b324846 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 14:19:51 +0100
Subject: [PATCH 0359/1081] Add test.

---
 .../02974_backup_query_format_null.reference  |  3 +++
 .../02974_backup_query_format_null.sh         | 22 +++++++++++++++++++
 2 files changed, 25 insertions(+)
 create mode 100644 tests/queries/0_stateless/02974_backup_query_format_null.reference
 create mode 100755 tests/queries/0_stateless/02974_backup_query_format_null.sh

diff --git a/tests/queries/0_stateless/02974_backup_query_format_null.reference b/tests/queries/0_stateless/02974_backup_query_format_null.reference
new file mode 100644
index 00000000000..67bfe658c1f
--- /dev/null
+++ b/tests/queries/0_stateless/02974_backup_query_format_null.reference
@@ -0,0 +1,3 @@
+2
+80
+-12345
diff --git a/tests/queries/0_stateless/02974_backup_query_format_null.sh b/tests/queries/0_stateless/02974_backup_query_format_null.sh
new file mode 100755
index 00000000000..ddba2f6de16
--- /dev/null
+++ b/tests/queries/0_stateless/02974_backup_query_format_null.sh
@@ -0,0 +1,22 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} -nm --query "
+DROP TABLE IF EXISTS tbl;
+CREATE TABLE tbl (a Int32) ENGINE = MergeTree() ORDER BY tuple();
+INSERT INTO tbl VALUES (2), (80), (-12345);
+"
+
+backup_name="Disk('backups', '${CLICKHOUSE_TEST_UNIQUE_NAME}')"
+
+${CLICKHOUSE_CLIENT} --query "BACKUP TABLE tbl TO ${backup_name} FORMAT Null"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+DROP TABLE tbl;
+RESTORE ALL FROM ${backup_name} FORMAT Null
+"
+
+${CLICKHOUSE_CLIENT} --query "SELECT * FROM tbl"

From 2191569d6b0b20b32af5c19469504817fb0455b1 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 13:13:42 +0000
Subject: [PATCH 0360/1081] Cosmetics: remove superfluous inline

---
 src/Functions/formatString.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/formatString.h b/src/Functions/formatString.h
index 315e5c06227..bdd36f4aa17 100644
--- a/src/Functions/formatString.h
+++ b/src/Functions/formatString.h
@@ -18,7 +18,7 @@ struct FormatStringImpl
     static constexpr size_t right_padding = 15;
 
     template <typename... Args>
-    static inline void formatExecute(bool possibly_has_column_string, bool possibly_has_column_fixed_string, Args &&... args)
+    static void formatExecute(bool possibly_has_column_string, bool possibly_has_column_fixed_string, Args &&... args)
     {
         if (possibly_has_column_string && possibly_has_column_fixed_string)
             format<true, true>(std::forward<Args>(args)...);
@@ -38,7 +38,7 @@ struct FormatStringImpl
     /// input_rows_count is the number of rows processed.
     /// Precondition: data.size() == offsets.size() == fixed_string_N.size() == constant_strings.size().
     template <bool has_column_string, bool has_column_fixed_string>
-    static inline void format(
+    static void format(
         String pattern,
         const std::vector<const ColumnString::Chars *> & data,
         const std::vector<const ColumnString::Offsets *> & offsets,

From 1aae7d7d953dc2445d0ded7c2d62ab3bd5ae0d6c Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 13:35:19 +0000
Subject: [PATCH 0361/1081] Cosmetics: Rename variable

---
 src/Functions/concat.cpp              | 18 +++++++++---------
 src/Functions/concatWithSeparator.cpp | 11 +++++------
 2 files changed, 14 insertions(+), 15 deletions(-)

diff --git a/src/Functions/concat.cpp b/src/Functions/concat.cpp
index b057e7fede5..d68f5256f6d 100644
--- a/src/Functions/concat.cpp
+++ b/src/Functions/concat.cpp
@@ -80,21 +80,21 @@ private:
         const ColumnConst * c0_const_string = checkAndGetColumnConst<ColumnString>(c0);
         const ColumnConst * c1_const_string = checkAndGetColumnConst<ColumnString>(c1);
 
-        auto c_res = ColumnString::create();
+        auto col_res = ColumnString::create();
 
         if (c0_string && c1_string)
-            concat(StringSource(*c0_string), StringSource(*c1_string), StringSink(*c_res, c0->size()));
+            concat(StringSource(*c0_string), StringSource(*c1_string), StringSink(*col_res, c0->size()));
         else if (c0_string && c1_const_string)
-            concat(StringSource(*c0_string), ConstSource<StringSource>(*c1_const_string), StringSink(*c_res, c0->size()));
+            concat(StringSource(*c0_string), ConstSource<StringSource>(*c1_const_string), StringSink(*col_res, c0->size()));
         else if (c0_const_string && c1_string)
-            concat(ConstSource<StringSource>(*c0_const_string), StringSource(*c1_string), StringSink(*c_res, c0->size()));
+            concat(ConstSource<StringSource>(*c0_const_string), StringSource(*c1_string), StringSink(*col_res, c0->size()));
         else
         {
             /// Fallback: use generic implementation for not very important cases.
             return executeFormatImpl(arguments, input_rows_count);
         }
 
-        return c_res;
+        return col_res;
     }
 
     ColumnPtr executeFormatImpl(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
@@ -102,7 +102,7 @@ private:
         const size_t num_arguments = arguments.size();
         assert(num_arguments >= 2);
 
-        auto c_res = ColumnString::create();
+        auto col_res = ColumnString::create();
         std::vector<const ColumnString::Chars *> data(num_arguments);
         std::vector<const ColumnString::Offsets *> offsets(num_arguments);
         std::vector<size_t> fixed_string_sizes(num_arguments);
@@ -169,11 +169,11 @@ private:
             offsets,
             fixed_string_sizes,
             constant_strings,
-            c_res->getChars(),
-            c_res->getOffsets(),
+            col_res->getChars(),
+            col_res->getOffsets(),
             input_rows_count);
 
-        return c_res;
+        return col_res;
     }
 };
 
diff --git a/src/Functions/concatWithSeparator.cpp b/src/Functions/concatWithSeparator.cpp
index b4f3732710f..00e480c3a6d 100644
--- a/src/Functions/concatWithSeparator.cpp
+++ b/src/Functions/concatWithSeparator.cpp
@@ -27,7 +27,6 @@ class ConcatWithSeparatorImpl : public IFunction
 public:
     static constexpr auto name = Name::name;
     explicit ConcatWithSeparatorImpl(ContextPtr context_) : context(context_) { }
-
     static FunctionPtr create(ContextPtr context) { return std::make_shared<ConcatWithSeparatorImpl>(context); }
 
     String getName() const override { return name; }
@@ -70,8 +69,8 @@ public:
         if (arguments.size() == 1)
             return result_type->createColumnConstWithDefaultValue(input_rows_count);
 
-        auto c_res = ColumnString::create();
-        c_res->reserve(input_rows_count);
+        auto col_res = ColumnString::create();
+        col_res->reserve(input_rows_count);
         const ColumnConst * col_sep = checkAndGetColumnConstStringOrFixedString(arguments[0].column.get());
         if (!col_sep)
             throw Exception(
@@ -129,10 +128,10 @@ public:
             offsets,
             fixed_string_sizes,
             constant_strings,
-            c_res->getChars(),
-            c_res->getOffsets(),
+            col_res->getChars(),
+            col_res->getOffsets(),
             input_rows_count);
-        return std::move(c_res);
+        return std::move(col_res);
     }
 
 private:

From d3cdc8826eb5209562ae743c7a385a7f33bbc015 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 29 Jan 2024 14:04:23 +0000
Subject: [PATCH 0362/1081] lower memory usage in vertical merges

---
 .../Transforms/ColumnGathererTransform.cpp    | 16 ++++++---
 .../Transforms/ColumnGathererTransform.h      | 29 ++++++++-------
 src/Storages/MergeTree/MergeTask.cpp          | 10 +++++-
 ...981_vertical_merges_memory_usage.reference |  1 +
 .../02981_vertical_merges_memory_usage.sql    | 35 +++++++++++++++++++
 5 files changed, 73 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
 create mode 100644 tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql

diff --git a/src/Processors/Transforms/ColumnGathererTransform.cpp b/src/Processors/Transforms/ColumnGathererTransform.cpp
index d7f52a538e1..b2e8e9bc89e 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.cpp
+++ b/src/Processors/Transforms/ColumnGathererTransform.cpp
@@ -17,9 +17,14 @@ namespace ErrorCodes
 }
 
 ColumnGathererStream::ColumnGathererStream(
-    size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_)
-    : sources(num_inputs), row_sources_buf(row_sources_buf_)
-    , block_preferred_size(block_preferred_size_)
+    size_t num_inputs,
+    ReadBuffer & row_sources_buf_,
+    size_t block_preferred_size_rows_,
+    size_t block_preferred_size_bytes_)
+    : sources(num_inputs)
+    , row_sources_buf(row_sources_buf_)
+    , block_preferred_size_rows(block_preferred_size_rows_)
+    , block_preferred_size_bytes(block_preferred_size_bytes_)
 {
     if (num_inputs == 0)
         throw Exception(ErrorCodes::EMPTY_DATA_PASSED, "There are no streams to gather");
@@ -124,10 +129,11 @@ ColumnGathererTransform::ColumnGathererTransform(
     const Block & header,
     size_t num_inputs,
     ReadBuffer & row_sources_buf_,
-    size_t block_preferred_size_)
+    size_t block_preferred_size_rows_,
+    size_t block_preferred_size_bytes_)
     : IMergingTransform<ColumnGathererStream>(
         num_inputs, header, header, /*have_all_inputs_=*/ true, /*limit_hint_=*/ 0, /*always_read_till_end_=*/ false,
-        num_inputs, row_sources_buf_, block_preferred_size_)
+        num_inputs, row_sources_buf_, block_preferred_size_rows_, block_preferred_size_bytes_)
     , log(getLogger("ColumnGathererStream"))
 {
     if (header.columns() != 1)
diff --git a/src/Processors/Transforms/ColumnGathererTransform.h b/src/Processors/Transforms/ColumnGathererTransform.h
index 885cb3f81ba..821d04db0df 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.h
+++ b/src/Processors/Transforms/ColumnGathererTransform.h
@@ -5,7 +5,6 @@
 #include <Processors/Merges/Algorithms/IMergingAlgorithm.h>
 #include <Processors/Merges/IMergingTransform.h>
 
-
 namespace Poco { class Logger; }
 
 
@@ -57,7 +56,11 @@ using MergedRowSources = PODArray<RowSourcePart>;
 class ColumnGathererStream final : public IMergingAlgorithm
 {
 public:
-    ColumnGathererStream(size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+    ColumnGathererStream(
+        size_t num_inputs,
+        ReadBuffer & row_sources_buf_,
+        size_t block_preferred_size_rows_,
+        size_t block_preferred_size_bytes_);
 
     const char * getName() const override { return "ColumnGathererStream"; }
     void initialize(Inputs inputs) override;
@@ -92,13 +95,12 @@ private:
     std::vector<Source> sources;
     ReadBuffer & row_sources_buf;
 
-    const size_t block_preferred_size;
+    const size_t block_preferred_size_rows;
+    const size_t block_preferred_size_bytes;
 
     Source * source_to_fully_copy = nullptr;
 
     ssize_t next_required_source = -1;
-    size_t cur_block_preferred_size = 0;
-
     UInt64 merged_rows = 0;
     UInt64 merged_bytes = 0;
 };
@@ -110,7 +112,8 @@ public:
         const Block & header,
         size_t num_inputs,
         ReadBuffer & row_sources_buf_,
-        size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+        size_t block_preferred_size_rows_,
+        size_t block_preferred_size_bytes_);
 
     String getName() const override { return "ColumnGathererTransform"; }
 
@@ -134,14 +137,17 @@ void ColumnGathererStream::gather(Column & column_res)
     if (next_required_source == -1)
     {
         /// Start new column.
-        cur_block_preferred_size = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size);
-        column_res.reserve(cur_block_preferred_size);
+        /// Actually reserve works only for fixed size columns.
+        /// So it's safe to ignore preferred size in bytes and call reserve for number of rows.
+        size_t size_to_reserve = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size_rows);
+        column_res.reserve(size_to_reserve);
     }
 
-    size_t cur_size = column_res.size();
     next_required_source = -1;
 
-    while (row_source_pos < row_sources_end && cur_size < cur_block_preferred_size)
+    while (row_source_pos < row_sources_end
+        && column_res.size() < block_preferred_size_rows
+        && column_res.allocatedBytes() < block_preferred_size_bytes)
     {
         RowSourcePart row_source = *row_source_pos;
         size_t source_num = row_source.getSourceNum();
@@ -159,6 +165,7 @@ void ColumnGathererStream::gather(Column & column_res)
         /// Consecutive optimization. TODO: precompute lengths
         size_t len = 1;
         size_t max_len = std::min(static_cast<size_t>(row_sources_end - row_source_pos), source.size - source.pos); // interval should be in the same block
+
         while (len < max_len && row_source_pos->data == row_source.data)
         {
             ++len;
@@ -181,8 +188,6 @@ void ColumnGathererStream::gather(Column & column_res)
                 column_res.insertFrom(*source.column, source.pos);
             else
                 column_res.insertRangeFrom(*source.column, source.pos, len);
-
-            cur_size += len;
         }
 
         source.pos += len;
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 4b5b7ca8018..59bdb7006b3 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -588,7 +588,15 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
     auto pipe = Pipe::unitePipes(std::move(pipes));
 
     ctx->rows_sources_read_buf->seek(0, 0);
-    auto transform = std::make_unique<ColumnGathererTransform>(pipe.getHeader(), pipe.numOutputPorts(), *ctx->rows_sources_read_buf);
+
+    const auto data_settings = global_ctx->data->getSettings();
+    auto transform = std::make_unique<ColumnGathererTransform>(
+        pipe.getHeader(),
+        pipe.numOutputPorts(),
+        *ctx->rows_sources_read_buf,
+        data_settings->merge_max_block_size,
+        data_settings->merge_max_block_size_bytes);
+
     pipe.addTransform(std::move(transform));
 
     ctx->column_parts_pipeline = QueryPipeline(std::move(pipe));
diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
new file mode 100644
index 00000000000..60c254e152b
--- /dev/null
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference
@@ -0,0 +1 @@
+Vertical	OK
diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
new file mode 100644
index 00000000000..1305f02c044
--- /dev/null
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
@@ -0,0 +1,35 @@
+-- Tags: long
+
+DROP TABLE IF EXISTS t_vertical_merge_memory;
+
+CREATE TABLE t_vertical_merge_memory (id UInt64, arr Array(String))
+ENGINE = MergeTree ORDER BY id
+SETTINGS
+    min_bytes_for_wide_part = 0,
+    vertical_merge_algorithm_min_rows_to_activate = 1,
+    vertical_merge_algorithm_min_columns_to_activate = 1,
+    index_granularity = 8192,
+    index_granularity_bytes = '10M',
+    merge_max_block_size = 8192,
+    merge_max_block_size_bytes = '10M';
+
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
+
+OPTIMIZE TABLE t_vertical_merge_memory FINAL;
+
+SYSTEM FLUSH LOGS;
+
+SELECT
+    merge_algorithm,
+    peak_memory_usage < 500 * 1024 * 1024
+        ? 'OK'
+        : format('FAIL: memory usage: {}', formatReadableSize(peak_memory_usage))
+FROM system.part_log
+WHERE
+    database = currentDatabase()
+    AND table = 't_vertical_merge_memory'
+    AND event_type = 'MergeParts'
+    AND length(merged_from) = 2;
+
+DROP TABLE IF EXISTS t_vertical_merge_memory;

From c2b7d2047ed09fac37ae85d69d4191a14eb2d31f Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 29 Jan 2024 14:09:40 +0000
Subject: [PATCH 0363/1081] Support arguments of arbitary type in function
 concatWithSeparator()

Follow-up to #56540
---
 .../functions/string-functions.md             |  2 +-
 src/Functions/concatWithSeparator.cpp         | 47 +++++++---
 .../02495_concat_with_separator.reference     | 39 ++++++++
 .../02495_concat_with_separator.sql           | 89 ++++++++++++++-----
 4 files changed, 142 insertions(+), 35 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index a2f1b0d7752..60cb3ac4ac4 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -515,7 +515,7 @@ Alias: `concat_ws`
 **Arguments**
 
 - sep — separator. Const [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md).
-- exprN — expression to be concatenated. [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md).
+- exprN — expression to be concatenated. Arguments which are not of types [String](../../sql-reference/data-types/string.md) or [FixedString](../../sql-reference/data-types/fixedstring.md) are converted to strings using their default serialization. As this decreases performance, it is not recommended to use non-String/FixedString arguments.
 
 **Returned values**
 
diff --git a/src/Functions/concatWithSeparator.cpp b/src/Functions/concatWithSeparator.cpp
index 00e480c3a6d..ed02f331192 100644
--- a/src/Functions/concatWithSeparator.cpp
+++ b/src/Functions/concatWithSeparator.cpp
@@ -1,5 +1,6 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnStringHelpers.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
@@ -48,17 +49,13 @@ public:
                 getName(),
                 arguments.size());
 
-        for (const auto arg_idx : collections::range(0, arguments.size()))
-        {
-            const auto * arg = arguments[arg_idx].get();
-            if (!isStringOrFixedString(arg))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Illegal type {} of argument {} of function {}",
-                    arg->getName(),
-                    arg_idx + 1,
-                    getName());
-        }
+        const auto * separator_arg = arguments[0].get();
+        if (!isStringOrFixedString(separator_arg))
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "Illegal type {} of first argument of function {}",
+                separator_arg->getName(),
+                getName());
 
         return std::make_shared<DataTypeString>();
     }
@@ -71,6 +68,7 @@ public:
 
         auto col_res = ColumnString::create();
         col_res->reserve(input_rows_count);
+
         const ColumnConst * col_sep = checkAndGetColumnConstStringOrFixedString(arguments[0].column.get());
         if (!col_sep)
             throw Exception(
@@ -87,6 +85,7 @@ public:
         std::vector<const ColumnString::Offsets *> offsets(num_args);
         std::vector<size_t> fixed_string_sizes(num_args);
         std::vector<std::optional<String>> constant_strings(num_args);
+        std::vector<ColumnString::MutablePtr> converted_col_ptrs(num_args);
 
         bool has_column_string = false;
         bool has_column_fixed_string = false;
@@ -110,9 +109,33 @@ public:
                 fixed_string_sizes[2 * i] = fixed_col->getN();
             }
             else if (const ColumnConst * const_col = checkAndGetColumnConstStringOrFixedString(column.get()))
+            {
                 constant_strings[2 * i] = const_col->getValue<String>();
+            }
             else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}", column->getName(), getName());
+            {
+                /// A non-String/non-FixedString-type argument: use the default serialization to convert it to String
+                auto full_column = column->convertToFullIfNeeded();
+                auto serialization = arguments[i +1].type->getDefaultSerialization();
+                auto converted_col_str = ColumnString::create();
+                ColumnStringHelpers::WriteHelper write_helper(*converted_col_str, column->size());
+                auto & write_buffer = write_helper.getWriteBuffer();
+                FormatSettings format_settings;
+                for (size_t row = 0; row < column->size(); ++row)
+                {
+                    serialization->serializeText(*full_column, row, write_buffer, format_settings);
+                    write_helper.rowWritten();
+                }
+                write_helper.finalize();
+
+                /// Keep the pointer alive
+                converted_col_ptrs[i] = std::move(converted_col_str);
+
+                /// Same as the normal `ColumnString` branch
+                has_column_string = true;
+                data[2 * i] = &converted_col_ptrs[i]->getChars();
+                offsets[2 * i] = &converted_col_ptrs[i]->getOffsets();
+            }
         }
 
         String pattern;
diff --git a/tests/queries/0_stateless/02495_concat_with_separator.reference b/tests/queries/0_stateless/02495_concat_with_separator.reference
index 8f0ea917f4b..ebff5deb6aa 100644
--- a/tests/queries/0_stateless/02495_concat_with_separator.reference
+++ b/tests/queries/0_stateless/02495_concat_with_separator.reference
@@ -14,6 +14,45 @@
 1
 1
 1
+1
+1
 \N
 \N
 \N
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+0
diff --git a/tests/queries/0_stateless/02495_concat_with_separator.sql b/tests/queries/0_stateless/02495_concat_with_separator.sql
index 916c4cda1b7..7167d48a1da 100644
--- a/tests/queries/0_stateless/02495_concat_with_separator.sql
+++ b/tests/queries/0_stateless/02495_concat_with_separator.sql
@@ -1,27 +1,72 @@
-select concatWithSeparator('|', 'a', 'b') == 'a|b';
-select concatWithSeparator('|', 'a', materialize('b')) == 'a|b';
-select concatWithSeparator('|', materialize('a'), 'b') == 'a|b';
-select concatWithSeparator('|', materialize('a'), materialize('b')) == 'a|b';
+SET allow_suspicious_low_cardinality_types=1;
 
-select concatWithSeparator('|', 'a', toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', 'a', materialize(toFixedString('b', 1))) == 'a|b';
-select concatWithSeparator('|', materialize('a'), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', materialize('a'), materialize(toFixedString('b', 1))) == 'a|b';
+-- negative tests
+SELECT concatWithSeparator(materialize('|'), 'a', 'b'); -- { serverError ILLEGAL_COLUMN }
+SELECT concatWithSeparator();                           -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
 
-select concatWithSeparator('|', toFixedString('a', 1), 'b') == 'a|b';
-select concatWithSeparator('|', toFixedString('a', 1), materialize('b')) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), 'b') == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize('b')) == 'a|b';
+-- special cases
+SELECT concatWithSeparator('|') = '';
+SELECT concatWithSeparator('|', 'a') == 'a';
 
-select concatWithSeparator('|', toFixedString('a', 1), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', toFixedString('a', 1), materialize(toFixedString('b', 1))) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), toFixedString('b', 1)) == 'a|b';
-select concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', 'a', 'b') == 'a|b';
+SELECT concatWithSeparator('|', 'a', materialize('b')) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), 'b') == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), materialize('b')) == 'a|b';
 
-select concatWithSeparator(null, 'a', 'b') == null;
-select concatWithSeparator('1', null, 'b') == null;
-select concatWithSeparator('1', 'a', null) == null;
+SELECT concatWithSeparator('|', 'a', toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', 'a', materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', materialize('a'), materialize(toFixedString('b', 1))) == 'a|b';
 
-select concatWithSeparator(materialize('|'), 'a', 'b'); -- { serverError 44 }
-select concatWithSeparator();                           -- { serverError 42 }
-select concatWithSeparator('|', 'a', 100);              -- { serverError 43 }
+SELECT concatWithSeparator('|', toFixedString('a', 1), 'b') == 'a|b';
+SELECT concatWithSeparator('|', toFixedString('a', 1), materialize('b')) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), 'b') == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize('b')) == 'a|b';
+
+SELECT concatWithSeparator('|', toFixedString('a', 1), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', toFixedString('a', 1), materialize(toFixedString('b', 1))) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), toFixedString('b', 1)) == 'a|b';
+SELECT concatWithSeparator('|', materialize(toFixedString('a', 1)), materialize(toFixedString('b', 1))) == 'a|b';
+
+SELECT concatWithSeparator(null, 'a', 'b') == null;
+SELECT concatWithSeparator('1', null, 'b') == null;
+SELECT concatWithSeparator('1', 'a', null) == null;
+
+-- Const String + non-const non-String/non-FixedString type'
+SELECT concatWithSeparator('|', 'a', materialize(42 :: Int8)) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize(43 :: Int16)) == 'a|43';
+SELECT concatWithSeparator('|', 'a', materialize(44 :: Int32)) == 'a|44';
+SELECT concatWithSeparator('|', 'a', materialize(45 :: Int64)) == 'a|45';
+SELECT concatWithSeparator('|', 'a', materialize(46 :: Int128)) == 'a|46';
+SELECT concatWithSeparator('|', 'a', materialize(47 :: Int256)) == 'a|47';
+SELECT concatWithSeparator('|', 'a', materialize(48 :: UInt8)) == 'a|48';
+SELECT concatWithSeparator('|', 'a', materialize(49 :: UInt16)) == 'a|49';
+SELECT concatWithSeparator('|', 'a', materialize(50 :: UInt32)) == 'a|50';
+SELECT concatWithSeparator('|', 'a', materialize(51 :: UInt64)) == 'a|51';
+SELECT concatWithSeparator('|', 'a', materialize(52 :: UInt128)) == 'a|52';
+SELECT concatWithSeparator('|', 'a', materialize(53 :: UInt256)) == 'a|53';
+SELECT concatWithSeparator('|', 'a', materialize(42.42 :: Float32)) == 'a|42.42';
+SELECT concatWithSeparator('|', 'a', materialize(43.43 :: Float64)) == 'a|43.43';
+SELECT concatWithSeparator('|', 'a', materialize(44.44 :: Decimal(2))) == 'a|44';
+SELECT concatWithSeparator('|', 'a', materialize(true :: Bool)) == 'a|true';
+SELECT concatWithSeparator('|', 'a', materialize(false :: Bool)) == 'a|false';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: String)) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: FixedString(3))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: Nullable(String))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: Nullable(FixedString(3)))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: LowCardinality(String))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: LowCardinality(FixedString(3)))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize('foo' :: LowCardinality(Nullable(String)))) == 'a|foo';
+SELECT concatWithSeparator('|', 'a', materialize('bar' :: LowCardinality(Nullable(FixedString(3))))) == 'a|bar';
+SELECT concatWithSeparator('|', 'a', materialize(42 :: LowCardinality(Nullable(UInt32)))) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize(42 :: LowCardinality(UInt32))) == 'a|42';
+SELECT concatWithSeparator('|', 'a', materialize('fae310ca-d52a-4923-9e9b-02bf67f4b009' :: UUID)) == 'a|fae310ca-d52a-4923-9e9b-02bf67f4b009';
+SELECT concatWithSeparator('|', 'a', materialize('2023-11-14' :: Date)) == 'a|2023-11-14';
+SELECT concatWithSeparator('|', 'a', materialize('2123-11-14' :: Date32)) == 'a|2123-11-14';
+SELECT concatWithSeparator('|', 'a', materialize('2023-11-14 05:50:12' :: DateTime('Europe/Amsterdam'))) == 'a|2023-11-14 05:50:12';
+SELECT concatWithSeparator('|', 'a', materialize('hallo' :: Enum('hallo' = 1))) == 'a|hallo';
+SELECT concatWithSeparator('|', 'a', materialize(['foo', 'bar'] :: Array(String))) == 'a|[\'foo\',\'bar\']';
+SELECT concatWithSeparator('|', 'a', materialize((42, 'foo') :: Tuple(Int32, String))) == 'a|(42,\'foo\')';
+SELECT concatWithSeparator('|', 'a', materialize(map(42, 'foo') :: Map(Int32, String))) == 'a|{42:\'foo\'}';
+SELECT concatWithSeparator('|', 'a', materialize('122.233.64.201' :: IPv4)) == 'a|122.233.64.201';
+SELECT concatWithSeparator('|', 'a', materialize('2001:0001:130F:0002:0003:09C0:876A:130B' :: IPv6)) == 'a|2001:0001:130F:0002:0003:09C0:876A:130B';

From 1f446f78b5902ba1ac3e142dc885ef95c4598130 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 29 Jan 2024 16:24:16 +0100
Subject: [PATCH 0364/1081] Fix parameter's name.

---
 src/Parsers/ASTBackupQuery.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ASTBackupQuery.h b/src/Parsers/ASTBackupQuery.h
index 27aa1680748..a56cdebc7b3 100644
--- a/src/Parsers/ASTBackupQuery.h
+++ b/src/Parsers/ASTBackupQuery.h
@@ -91,7 +91,7 @@ public:
 
     String getID(char) const override;
     ASTPtr clone() const override;
-    void formatQueryImpl(const FormatSettings & format, FormatState &, FormatStateStacked) const override;
+    void formatQueryImpl(const FormatSettings & fs, FormatState &, FormatStateStacked) const override;
     ASTPtr getRewrittenASTWithoutOnCluster(const WithoutOnClusterASTRewriteParams &) const override;
     QueryKind getQueryKind() const override;
 

From 1ab29bef622a8de3af7bec194598e3939c9f2d7a Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Mon, 29 Jan 2024 15:33:09 +0000
Subject: [PATCH 0365/1081] fixes

---
 src/Functions/FunctionBinaryArithmetic.h      | 54 ++++++++++++++-----
 src/Functions/IsOperation.h                   |  6 +--
 .../00700_decimal_arithm.reference            | 14 ++---
 .../01717_int_div_float_too_large_ubsan.sql   |  4 +-
 .../02975_intdiv_with_decimal.reference       | 52 +++++++++++-------
 .../0_stateless/02975_intdiv_with_decimal.sql | 16 ++++++
 6 files changed, 101 insertions(+), 45 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index e34514d15fd..831c1cf3aeb 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -153,17 +153,18 @@ public:
     using ResultDataType = Switch<
         /// Result must be Integer
         Case<
-            only_integer && IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>,
+            only_integer && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>),
             Switch<
-                Case<std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>, DataTypeInt256>,
-                Case<std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>, DataTypeInt128>,
-                Case<std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>, DataTypeInt64>,
-                Case<std::is_same_v<LeftDataType, DataTypeDecimal32> || std::is_same_v<RightDataType, DataTypeDecimal32>, DataTypeInt32>>>,
-        Case<
-            only_integer,
-            Switch<
-                Case<IsIntegral<LeftDataType>, LeftDataType>,
-                Case<IsIntegral<RightDataType>, RightDataType>>>,
+                Case<
+                    IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>,
+                    Switch<
+                        Case<IsIntegralOrExtended<LeftDataType>, LeftDataType>,
+                        Case<IsIntegralOrExtended<RightDataType>, RightDataType>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>, DataTypeInt256>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>, DataTypeInt128>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>, DataTypeInt64>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal32> || std::is_same_v<RightDataType, DataTypeDecimal32>, DataTypeInt32>>>>>,
+
         /// Decimal cases
         Case<!allow_decimal && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>), InvalidType>,
         Case<
@@ -1713,12 +1714,37 @@ public:
                             type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
                         }
                     }
-                    else if constexpr ((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
-                        (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>))
-                        type_res = std::make_shared<DataTypeFloat64>();
+                    else if constexpr (((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
+                        (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)) && !(is_div_int || is_div_int_or_zero))
+                    {
+                        if constexpr ((is_div_int || is_div_int_or_zero) && IsDataTypeDecimal<LeftDataType>)
+                        {
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
+                                type_res = std::make_shared<DataTypeInt256>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
+                                type_res = std::make_shared<DataTypeInt128>();
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeFloat64>)
+                                type_res = std::make_shared<DataTypeInt64>();
+                            else
+                                type_res = std::make_shared<DataTypeInt32>();
+                        }
+                        else if constexpr (is_div_int || is_div_int_or_zero)
+                        {
+                            if constexpr (std::is_same_v<RightDataType, DataTypeDecimal256>)
+                                type_res = std::make_shared<DataTypeInt256>();
+                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal128>)
+                                type_res = std::make_shared<DataTypeInt128>();
+                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal64> || std::is_same_v<LeftDataType, DataTypeFloat64>)
+                                type_res = std::make_shared<DataTypeInt64>();
+                            else
+                                type_res = std::make_shared<DataTypeInt32>();
+                        }
+                        else
+                            type_res = std::make_shared<DataTypeFloat64>();
+                    }
                     else if constexpr (IsDataTypeDecimal<LeftDataType>)
                     {
-                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegral<RightDataType>)
+                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegralOrExtended<RightDataType>)
                             type_res = std::make_shared<RightDataType>();
                         else if constexpr (is_div_int || is_div_int_or_zero)
                         {
diff --git a/src/Functions/IsOperation.h b/src/Functions/IsOperation.h
index b36530591ef..b2c7a27d375 100644
--- a/src/Functions/IsOperation.h
+++ b/src/Functions/IsOperation.h
@@ -61,10 +61,8 @@ struct IsOperation
     static constexpr bool bit_hamming_distance = IsSameOperation<Op, BitHammingDistanceImpl>::value;
 
     static constexpr bool division = div_floating || div_int || div_int_or_zero || modulo;
-
-    static constexpr bool division_allow_decimal = div_floating || modulo;
-
-    static constexpr bool allow_decimal = plus || minus || multiply || division_allow_decimal || least || greatest;
+    // NOTE: allow_decimal should not fully contain `division` because of divInt
+    static constexpr bool allow_decimal = plus || minus || multiply || division || least || greatest;
 };
 
 }
diff --git a/tests/queries/0_stateless/00700_decimal_arithm.reference b/tests/queries/0_stateless/00700_decimal_arithm.reference
index 811946c87e0..20f04696b1b 100644
--- a/tests/queries/0_stateless/00700_decimal_arithm.reference
+++ b/tests/queries/0_stateless/00700_decimal_arithm.reference
@@ -10,18 +10,18 @@
 63	21	-42	882	-882	2	0	2	0
 63	21	-42	882	-882	2	0	2	0
 1.00305798474369219219752355409390731264	-0.16305798474369219219752355409390731264	1.490591730234615865843651857942052864	-1.38847100762815390390123822295304634368	1.38847100762815390390123822295304634368	0.02	0.005
-63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2.02	0.505
-63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2.02	0.505
-63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2.02	0.505
-63.42	21.42	-41.58	890.82	-890.82	2.02	0.5	2.02	0.5
+63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2	0
+63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2	0
+63.42	21.42	-41.58	890.82	-890.82	2.02	0.505	2	0
+63.42	21.42	-41.58	890.82	-890.82	2.02	0.5	2	0
 63	-21	42	882	-882	0	2	0	2
 63	-21	42	882	-882	0	2	0	2
 63	-21	42	882	-882	0	2	0	2
 1.00305798474369219219752355409390731264	0.16305798474369219219752355409390731264	-1.490591730234615865843651857942052864	-1.38847100762815390390123822295304634368	1.38847100762815390390123822295304634368	-0.00000000000000000000000000000000000001	0.00000000000000000000000000000000000001
-63.42	-21.42	41.58	890.82	-890.82	0.495	1.98	0.495	1.98
+63.42	-21.42	41.58	890.82	-890.82	0.495	1.98	0	2
 63.42	-21.42	41.58	890.82	-890.82
-63.42	-21.42	41.58	890.82	-890.82	0.495049504950495049	1.980198019801980198	0.495049504950495049	1.980198019801980198
-63.42	-21.42	41.58	890.82	-890.82	0.49	1.98	0.49	1.98
+63.42	-21.42	41.58	890.82	-890.82	0.495049504950495049	1.980198019801980198	0	2
+63.42	-21.42	41.58	890.82	-890.82	0.49	1.98	0	2
 -42	42	42	42	0.42	0.42	0.42	42.42	42.42	42.42
 0	0	0	0	0	0	0	0	0	0
 42	-42	-42	-42	-0.42	-0.42	-0.42	-42.42	-42.42	-42.42
diff --git a/tests/queries/0_stateless/01717_int_div_float_too_large_ubsan.sql b/tests/queries/0_stateless/01717_int_div_float_too_large_ubsan.sql
index c4f26a079f0..dc1e5b37050 100644
--- a/tests/queries/0_stateless/01717_int_div_float_too_large_ubsan.sql
+++ b/tests/queries/0_stateless/01717_int_div_float_too_large_ubsan.sql
@@ -1,2 +1,2 @@
-SELECT intDiv(9223372036854775807, 0.9998999834060669); -- { serverError 153 }
-SELECT intDiv(9223372036854775807, 1.);  -- { serverError 153 }
+SELECT intDiv(18446744073709551615, 0.9998999834060669); -- { serverError 153 }
+SELECT intDiv(18446744073709551615, 1.);  -- { serverError 153 }
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.reference b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
index 9c1faab21d7..594dcee975a 100644
--- a/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
@@ -24,28 +24,44 @@
 2
 2
 2
+1
+1
+1
+1
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
 2
 2
 2
 2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
-2
+1
+1
+1
+1
 2
 2
 2
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.sql b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
index 8fc4b5a9a7d..18e657caa8a 100644
--- a/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
@@ -25,6 +25,14 @@ SELECT intDiv(toDecimal256(4.4, 2), toDecimal128(2.2, 2));
 SELECT intDiv(toDecimal64(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDiv(toDecimal128(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDiv(toDecimal256(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDiv(4.2, toDecimal32(2.2, 2));
+SELECT intDiv(4.2, toDecimal64(2.2, 2));
+SELECT intDiv(4.2, toDecimal128(2.2, 2));
+SELECT intDiv(4.2, toDecimal256(2.2, 2));
+SELECT intDiv(toDecimal32(4.4, 2), 2.2);
+SELECT intDiv(toDecimal64(4.4, 2), 2.2);
+SELECT intDiv(toDecimal128(4.4, 2), 2.2);
+SELECT intDiv(toDecimal256(4.4, 2), 2.2);
 --intDivOrZero--
 SELECT intDivOrZero(4,2);
 SELECT intDivOrZero(toDecimal32(4.4, 2), 2);
@@ -52,3 +60,11 @@ SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal128(2.2, 2));
 SELECT intDivOrZero(toDecimal64(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDivOrZero(toDecimal128(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal256(2.2, 2));
+SELECT intDivOrZero(4.2, toDecimal32(2.2, 2));
+SELECT intDivOrZero(4.2, toDecimal64(2.2, 2));
+SELECT intDivOrZero(4.2, toDecimal128(2.2, 2));
+SELECT intDivOrZero(4.2, toDecimal256(2.2, 2));
+SELECT intDivOrZero(toDecimal32(4.4, 2), 2.2);
+SELECT intDivOrZero(toDecimal64(4.4, 2), 2.2);
+SELECT intDivOrZero(toDecimal128(4.4, 2), 2.2);
+SELECT intDivOrZero(toDecimal256(4.4, 2), 2.2);

From 6bfa910d9ea403e91fb9be04573c73bfae77b4c4 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 16:47:02 +0100
Subject: [PATCH 0366/1081] Fix merge

---
 src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 78a67f3e59a..8556f0237e3 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -47,12 +47,10 @@ struct AzureObjectStorageSettings
     size_t max_single_read_retries = 3;
     size_t max_single_download_retries = 3;
     int list_object_keys_size = 1000;
-<<<<<<< HEAD
     size_t min_upload_part_size = 16 * 1024 * 1024;
     size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
     size_t max_single_part_copy_size = 256 * 1024 * 1024;
     bool use_native_copy = false;
-=======
     size_t max_unexpected_write_error_retries = 4;
 >>>>>>> master
 };

From 621c3e85963522127e2d5a62aa42f096e9c289c3 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 29 Jan 2024 16:50:01 +0100
Subject: [PATCH 0367/1081] Fix upgrade check for new setting

---
 src/Core/SettingsChangesHistory.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 928e05e5bb6..db9bb0b3a80 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,7 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
+              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
+              {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From ac532599aa48a6b012b498d1cfddf315f48cdcef Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:33:53 +0100
Subject: [PATCH 0368/1081] Don't apply without coverage flags when it's not
 necessary

---
 cmake/sanitize.cmake | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 3882b51227e..bc4a029721d 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -79,7 +79,10 @@ if (SANITIZE_COVERAGE)
 
     # But the actual coverage will be enabled on per-library basis: for ClickHouse code, but not for 3rd-party.
     set (COVERAGE_FLAGS "-fsanitize-coverage=trace-pc-guard,pc-table")
-endif()
 
-set (WITHOUT_COVERAGE_FLAGS "-fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table")
-set (WITHOUT_COVERAGE_FLAGS_LIST -fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table)
+    set (WITHOUT_COVERAGE_FLAGS "-fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table")
+    set (WITHOUT_COVERAGE_FLAGS_LIST -fno-profile-instr-generate -fno-coverage-mapping -fno-sanitize-coverage=trace-pc-guard,pc-table)
+else()
+    set (WITHOUT_COVERAGE_FLAGS "")
+    set (WITHOUT_COVERAGE_FLAGS_LIST "")
+endif()

From b88d0a2b15d902773b7396c1b6a0169c7ae7bcca Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:34:11 +0100
Subject: [PATCH 0369/1081] Don't apply O2 on release builds

---
 src/CMakeLists.txt | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 027e8a01fb1..5eae5ab6bff 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -294,12 +294,14 @@ if (TARGET ch_contrib::gwp_asan)
 endif()
 
 # Otherwise it will slow down stack traces printing too much.
-set_source_files_properties(
-        Common/Elf.cpp
-        Common/Dwarf.cpp
-        Common/SymbolIndex.cpp
-        Common/ThreadFuzzer.cpp
-        PROPERTIES COMPILE_FLAGS "-O2 ${WITHOUT_COVERAGE_FLAGS}")
+if ("${CMAKE_BUILD_TYPE_UC}" STREQUAL "DEBUG")
+    set_source_files_properties(
+            Common/Elf.cpp
+            Common/Dwarf.cpp
+            Common/SymbolIndex.cpp
+            Common/ThreadFuzzer.cpp
+            PROPERTIES COMPILE_FLAGS "-O2 ${WITHOUT_COVERAGE_FLAGS}")
+endif()
 
 target_link_libraries (clickhouse_common_io
         PRIVATE

From cda39e64e4d6b3076b68e2c73067fad3ebf78460 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 17:47:50 +0100
Subject: [PATCH 0370/1081] Perf: Only consider XML files

---
 tests/performance/scripts/entrypoint.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/performance/scripts/entrypoint.sh b/tests/performance/scripts/entrypoint.sh
index ec7e4d96dde..0c3bfa550f4 100755
--- a/tests/performance/scripts/entrypoint.sh
+++ b/tests/performance/scripts/entrypoint.sh
@@ -118,8 +118,8 @@ then
     # far in the future and have unrelated test changes.
     base=$(git -C right/ch merge-base pr origin/master)
     git -C right/ch diff --name-only "$base" pr -- . | tee all-changed-files.txt
-    git -C right/ch diff --name-only "$base" pr -- tests/performance | tee changed-test-definitions.txt
-    git -C right/ch diff --name-only "$base" pr -- :!tests/performance :!docker/test/performance-comparison | tee other-changed-files.txt
+    git -C right/ch diff --name-only "$base" pr -- tests/performance/*.xml | tee changed-test-definitions.txt
+    git -C right/ch diff --name-only "$base" pr -- :!tests/performance/*.xml :!docker/test/performance-comparison | tee other-changed-files.txt
 fi
 
 # Set python output encoding so that we can print queries with non-ASCII letters.

From 5b1919aff1d5cf91b9effdc7eb611a92f88d3b48 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 20:11:14 +0300
Subject: [PATCH 0371/1081] Loggers initialization fix

---
 src/Loggers/Loggers.cpp | 23 ++++++++++++-----------
 1 file changed, 12 insertions(+), 11 deletions(-)

diff --git a/src/Loggers/Loggers.cpp b/src/Loggers/Loggers.cpp
index 258853e8162..1d17585cc96 100644
--- a/src/Loggers/Loggers.cpp
+++ b/src/Loggers/Loggers.cpp
@@ -159,7 +159,6 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
     if (config.getBool("logger.use_syslog", false))
     {
-        //const std::string & cmd_name = commandName();
         auto syslog_level = Poco::Logger::parseLevel(config.getString("logger.syslog_level", log_level_string));
         if (syslog_level > max_log_level)
         {
@@ -228,22 +227,24 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
     split->open();
     logger.close();
-    logger.setChannel(split);
 
-    // Global logging level (it can be overridden for specific loggers).
+    logger.setChannel(split);
     logger.setLevel(max_log_level);
 
-    // Set level to all already created loggers
-    std::vector<std::string> names;
-    //logger_root = Logger::root();
-    logger.root().names(names);
-    for (const auto & name : names)
-        logger.root().get(name).setLevel(max_log_level);
-
-    // Attach to the root logger.
+    // Global logging level and channel (it can be overridden for specific loggers).
     logger.root().setLevel(max_log_level);
     logger.root().setChannel(logger.getChannel());
 
+    // Set level and channel to all already created loggers
+    std::vector<std::string> names;
+    logger.names(names);
+
+    for (const auto & name : names)
+    {
+        logger.get(name).setLevel(max_log_level);
+        logger.get(name).setChannel(split);
+    }
+
     // Explicitly specified log levels for specific loggers.
     {
         Poco::Util::AbstractConfiguration::Keys loggers_level;

From 7892adc18beb05335f4f56e6ad3737384ba958ef Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 29 Jan 2024 20:18:25 +0300
Subject: [PATCH 0372/1081] Add setting
 update_insert_deduplication_token_in_dependent_materialized_views to settings
 changes history

---
 src/Core/SettingsChangesHistory.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 928e05e5bb6..bf3e98820ab 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,7 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
+              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
+              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From be6a6ca3b3eaf9208ce96f1ef1a2ef00e71572ce Mon Sep 17 00:00:00 2001
From: Aleksandr Musorin <aleksandr.musorin@semrush.com>
Date: Mon, 29 Jan 2024 18:31:11 +0100
Subject: [PATCH 0373/1081] docs: added hidden clickhouse-client shortkeys and
 aliases

---
 docs/en/interfaces/cli.md | 23 +++++++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/docs/en/interfaces/cli.md b/docs/en/interfaces/cli.md
index a53844e792f..518037a2c7c 100644
--- a/docs/en/interfaces/cli.md
+++ b/docs/en/interfaces/cli.md
@@ -197,6 +197,29 @@ You can pass parameters to `clickhouse-client` (all parameters have a default va
 Instead of `--host`, `--port`, `--user` and `--password` options, ClickHouse client also supports connection strings (see next section).
 
 
+## Aliases {#cli_aliases}
+
+- `\l` - SHOW DATABASES
+- `\d` - SHOW TABLES
+- `\c <DATABASE>` - USE DATABASE
+- `.` - repeat the last query
+
+
+## Shortkeys {#shortkeys_aliases}
+
+- `Alt (Option) + Shift + e` - open editor with current query. It is possible to set up an environment variable - `EDITOR`, by default vim is used.
+- `Alt (Option) + #` - comment line.
+- `Ctrl + r` - fuzzy history search.
+
+:::tip
+To configure the correct work of meta key (Option) on MacOS:
+
+iTerm2: Go to Preferences -> Profile -> Keys -> Left Option key and click Esc+
+:::
+
+The full list with all available shortkeys - [replxx](https://github.com/AmokHuginnsson/replxx/blob/1f149bf/src/replxx_impl.cxx#L262).
+
+
 ## Connection string {#connection_string}
 
 clickhouse-client alternatively supports connecting to clickhouse server using a connection string similar to [MongoDB](https://www.mongodb.com/docs/manual/reference/connection-string/), [PostgreSQL](https://www.postgresql.org/docs/current/libpq-connect.html#LIBPQ-CONNSTRING), [MySQL](https://dev.mysql.com/doc/refman/8.0/en/connecting-using-uri-or-key-value-pairs.html#connecting-using-uri). It has the following syntax:

From d0143380d733480f2b3c50dd092a758e6604a2a6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 29 Jan 2024 17:53:59 +0000
Subject: [PATCH 0374/1081] Fix not-ready set for system.tables

---
 src/Storages/System/StorageSystemTables.cpp        | 14 +++++++++++---
 .../queries/0_stateless/02841_not_ready_set_bug.sh |  1 +
 2 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index a0f6b03cf89..e0d2dd03e78 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -693,10 +693,15 @@ public:
     {
     }
 
+    void applyFilters() override;
+
 private:
     ContextPtr context;
     std::vector<UInt8> columns_mask;
     size_t max_block_size;
+
+    ColumnPtr filtered_databases_column;
+    ColumnPtr filtered_tables_column;
 };
 
 void StorageSystemTables::read(
@@ -723,16 +728,19 @@ void StorageSystemTables::read(
     query_plan.addStep(std::move(reading));
 }
 
-void ReadFromSystemTables::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
+void ReadFromSystemTables::applyFilters()
 {
     auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes);
     const ActionsDAG::Node * predicate = nullptr;
     if (filter_actions_dag)
         predicate = filter_actions_dag->getOutputs().at(0);
 
-    ColumnPtr filtered_databases_column = getFilteredDatabases(predicate, context);
-    ColumnPtr filtered_tables_column = getFilteredTables(predicate, filtered_databases_column, context);
+    filtered_databases_column = getFilteredDatabases(predicate, context);
+    filtered_tables_column = getFilteredTables(predicate, filtered_databases_column, context);
+}
 
+void ReadFromSystemTables::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
+{
     Pipe pipe(std::make_shared<TablesBlockSource>(
         std::move(columns_mask), getOutputStream().header, max_block_size, std::move(filtered_databases_column), std::move(filtered_tables_column), context));
     pipeline.init(std::move(pipe));
diff --git a/tests/queries/0_stateless/02841_not_ready_set_bug.sh b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
index fd7f62d28bf..809640de075 100755
--- a/tests/queries/0_stateless/02841_not_ready_set_bug.sh
+++ b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
@@ -9,3 +9,4 @@ $CLICKHOUSE_CLIENT -q "create table t1 (number UInt64) engine = MergeTree order
 $CLICKHOUSE_CLIENT -q "insert into t1 select number from numbers(10);"
 $CLICKHOUSE_CLIENT --max_threads=2 --max_result_rows=1 --result_overflow_mode=break -q "with tab as (select min(number) from t1 prewhere number in (select number from view(select number, row_number() OVER (partition by number % 2 ORDER BY number DESC) from numbers_mt(1e4)) where number != 2 order by number)) select number from t1 union all select * from tab;" > /dev/null
 
+$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) format Null"

From 516daadeef67886c1f6fdf0864004bdc7fcf95a7 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Mon, 29 Jan 2024 15:16:00 -0300
Subject: [PATCH 0375/1081] add static storage assert in datapartcloner

---
 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index e384e1b7066..04019d2c665 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -257,6 +257,7 @@ std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHand
     const WriteSettings & write_settings,
     const IDataPartStorage::ClonePartParams & params)
 {
+    chassert(!merge_tree_data->isStaticStorage());
     if (!doesStoragePolicyAllowSameDisk(merge_tree_data, src_part))
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,

From 34134c4f1e4215fec06fed1850d72877b47603f3 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Mon, 29 Jan 2024 19:25:18 +0100
Subject: [PATCH 0376/1081] Style fix

---
 tests/queries/0_stateless/02841_not_ready_set_bug.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02841_not_ready_set_bug.sh b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
index 809640de075..3aaffe51578 100755
--- a/tests/queries/0_stateless/02841_not_ready_set_bug.sh
+++ b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
@@ -9,4 +9,4 @@ $CLICKHOUSE_CLIENT -q "create table t1 (number UInt64) engine = MergeTree order
 $CLICKHOUSE_CLIENT -q "insert into t1 select number from numbers(10);"
 $CLICKHOUSE_CLIENT --max_threads=2 --max_result_rows=1 --result_overflow_mode=break -q "with tab as (select min(number) from t1 prewhere number in (select number from view(select number, row_number() OVER (partition by number % 2 ORDER BY number DESC) from numbers_mt(1e4)) where number != 2 order by number)) select number from t1 union all select * from tab;" > /dev/null
 
-$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) format Null"
+$CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) AND database = currentDatabase() format Null"

From 9d5af9d9cf922f5bf803e8b1f7d4ae520e9b3cce Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 29 Jan 2024 19:31:05 +0100
Subject: [PATCH 0377/1081] Try fix

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 2af0a83bd26..764c6a2af54 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,5 +5,5 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_LOCAL -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
+$CLICKHOUSE_CLIENT -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
 

From df7d3b8a401669b6ead2ee8b8d48b750bec36e2d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 17:14:32 +0100
Subject: [PATCH 0378/1081] Allocate current shard number from keeper

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 121 +++++++++++++++++-
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  45 +++++--
 src/Storages/S3Queue/S3QueueSource.cpp        |   4 +-
 src/Storages/S3Queue/StorageS3Queue.cpp       |  35 +++--
 src/Storages/S3Queue/StorageS3Queue.h         |   4 +-
 .../integration/test_storage_s3_queue/test.py |  23 +++-
 6 files changed, 198 insertions(+), 34 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 6c3e47d998e..30bb561204f 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -134,6 +134,7 @@ S3QueueFilesMetadata::S3QueueFilesMetadata(const fs::path & zookeeper_path_, con
     , zookeeper_processing_path(zookeeper_path_ / "processing")
     , zookeeper_processed_path(zookeeper_path_ / "processed")
     , zookeeper_failed_path(zookeeper_path_ / "failed")
+    , zookeeper_shards_path(zookeeper_path_ / "shards")
     , zookeeper_cleanup_lock_path(zookeeper_path_ / "cleanup_lock")
     , log(getLogger("S3QueueFilesMetadata"))
 {
@@ -159,7 +160,11 @@ void S3QueueFilesMetadata::deactivateCleanupTask()
 
 zkutil::ZooKeeperPtr S3QueueFilesMetadata::getZooKeeper() const
 {
-    return Context::getGlobalContextInstance()->getZooKeeper();
+    if (!zookeeper || zookeeper->expired())
+    {
+        zookeeper = Context::getGlobalContextInstance()->getZooKeeper();
+    }
+    return zookeeper;
 }
 
 S3QueueFilesMetadata::FileStatusPtr S3QueueFilesMetadata::getFileStatus(const std::string & path)
@@ -199,9 +204,121 @@ S3QueueFilesMetadata::NodeMetadata S3QueueFilesMetadata::createNodeMetadata(
     return metadata;
 }
 
+bool S3QueueFilesMetadata::isShardedProcessing() const
+{
+    return getProcessingIdsNum() > 1 && mode == S3QueueMode::ORDERED;
+}
+
+size_t S3QueueFilesMetadata::registerNewShard()
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot register a new shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    zk_client->createAncestors(zookeeper_shards_path / "");
+
+    std::string shard_node_path;
+    size_t shard_id = 0;
+    for (size_t i = 0; i < shards_num; ++i)
+    {
+        const auto node_path = getZooKeeperPathForShard(i);
+        auto err = zk_client->tryCreate(node_path, "", zkutil::CreateMode::Persistent);
+        if (err == Coordination::Error::ZOK)
+        {
+            shard_node_path = node_path;
+            shard_id = i;
+            break;
+        }
+        else if (err == Coordination::Error::ZNODEEXISTS)
+            continue;
+        else
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Unexpected error: {}", magic_enum::enum_name(err));
+    }
+
+    if (shard_node_path.empty())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Failed to register a new shard");
+
+    LOG_TRACE(log, "Using shard {} (zk node: {})", shard_id, shard_node_path);
+    return shard_id;
+}
+
+std::string S3QueueFilesMetadata::getZooKeeperPathForShard(size_t shard_id) const
+{
+    return zookeeper_shards_path / ("shard" + toString(shard_id));
+}
+
+void S3QueueFilesMetadata::registerNewShard(size_t shard_id)
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot register a new shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    zk_client->createAncestors(node_path);
+
+    auto err = zk_client->tryCreate(node_path, "", zkutil::CreateMode::Persistent);
+    if (err != Coordination::Error::ZOK)
+    {
+        if (err == Coordination::Error::ZNODEEXISTS)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot register shard {}: already exists", shard_id);
+        else
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Unexpected error: {}", magic_enum::enum_name(err));
+    }
+}
+
+bool S3QueueFilesMetadata::isShardRegistered(size_t shard_id)
+{
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    return zk_client->exists(node_path);
+}
+
+void S3QueueFilesMetadata::unregisterShard(size_t shard_id)
+{
+    if (!isShardedProcessing())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot unregister a shard, because processing is not sharded");
+    }
+
+    const auto zk_client = getZooKeeper();
+    const auto node_path = getZooKeeperPathForShard(shard_id);
+    zk_client->remove(node_path);
+}
+
+size_t S3QueueFilesMetadata::getProcessingIdsNum() const
+{
+    return shards_num * threads_per_shard;
+}
+
+std::vector<size_t> S3QueueFilesMetadata::getProcessingIdsForShard(size_t shard_id) const
+{
+    std::vector<size_t> res(threads_per_shard);
+    std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
+    return res;
+}
+
+bool S3QueueFilesMetadata::isProcessingIdBelongsToShard(size_t id, size_t shard_id) const
+{
+    return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard;
+}
+
+size_t S3QueueFilesMetadata::getIdForProcessingThread(size_t thread_id, size_t shard_id) const
+{
+    return shard_id * threads_per_shard + thread_id;
+}
+
 size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
-    return sipHash64(path.data(), path.size()) % getProcessingThreadsNum();
+    return sipHash64(path.data(), path.size()) % getProcessingIdsNum();
 }
 
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 0cc03783868..66e36b4122e 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -80,24 +80,38 @@ public:
 
     void deactivateCleanupTask();
 
-    bool isShardedProcessing() const { return getProcessingThreadsNum() > 1 && mode == S3QueueMode::ORDERED; }
+    /// Should the table use sharded processing?
+    /// We use sharded processing for Ordered mode of S3Queue table.
+    /// It allows to parallelize processing within a single server
+    /// and to allow distributed processing.
+    bool isShardedProcessing() const;
 
-    size_t getProcessingThreadsNum() const { return shards_num * threads_per_shard; }
+    /// Register a new shard for processing.
+    /// Return a shard id of registered shard.
+    size_t registerNewShard();
+    /// Register a new shard for processing by given id.
+    /// Throws exception if shard by this id is already registered.
+    void registerNewShard(size_t shard_id);
+    /// Unregister shard from keeper.
+    void unregisterShard(size_t shard_id);
+    bool isShardRegistered(size_t shard_id);
 
+    /// Total number of processing ids.
+    /// A processing id identifies a single processing thread.
+    /// There might be several processing ids per shard.
+    size_t getProcessingIdsNum() const;
+    /// Get processing ids identified with requested shard.
+    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const;
+    /// Check if given processing id belongs to a given shard.
+    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const;
+    /// Get a processing id for processing thread by given thread id.
+    /// thread id is a value in range [0, threads_per_shard].
+    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const;
+
+    /// Calculate which processing id corresponds to a given file path.
+    /// The file will be processed by a thread related to this processing id.
     size_t getProcessingIdForPath(const std::string & path) const;
 
-    /// shard_id must be in range [0, shards_num - 1]
-    size_t getIdForProcessingThread(size_t thread_id, size_t shard_id) const { return shard_id * threads_per_shard + thread_id; }
-
-    bool isProcessingIdBelongsToShard(size_t id, size_t shard_id) const { return shard_id * threads_per_shard <= id && id < (shard_id + 1) * threads_per_shard; }
-
-    std::vector<size_t> getProcessingIdsForShard(size_t shard_id) const
-    {
-        std::vector<size_t> res(threads_per_shard);
-        std::iota(res.begin(), res.end(), shard_id * threads_per_shard);
-        return res;
-    }
-
 private:
     const S3QueueMode mode;
     const UInt64 max_set_size;
@@ -111,9 +125,11 @@ private:
     const fs::path zookeeper_processing_path;
     const fs::path zookeeper_processed_path;
     const fs::path zookeeper_failed_path;
+    const fs::path zookeeper_shards_path;
     const fs::path zookeeper_cleanup_lock_path;
 
     LoggerPtr log;
+    mutable zkutil::ZooKeeperPtr zookeeper;
 
     std::atomic_bool shutdown = false;
     BackgroundSchedulePool::TaskHolder task;
@@ -124,6 +140,7 @@ private:
 
     void setFileProcessedForOrderedMode(ProcessingNodeHolderPtr holder);
     void setFileProcessedForUnorderedMode(ProcessingNodeHolderPtr holder);
+    std::string getZooKeeperPathForShard(size_t shard_id) const;
 
     enum class SetFileProcessingResult
     {
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index 832a50386ee..e277a81a923 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -85,7 +85,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                 else
                 {
                     throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                    "Processing id {} does not exist (Expexted ids: {})",
+                                    "Processing id {} does not exist (Expected ids: {})",
                                     idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                 }
             }
@@ -110,7 +110,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                             else
                             {
                                 throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                                "Processing id {} does not exist (Expexted ids: {})",
+                                                "Processing id {} does not exist (Expected ids: {})",
                                                 idx, fmt::join(metadata->getProcessingIdsForShard(current_shard), ", "));
                             }
                         }
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 44e9b818e1e..23ef9aec980 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -93,13 +93,6 @@ namespace
                             "Setting `s3queue_cleanup_interval_min_ms` ({}) must be less or equal to `s3queue_cleanup_interval_max_ms` ({})",
                             s3queue_settings.s3queue_cleanup_interval_min_ms, s3queue_settings.s3queue_cleanup_interval_max_ms);
         }
-
-        if (s3queue_settings.s3queue_current_shard_num >= s3queue_settings.s3queue_total_shards_num)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                            "Setting `s3queue_current_shard_num` ({}) cannot exceed `{}` (`s3queue_total_shards_num` - 1)",
-                            s3queue_settings.s3queue_current_shard_num, s3queue_settings.s3queue_total_shards_num);
-
-        ///TODO: Add a test with different total_shards_settings for same keeper path - exception must be thrown.
     }
 }
 
@@ -111,7 +104,8 @@ StorageS3Queue::StorageS3Queue(
     const ConstraintsDescription & constraints_,
     const String & comment,
     ContextPtr context_,
-    std::optional<FormatSettings> format_settings_)
+    std::optional<FormatSettings> format_settings_,
+    ASTStorage * engine_args)
     : IStorage(table_id_)
     , WithContext(context_)
     , s3queue_settings(std::move(s3queue_settings_))
@@ -174,6 +168,19 @@ StorageS3Queue::StorageS3Queue(
         S3QueueMetadataFactory::instance().remove(zk_path);
         throw;
     }
+
+    if (files_metadata->isShardedProcessing())
+    {
+        if (!s3queue_settings->s3queue_current_shard_num.changed)
+        {
+            s3queue_settings->s3queue_current_shard_num = static_cast<UInt32>(files_metadata->registerNewShard());
+            engine_args->settings->changes.setSetting("s3queue_current_shard_num", s3queue_settings->s3queue_current_shard_num.value);
+        }
+        else if (!files_metadata->isShardRegistered(s3queue_settings->s3queue_current_shard_num))
+        {
+            files_metadata->registerNewShard(s3queue_settings->s3queue_current_shard_num);
+        }
+    }
 }
 
 void StorageS3Queue::startup()
@@ -187,6 +194,7 @@ void StorageS3Queue::shutdown(bool is_drop)
     table_is_being_dropped = is_drop;
     shutdown_called = true;
 
+    LOG_TRACE(log, "Shutting down storage...");
     if (task)
     {
         task->deactivate();
@@ -195,8 +203,16 @@ void StorageS3Queue::shutdown(bool is_drop)
     if (files_metadata)
     {
         files_metadata->deactivateCleanupTask();
+
+        if (is_drop && files_metadata->isShardedProcessing())
+        {
+            files_metadata->unregisterShard(s3queue_settings->s3queue_current_shard_num);
+            LOG_TRACE(log, "Unregistered shard {} from zookeeper", s3queue_settings->s3queue_current_shard_num);
+        }
+
         files_metadata.reset();
     }
+    LOG_TRACE(log, "Shut down storage");
 }
 
 void StorageS3Queue::drop()
@@ -627,7 +643,8 @@ void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
                 args.constraints,
                 args.comment,
                 args.getContext(),
-                format_settings);
+                format_settings,
+                args.storage_def);
         },
         {
             .supports_settings = true,
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index fa13086bc22..fd3b4bb4914 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -11,6 +11,7 @@
 #include <Storages/StorageS3.h>
 #include <Interpreters/Context.h>
 #include <IO/S3/BlobStorageLogWriter.h>
+#include <Storages/StorageFactory.h>
 
 
 namespace Aws::S3
@@ -35,7 +36,8 @@ public:
         const ConstraintsDescription & constraints_,
         const String & comment,
         ContextPtr context_,
-        std::optional<FormatSettings> format_settings_);
+        std::optional<FormatSettings> format_settings_,
+        ASTStorage * engine_args);
 
     String getName() const override { return "S3Queue"; }
 
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 4dc5f7e6556..1495e4954b1 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -89,6 +89,7 @@ def started_cluster():
                 "configs/zookeeper.xml",
                 "configs/s3queue_log.xml",
             ],
+            stay_alive=True,
         )
         cluster.add_instance(
             "instance2",
@@ -1049,7 +1050,6 @@ def test_shards(started_cluster, mode, processing_threads):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": processing_threads,
                 "s3queue_total_shards_num": shards_num,
-                "s3queue_current_shard_num": i,
             },
         )
         create_mv(node, table, dst_table)
@@ -1115,6 +1115,8 @@ def test_shards(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+        shard_nodes = zk.get_children(f"{keeper_path}/shards/")
+        assert len(shard_nodes) == shards_num
 
 
 @pytest.mark.parametrize(
@@ -1150,7 +1152,6 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": processing_threads,
                 "s3queue_total_shards_num": shards_num,
-                "s3queue_current_shard_num": i,
             },
         )
         i += 1
@@ -1205,6 +1206,8 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         zk = started_cluster.get_kazoo_client("zoo1")
         processed_nodes = zk.get_children(f"{keeper_path}/processed/")
         assert len(processed_nodes) == shards_num * processing_threads
+        shard_nodes = zk.get_children(f"{keeper_path}/shards/")
+        assert len(shard_nodes) == shards_num
 
 
 def test_settings_check(started_cluster):
@@ -1216,7 +1219,8 @@ def test_settings_check(started_cluster):
     files_path = f"{table_name}_data"
     mode = "ordered"
 
-    i = 0
+    node.restart_clickhouse()
+
     create_table(
         started_cluster,
         node,
@@ -1227,7 +1231,6 @@ def test_settings_check(started_cluster):
             "keeper_path": keeper_path,
             "s3queue_processing_threads_num": 5,
             "s3queue_total_shards_num": 2,
-            "s3queue_current_shard_num": i,
         },
     )
 
@@ -1243,7 +1246,6 @@ def test_settings_check(started_cluster):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": 5,
                 "s3queue_total_shards_num": 3,
-                "s3queue_current_shard_num": i,
             },
             expect_error=True,
         )
@@ -1261,8 +1263,17 @@ def test_settings_check(started_cluster):
                 "keeper_path": keeper_path,
                 "s3queue_processing_threads_num": 2,
                 "s3queue_total_shards_num": 2,
-                "s3queue_current_shard_num": i,
             },
             expect_error=True,
         )
     )
+
+    assert "s3queue_current_shard_num = 0" in node.query(
+        f"SHOW CREATE TABLE {table_name}"
+    )
+    node.restart_clickhouse()
+    assert "s3queue_current_shard_num = 0" in node.query(
+        f"SHOW CREATE TABLE {table_name}"
+    )
+
+    node.query(f"DROP TABLE {table_name} SYNC")

From 36dc076bbfeac1f617c2b0b1bafc4a582e758762 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 29 Jan 2024 20:04:38 +0100
Subject: [PATCH 0379/1081] Update test

---
 .../test_broken_projections/test.py           | 28 ++++++-------------
 1 file changed, 8 insertions(+), 20 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index e0b8c3d9247..9597560f5bf 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -215,18 +215,12 @@ def random_str(length=6):
 
 
 def check(node, table, check_result, expect_broken_part="", expected_error=""):
-    query_id = random_str()
-
     if expect_broken_part == "proj1":
         assert expected_error in node.query_and_get_error(
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
-        node.query(
-            f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c",
-            query_id=query_id,
-        )
-        time.sleep(2)
+        query_id = node.query(f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)").strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -238,26 +232,20 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         if res == "":
             res = node.query(
                 """
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
-                FROM system.query_log
+                SELECT query_id, query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log ORDER BY query_start_time_microseconds DESC
             """
             )
-            print(res)
+            print(f"LOG: {res}")
             assert False
         assert "proj1" in res
 
-    query_id = random_str()
-
     if expect_broken_part == "proj2":
         assert expected_error in node.query_and_get_error(
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
     else:
-        node.query(
-            f"SELECT d FROM '{table}' WHERE c == 12 OR c == 16 ORDER BY d",
-            query_id=query_id,
-        )
-        time.sleep(2)
+        query_id = node.query(f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)").strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -269,11 +257,11 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
         if res == "":
             res = node.query(
                 """
-                SELECT query, splitByChar('.', arrayJoin(projections))[-1]
-                FROM system.query_log
+                SELECT query_id, query, splitByChar('.', arrayJoin(projections))[-1]
+                FROM system.query_log ORDER BY query_start_time_microseconds DESC
             """
             )
-            print(res)
+            print(f"LOG: {res}")
             assert False
         assert "proj2" in res
 

From 7cef679f6d4addb98017625065a3a7479d7f16c9 Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Mon, 29 Jan 2024 20:11:02 +0100
Subject: [PATCH 0380/1081] Address PR feedback

---
 src/Server/MySQLHandler.cpp                   | 221 +++++++++---------
 src/Server/MySQLHandler.h                     |   1 +
 .../02967_mysql_settings_override.sh          |   8 +-
 3 files changed, 116 insertions(+), 114 deletions(-)

diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index 260219c1556..72fe3b7cea9 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -57,16 +57,109 @@ namespace ErrorCodes
     extern const int UNSUPPORTED_METHOD;
 }
 
-
 static const size_t PACKET_HEADER_SIZE = 4;
 static const size_t SSL_REQUEST_PAYLOAD_SIZE = 32;
 
-static String showWarningsReplacementQuery(const String & query);
-static String showCountWarningsReplacementQuery(const String & query);
-static String selectEmptyReplacementQuery(const String & query);
-static String showTableStatusReplacementQuery(const String & query);
-static String killConnectionIdReplacementQuery(const String & query);
-static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting);
+static bool checkShouldReplaceQuery(const String & query, const String & prefix)
+{
+    return query.length() >= prefix.length()
+        && std::equal(prefix.begin(), prefix.end(), query.begin(), [](char a, char b) { return std::tolower(a) == std::tolower(b); });
+}
+
+static bool isFederatedServerSetupSetCommand(const String & query)
+{
+    re2::RE2::Options regexp_options;
+    regexp_options.set_case_sensitive(false);
+    static const re2::RE2 expr(
+        "(^(SET NAMES(.*)))"
+        "|(^(SET character_set_results(.*)))"
+        "|(^(SET FOREIGN_KEY_CHECKS(.*)))"
+        "|(^(SET AUTOCOMMIT(.*)))"
+        "|(^(SET sql_mode(.*)))"
+        "|(^(SET @@(.*)))"
+        "|(^(SET SESSION TRANSACTION ISOLATION LEVEL(.*)))", regexp_options);
+    assert(expr.ok());
+    return re2::RE2::FullMatch(query, expr);
+}
+
+/// Always return an empty set with appropriate column definitions for SHOW WARNINGS queries
+/// See also: https://dev.mysql.com/doc/refman/8.0/en/show-warnings.html
+static String showWarningsReplacementQuery([[maybe_unused]] const String & query)
+{
+    return "SELECT '' AS Level, 0::UInt32 AS Code, '' AS Message WHERE false";
+}
+
+static String showCountWarningsReplacementQuery([[maybe_unused]] const String & query)
+{
+    return "SELECT 0::UInt64 AS `@@session.warning_count`";
+}
+
+/// Replace "[query(such as SHOW VARIABLES...)]" into "".
+static String selectEmptyReplacementQuery(const String & query)
+{
+    std::ignore = query;
+    return "select ''";
+}
+
+/// Replace "SHOW TABLE STATUS LIKE 'xx'" into "SELECT ... FROM system.tables WHERE name LIKE 'xx'".
+static String showTableStatusReplacementQuery(const String & query)
+{
+    const String prefix = "SHOW TABLE STATUS LIKE ";
+    if (query.size() > prefix.size())
+    {
+        String suffix = query.data() + prefix.length();
+        return (
+            "SELECT"
+            " name AS Name,"
+            " engine AS Engine,"
+            " '10' AS Version,"
+            " 'Dynamic' AS Row_format,"
+            " 0 AS Rows,"
+            " 0 AS Avg_row_length,"
+            " 0 AS Data_length,"
+            " 0 AS Max_data_length,"
+            " 0 AS Index_length,"
+            " 0 AS Data_free,"
+            " 'NULL' AS Auto_increment,"
+            " metadata_modification_time AS Create_time,"
+            " metadata_modification_time AS Update_time,"
+            " metadata_modification_time AS Check_time,"
+            " 'utf8_bin' AS Collation,"
+            " 'NULL' AS Checksum,"
+            " '' AS Create_options,"
+            " '' AS Comment"
+            " FROM system.tables"
+            " WHERE name LIKE "
+            + suffix);
+    }
+    return query;
+}
+
+static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & clickhouse_setting)
+{
+    const String prefix = "SET " + mysql_setting;
+    // if (query.length() >= prefix.length() && boost::iequals(std::string_view(prefix), std::string_view(query.data(), 3)))
+    if (checkShouldReplaceQuery(query, prefix))
+        return "SET " + clickhouse_setting + String(query.data() + prefix.length());
+    return std::nullopt;
+}
+
+/// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
+static String killConnectionIdReplacementQuery(const String & query)
+{
+    const String prefix = "KILL QUERY ";
+    if (query.size() > prefix.size())
+    {
+        String suffix = query.data() + prefix.length();
+        static const re2::RE2 expr("^[0-9]");
+        if (re2::RE2::FullMatch(suffix, expr))
+        {
+            String replacement = fmt::format("KILL QUERY WHERE query_id LIKE 'mysql:{}:%'", suffix);
+            return replacement;
+        }
+    }
+    return query;
+}
 
 MySQLHandler::MySQLHandler(
     IServer & server_,
@@ -326,8 +419,6 @@ void MySQLHandler::comPing()
     packet_endpoint->sendPacket(OKPacket(0x0, client_capabilities, 0, 0, 0), true);
 }
 
-static bool isFederatedServerSetupSetCommand(const String & query);
-
 void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
 {
     String query = String(payload.position(), payload.buffer().end());
@@ -347,7 +438,7 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
         // Queries replacements
         for (auto const & [query_to_replace, replacement_fn] : queries_replacements)
         {
-            if (0 == strncasecmp(query_to_replace.c_str(), query.c_str(), query_to_replace.size()))
+            if (checkShouldReplaceQuery(query, query_to_replace))
             {
                 should_replace = true;
                 replacement_query = replacement_fn(query);
@@ -357,9 +448,9 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
 
         // Settings replacements
         if (!should_replace)
-            for (auto const & [mysql_setting, native_setting] : settings_replacements)
+            for (auto const & [mysql_setting, clickhouse_setting] : settings_replacements)
             {
-                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, native_setting);
+                const auto replacement_query_opt = setSettingReplacementQuery(query, mysql_setting, clickhouse_setting);
                 if (replacement_query_opt.has_value())
                 {
                     should_replace = true;
@@ -368,8 +459,6 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
                 }
             }
 
-        ReadBufferFromString replacement(replacement_query);
-
         auto query_context = session->makeQueryContext();
         query_context->setCurrentQueryId(fmt::format("mysql:{}:{}", connection_id, toString(UUIDHelpers::generateV4())));
         CurrentThread::QueryScope query_scope{query_context};
@@ -401,7 +490,14 @@ void MySQLHandler::comQuery(ReadBuffer & payload, bool binary_protocol)
             }
         };
 
-        executeQuery(should_replace ? replacement : payload, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+        if (should_replace)
+        {
+            ReadBufferFromString replacement(replacement_query);
+            executeQuery(replacement, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+        }
+        else
+            executeQuery(payload, *out, false, query_context, set_result_details, QueryFlags{}, format_settings);
+
 
         if (!with_output)
             packet_endpoint->sendPacket(OKPacket(0x00, client_capabilities, affected_rows, 0, 0), true);
@@ -547,99 +643,4 @@ void MySQLHandlerSSL::finishHandshakeSSL(
 }
 
 #endif
-
-static bool isFederatedServerSetupSetCommand(const String & query)
-{
-    re2::RE2::Options regexp_options;
-    regexp_options.set_case_sensitive(false);
-    static const re2::RE2 expr(
-        "(^(SET NAMES(.*)))"
-        "|(^(SET character_set_results(.*)))"
-        "|(^(SET FOREIGN_KEY_CHECKS(.*)))"
-        "|(^(SET AUTOCOMMIT(.*)))"
-        "|(^(SET sql_mode(.*)))"
-        "|(^(SET @@(.*)))"
-        "|(^(SET SESSION TRANSACTION ISOLATION LEVEL(.*)))", regexp_options);
-    assert(expr.ok());
-    return re2::RE2::FullMatch(query, expr);
-}
-
-/// Always return an empty set with appropriate column definitions for SHOW WARNINGS queries
-/// See also: https://dev.mysql.com/doc/refman/8.0/en/show-warnings.html
-static String showWarningsReplacementQuery([[maybe_unused]] const String & query)
-{
-    return "SELECT '' AS Level, 0::UInt32 AS Code, '' AS Message WHERE false";
-}
-
-static String showCountWarningsReplacementQuery([[maybe_unused]] const String & query)
-{
-    return "SELECT 0::UInt64 AS `@@session.warning_count`";
-}
-
-/// Replace "[query(such as SHOW VARIABLES...)]" into "".
-static String selectEmptyReplacementQuery(const String & query)
-{
-    std::ignore = query;
-    return "select ''";
-}
-
-/// Replace "SHOW TABLE STATUS LIKE 'xx'" into "SELECT ... FROM system.tables WHERE name LIKE 'xx'".
-static String showTableStatusReplacementQuery(const String & query)
-{
-    const String prefix = "SHOW TABLE STATUS LIKE ";
-    if (query.size() > prefix.size())
-    {
-        String suffix = query.data() + prefix.length();
-        return (
-            "SELECT"
-            " name AS Name,"
-            " engine AS Engine,"
-            " '10' AS Version,"
-            " 'Dynamic' AS Row_format,"
-            " 0 AS Rows,"
-            " 0 AS Avg_row_length,"
-            " 0 AS Data_length,"
-            " 0 AS Max_data_length,"
-            " 0 AS Index_length,"
-            " 0 AS Data_free,"
-            " 'NULL' AS Auto_increment,"
-            " metadata_modification_time AS Create_time,"
-            " metadata_modification_time AS Update_time,"
-            " metadata_modification_time AS Check_time,"
-            " 'utf8_bin' AS Collation,"
-            " 'NULL' AS Checksum,"
-            " '' AS Create_options,"
-            " '' AS Comment"
-            " FROM system.tables"
-            " WHERE name LIKE "
-            + suffix);
-    }
-    return query;
-}
-
-static std::optional<String> setSettingReplacementQuery(const String & query, const String & mysql_setting, const String & native_setting)
-{
-    const String prefix = "SET " + mysql_setting;
-    if (0 == strncasecmp(prefix.c_str(), query.c_str(), prefix.size()))
-        return "SET " + native_setting + String(query.data() + prefix.length());
-    return std::nullopt;
-}
-
-/// Replace "KILL QUERY [connection_id]" into "KILL QUERY WHERE query_id LIKE 'mysql:[connection_id]:xxx'".
-static String killConnectionIdReplacementQuery(const String & query)
-{
-    const String prefix = "KILL QUERY ";
-    if (query.size() > prefix.size())
-    {
-        String suffix = query.data() + prefix.length();
-        static const re2::RE2 expr("^[0-9]");
-        if (re2::RE2::FullMatch(suffix, expr))
-        {
-            String replacement = fmt::format("KILL QUERY WHERE query_id LIKE 'mysql:{}:%'", suffix);
-            return replacement;
-        }
-    }
-    return query;
-}
-
 }
diff --git a/src/Server/MySQLHandler.h b/src/Server/MySQLHandler.h
index 8f9dcd872db..2deb2b8f435 100644
--- a/src/Server/MySQLHandler.h
+++ b/src/Server/MySQLHandler.h
@@ -96,6 +96,7 @@ protected:
     using QueriesReplacements = std::unordered_map<std::string, QueryReplacementFn>;
     QueriesReplacements queries_replacements;
 
+    /// MySQL setting name --> ClickHouse setting name
     using SettingsReplacements = std::unordered_map<std::string, std::string>;
     SettingsReplacements settings_replacements;
 
diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.sh b/tests/queries/0_stateless/02967_mysql_settings_override.sh
index cee18255eeb..59a2099190a 100755
--- a/tests/queries/0_stateless/02967_mysql_settings_override.sh
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.sh
@@ -2,7 +2,7 @@
 # Tags: no-fasttest
 # Tag no-fasttest: requires mysql client
 
-# Tests the override of certain MySQL proprietary settings to ClickHouse native settings
+# Tests that certain MySQL-proprietary settings are mapped to ClickHouse-native settings.
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -15,17 +15,17 @@ TEST_TABLE="mysql_settings_override_test"
 DROP_TABLE="DROP TABLE IF EXISTS $TEST_TABLE;"
 CREATE_TABLE="CREATE TABLE $TEST_TABLE (s String) ENGINE MergeTree ORDER BY s;"
 INSERT_STMT="INSERT INTO $TEST_TABLE VALUES ('a'), ('b'), ('c'), ('d');"
-SELECT_STMT="SELECT * FROM $TEST_TABLE;"
+SELECT_STMT="SELECT * FROM $TEST_TABLE ORDER BY s;"
 
 echo "-- Init"
 ${MYSQL_CLIENT} --execute "$DROP_TABLE $CREATE_TABLE $INSERT_STMT $SELECT_STMT" # should fetch all 4 records
 
-echo "-- Uppercase tests"
+echo "-- Uppercase setting name"
 ${MYSQL_CLIENT} --execute "SET SQL_SELECT_LIMIT = 2; $SELECT_STMT" # should fetch 2 records out of 4
 ${MYSQL_CLIENT} --execute "SET NET_WRITE_TIMEOUT = 22; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "SET NET_READ_TIMEOUT = 33; $CHANGED_SETTINGS_QUERY"
 
-echo "-- Lowercase tests"
+echo "-- Lowercase setting name"
 ${MYSQL_CLIENT} --execute "set sql_select_limit=3; $SELECT_STMT" # should fetch 3 records out of 4
 ${MYSQL_CLIENT} --execute "set net_write_timeout=55; $CHANGED_SETTINGS_QUERY"
 ${MYSQL_CLIENT} --execute "set net_read_timeout=66; $CHANGED_SETTINGS_QUERY"

From 50439cc1d5b315a5e34ac5b5ed02c32b9d563f14 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 29 Jan 2024 19:14:22 +0000
Subject: [PATCH 0381/1081] Automatic style fix

---
 tests/integration/test_broken_projections/test.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_broken_projections/test.py b/tests/integration/test_broken_projections/test.py
index 9597560f5bf..4a4690a5d0a 100644
--- a/tests/integration/test_broken_projections/test.py
+++ b/tests/integration/test_broken_projections/test.py
@@ -220,7 +220,9 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT c FROM '{table}' WHERE d == 12 ORDER BY c"
         )
     else:
-        query_id = node.query(f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)").strip()
+        query_id = node.query(
+            f"SELECT queryID() FROM (SELECT c FROM '{table}' WHERE d == 12 ORDER BY c)"
+        ).strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""
@@ -245,7 +247,9 @@ def check(node, table, check_result, expect_broken_part="", expected_error=""):
             f"SELECT d FROM '{table}' WHERE c == 12 ORDER BY d"
         )
     else:
-        query_id = node.query(f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)").strip()
+        query_id = node.query(
+            f"SELECT queryID() FROM (SELECT d FROM '{table}' WHERE c == 12 ORDER BY d)"
+        ).strip()
         node.query("SYSTEM FLUSH LOGS")
         res = node.query(
             f"""

From 432fab621fa42aef0a24897f8150254eae116091 Mon Sep 17 00:00:00 2001
From: Joshua Hildred <jthildred@gmail.com>
Date: Mon, 29 Jan 2024 11:27:03 -0800
Subject: [PATCH 0382/1081] upgrade libxml2 to 12.4 to avoid security issues

---
 contrib/libxml2                               |   2 +-
 .../linux_x86_64/include/libxml/xmlversion.h  | 109 ++++++++++--------
 2 files changed, 60 insertions(+), 51 deletions(-)

diff --git a/contrib/libxml2 b/contrib/libxml2
index 223cb03a5d2..8292f361458 160000
--- a/contrib/libxml2
+++ b/contrib/libxml2
@@ -1 +1 @@
-Subproject commit 223cb03a5d27b1b2393b266a8657443d046139d6
+Subproject commit 8292f361458fcffe0bff515a385be02e9d35582c
diff --git a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
index c2faeb47cb1..010bc2787a1 100644
--- a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
+++ b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
@@ -21,7 +21,7 @@ extern "C" {
  * your library and includes mismatch
  */
 #ifndef LIBXML2_COMPILING_MSCCDEF
-XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
+XMLPUBFUN void xmlCheckVersion(int version);
 #endif /* LIBXML2_COMPILING_MSCCDEF */
 
 /**
@@ -29,28 +29,28 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
  *
  * the version string like "1.2.3"
  */
-#define LIBXML_DOTTED_VERSION "2.10.3"
+#define LIBXML_DOTTED_VERSION "2.12.2"
 
 /**
  * LIBXML_VERSION:
  *
  * the version number: 1.2.3 value is 10203
  */
-#define LIBXML_VERSION 21003
+#define LIBXML_VERSION 21202
 
 /**
  * LIBXML_VERSION_STRING:
  *
  * the version number string, 1.2.3 value is "10203"
  */
-#define LIBXML_VERSION_STRING "21003"
+#define LIBXML_VERSION_STRING "21202"
 
 /**
  * LIBXML_VERSION_EXTRA:
  *
  * extra version information, used to show a git commit description
  */
-#define LIBXML_VERSION_EXTRA ""
+#define LIBXML_VERSION_EXTRA "-GITv2.12.2-5-g23dd0b76"
 
 /**
  * LIBXML_TEST_VERSION:
@@ -58,7 +58,7 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
  * Macro to check that the libxml version in use is compatible with
  * the version the software has been compiled against
  */
-#define LIBXML_TEST_VERSION xmlCheckVersion(21003);
+#define LIBXML_TEST_VERSION xmlCheckVersion(21202);
 
 #ifndef VMS
 #if 0
@@ -270,7 +270,7 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
  *
  * Whether iconv support is available
  */
-#if 0
+#if 1
 #define LIBXML_ICONV_ENABLED
 #endif
 
@@ -313,7 +313,7 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 /**
  * LIBXML_DEBUG_RUNTIME:
  *
- * Whether the runtime debugging is configured in
+ * Removed
  */
 #if 0
 #define LIBXML_DEBUG_RUNTIME
@@ -409,12 +409,7 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 #endif
 
 #ifdef __GNUC__
-
-/**
- * ATTRIBUTE_UNUSED:
- *
- * Macro used to signal to GCC unused function parameters
- */
+/** DOC_DISABLE */
 
 #ifndef ATTRIBUTE_UNUSED
 # if ((__GNUC__ > 2) || ((__GNUC__ == 2) && (__GNUC_MINOR__ >= 7)))
@@ -424,12 +419,6 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 # endif
 #endif
 
-/**
- * LIBXML_ATTR_ALLOC_SIZE:
- *
- * Macro used to indicate to GCC this is an allocator function
- */
-
 #ifndef LIBXML_ATTR_ALLOC_SIZE
 # if (!defined(__clang__) && ((__GNUC__ > 4) || ((__GNUC__ == 4) && (__GNUC_MINOR__ >= 3))))
 #  define LIBXML_ATTR_ALLOC_SIZE(x) __attribute__((alloc_size(x)))
@@ -440,12 +429,6 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 # define LIBXML_ATTR_ALLOC_SIZE(x)
 #endif
 
-/**
- * LIBXML_ATTR_FORMAT:
- *
- * Macro used to indicate to GCC the parameter are printf like
- */
-
 #ifndef LIBXML_ATTR_FORMAT
 # if ((__GNUC__ > 3) || ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 3)))
 #  define LIBXML_ATTR_FORMAT(fmt,args) __attribute__((__format__(__printf__,fmt,args)))
@@ -457,45 +440,71 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 #endif
 
 #ifndef XML_DEPRECATED
-#  ifdef IN_LIBXML
+#  if defined (IN_LIBXML) || (__GNUC__ * 100 + __GNUC_MINOR__ < 301)
 #    define XML_DEPRECATED
-#  else
 /* Available since at least GCC 3.1 */
+#  else
 #    define XML_DEPRECATED __attribute__((deprecated))
 #  endif
 #endif
 
+#if defined(__clang__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)
+  #if defined(__clang__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 800)
+    #define XML_IGNORE_FPTR_CAST_WARNINGS \
+      _Pragma("GCC diagnostic push") \
+      _Pragma("GCC diagnostic ignored \"-Wpedantic\"") \
+      _Pragma("GCC diagnostic ignored \"-Wcast-function-type\"")
+  #else
+    #define XML_IGNORE_FPTR_CAST_WARNINGS \
+      _Pragma("GCC diagnostic push") \
+      _Pragma("GCC diagnostic ignored \"-Wpedantic\"")
+  #endif
+  #define XML_POP_WARNINGS \
+    _Pragma("GCC diagnostic pop")
+#else
+  #define XML_IGNORE_FPTR_CAST_WARNINGS
+  #define XML_POP_WARNINGS
+#endif
+
 #else /* ! __GNUC__ */
-/**
- * ATTRIBUTE_UNUSED:
- *
- * Macro used to signal to GCC unused function parameters
- */
 #define ATTRIBUTE_UNUSED
-/**
- * LIBXML_ATTR_ALLOC_SIZE:
- *
- * Macro used to indicate to GCC this is an allocator function
- */
 #define LIBXML_ATTR_ALLOC_SIZE(x)
-/**
- * LIBXML_ATTR_FORMAT:
- *
- * Macro used to indicate to GCC the parameter are printf like
- */
 #define LIBXML_ATTR_FORMAT(fmt,args)
-/**
- * XML_DEPRECATED:
- *
- * Macro used to indicate that a function, variable, type or struct member
- * is deprecated.
- */
 #ifndef XML_DEPRECATED
-#define XML_DEPRECATED
+#  if defined (IN_LIBXML) || !defined (_MSC_VER)
+#    define XML_DEPRECATED
+/* Available since Visual Studio 2005 */
+#  elif defined (_MSC_VER) && (_MSC_VER >= 1400)
+#    define XML_DEPRECATED __declspec(deprecated)
+#  endif
+#endif
+#if defined (_MSC_VER) && (_MSC_VER >= 1400)
+#  define XML_IGNORE_FPTR_CAST_WARNINGS __pragma(warning(push))
+#else
+#  define XML_IGNORE_FPTR_CAST_WARNINGS
+#endif
+#ifndef XML_POP_WARNINGS
+#  if defined (_MSC_VER) && (_MSC_VER >= 1400)
+#    define XML_POP_WARNINGS __pragma(warning(pop))
+#  else
+#    define XML_POP_WARNINGS
+#  endif
 #endif
 #endif /* __GNUC__ */
 
+#define XML_NO_ATTR
+
+#ifdef LIBXML_THREAD_ENABLED
+  #define XML_DECLARE_GLOBAL(name, type, attrs) \
+    attrs XMLPUBFUN type *__##name(void);
+  #define XML_GLOBAL_MACRO(name) (*__##name())
+#else
+  #define XML_DECLARE_GLOBAL(name, type, attrs) \
+    attrs XMLPUBVAR type name;
+#endif
+
 #ifdef __cplusplus
 }
 #endif /* __cplusplus */
 #endif
+

From 5192d383705510e6b4de0016bd475b0582f48b5e Mon Sep 17 00:00:00 2001
From: slvrtrn <hypnoash@gmail.com>
Date: Mon, 29 Jan 2024 20:35:15 +0100
Subject: [PATCH 0383/1081] Fix tests

---
 .../0_stateless/02967_mysql_settings_override.reference       | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02967_mysql_settings_override.reference b/tests/queries/0_stateless/02967_mysql_settings_override.reference
index bc058f4889e..96cf7ecc403 100644
--- a/tests/queries/0_stateless/02967_mysql_settings_override.reference
+++ b/tests/queries/0_stateless/02967_mysql_settings_override.reference
@@ -4,7 +4,7 @@ a
 b
 c
 d
--- Uppercase tests
+-- Uppercase setting name
 s
 a
 b
@@ -12,7 +12,7 @@ name	value
 send_timeout	22
 name	value
 receive_timeout	33
--- Lowercase tests
+-- Lowercase setting name
 s
 a
 b

From 3a5ba56c36775709d8cfa4b2d6deb081b69dd2a5 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 29 Jan 2024 20:09:09 +0000
Subject: [PATCH 0384/1081] Fix lazy initialization in RabbitMQ, fix possible
 deadlock on insert into unitialized queue engine

---
 src/Storages/IMessageProducer.cpp             | 11 ++-
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 76 +++++++------------
 src/Storages/RabbitMQ/StorageRabbitMQ.h       |  5 +-
 .../integration/test_storage_rabbitmq/test.py | 12 +++
 4 files changed, 52 insertions(+), 52 deletions(-)

diff --git a/src/Storages/IMessageProducer.cpp b/src/Storages/IMessageProducer.cpp
index c723ec77b70..20c47f6f0b4 100644
--- a/src/Storages/IMessageProducer.cpp
+++ b/src/Storages/IMessageProducer.cpp
@@ -12,7 +12,16 @@ void AsynchronousMessageProducer::start(const ContextPtr & context)
 {
     LOG_TEST(log, "Executing startup");
 
-    initialize();
+    try
+    {
+        initialize();
+    }
+    catch (...)
+    {
+        finished = true;
+        throw;
+    }
+
     producing_task = context->getSchedulePool().createTask(getProducingTaskName(), [this]
     {
         LOG_TEST(log, "Starting producing task loop");
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 025f421db59..868f48d0b7d 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -69,7 +69,7 @@ StorageRabbitMQ::StorageRabbitMQ(
         ContextPtr context_,
         const ColumnsDescription & columns_,
         std::unique_ptr<RabbitMQSettings> rabbitmq_settings_,
-        bool is_attach_)
+        bool is_attach)
         : IStorage(table_id_)
         , WithContext(context_->getGlobalContext())
         , rabbitmq_settings(std::move(rabbitmq_settings_))
@@ -91,7 +91,6 @@ StorageRabbitMQ::StorageRabbitMQ(
         , unique_strbase(getRandomName())
         , queue_size(std::max(QUEUE_SIZE, static_cast<uint32_t>(getMaxBlockSize())))
         , milliseconds_to_wait(rabbitmq_settings->rabbitmq_empty_queue_backoff_start_ms)
-        , is_attach(is_attach_)
 {
     const auto & config = getContext()->getConfigRef();
 
@@ -318,10 +317,11 @@ void StorageRabbitMQ::connectionFunc()
     try
     {
         if (connection->reconnect())
+        {
             initRabbitMQ();
-
-        streaming_task->scheduleAfter(RESCHEDULE_MS);
-        return;
+            streaming_task->scheduleAfter(RESCHEDULE_MS);
+            return;
+        }
     }
     catch (...)
     {
@@ -373,57 +373,37 @@ void StorageRabbitMQ::initRabbitMQ()
     }
     else
     {
-        try
+        auto rabbit_channel = connection->createChannel();
+
+        /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
+
+        initExchange(*rabbit_channel);
+        bindExchange(*rabbit_channel);
+
+        for (const auto i : collections::range(0, num_queues))
+            bindQueue(i + 1, *rabbit_channel);
+
+        if (queues.size() != num_queues)
         {
-            auto rabbit_channel = connection->createChannel();
-
-            /// Main exchange -> Bridge exchange -> ( Sharding exchange ) -> Queues -> Consumers
-
-            initExchange(*rabbit_channel);
-            bindExchange(*rabbit_channel);
-
-            for (const auto i : collections::range(0, num_queues))
-                bindQueue(i + 1, *rabbit_channel);
-
-            if (queues.size() != num_queues)
-            {
-                throw Exception(
-                    ErrorCodes::LOGICAL_ERROR,
-                    "Expected all queues to be initialized (but having {}/{})",
-                    queues.size(), num_queues);
-            }
-
-            LOG_TRACE(log, "RabbitMQ setup completed");
-            rabbit_channel->close();
-        }
-        catch (...)
-        {
-            tryLogCurrentException(log);
-            if (is_attach)
-                return; /// A user will have to reattach the table.
-            throw;
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Expected all queues to be initialized (but having {}/{})",
+                queues.size(), num_queues);
         }
+
+        LOG_TRACE(log, "RabbitMQ setup completed");
+        rabbit_channel->close();
     }
 
     LOG_TRACE(log, "Registering {} conumers", num_consumers);
 
     for (size_t i = 0; i < num_consumers; ++i)
     {
-        try
-        {
-            auto consumer = createConsumer();
-            consumer->updateChannel(*connection);
-            consumers_ref.push_back(consumer);
-            pushConsumer(consumer);
-            ++num_created_consumers;
-        }
-        catch (...)
-        {
-            if (!is_attach)
-                throw;
-
-            tryLogCurrentException(log);
-        }
+        auto consumer = createConsumer();
+        consumer->updateChannel(*connection);
+        consumers_ref.push_back(consumer);
+        pushConsumer(consumer);
+        ++num_created_consumers;
     }
 
     LOG_TRACE(log, "Registered {}/{} conumers", num_created_consumers, num_consumers);
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.h b/src/Storages/RabbitMQ/StorageRabbitMQ.h
index be46caf9798..696734617be 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.h
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.h
@@ -27,7 +27,7 @@ public:
             ContextPtr context_,
             const ColumnsDescription & columns_,
             std::unique_ptr<RabbitMQSettings> rabbitmq_settings_,
-            bool is_attach_);
+            bool is_attach);
 
     std::string getName() const override { return "RabbitMQ"; }
 
@@ -158,10 +158,9 @@ private:
 
     size_t read_attempts = 0;
     mutable bool drop_table = false;
-    bool is_attach;
 
     RabbitMQConsumerPtr createConsumer();
-    bool initialized = false;
+    std::atomic<bool> initialized = false;
 
     /// Functions working in the background
     void streamingToViewsFunc();
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 6924f2e1508..28dbca1862c 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -3538,3 +3538,15 @@ def test_rabbitmq_handle_error_mode_stream(rabbitmq_cluster):
 
     expected = "".join(sorted(expected))
     assert broken_messages == expected
+
+
+def test_attach_broken_table(rabbitmq_cluster):
+    instance.query(
+        "ATTACH TABLE rabbit_queue UUID '2d1cdf1a-f060-4a61-a7c9-5b59e59992c6' (`payload` String) ENGINE = RabbitMQ SETTINGS rabbitmq_host_port = 'nonexisting:5671', rabbitmq_format = 'JSONEachRow', rabbitmq_username = 'test', rabbitmq_password = 'test'"
+    )
+
+    error = instance.query_and_get_error("SELECT * FROM rabbit_queue")
+    assert "CANNOT_CONNECT_RABBITMQ" in error
+
+    error = instance.query_and_get_error("INSERT INTO rabbit_queue VALUES ('test')")
+    assert "CANNOT_CONNECT_RABBITMQ" in error

From 45776ea035f6f33ff9d4324f41a845b509a2b7cf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 21:24:20 +0100
Subject: [PATCH 0385/1081] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index d84249e43b9..8a892d711a7 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -103,7 +103,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
-              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"}}},
+              {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},

From 4a8a7208f2a21236de1fa5140a2980a9bdf98974 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Mon, 29 Jan 2024 21:25:58 +0100
Subject: [PATCH 0386/1081] rename of settings, add setting for resultset,
 extend test, fix documentation and add to SettingsChanges log

---
 docs/en/interfaces/formats.md                 |  6 +--
 .../operations/settings/settings-formats.md   |  6 ++-
 docs/ru/interfaces/formats.md                 |  6 +--
 src/Core/Settings.h                           |  3 +-
 src/Core/SettingsChangesHistory.h             |  4 +-
 src/Formats/FormatFactory.cpp                 |  3 +-
 src/Formats/FormatSettings.h                  |  3 +-
 .../Impl/TemplateBlockOutputFormat.cpp        | 39 ++++++++++++-------
 ...0937_format_schema_rows_template.reference |  5 +++
 .../00937_format_schema_rows_template.sh      | 24 ++++++++++--
 10 files changed, 71 insertions(+), 28 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index a3f54c1c383..0f597282f9e 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -253,7 +253,7 @@ This format is also available under the name `TSVRawWithNamesAndNames`.
 
 This format allows specifying a custom format string with placeholders for values with a specified escaping rule.
 
-It uses settings `format_template_resultset`, `format_template_row` (`format_schema_rows_template`), `format_template_rows_between_delimiter` and some settings of other formats (e.g. `output_format_json_quote_64bit_integers` when using `JSON` escaping, see further)
+It uses settings `format_template_resultset`, `format_template_row` (`format_template_row_format`), `format_template_rows_between_delimiter` and some settings of other formats (e.g. `output_format_json_quote_64bit_integers` when using `JSON` escaping, see further)
 
 Setting `format_template_row` specifies the path to the file containing format strings for rows with the following syntax:
 
@@ -279,11 +279,11 @@ the values of `SearchPhrase`, `c` and `price` columns, which are escaped as `Quo
 
 `Search phrase: 'bathroom interior design', count: 2166, ad price: $3;`
 
-In cases where it is challenging or not possible to deploy format output configuration for the template format to a directory on all nodes in a cluster, or if the format is trivial then `format_schema_rows_template` can be used to pass the template string directly in the query, rather than a path to the file which contains it.
+In cases where it is challenging or not possible to deploy format output configuration for the template format to a directory on all nodes in a cluster, or if the format is trivial then `format_template_row_format` can be used to set the template string directly in the query, rather than a path to the file which contains it.
 
 The `format_template_rows_between_delimiter` setting specifies the delimiter between rows, which is printed (or expected) after every row except the last one (`\n` by default)
 
-Setting `format_template_resultset` specifies the path to the file, which contains a format string for resultset. Format string for resultset has the same syntax as a format string for row and allows to specify a prefix, a suffix and a way to print some additional information. It contains the following placeholders instead of column names:
+Setting `format_template_resultset` specifies the path to the file, which contains a format string for resultset. Setting `format_template_resultset_format` can be used to set the template string for the result set directly in the query itself. Format string for resultset has the same syntax as a format string for row and allows to specify a prefix, a suffix and a way to print some additional information. It contains the following placeholders instead of column names:
 
 - `data` is the rows with data in `format_template_row` format, separated by `format_template_rows_between_delimiter`. This placeholder must be the first placeholder in the format string.
 - `totals` is the row with total values in `format_template_row` format (when using WITH TOTALS)
diff --git a/docs/en/operations/settings/settings-formats.md b/docs/en/operations/settings/settings-formats.md
index 5dedaa2f6ab..816812b1e3a 100644
--- a/docs/en/operations/settings/settings-formats.md
+++ b/docs/en/operations/settings/settings-formats.md
@@ -1660,6 +1660,10 @@ Result:
 
 Path to file which contains format string for result set (for Template format).
 
+### format_template_resultset_format {#format_template_resultset_format}
+
+Format string for result set (for Template format)
+
 ### format_template_row {#format_template_row}
 
 Path to file which contains format string for rows (for Template format).
@@ -1668,7 +1672,7 @@ Path to file which contains format string for rows (for Template format).
 
 Delimiter between rows (for Template format).
 
-### format_schema_rows_template {#format_schema_rows_template}
+### format_template_row_format {#format_template_row_format}
 
 Format string for rows (for Template format)
 
diff --git a/docs/ru/interfaces/formats.md b/docs/ru/interfaces/formats.md
index 8f8197e2221..a9280de9c7b 100644
--- a/docs/ru/interfaces/formats.md
+++ b/docs/ru/interfaces/formats.md
@@ -201,7 +201,7 @@ SELECT * FROM nestedt FORMAT TSV
 
 Этот формат позволяет указать произвольную форматную строку, в которую подставляются значения, сериализованные выбранным способом.
 
-Для этого используются настройки `format_template_resultset`, `format_template_row` (`format_schema_rows_template`), `format_template_rows_between_delimiter` и настройки экранирования других форматов (например, `output_format_json_quote_64bit_integers` при экранировании как в `JSON`, см. далее)
+Для этого используются настройки `format_template_resultset`, `format_template_row` (`format_template_row_format`), `format_template_rows_between_delimiter` и настройки экранирования других форматов (например, `output_format_json_quote_64bit_integers` при экранировании как в `JSON`, см. далее)
 
 Настройка `format_template_row` задаёт путь к файлу, содержащему форматную строку для строк таблицы, которая должна иметь вид:
 
@@ -227,11 +227,11 @@ SELECT * FROM nestedt FORMAT TSV
 
     `Search phrase: 'bathroom interior design', count: 2166, ad price: $3;`
 
-В тех случаях, когда не удобно или не возможно указать произвольную форматную строку в файле, можно использовать `format_schema_rows_template` указать произвольную форматную строку в запросе.    
+В тех случаях, когда не удобно или не возможно указать произвольную форматную строку в файле, можно использовать `format_template_row_format` указать произвольную форматную строку в запросе.  
 
 Настройка `format_template_rows_between_delimiter` задаёт разделитель между строками, который выводится (или ожмдается при вводе) после каждой строки, кроме последней. По умолчанию `\n`.
 
-Настройка `format_template_resultset` задаёт путь к файлу, содержащему форматную строку для результата. Форматная строка для результата имеет синтаксис аналогичный форматной строке для строк таблицы и позволяет указать префикс, суффикс и способ вывода дополнительной информации. Вместо имён столбцов в ней указываются следующие имена подстановок:
+Настройка `format_template_resultset` задаёт путь к файлу, содержащему форматную строку для результата. Настройка `format_template_resultset_format` используется для установки форматной строки для результата непосредственно в запросе. Форматная строка для результата имеет синтаксис аналогичный форматной строке для строк таблицы и позволяет указать префикс, суффикс и способ вывода дополнительной информации. Вместо имён столбцов в ней указываются следующие имена подстановок:
 
 -   `data` - строки с данными в формате `format_template_row`, разделённые `format_template_rows_between_delimiter`. Эта подстановка должна быть первой подстановкой в форматной строке.
 -   `totals` - строка с тотальными значениями в формате `format_template_row` (при использовании WITH TOTALS)
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index f9e3f401d98..bb946f0d861 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1080,7 +1080,8 @@ class IColumn;
     M(String, format_schema, "", "Schema identifier (used by schema-based formats)", 0) \
     M(String, format_template_resultset, "", "Path to file which contains format string for result set (for Template format)", 0) \
     M(String, format_template_row, "", "Path to file which contains format string for rows (for Template format)", 0) \
-    M(String, format_schema_rows_template, "", "Format string for rows (for Template format)", 0) \
+    M(String, format_template_row_format, "", "Format string for rows (for Template format)", 0) \
+    M(String, format_template_resultset_format, "", "Format string for result set (for Template format)", 0) \
     M(String, format_template_rows_between_delimiter, "\n", "Delimiter between rows (for Template format)", 0) \
     \
     M(EscapingRule, format_custom_escaping_rule, "Escaped", "Field escaping rule (for CustomSeparated format)", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 859ba99b5f7..8faf43c7e01 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -99,7 +99,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"output_format_pretty_color", true, "auto", "Setting is changed to allow also for auto value, disabling ANSI escapes if output is not a tty"},
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
-              {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"}}},
+              {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
+              {"format_template_row_format", "none", "", "Template row format string can be set directly in query"},
+              {"format_template_resultset_format", "none", "", "Template result set format string can be set in query"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 274994b4168..8c39b4b71e4 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -166,7 +166,8 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.template_settings.resultset_format = settings.format_template_resultset;
     format_settings.template_settings.row_between_delimiter = settings.format_template_rows_between_delimiter;
     format_settings.template_settings.row_format = settings.format_template_row;
-    format_settings.template_settings.row_format_schema = settings.format_schema_rows_template;
+    format_settings.template_settings.row_format_template = settings.format_template_row_format;
+    format_settings.template_settings.resultset_format_template = settings.format_template_resultset_format;
     format_settings.tsv.crlf_end_of_line = settings.output_format_tsv_crlf_end_of_line;
     format_settings.tsv.empty_as_default = settings.input_format_tsv_empty_as_default;
     format_settings.tsv.enum_as_number = settings.input_format_tsv_enum_as_number;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 28a2076af84..bdd2dda5287 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -338,7 +338,8 @@ struct FormatSettings
         String resultset_format;
         String row_format;
         String row_between_delimiter;
-        String row_format_schema;
+        String row_format_template;
+        String resultset_format_template;
     } template_settings;
 
     struct
diff --git a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
index efda754917b..1c43a0fa331 100644
--- a/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateBlockOutputFormat.cpp
@@ -194,13 +194,25 @@ void registerOutputFormatTemplate(FormatFactory & factory)
             const FormatSettings & settings)
     {
         ParsedTemplateFormatString resultset_format;
+        auto idx_resultset_by_name = [&](const String & partName)
+        {
+            return static_cast<size_t>(TemplateBlockOutputFormat::stringToResultsetPart(partName));
+        };
         if (settings.template_settings.resultset_format.empty())
         {
             /// Default format string: "${data}"
-            resultset_format.delimiters.resize(2);
-            resultset_format.escaping_rules.emplace_back(ParsedTemplateFormatString::EscapingRule::None);
-            resultset_format.format_idx_to_column_idx.emplace_back(0);
-            resultset_format.column_names.emplace_back("data");
+            if (settings.template_settings.resultset_format_template.empty())
+            {
+                resultset_format.delimiters.resize(2);
+                resultset_format.escaping_rules.emplace_back(ParsedTemplateFormatString::EscapingRule::None);
+                resultset_format.format_idx_to_column_idx.emplace_back(0);
+                resultset_format.column_names.emplace_back("data");
+            }
+            else
+            {
+                resultset_format = ParsedTemplateFormatString();
+                resultset_format.parse(settings.template_settings.resultset_format_template, idx_resultset_by_name);
+            }
         }
         else
         {
@@ -208,31 +220,32 @@ void registerOutputFormatTemplate(FormatFactory & factory)
             resultset_format = ParsedTemplateFormatString(
                     FormatSchemaInfo(settings.template_settings.resultset_format, "Template", false,
                             settings.schema.is_server, settings.schema.format_schema_path),
-                    [&](const String & partName)
-                    {
-                        return static_cast<size_t>(TemplateBlockOutputFormat::stringToResultsetPart(partName));
-                    });
+                    idx_resultset_by_name);
+            if (!settings.template_settings.resultset_format_template.empty())
+            {
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_resultset or format_template_resultset_format, but not both");
+            }
         }
 
         ParsedTemplateFormatString row_format;
-        auto idx_by_name = [&](const String & colName)
+        auto idx_row_by_name = [&](const String & colName)
         {
             return sample.getPositionByName(colName);
         };
         if (settings.template_settings.row_format.empty())
         {
             row_format = ParsedTemplateFormatString();
-            row_format.parse(settings.template_settings.row_format_schema,idx_by_name);
+            row_format.parse(settings.template_settings.row_format_template, idx_row_by_name);
         }
         else
         {
             row_format = ParsedTemplateFormatString(
                 FormatSchemaInfo(settings.template_settings.row_format, "Template", false,
                         settings.schema.is_server, settings.schema.format_schema_path),
-                idx_by_name);
-            if (!settings.template_settings.row_format_schema.empty())
+                idx_row_by_name);
+            if (!settings.template_settings.row_format_template.empty())
             {
-                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_schema_rows_template, but not both");
+                throw Exception(DB::ErrorCodes::INVALID_TEMPLATE_FORMAT, "Expected either format_template_row or format_template_row_format, but not both");
             }
         }
         return std::make_shared<TemplateBlockOutputFormat>(sample, buf, settings, resultset_format, row_format, settings.template_settings.row_between_delimiter);
diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.reference b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
index 5f59cca2629..85bab456512 100644
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.reference
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.reference
@@ -2,3 +2,8 @@ Question: 'How awesome is clickhouse?', Answer: 'unbelievably awesome!', Number
 Question: 'How fast is clickhouse?', Answer: 'Lightning fast!', Number of Likes: 9876543210, Date: 2016-01-03;
 Question: 'Is it opensource?', Answer: 'of course it is!', Number of Likes: 789, Date: 2016-01-04
 
+===== Results ===== 
+Question: 'How awesome is clickhouse?', Answer: 'unbelievably awesome!', Number of Likes: 456, Date: 2016-01-02;
+Question: 'How fast is clickhouse?', Answer: 'Lightning fast!', Number of Likes: 9876543210, Date: 2016-01-03;
+Question: 'Is it opensource?', Answer: 'of course it is!', Number of Likes: 789, Date: 2016-01-04
+===================
diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index aff5de3b555..d773fedfd3d 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-# Test format_schema_rows_template setting 
+# Test format_template_row_format setting 
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS template";
 $CLICKHOUSE_CLIENT --query="CREATE TABLE template (question String, answer String, likes UInt64, date Date) ENGINE = Memory";
@@ -15,17 +15,33 @@ $CLICKHOUSE_CLIENT --query="INSERT INTO template VALUES
 ('Is it opensource?', 'of course it is!', 789, '2016-01-04')";
 
 $CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
-format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
 format_template_rows_between_delimiter = ';\n'";
 
 echo -e "\n"
 
-# Test that if both format_schema_rows_template setting and format_template_row are provided, error is thrown 
+# Test that if both format_template_row_format setting and format_template_row are provided, error is thrown 
 echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > "$CURDIR"/00937_template_output_format_row.tmp
 $CLICKHOUSE_CLIENT --multiline --multiquery --query "SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
 format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
-format_schema_rows_template = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_rows_between_delimiter = ';\n'; --{clientError 474}"
+
+# Test format_template_resultset_format setting 
+
+$CLICKHOUSE_CLIENT --query="SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
+format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
+format_template_resultset_format = '===== Results ===== \n\${data}\n===================\n', \
+format_template_rows_between_delimiter = ';\n'";
+
+# Test that if both format_template_result_format setting and format_template_resultset are provided, error is thrown
+echo -ne '===== Resultset ===== \n \${data} \n ===============' > "$CURDIR"/00937_template_output_format_resultset.tmp
+$CLICKHOUSE_CLIENT --multiline --multiquery --query "SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
+format_template_resultset = '$CURDIR/00937_template_output_format_resultset.tmp', \
+format_template_resultset_format = '===== Resultset ===== \n \${data} \n ===============', \
+format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
 format_template_rows_between_delimiter = ';\n'; --{clientError 474}"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE template";
 rm "$CURDIR"/00937_template_output_format_row.tmp
+rm "$CURDIR"/00937_template_output_format_resultset.tmp

From 8183074500b4d0d0755b48d01ff85215f16c3dfd Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Mon, 29 Jan 2024 21:32:42 +0100
Subject: [PATCH 0387/1081] Update src/Core/SettingsChangesHistory.h

set previous value as empty string for added setting rather than "none" in SettingsChangesHistory.h

Co-authored-by: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
---
 src/Core/SettingsChangesHistory.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 960b64e5b6a..4a6a5d15be5 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,8 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"format_template_row_format", "none", "", "Template row format string can be set directly in query"},
-              {"format_template_resultset_format", "none", "", "Template result set format string can be set in query"},
+              {"format_template_row_format", "", "", "Template row format string can be set directly in query"},
+              {"format_template_resultset_format", "", "", "Template result set format string can be set in query"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},

From 1580f737952c38d50651a7022081480f7e3b602f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 21:53:05 +0100
Subject: [PATCH 0388/1081] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 8a892d711a7..ad04ee79995 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -104,7 +104,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
-              {"azure_max_unexpected_write_error_retries", 4, 0, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
+              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From e8d348b90e27448fc49f2ed2ace93d608923c0fc Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 29 Jan 2024 20:53:57 +0000
Subject: [PATCH 0389/1081] Add a test

---
 .../0_stateless/02971_analyzer_remote_id.reference  |  1 +
 .../queries/0_stateless/02971_analyzer_remote_id.sh | 13 +++++++++++++
 2 files changed, 14 insertions(+)
 create mode 100644 tests/queries/0_stateless/02971_analyzer_remote_id.reference
 create mode 100755 tests/queries/0_stateless/02971_analyzer_remote_id.sh

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.reference b/tests/queries/0_stateless/02971_analyzer_remote_id.reference
new file mode 100644
index 00000000000..b8626c4cff2
--- /dev/null
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.reference
@@ -0,0 +1 @@
+4
diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
new file mode 100755
index 00000000000..88bbe38729b
--- /dev/null
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"
+${CLICKHOUSE_CLIENT} --query="CREATE DATABASE test_02971"
+
+${CLICKHOUSE_CLIENT} --query="CREATE TABLE test_02971.x ENGINE = MergeTree() ORDER BY number AS SELECT * FROM numbers(2)"
+${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1"
+
+${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"

From 182d1c08b8c1bc28d17b64858e4a4376bea27bce Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 29 Jan 2024 21:21:52 +0000
Subject: [PATCH 0390/1081] slightly better memory usage in
 AsynchronousBoundedReadBuffer

---
 src/Disks/IO/AsynchronousBoundedReadBuffer.cpp | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
index 8eecd0d99d1..bd19540bf44 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
@@ -48,11 +48,10 @@ AsynchronousBoundedReadBuffer::AsynchronousBoundedReadBuffer(
     const ReadSettings & settings_,
     AsyncReadCountersPtr async_read_counters_,
     FilesystemReadPrefetchesLogPtr prefetches_log_)
-    : ReadBufferFromFileBase(chooseBufferSizeForRemoteReading(settings_, impl_->getFileSize()), nullptr, 0)
+    : ReadBufferFromFileBase(0, nullptr, 0)
     , impl(std::move(impl_))
     , read_settings(settings_)
     , reader(reader_)
-    , prefetch_buffer(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()))
     , query_id(CurrentThread::isInitialized() && CurrentThread::get().getQueryContext() != nullptr ? CurrentThread::getQueryId() : "")
     , current_reader_id(getRandomASCIIString(8))
     , log(getLogger("AsynchronousBoundedReadBuffer"))
@@ -115,7 +114,7 @@ void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
     last_prefetch_info.submit_time = std::chrono::system_clock::now();
     last_prefetch_info.priority = priority;
 
-    chassert(prefetch_buffer.size() == chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+    prefetch_buffer.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
     prefetch_future = readAsync(prefetch_buffer.data(), prefetch_buffer.size(), priority);
     ProfileEvents::increment(ProfileEvents::RemoteFSPrefetches);
 }
@@ -211,7 +210,7 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     }
     else
     {
-        chassert(memory.size() == chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+        memory.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
 
         {
             ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::SynchronousRemoteReadWaitMicroseconds);

From 18578c7b1b20d5dfb0755b040e0604256ec680e3 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 29 Jan 2024 21:29:52 +0000
Subject: [PATCH 0391/1081] Try to make variant tests a bit faster

---
 .../0_stateless/02941_variant_type_1.sh       | 78 +++++++++----------
 .../0_stateless/02941_variant_type_2.sh       | 46 +++++------
 .../0_stateless/02941_variant_type_3.sh       | 48 ++++++------
 .../0_stateless/02941_variant_type_4.sh       | 34 ++++----
 4 files changed, 104 insertions(+), 102 deletions(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_1.sh b/tests/queries/0_stateless/02941_variant_type_1.sh
index 4cf8ad25122..ed365bbd244 100755
--- a/tests/queries/0_stateless/02941_variant_type_1.sh
+++ b/tests/queries/0_stateless/02941_variant_type_1.sh
@@ -12,52 +12,52 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test1_insert()
 {
     echo "test1 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 3, number from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 6, 'str_' || toString(number) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(3);
+insert into test select number + 3, number from numbers(3);
+insert into test select number + 6, 'str_' || toString(number) from numbers(3);
+insert into test select number + 9, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(3);
+insert into test select number + 12, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(3);
+insert into test select number + 15, range(number + 1)::Array(UInt64) from numbers(3);"
 }
 
 function test1_select()
 {
     echo "test1 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
 function test2_insert()
 {
     echo "test2 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 3, number % 2 ? NULL : number from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
-    $CH_CLIENT -q "insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(3);
+insert into test select number + 3, number % 2 ? NULL : number from numbers(3);
+insert into test select number + 6, number % 2 ? NULL : 'str_' || toString(number) from numbers(3);
+insert into test select number + 9, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);
+insert into test select number + 12, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);
+insert into test select number + 15, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(3);"
 }
 
 function test2_select()
 {
     echo "test2 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
@@ -70,15 +70,15 @@ function test3_insert()
 function test3_select()
 {
     echo "test3 select"
-    $CH_CLIENT -q "select v from test order by id;"
-    $CH_CLIENT -q "select v.String from test order by id;"
-    $CH_CLIENT -q "select v.UInt64 from test order by id;"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test order by id;"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test order by id;"
+    $CH_CLIENT -nmq "select v from test order by id;
+select v.String from test order by id;
+select v.UInt64 from test order by id;
+select v.\`LowCardinality(String)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\` from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test order by id;
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test order by id;
+select v.\`Array(UInt64)\` from test order by id;
+select v.\`Array(UInt64)\`.size0 from test order by id;"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index 7064dfbf4ec..23666a9b4a8 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -12,34 +12,34 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test4_insert()
 {
     echo "test4 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 200000, number from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(200000);
+insert into test select number + 200000, number from numbers(200000);
+insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);
+insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);
+insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);
+insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
 }
 
 function test4_select
 {
     echo "test4 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    $CH_CLIENT -nmq "select v from test format Null;
+select count() from test where isNotNull(v);
+select v.String from test format Null;
+select count() from test where isNotNull(v.String);
+select v.UInt64 from test format Null;
+select count() from test where isNotNull(v.UInt64);
+select v.\`LowCardinality(String)\` from test format Null;
+select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+select v.\`Array(UInt64)\` from test format Null;
+select count() from test where not empty(v.\`Array(UInt64)\`);
+select v.\`Array(UInt64)\`.size0 from test format Null;
+select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
 }
 
 function run()
diff --git a/tests/queries/0_stateless/02941_variant_type_3.sh b/tests/queries/0_stateless/02941_variant_type_3.sh
index 303039edef7..d6309e26414 100755
--- a/tests/queries/0_stateless/02941_variant_type_3.sh
+++ b/tests/queries/0_stateless/02941_variant_type_3.sh
@@ -12,34 +12,36 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1"
 function test5_insert()
 {
     echo "test5 insert"
-    $CH_CLIENT -q "insert into test select number, NULL from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
-    $CH_CLIENT -q "insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
+    $CH_CLIENT -nmq "
+insert into test select number, NULL from numbers(200000);
+insert into test select number + 200000, number % 2 ? NULL : number from numbers(200000);
+insert into test select number + 400000, number % 2 ? NULL : 'str_' || toString(number) from numbers(200000);
+insert into test select number + 600000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(('lc_str_' || toString(number))::LowCardinality(String), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);
+insert into test select number + 800000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(tuple(number, number + 1)::Tuple(a UInt32, b UInt32), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);
+insert into test select number + 1000000, number % 2 ? CAST(NULL, 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') : CAST(range(number % 20 + 1)::Array(UInt64), 'Variant(String, UInt64, LowCardinality(String), Tuple(a UInt32, b UInt32), Array(UInt64))') from numbers(200000);"
 }
 
 function test5_select()
 {
     echo "test5 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+        $CH_CLIENT -nmq "
+select v from test format Null;
+select count() from test where isNotNull(v);
+select v.String from test format Null;
+select count() from test where isNotNull(v.String);
+select v.UInt64 from test format Null;
+select count() from test where isNotNull(v.UInt64);
+select v.\`LowCardinality(String)\` from test format Null;
+select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+select v.\`Array(UInt64)\` from test format Null;
+select count() from test where not empty(v.\`Array(UInt64)\`);
+select v.\`Array(UInt64)\`.size0 from test format Null;
+select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
 }
 
 function run()
diff --git a/tests/queries/0_stateless/02941_variant_type_4.sh b/tests/queries/0_stateless/02941_variant_type_4.sh
index 169e43c6d69..5ea04db4bb4 100755
--- a/tests/queries/0_stateless/02941_variant_type_4.sh
+++ b/tests/queries/0_stateless/02941_variant_type_4.sh
@@ -18,23 +18,23 @@ function test6_insert()
 function test6_select()
 {
     echo "test6 select"
-    $CH_CLIENT -q "select v from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v);"
-    $CH_CLIENT -q "select v.String from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.String);"
-    $CH_CLIENT -q "select v.UInt64 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.UInt64);"
-    $CH_CLIENT -q "select v.\`LowCardinality(String)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`LowCardinality(String)\`);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);"
-    $CH_CLIENT -q "select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\` from test format Null;"
-    $CH_CLIENT -q "select count() from test where not empty(v.\`Array(UInt64)\`);"
-    $CH_CLIENT -q "select v.\`Array(UInt64)\`.size0 from test format Null;"
-    $CH_CLIENT -q "select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
+    $CH_CLIENT -nmq "select v from test format Null;
+    select count() from test where isNotNull(v);
+    select v.String from test format Null;
+    select count() from test where isNotNull(v.String);
+    select v.UInt64 from test format Null;
+    select count() from test where isNotNull(v.UInt64);
+    select v.\`LowCardinality(String)\` from test format Null;
+    select count() from test where isNotNull(v.\`LowCardinality(String)\`);
+    select v.\`Tuple(a UInt32, b UInt32)\` from test format Null;
+    select v.\`Tuple(a UInt32, b UInt32)\`.a from test format Null;
+    select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.a);
+    select v.\`Tuple(a UInt32, b UInt32)\`.b from test format Null;
+    select count() from test where isNotNull(v.\`Tuple(a UInt32, b UInt32)\`.b);
+    select v.\`Array(UInt64)\` from test format Null;
+    select count() from test where not empty(v.\`Array(UInt64)\`);
+    select v.\`Array(UInt64)\`.size0 from test format Null;
+    select count() from test where isNotNull(v.\`Array(UInt64)\`.size0);"
     echo "-----------------------------------------------------------------------------------------------------------"
 }
 

From 559de083a3197ca7db1955377100f12e12b37dce Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Mon, 29 Jan 2024 23:20:38 +0000
Subject: [PATCH 0392/1081] Implemented failed login attempt counting using
 quota

---
 .../operations/system-tables/quota_usage.md   |  2 +
 .../operations/system-tables/quotas_usage.md  |  6 +-
 .../sql-reference/statements/create/quota.md  |  2 +-
 .../operations/system-tables/quota_usage.md   |  7 +-
 .../operations/system-tables/quotas_usage.md  |  3 +-
 .../sql-reference/statements/alter/quota.md   |  2 +-
 .../sql-reference/statements/create/quota.md  |  2 +-
 src/Access/AccessControl.cpp                  | 48 +++++++++-
 src/Access/AccessControl.h                    |  7 +-
 src/Access/Common/QuotaDefs.cpp               |  5 ++
 src/Access/Common/QuotaDefs.h                 | 21 ++---
 src/Access/EnabledQuota.cpp                   | 16 ++++
 src/Access/EnabledQuota.h                     |  2 +
 src/Access/QuotaCache.cpp                     | 31 +++++--
 src/Access/QuotaCache.h                       |  7 +-
 src/Interpreters/Session.cpp                  |  3 +-
 tests/integration/test_quota/test.py          | 79 ++++++++++++----
 tests/integration/test_quota/tiny_limits.xml  |  1 +
 tests/integration/test_quota/two_quotas.xml   |  1 +
 .../0_stateless/01297_create_quota.reference  |  8 +-
 .../02117_show_create_table_system.reference  | 11 ++-
 .../02884_authentication_quota.reference      | 52 +++++++++++
 .../0_stateless/02884_authentication_quota.sh | 90 +++++++++++++++++++
 23 files changed, 346 insertions(+), 60 deletions(-)
 create mode 100644 tests/queries/0_stateless/02884_authentication_quota.reference
 create mode 100755 tests/queries/0_stateless/02884_authentication_quota.sh

diff --git a/docs/en/operations/system-tables/quota_usage.md b/docs/en/operations/system-tables/quota_usage.md
index 0dca7c525f2..3d4b8f62d2d 100644
--- a/docs/en/operations/system-tables/quota_usage.md
+++ b/docs/en/operations/system-tables/quota_usage.md
@@ -25,6 +25,8 @@ Columns:
 - `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum number of rows read from all tables and table functions participated in queries.
 - `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — The total number of bytes read from all tables and table functions participated in queries.
 - `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum of bytes read from all tables and table functions.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — The total count of sequential authentication failures. If the user entered the correct password before exceed `failed_sequential_authentications` threshold then the counter will be reset.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Maximum count of sequential authentication failures.
 - `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
 - `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
 
diff --git a/docs/en/operations/system-tables/quotas_usage.md b/docs/en/operations/system-tables/quotas_usage.md
index a04018ac2c8..960903fa25f 100644
--- a/docs/en/operations/system-tables/quotas_usage.md
+++ b/docs/en/operations/system-tables/quotas_usage.md
@@ -28,8 +28,10 @@ Columns:
 - `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum number of rows read from all tables and table functions participated in queries.
 - `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — The total number of bytes read from all tables and table functions participated in queries.
 - `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — Maximum of bytes read from all tables and table functions.
-- `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
-- `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — The total count of sequential authentication failures. If the user entered the correct password before exceed `failed_sequential_authentications` threshold then the counter will be reset.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Maximum count of sequential authentication failures.
+- `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — The total query execution time, in seconds (wall time).
+- `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Maximum of query execution time.
 
 ## See Also {#see-also}
 
diff --git a/docs/en/sql-reference/statements/create/quota.md b/docs/en/sql-reference/statements/create/quota.md
index a6ced870c18..d16b40876c7 100644
--- a/docs/en/sql-reference/statements/create/quota.md
+++ b/docs/en/sql-reference/statements/create/quota.md
@@ -21,7 +21,7 @@ CREATE QUOTA [IF NOT EXISTS | OR REPLACE] name [ON CLUSTER cluster_name]
 
 Keys `user_name`, `ip_address`, `client_key`, `client_key, user_name` and `client_key, ip_address` correspond to the fields in the [system.quotas](../../../operations/system-tables/quotas.md) table.
 
-Parameters `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` correspond to the fields in the [system.quotas_usage](../../../operations/system-tables/quotas_usage.md) table.
+Parameters `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` correspond to the fields in the [system.quotas_usage](../../../operations/system-tables/quotas_usage.md) table.
 
 `ON CLUSTER` clause allows creating quotas on a cluster, see [Distributed DDL](../../../sql-reference/distributed-ddl.md).
 
diff --git a/docs/ru/operations/system-tables/quota_usage.md b/docs/ru/operations/system-tables/quota_usage.md
index 96f6debd24e..46305e59da6 100644
--- a/docs/ru/operations/system-tables/quota_usage.md
+++ b/docs/ru/operations/system-tables/quota_usage.md
@@ -26,8 +26,11 @@ slug: /ru/operations/system-tables/quota_usage
 -   `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество строк, считываемых из всех таблиц и табличных функций, участвующих в запросах.
 -   `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — общее количество байт, считанных из всех таблиц и табличных функций, участвующих в запросах.
 -   `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество байт, считываемых из всех таблиц и табличных функций.
--   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
--   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Общее количество неудачных попыток подряд ввести пароль. Если пользователь ввел верный пароль до преодоления порогового значения `max_failed_sequential_authentications` то счетчик неудачных попыток будет сброшен.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — Максимальное количество неудачных попыток подряд ввести пароль.
+-   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
+-   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
+
 
 ## Смотрите также {#see-also}
 
diff --git a/docs/ru/operations/system-tables/quotas_usage.md b/docs/ru/operations/system-tables/quotas_usage.md
index 27e7cdf8abe..4bc0f2e81ca 100644
--- a/docs/ru/operations/system-tables/quotas_usage.md
+++ b/docs/ru/operations/system-tables/quotas_usage.md
@@ -29,9 +29,10 @@ slug: /ru/operations/system-tables/quotas_usage
 -   `max_read_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество строк, считываемых из всех таблиц и табличных функций, участвующих в запросах.
 -   `read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — общее количество байт, считанных из всех таблиц и табличных функций, участвующих в запросах.
 -   `max_read_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) — максимальное количество байт, считываемых из всех таблиц и табличных функций.
+- `failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Общее количество неудачных попыток подряд ввести пароль. Если пользователь ввел верный пароль до преодоления порогового значения `max_failed_sequential_authentications` то счетчик неудачных попыток будет сброшен.
+- `max_failed_sequential_authentications` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/float.md))) — Максимальное количество неудачных попыток подряд ввести пароль.
 -   `execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — общее время выполнения запроса, в секундах.
 -   `max_execution_time` ([Nullable](../../sql-reference/data-types/nullable.md)([Float64](../../sql-reference/data-types/float.md))) — максимальное время выполнения запроса.
-
 ## Смотрите также {#see-also}
 
 -   [SHOW QUOTA](../../sql-reference/statements/show.md#show-quota-statement)
diff --git a/docs/ru/sql-reference/statements/alter/quota.md b/docs/ru/sql-reference/statements/alter/quota.md
index 709baea6af0..c14b81c9bf3 100644
--- a/docs/ru/sql-reference/statements/alter/quota.md
+++ b/docs/ru/sql-reference/statements/alter/quota.md
@@ -22,7 +22,7 @@ ALTER QUOTA [IF EXISTS] name [ON CLUSTER cluster_name]
 
 Ключи `user_name`, `ip_address`, `client_key`, `client_key, user_name` и `client_key, ip_address` соответствуют полям таблицы [system.quotas](../../../operations/system-tables/quotas.md).
 
-Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
+Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
 
 В секции `ON CLUSTER` можно указать кластеры, на которых создается квота, см. [Распределенные DDL запросы](../../../sql-reference/distributed-ddl.md).
 
diff --git a/docs/ru/sql-reference/statements/create/quota.md b/docs/ru/sql-reference/statements/create/quota.md
index 18eba6b5b1a..398c52fdc73 100644
--- a/docs/ru/sql-reference/statements/create/quota.md
+++ b/docs/ru/sql-reference/statements/create/quota.md
@@ -20,7 +20,7 @@ CREATE QUOTA [IF NOT EXISTS | OR REPLACE] name [ON CLUSTER cluster_name]
 ```
 Ключи `user_name`, `ip_address`, `client_key`, `client_key, user_name` и `client_key, ip_address` соответствуют полям таблицы [system.quotas](../../../operations/system-tables/quotas.md).
 
-Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
+Параметры `queries`, `query_selects`, `query_inserts`, `errors`, `result_rows`, `result_bytes`, `read_rows`, `read_bytes`, `execution_time`, `failed_sequential_authentications` соответствуют полям таблицы [system.quotas_usage](../../../operations/system-tables/quotas_usage.md).
 
 В секции `ON CLUSTER` можно указать кластеры, на которых создается квота, см. [Распределенные DDL запросы](../../../sql-reference/distributed-ddl.md).
 
diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 71ad219110d..95262e632f0 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -559,16 +559,26 @@ AccessChangesNotifier & AccessControl::getChangesNotifier()
 }
 
 
-AuthResult AccessControl::authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address) const
+AuthResult AccessControl::authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address, const String & forwarded_address) const
 {
+    // NOTE: In the case where the user has never been logged in using LDAP,
+    // Then user_id is not generated, and the authentication quota will always be nullptr.
+    auto authentication_quota = getAuthenticationQuota(credentials.getUserName(), address, forwarded_address);
+    if (authentication_quota)
+        authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
     try
     {
-        return MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                   allow_plaintext_password);
+        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                                     allow_plaintext_password);
+
+        return auth_result;
     }
     catch (...)
     {
         tryLogCurrentException(getLogger(), "from: " + address.toString() + ", user: " + credentials.getUserName()  + ": Authentication failed");
+        if (authentication_quota)
+            authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1, true);
 
         WriteBufferFromOwnString message;
         message << credentials.getUserName() << ": Authentication failed: password is incorrect, or there is no user with such name.";
@@ -588,6 +598,9 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
                                             "{}: Authentication failed: password is incorrect, or there is no user with such name.{}"},
                         ErrorCodes::AUTHENTICATION_FAILED);
     }
+
+    if (authentication_quota)
+        authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)
@@ -763,7 +776,34 @@ std::shared_ptr<const EnabledQuota> AccessControl::getEnabledQuota(
     const String & forwarded_address,
     const String & custom_quota_key) const
 {
-    return quota_cache->getEnabledQuota(user_id, user_name, enabled_roles, address, forwarded_address, custom_quota_key);
+    return quota_cache->getEnabledQuota(user_id, user_name, enabled_roles, address, forwarded_address, custom_quota_key, true);
+}
+
+std::shared_ptr<const EnabledQuota> AccessControl::getAuthenticationQuota(
+    const String & user_name, const Poco::Net::IPAddress & address, const std::string & forwarded_address) const
+{
+    auto user_id = find<User>(user_name);
+    UserPtr user;
+    if (user_id && (user = tryRead<User>(*user_id)))
+    {
+        const auto new_current_roles = user->granted_roles.findGranted(user->default_roles);
+        const auto roles_info = getEnabledRolesInfo(new_current_roles, {});
+
+        // client_key is not received at the moment of authentication during TCP connection
+        // if key type is set to QuotaKeyType::CLIENT_KEY
+        // QuotaCache::QuotaInfo::calculateKey will throw exception without throw_if_client_key_empty = false
+        String quota_key;
+        bool throw_if_client_key_empty = false;
+        return quota_cache->getEnabledQuota(*user_id,
+                                            user->getName(),
+                                            roles_info->enabled_roles,
+                                            address,
+                                            forwarded_address,
+                                            quota_key,
+                                            throw_if_client_key_empty);
+    }
+    else
+        return nullptr;
 }
 
 
diff --git a/src/Access/AccessControl.h b/src/Access/AccessControl.h
index 76431ab4928..904f77faf90 100644
--- a/src/Access/AccessControl.h
+++ b/src/Access/AccessControl.h
@@ -118,7 +118,7 @@ public:
     scope_guard subscribeForChanges(const UUID & id, const OnChangedHandler & handler) const;
     scope_guard subscribeForChanges(const std::vector<UUID> & ids, const OnChangedHandler & handler) const;
 
-    AuthResult authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address) const;
+    AuthResult authenticate(const Credentials & credentials, const Poco::Net::IPAddress & address, const String & forwarded_address) const;
 
     /// Makes a backup of access entities.
     void restoreFromBackup(RestorerFromBackup & restorer) override;
@@ -206,6 +206,11 @@ public:
         const String & forwarded_address,
         const String & custom_quota_key) const;
 
+    std::shared_ptr<const EnabledQuota> getAuthenticationQuota(
+        const String & user_name,
+        const Poco::Net::IPAddress & address,
+        const std::string & forwarded_address) const;
+
     std::vector<QuotaUsage> getAllQuotasUsage() const;
 
     std::shared_ptr<const EnabledSettings> getEnabledSettings(
diff --git a/src/Access/Common/QuotaDefs.cpp b/src/Access/Common/QuotaDefs.cpp
index 4136fd52a00..0e9a4d5a365 100644
--- a/src/Access/Common/QuotaDefs.cpp
+++ b/src/Access/Common/QuotaDefs.cpp
@@ -111,6 +111,11 @@ const QuotaTypeInfo & QuotaTypeInfo::get(QuotaType type)
             static const auto info = make_info("WRITTEN_BYTES", 1);
             return info;
         }
+        case QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS:
+        {
+            static const auto info = make_info("FAILED_SEQUENTIAL_AUTHENTICATIONS", 1);
+            return info;
+        }
         case QuotaType::MAX: break;
     }
     throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected quota type: {}", static_cast<int>(type));
diff --git a/src/Access/Common/QuotaDefs.h b/src/Access/Common/QuotaDefs.h
index dfe2b56ef31..4f849a72b43 100644
--- a/src/Access/Common/QuotaDefs.h
+++ b/src/Access/Common/QuotaDefs.h
@@ -11,16 +11,17 @@ using QuotaValue = UInt64;
 /// Kinds of resource what we wish to quota.
 enum class QuotaType
 {
-    QUERIES,        /// Number of queries.
-    QUERY_SELECTS,  /// Number of select queries.
-    QUERY_INSERTS,  /// Number of insert queries.
-    ERRORS,         /// Number of queries with exceptions.
-    RESULT_ROWS,    /// Number of rows returned as result.
-    RESULT_BYTES,   /// Number of bytes returned as result.
-    READ_ROWS,      /// Number of rows read from tables.
-    READ_BYTES,     /// Number of bytes read from tables.
-    EXECUTION_TIME, /// Total amount of query execution time in nanoseconds.
-    WRITTEN_BYTES,  /// Number of bytes written to tables.
+    QUERIES,                                /// Number of queries.
+    QUERY_SELECTS,                          /// Number of select queries.
+    QUERY_INSERTS,                          /// Number of insert queries.
+    ERRORS,                                 /// Number of queries with exceptions.
+    RESULT_ROWS,                            /// Number of rows returned as result.
+    RESULT_BYTES,                           /// Number of bytes returned as result.
+    READ_ROWS,                              /// Number of rows read from tables.
+    READ_BYTES,                             /// Number of bytes read from tables.
+    EXECUTION_TIME,                         /// Total amount of query execution time in nanoseconds.
+    WRITTEN_BYTES,                          /// Number of bytes written to tables.
+    FAILED_SEQUENTIAL_AUTHENTICATIONS,      /// Number of recent failed authentications.
 
     MAX
 };
diff --git a/src/Access/EnabledQuota.cpp b/src/Access/EnabledQuota.cpp
index a61e795f741..98cce586a54 100644
--- a/src/Access/EnabledQuota.cpp
+++ b/src/Access/EnabledQuota.cpp
@@ -105,6 +105,16 @@ struct EnabledQuota::Impl
         std::uniform_int_distribution<Int64> distribution{0, count - 1};
         return std::chrono::system_clock::duration(distribution(thread_local_rng));
     }
+
+    static void resetQuotaValue(const Intervals & intervals, QuotaType quota_type, QuotaValue value, std::chrono::system_clock::time_point current_time)
+    {
+        const auto quota_type_i = static_cast<size_t>(quota_type);
+        for (const auto & interval : intervals.intervals)
+        {
+            interval.used[quota_type_i] = value;
+            interval.getEndOfInterval(current_time);
+        }
+    }
 };
 
 
@@ -285,6 +295,12 @@ void EnabledQuota::checkExceeded(QuotaType quota_type) const
 }
 
 
+void EnabledQuota::reset(QuotaType quota_type) const
+{
+    const auto loaded = intervals.load();
+    Impl::resetQuotaValue(*loaded, quota_type, 0, std::chrono::system_clock::now());
+}
+
 std::optional<QuotaUsage> EnabledQuota::getUsage() const
 {
     auto loaded = intervals.load();
diff --git a/src/Access/EnabledQuota.h b/src/Access/EnabledQuota.h
index ed1e06fa1f2..c4665da5dc6 100644
--- a/src/Access/EnabledQuota.h
+++ b/src/Access/EnabledQuota.h
@@ -52,6 +52,8 @@ public:
     void checkExceeded() const;
     void checkExceeded(QuotaType quota_type) const;
 
+    void reset(QuotaType quota_type) const;
+
     /// Returns the information about quota consumption.
     std::optional<QuotaUsage> getUsage() const;
 
diff --git a/src/Access/QuotaCache.cpp b/src/Access/QuotaCache.cpp
index 3c25c8833f3..dc49e9680ad 100644
--- a/src/Access/QuotaCache.cpp
+++ b/src/Access/QuotaCache.cpp
@@ -30,7 +30,7 @@ void QuotaCache::QuotaInfo::setQuota(const QuotaPtr & quota_, const UUID & quota
 }
 
 
-String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled) const
+String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled, bool throw_if_client_key_empty) const
 {
     const auto & params = enabled.params;
     switch (quota->key_type)
@@ -55,8 +55,15 @@ String QuotaCache::QuotaInfo::calculateKey(const EnabledQuota & enabled) const
         {
             if (!params.client_key.empty())
                 return params.client_key;
-            throw Exception(ErrorCodes::QUOTA_REQUIRES_CLIENT_KEY, "Quota {} (for user {}) requires a client supplied key.",
-                quota->getName(), params.user_name);
+
+            if (throw_if_client_key_empty)
+                throw Exception(
+                    ErrorCodes::QUOTA_REQUIRES_CLIENT_KEY,
+                    "Quota {} (for user {}) requires a client supplied key.",
+                    quota->getName(),
+                    params.user_name);
+            else
+                return ""; // Authentication quota has no client key at time of authentication.
         }
         case QuotaKeyType::CLIENT_KEY_OR_USER_NAME:
         {
@@ -165,7 +172,14 @@ QuotaCache::QuotaCache(const AccessControl & access_control_)
 QuotaCache::~QuotaCache() = default;
 
 
-std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(const UUID & user_id, const String & user_name, const boost::container::flat_set<UUID> & enabled_roles, const Poco::Net::IPAddress & client_address, const String & forwarded_address, const String & client_key)
+std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(
+    const UUID & user_id,
+    const String & user_name,
+    const boost::container::flat_set<UUID> & enabled_roles,
+    const Poco::Net::IPAddress & client_address,
+    const String & forwarded_address,
+    const String & client_key,
+    bool throw_if_client_key_empty)
 {
     std::lock_guard lock{mutex};
     ensureAllQuotasRead();
@@ -188,11 +202,10 @@ std::shared_ptr<const EnabledQuota> QuotaCache::getEnabledQuota(const UUID & use
 
     auto res = std::shared_ptr<EnabledQuota>(new EnabledQuota(params));
     enabled_quotas.emplace(std::move(params), res);
-    chooseQuotaToConsumeFor(*res);
+    chooseQuotaToConsumeFor(*res, throw_if_client_key_empty);
     return res;
 }
 
-
 void QuotaCache::ensureAllQuotasRead()
 {
     /// `mutex` is already locked.
@@ -257,13 +270,13 @@ void QuotaCache::chooseQuotaToConsume()
             i = enabled_quotas.erase(i);
         else
         {
-            chooseQuotaToConsumeFor(*elem);
+            chooseQuotaToConsumeFor(*elem, true);
             ++i;
         }
     }
 }
 
-void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled)
+void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled, bool throw_if_client_key_empty)
 {
     /// `mutex` is already locked.
     boost::shared_ptr<const Intervals> intervals;
@@ -271,7 +284,7 @@ void QuotaCache::chooseQuotaToConsumeFor(EnabledQuota & enabled)
     {
         if (info.roles->match(enabled.params.user_id, enabled.params.enabled_roles))
         {
-            String key = info.calculateKey(enabled);
+            String key = info.calculateKey(enabled, throw_if_client_key_empty);
             intervals = info.getOrBuildIntervals(key);
             break;
         }
diff --git a/src/Access/QuotaCache.h b/src/Access/QuotaCache.h
index 883ddfe47a8..97cf2d19c2f 100644
--- a/src/Access/QuotaCache.h
+++ b/src/Access/QuotaCache.h
@@ -28,7 +28,8 @@ public:
         const boost::container::flat_set<UUID> & enabled_roles,
         const Poco::Net::IPAddress & address,
         const String & forwarded_address,
-        const String & client_key);
+        const String & client_key,
+        bool throw_if_client_key_empty);
 
     std::vector<QuotaUsage> getAllQuotasUsage() const;
 
@@ -41,7 +42,7 @@ private:
         QuotaInfo(const QuotaPtr & quota_, const UUID & quota_id_) { setQuota(quota_, quota_id_); }
         void setQuota(const QuotaPtr & quota_, const UUID & quota_id_);
 
-        String calculateKey(const EnabledQuota & enabled_quota) const;
+        String calculateKey(const EnabledQuota & enabled_quota, bool throw_if_client_key_empty) const;
         boost::shared_ptr<const Intervals> getOrBuildIntervals(const String & key);
         boost::shared_ptr<const Intervals> rebuildIntervals(const String & key, std::chrono::system_clock::time_point current_time);
         void rebuildAllIntervals();
@@ -56,7 +57,7 @@ private:
     void quotaAddedOrChanged(const UUID & quota_id, const std::shared_ptr<const Quota> & new_quota);
     void quotaRemoved(const UUID & quota_id);
     void chooseQuotaToConsume();
-    void chooseQuotaToConsumeFor(EnabledQuota & enabled_quota);
+    void chooseQuotaToConsumeFor(EnabledQuota & enabled_quota, bool throw_if_client_key_empty);
 
     const AccessControl & access_control;
     mutable std::mutex mutex;
diff --git a/src/Interpreters/Session.cpp b/src/Interpreters/Session.cpp
index 533f33033e3..df97a09f686 100644
--- a/src/Interpreters/Session.cpp
+++ b/src/Interpreters/Session.cpp
@@ -349,10 +349,9 @@ void Session::authenticate(const Credentials & credentials_, const Poco::Net::So
 
     try
     {
-        auto auth_result = global_context->getAccessControl().authenticate(credentials_, address.host());
+        auto auth_result = global_context->getAccessControl().authenticate(credentials_, address.host(), getClientInfo().getLastForwardedFor());
         user_id = auth_result.user_id;
         settings_from_auth_server = auth_result.settings;
-
         LOG_DEBUG(log, "{} Authenticated with global context as user {}",
                 toString(auth_id), toString(*user_id));
     }
diff --git a/tests/integration/test_quota/test.py b/tests/integration/test_quota/test.py
index cec14b0af73..bf64b57a7bf 100644
--- a/tests/integration/test_quota/test.py
+++ b/tests/integration/test_quota/test.py
@@ -40,7 +40,7 @@ def system_quota_usage(canonical):
     canonical_tsv = TSV(canonical)
     query = (
         "SELECT quota_name, quota_key, duration, queries, max_queries, query_selects, max_query_selects, query_inserts, max_query_inserts, errors, max_errors, result_rows, max_result_rows,"
-        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "
+        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time, max_failed_sequential_authentications "
         "FROM system.quota_usage ORDER BY duration"
     )
     r = TSV(instance.query(query))
@@ -52,7 +52,7 @@ def system_quotas_usage(canonical):
     canonical_tsv = TSV(canonical)
     query = (
         "SELECT quota_name, quota_key, is_current, duration, queries, max_queries, query_selects, max_query_selects, query_inserts, max_query_inserts, errors, max_errors, result_rows, max_result_rows, "
-        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time "
+        "result_bytes, max_result_bytes, read_rows, max_read_rows, read_bytes, max_read_bytes, max_execution_time, max_failed_sequential_authentications "
         "FROM system.quotas_usage ORDER BY quota_name, quota_key, duration"
     )
     r = TSV(instance.query(query))
@@ -130,6 +130,7 @@ def test_quota_from_users_xml():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -156,6 +157,7 @@ def test_quota_from_users_xml():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -183,6 +185,7 @@ def test_quota_from_users_xml():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -211,6 +214,7 @@ def test_quota_from_users_xml():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -239,6 +243,7 @@ def test_quota_from_users_xml():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -285,6 +290,7 @@ def test_simpliest_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -313,6 +319,7 @@ def test_simpliest_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -351,6 +358,7 @@ def test_tracking_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -377,6 +385,7 @@ def test_tracking_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -405,6 +414,7 @@ def test_tracking_quota():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -433,6 +443,7 @@ def test_tracking_quota():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -456,7 +467,7 @@ def test_exceed_quota():
         ]
     )
     system_quota_limits(
-        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N"]]
+        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N", "1"]]
     )
     system_quota_usage(
         [
@@ -481,6 +492,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "1",
             ]
         ]
     )
@@ -512,6 +524,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "1",
             ]
         ]
     )
@@ -548,6 +561,7 @@ def test_exceed_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -574,6 +588,7 @@ def test_exceed_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -602,6 +617,7 @@ def test_exceed_quota():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -638,6 +654,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -664,6 +681,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -700,6 +718,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -715,6 +734,7 @@ def test_add_remove_interval():
                 20000,
                 120,
                 "\\N",
+                "\\N",
             ],
         ]
     )
@@ -741,6 +761,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -763,6 +784,7 @@ def test_add_remove_interval():
                 0,
                 20000,
                 120,
+                "\\N",
             ],
         ]
     )
@@ -791,6 +813,7 @@ def test_add_remove_interval():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota",
@@ -813,6 +836,7 @@ def test_add_remove_interval():
                 200,
                 20000,
                 120,
+                "\\N",
             ],
         ]
     )
@@ -849,6 +873,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -875,6 +900,7 @@ def test_add_remove_interval():
                 200,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -903,6 +929,7 @@ def test_add_remove_interval():
                 400,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -947,6 +974,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -975,6 +1003,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1011,6 +1040,7 @@ def test_add_remove_interval():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1037,6 +1067,7 @@ def test_add_remove_interval():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1073,6 +1104,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1100,6 +1132,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1146,6 +1179,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ],
             [
                 "myQuota2",
@@ -1161,6 +1195,7 @@ def test_add_remove_quota():
                 400000,
                 60,
                 "\\N",
+                "3",
             ],
             [
                 "myQuota2",
@@ -1176,6 +1211,7 @@ def test_add_remove_quota():
                 "\\N",
                 1800,
                 "\\N",
+                "\\N",
             ],
         ]
     )
@@ -1203,6 +1239,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1239,6 +1276,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1266,6 +1304,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1308,6 +1347,7 @@ def test_add_remove_quota():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1335,6 +1375,7 @@ def test_add_remove_quota():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1371,6 +1412,7 @@ def test_reload_users_xml_by_timer():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1397,7 +1439,7 @@ def test_reload_users_xml_by_timer():
     assert_eq_with_retry(
         instance,
         "SELECT * FROM system.quota_limits",
-        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N"]],
+        [["myQuota", 31556952, 0, 1, 1, 1, 1, 1, "\\N", 1, "\\N", "\\N", "\\N", "1"]],
     )
 
 
@@ -1447,15 +1489,15 @@ def test_dcl_introspection():
     )
     assert (
         instance.query("SHOW CREATE QUOTA myQuota2")
-        == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+        == "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, failed_sequential_authentications = 3, FOR INTERVAL 1 month MAX execution_time = 1800\n"
     )
     assert (
         instance.query("SHOW CREATE QUOTAS")
         == "CREATE QUOTA myQuota KEYED BY user_name FOR INTERVAL 1 year MAX queries = 1000, read_rows = 1000 TO default\n"
-        "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, FOR INTERVAL 1 month MAX execution_time = 1800\n"
+        "CREATE QUOTA myQuota2 KEYED BY client_key, user_name FOR RANDOMIZED INTERVAL 1 hour MAX result_rows = 4000, result_bytes = 400000, read_rows = 4000, read_bytes = 400000, execution_time = 60, failed_sequential_authentications = 3, FOR INTERVAL 1 month MAX execution_time = 1800\n"
     )
     assert re.match(
-        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "myQuota\\tdefault\\t.*\\t31556952\\t1\\t1000\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t1000\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1478,13 +1520,13 @@ def test_dcl_management():
         == "CREATE QUOTA qA FOR INTERVAL 5 quarter MAX queries = 123 TO default\n"
     )
     assert re.match(
-        "qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\n",
+        "qA\\t\\t.*\\t39446190\\t0\\t123\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t39446190\\t1\\t123\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "qA\\t\\t.*\\t39446190\\t1\\t123\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1496,15 +1538,15 @@ def test_dcl_management():
         == "CREATE QUOTA qA FOR INTERVAL 30 minute MAX execution_time = 0.5, FOR INTERVAL 5 quarter MAX queries = 321, errors = 10 TO default\n"
     )
     assert re.match(
-        "qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\n"
-        "qA\\t\\t.*\\t39446190\\t1\\t321\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t1800\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\\t0\\t\\\\N\n"
+        "qA\\t\\t.*\\t39446190\\t1\\t321\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\n"
-        "qA\\t\\t.*\\t39446190\\t2\\t321\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t1800\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t0.5\\t0\\t\\\\N\\t0\\t\\\\N\n"
+        "qA\\t\\t.*\\t39446190\\t2\\t321\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t10\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1518,7 +1560,7 @@ def test_dcl_management():
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qA\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1528,13 +1570,13 @@ def test_dcl_management():
         == "CREATE QUOTA qB FOR RANDOMIZED INTERVAL 16 month TRACKING ONLY TO default\n"
     )
     assert re.match(
-        "qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\n",
+        "qB\\t\\t.*\\t42075936\\t1\\t\\\\N\\t1\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t50\\t\\\\N\\t200\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
     instance.query("SELECT * from test_table")
     assert re.match(
-        "qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\n",
+        "qB\\t\\t.*\\t42075936\\t2\\t\\\\N\\t2\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t100\\t\\\\N\\t400\\t\\\\N\\t.*\\t\\\\N\\t0\\t\\\\N\\t0\\t\\\\N\n",
         instance.query("SHOW QUOTA"),
     )
 
@@ -1579,6 +1621,7 @@ def test_query_inserts():
                 "\\N",
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1605,6 +1648,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1632,6 +1676,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1663,6 +1708,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
@@ -1691,6 +1737,7 @@ def test_query_inserts():
                 0,
                 "\\N",
                 "\\N",
+                "\\N",
             ]
         ]
     )
diff --git a/tests/integration/test_quota/tiny_limits.xml b/tests/integration/test_quota/tiny_limits.xml
index 5821935bb6d..b5014674f98 100644
--- a/tests/integration/test_quota/tiny_limits.xml
+++ b/tests/integration/test_quota/tiny_limits.xml
@@ -12,6 +12,7 @@
                 <errors>1</errors>
                 <read_rows>1</read_rows>
                 <result_rows>1</result_rows>
+                <failed_sequential_authentications>1</failed_sequential_authentications>
             </interval>
         </myQuota>
     </quotas>
diff --git a/tests/integration/test_quota/two_quotas.xml b/tests/integration/test_quota/two_quotas.xml
index 13872286dc6..e3b91b1bf43 100644
--- a/tests/integration/test_quota/two_quotas.xml
+++ b/tests/integration/test_quota/two_quotas.xml
@@ -18,6 +18,7 @@
                 <read_bytes>400000</read_bytes>
                 <result_bytes>400000</result_bytes>
                 <execution_time>60</execution_time>
+                <failed_sequential_authentications>3</failed_sequential_authentications>
             </interval>
             <interval2>
                 <duration>2629746</duration>
diff --git a/tests/queries/0_stateless/01297_create_quota.reference b/tests/queries/0_stateless/01297_create_quota.reference
index 308bbf79024..456c9fc56bb 100644
--- a/tests/queries/0_stateless/01297_create_quota.reference
+++ b/tests/queries/0_stateless/01297_create_quota.reference
@@ -57,10 +57,10 @@ q2_01297	local_directory	[]	[5259492]	0	['r1_01297','u1_01297']	[]
 q3_01297	local_directory	['client_key','user_name']	[5259492,15778476]	0	[]	[]
 q4_01297	local_directory	[]	[604800]	1	[]	['u1_01297']
 -- system.quota_limits
-q2_01297	5259492	0	100	\N	\N	11	1000	10000	1001	10001	2.5	\N
-q3_01297	5259492	0	\N	\N	\N	\N	1002	\N	\N	\N	\N	\N
-q3_01297	15778476	0	100	\N	\N	11	\N	\N	\N	\N	\N	\N
-q4_01297	604800	0	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N
+q2_01297	5259492	0	100	\N	\N	11	1000	10000	1001	10001	2.5	\N	\N
+q3_01297	5259492	0	\N	\N	\N	\N	1002	\N	\N	\N	\N	\N	\N
+q3_01297	15778476	0	100	\N	\N	11	\N	\N	\N	\N	\N	\N	\N
+q4_01297	604800	0	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N	\N
 -- query_selects query_inserts
 CREATE QUOTA q1_01297 KEYED BY user_name FOR INTERVAL 1 minute MAX query_selects = 1 TO r1_01297
 CREATE QUOTA q2_01297 KEYED BY user_name FOR INTERVAL 1 minute MAX query_inserts = 1 TO r1_01297
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index e89d589857e..4c8f09bb852 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -762,7 +762,8 @@ CREATE TABLE system.quota_limits
     `max_read_rows` Nullable(UInt64),
     `max_read_bytes` Nullable(UInt64),
     `max_execution_time` Nullable(Float64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotaLimits
 COMMENT 'SYSTEM TABLE is built on the fly.'
@@ -792,7 +793,9 @@ CREATE TABLE system.quota_usage
     `execution_time` Nullable(Float64),
     `max_execution_time` Nullable(Float64),
     `written_bytes` Nullable(UInt64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `failed_sequential_authentications` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotaUsage
 COMMENT 'SYSTEM TABLE is built on the fly.'
@@ -836,7 +839,9 @@ CREATE TABLE system.quotas_usage
     `execution_time` Nullable(Float64),
     `max_execution_time` Nullable(Float64),
     `written_bytes` Nullable(UInt64),
-    `max_written_bytes` Nullable(UInt64)
+    `max_written_bytes` Nullable(UInt64),
+    `failed_sequential_authentications` Nullable(UInt64),
+    `max_failed_sequential_authentications` Nullable(UInt64)
 )
 ENGINE = SystemQuotasUsage
 COMMENT 'SYSTEM TABLE is built on the fly.'
diff --git a/tests/queries/0_stateless/02884_authentication_quota.reference b/tests/queries/0_stateless/02884_authentication_quota.reference
new file mode 100644
index 00000000000..02e410ed56f
--- /dev/null
+++ b/tests/queries/0_stateless/02884_authentication_quota.reference
@@ -0,0 +1,52 @@
+> Drop the user, quota, and role if those were created.
+> Create the user with quota with the maximum single authentication attempt.
+> Check if the quota has been created.
+1
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+1	1
+> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	1
+> Login to the user account using the wrong password 2 times to exceed the quota.
+password is incorrect
+QUOTA_EXCEEDED
+> Login to the user account using the correct password, but login is unsuccesful (quota exceed).
+QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+2	1
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+3	3
+> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	3
+> Create the role with quota with the maximum single authentication attempt.
+> Login to the user account using the wrong password.
+password is incorrect
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+1	1
+> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	1
+> Login to the user account using the wrong password 2 times to exceed the quota.
+password is incorrect
+QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+QUOTA_EXCEEDED
+> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
+> Login to the user account using the wrong password.
+password is incorrect
+> Login to the user account using the correct password.
+> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1
+> Login 2 times to the user account using the wrong password to exceed the quota
+password is incorrect
+> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
+> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
+> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+QUOTA_EXCEEDED
diff --git a/tests/queries/0_stateless/02884_authentication_quota.sh b/tests/queries/0_stateless/02884_authentication_quota.sh
new file mode 100755
index 00000000000..fcb2607c3d6
--- /dev/null
+++ b/tests/queries/0_stateless/02884_authentication_quota.sh
@@ -0,0 +1,90 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+QUOTA="2884_quota_$$"
+USER="2884_user_$$"
+ROLE="2884_role_$$"
+
+echo "> Drop the user, quota, and role if those were created."
+${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
+${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
+${CLICKHOUSE_CLIENT} -q "DROP ROLE IF EXISTS ${ROLE}"
+
+echo "> Create the user with quota with the maximum single authentication attempt."
+${CLICKHOUSE_CLIENT} -q "CREATE USER ${USER} IDENTIFIED WITH plaintext_password BY 'pass'"
+${CLICKHOUSE_CLIENT} -q "CREATE QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
+
+echo "> Check if the quota has been created."
+${CLICKHOUSE_CLIENT} -q "SELECT COUNT(*) FROM system.quotas WHERE name = '${QUOTA}'"
+
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Login to the user account using the wrong password 2 times to exceed the quota."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using the correct password, but login is unsuccesful (quota exceed)."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+echo "> Create the role with quota with the maximum single authentication attempt."
+${CLICKHOUSE_CLIENT} -q "CREATE ROLE ${ROLE}"
+${CLICKHOUSE_CLIENT} -q "GRANT ALL ON *.* TO ${ROLE}"
+${CLICKHOUSE_CLIENT} -q "GRANT ${ROLE} to ${USER}"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${ROLE}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+echo "> Login to the user account using the wrong password 2 times to exceed the quota."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
+echo "> Login to the user account using the wrong password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Login to the user account using the correct password."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1"
+${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
+echo "> Login 2 times to the user account using the wrong password to exceed the quota"
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+echo "> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
+${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
+${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
+${CLICKHOUSE_CLIENT} -q "DROP ROLE IF EXISTS ${ROLE}"

From ff1cdf6beef1ae2d8aed50513a8a1b99e63e61d1 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 00:42:51 +0100
Subject: [PATCH 0393/1081] Restart CI

---
 tests/integration/test_storage_rabbitmq/test.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 28dbca1862c..b778e9fb556 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -3547,6 +3547,5 @@ def test_attach_broken_table(rabbitmq_cluster):
 
     error = instance.query_and_get_error("SELECT * FROM rabbit_queue")
     assert "CANNOT_CONNECT_RABBITMQ" in error
-
     error = instance.query_and_get_error("INSERT INTO rabbit_queue VALUES ('test')")
     assert "CANNOT_CONNECT_RABBITMQ" in error

From b1d2c0d93a493ec62aa0d3c8a82373624066fcb3 Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Mon, 29 Jan 2024 23:56:54 +0000
Subject: [PATCH 0394/1081] minor update

---
 src/Access/AccessControl.cpp | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 95262e632f0..7026fda94b1 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -567,12 +567,11 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
     if (authentication_quota)
         authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
 
+    AuthResult auth_result;
     try
     {
-        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                                     allow_plaintext_password);
-
-        return auth_result;
+        auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                          allow_plaintext_password);
     }
     catch (...)
     {
@@ -601,6 +600,8 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
 
     if (authentication_quota)
         authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
+    return auth_result;
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)

From 815c73f1e5471abd51ddcb4ca0da2f33a2d630d5 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 30 Jan 2024 10:41:42 +0800
Subject: [PATCH 0395/1081] change as request

---
 src/Functions/regexpExtract.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/regexpExtract.cpp b/src/Functions/regexpExtract.cpp
index e7c982d675a..f6bbd2f96f2 100644
--- a/src/Functions/regexpExtract.cpp
+++ b/src/Functions/regexpExtract.cpp
@@ -137,7 +137,7 @@ private:
         if (index < 0 || index >= capture + 1)
             throw Exception(
                 ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                 index,
                 pattern,
                 getName(),
@@ -189,7 +189,7 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                    "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                     index,
                     pattern,
                     getName(),
@@ -234,7 +234,7 @@ private:
             if (index < 0 || index >= capture + 1)
                 throw Exception(
                     ErrorCodes::INDEX_OF_POSITIONAL_ARGUMENT_IS_OUT_OF_RANGE,
-                    "Index value {} is out of range of regexp pattern '{}' in function {}, should be in [0, {})",
+                    "Index value {} for regexp pattern `{}` in function {} is out-of-range, should be in [0, {})",
                     index,
                     pattern,
                     getName(),

From 3f1ec9a9881949c7e676cf11f35fb75df3b95f78 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 04:23:16 +0100
Subject: [PATCH 0396/1081] Fix error

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 692d8fc6360..53b14ddc385 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,7 +102,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"default_table_engine", DefaultTableEngine::None, DefaultTableEngine::MergeTree, "Set default table engine to MergeTree for better usability"},
+              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},

From 0ded5800112f95f7b13ca8d060e743559ce787e6 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Tue, 30 Jan 2024 04:03:27 +0000
Subject: [PATCH 0397/1081] Fix

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 14 +++++++++++++-
 .../replaceForPositionalArguments.cpp         | 19 +++++++++++++++----
 2 files changed, 28 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index c683214840b..fbabef87112 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2170,7 +2170,19 @@ void QueryAnalyzer::replaceNodesWithPositionalArguments(QueryTreeNodePtr & node_
         else // Int64
         {
             auto value = constant_node->getValue().get<Int64>();
-            pos = value > 0 ? value : projection_nodes.size() + value + 1;
+            if (value > 0)
+                pos = value;
+            else
+            {
+                if (static_cast<size_t>(std::abs(value)) > projection_nodes.size())
+                    throw Exception(
+                        ErrorCodes::BAD_ARGUMENTS,
+                        "Negtive positional argument number {} is out of bounds. Expected in range [-{}, -1]. In scope {}",
+                        value,
+                        projection_nodes.size(),
+                        scope.scope_node->formatASTForErrorMessage());
+                pos = projection_nodes.size() + value + 1;
+            }
         }
 
         if (!pos || pos > projection_nodes.size())
diff --git a/src/Interpreters/replaceForPositionalArguments.cpp b/src/Interpreters/replaceForPositionalArguments.cpp
index bea87ad913a..c72cac25c9d 100644
--- a/src/Interpreters/replaceForPositionalArguments.cpp
+++ b/src/Interpreters/replaceForPositionalArguments.cpp
@@ -10,7 +10,8 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int BAD_ARGUMENTS;
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
 bool replaceForPositionalArguments(ASTPtr & argument, const ASTSelectQuery * select_query, ASTSelectQuery::Expression expression)
@@ -39,7 +40,18 @@ bool replaceForPositionalArguments(ASTPtr & argument, const ASTSelectQuery * sel
     else if (which == Field::Types::Int64)
     {
         auto value = ast_literal->value.get<Int64>();
-        pos = value > 0 ? value : columns.size() + value + 1;
+        if (value > 0)
+            pos = value;
+        else
+        {
+            if (static_cast<size_t>(std::abs(value)) > columns.size())
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Negtive positional argument number {} is out of bounds. Expected in range [-{}, -1]",
+                    value,
+                    columns.size());
+            pos = columns.size() + value + 1;
+        }
     }
     else
     {
@@ -47,8 +59,7 @@ bool replaceForPositionalArguments(ASTPtr & argument, const ASTSelectQuery * sel
     }
 
     if (!pos || pos > columns.size())
-        throw Exception(
-            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Positional argument out of bounds: {} (expected in range [1, {}]", pos, columns.size());
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Positional argument out of bounds: {} (expected in range [1, {}]", pos, columns.size());
 
     const auto & column = columns[--pos];
     if (typeid_cast<const ASTIdentifier *>(column.get()) || typeid_cast<const ASTLiteral *>(column.get()))

From 89339127a97c79e6ecb2ee476045d218b13e2093 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 07:02:06 +0100
Subject: [PATCH 0398/1081] Add changelog for 24.1

---
 CHANGELOG.md | 2308 ++++----------------------------------------------
 1 file changed, 161 insertions(+), 2147 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 1b36142cc9f..ea3c954776a 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,2164 +1,178 @@
 ### Table of Contents
-**[ClickHouse release v23.12, 2023-12-28](#2312)**<br/>
-**[ClickHouse release v23.11, 2023-12-06](#2311)**<br/>
-**[ClickHouse release v23.10, 2023-11-02](#2310)**<br/>
-**[ClickHouse release v23.9, 2023-09-28](#239)**<br/>
-**[ClickHouse release v23.8 LTS, 2023-08-31](#238)**<br/>
-**[ClickHouse release v23.7, 2023-07-27](#237)**<br/>
-**[ClickHouse release v23.6, 2023-06-30](#236)**<br/>
-**[ClickHouse release v23.5, 2023-06-08](#235)**<br/>
-**[ClickHouse release v23.4, 2023-04-26](#234)**<br/>
-**[ClickHouse release v23.3 LTS, 2023-03-30](#233)**<br/>
-**[ClickHouse release v23.2, 2023-02-23](#232)**<br/>
-**[ClickHouse release v23.1, 2023-01-25](#231)**<br/>
-**[Changelog for 2022](https://clickhouse.com/docs/en/whats-new/changelog/2022/)**<br/>
+**[ClickHouse release v24.1, 2024-01-30](#241)**<br/>
+**[Changelog for 2023](https://clickhouse.com/docs/en/whats-new/changelog/2023/)**<br/>
 
-# 2023 Changelog
+# 2024 Changelog
 
-### <a id="2312"></a> ClickHouse release 23.12, 2023-12-28
+### <a id="241"></a> ClickHouse release 24.1, 2024-01-30
+
+### ClickHouse release master (b4a5b6060ea) FIXME as compared to v23.12.1.1368-stable (a2faa65b080)
 
 #### Backward Incompatible Change
-* Fix check for non-deterministic functions in TTL expressions. Previously, you could create a TTL expression with non-deterministic functions in some cases, which could lead to undefined behavior later. This fixes [#37250](https://github.com/ClickHouse/ClickHouse/issues/37250). Disallow TTL expressions that don't depend on any columns of a table by default. It can be allowed back by `SET allow_suspicious_ttl_expressions = 1` or `SET compatibility = '23.11'`. Closes [#37286](https://github.com/ClickHouse/ClickHouse/issues/37286). [#51858](https://github.com/ClickHouse/ClickHouse/pull/51858) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for the `OPTIMIZE` is not allowed by default (it can be unlocked with the `allow_experimental_replacing_merge_with_cleanup` setting). [#58267](https://github.com/ClickHouse/ClickHouse/pull/58267) ([Alexander Tokmakov](https://github.com/tavplubix)). This fixes [#57930](https://github.com/ClickHouse/ClickHouse/issues/57930). This closes [#54988](https://github.com/ClickHouse/ClickHouse/issues/54988). This closes [#54570](https://github.com/ClickHouse/ClickHouse/issues/54570). This closes [#50346](https://github.com/ClickHouse/ClickHouse/issues/50346). This closes [#47579](https://github.com/ClickHouse/ClickHouse/issues/47579). The feature has to be removed because it is not good. We have to remove it as quickly as possible, because there is no other option. [#57932](https://github.com/ClickHouse/ClickHouse/pull/57932) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The setting `print_pretty_type_names` is turned on by default. You can turn it off to keep the old behavior or `SET compatibility = '23.12'`. [#57726](https://github.com/ClickHouse/ClickHouse/pull/57726) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58316](https://github.com/ClickHouse/ClickHouse/pull/58316) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* The function `reverseDNSQuery` is no longer available. This closes [#58368](https://github.com/ClickHouse/ClickHouse/issues/58368). [#58369](https://github.com/ClickHouse/ClickHouse/pull/58369) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Enable various changes to improve the access control in the configuration file. These changes affect the behavior, and you check the `config.xml` in the `access_control_improvements` section. In case you are not confident, keep the values in the configuration file as they were in the previous version. [#58584](https://github.com/ClickHouse/ClickHouse/pull/58584) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the operation of `sumMapFiltered` with NaN values. NaN values are now placed at the end (instead of randomly) and considered different from any values. `-0` is now also treated as equal to `0`; since 0 values are discarded, `-0` values are discarded too. [#58959](https://github.com/ClickHouse/ClickHouse/pull/58959) ([Raúl Marín](https://github.com/Algunenano)).
+* The function `visibleWidth` will behave according to the docs. In previous versions, it simply counted code points after string serialization, like the `lengthUTF8` function, but didn't consider zero-width and combining characters, full-width characters, tabs, and deletes. Now the behavior is changed accordingly. If you want to keep the old behavior, set `function_visible_width_behavior` to `0`, or set `compatibility` to `23.12` or lower. [#59022](https://github.com/ClickHouse/ClickHouse/pull/59022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `Kusto` dialect is disabled until these two bugs will be fixed: [#59037](https://github.com/ClickHouse/ClickHouse/issues/59037) and [#59036](https://github.com/ClickHouse/ClickHouse/issues/59036). [#59305](https://github.com/ClickHouse/ClickHouse/pull/59305) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Any attempt to use `Kusto` will result in exception.
+* More efficient implementation of the `FINAL` modifier no longer guarantees preserving the order even if `max_threads = 1`. If you counted on the previous behavior, set `enable_vertical_final` to 0 or `compatibility` to `23.12`. 
 
 #### New Feature
-* Implement Refreshable Materialized Views, requested in [#33919](https://github.com/ClickHouse/ClickHouse/issues/33919). [#56946](https://github.com/ClickHouse/ClickHouse/pull/56946) ([Michael Kolupaev](https://github.com/al13n321), [Michael Guzov](https://github.com/koloshmet)).
-* Introduce `PASTE JOIN`, which allows users to join tables without `ON` clause simply by row numbers. Example: `SELECT * FROM (SELECT number AS a FROM numbers(2)) AS t1 PASTE JOIN (SELECT number AS a FROM numbers(2) ORDER BY a DESC) AS t2`. [#57995](https://github.com/ClickHouse/ClickHouse/pull/57995) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* The `ORDER BY` clause now supports specifying `ALL`, meaning that ClickHouse sorts by all columns in the `SELECT` clause. Example: `SELECT col1, col2 FROM tab WHERE [...] ORDER BY ALL`. [#57875](https://github.com/ClickHouse/ClickHouse/pull/57875) ([zhongyuankai](https://github.com/zhongyuankai)).
-* Added a new mutation command `ALTER TABLE <table> APPLY DELETED MASK`, which allows to enforce applying of mask written by lightweight delete and to remove rows marked as deleted from disk. [#57433](https://github.com/ClickHouse/ClickHouse/pull/57433) ([Anton Popov](https://github.com/CurtizJ)).
-* A handler `/binary` opens a visual viewer of symbols inside the ClickHouse binary. [#58211](https://github.com/ClickHouse/ClickHouse/pull/58211) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added a new SQL function `sqid` to generate Sqids (https://sqids.org/), example: `SELECT sqid(125, 126)`. [#57512](https://github.com/ClickHouse/ClickHouse/pull/57512) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a new function `seriesPeriodDetectFFT` to detect series period using FFT. [#57574](https://github.com/ClickHouse/ClickHouse/pull/57574) ([Bhavna Jindal](https://github.com/bhavnajindal)).
-* Add an HTTP endpoint for checking if Keeper is ready to accept traffic. [#55876](https://github.com/ClickHouse/ClickHouse/pull/55876) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Add 'union' mode for schema inference. In this mode the resulting table schema is the union of all files schemas (so schema is inferred from each file). The mode of schema inference is controlled by a setting `schema_inference_mode` with two possible values - `default` and `union`. Closes [#55428](https://github.com/ClickHouse/ClickHouse/issues/55428). [#55892](https://github.com/ClickHouse/ClickHouse/pull/55892) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add new setting `input_format_csv_try_infer_numbers_from_strings` that allows to infer numbers from strings in CSV format. Closes [#56455](https://github.com/ClickHouse/ClickHouse/issues/56455). [#56859](https://github.com/ClickHouse/ClickHouse/pull/56859) ([Kruglov Pavel](https://github.com/Avogar)).
-* When the number of databases or tables exceeds a configurable threshold, show a warning to the user. [#57375](https://github.com/ClickHouse/ClickHouse/pull/57375) ([凌涛](https://github.com/lingtaolf)).
-* Dictionary with `HASHED_ARRAY` (and `COMPLEX_KEY_HASHED_ARRAY`) layout supports `SHARDS` similarly to `HASHED`. [#57544](https://github.com/ClickHouse/ClickHouse/pull/57544) ([vdimir](https://github.com/vdimir)).
-* Add asynchronous metrics for total primary key bytes and total allocated primary key bytes in memory. [#57551](https://github.com/ClickHouse/ClickHouse/pull/57551) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `SHA512_256` function. [#57645](https://github.com/ClickHouse/ClickHouse/pull/57645) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `FORMAT_BYTES` as an alias for `formatReadableSize`. [#57592](https://github.com/ClickHouse/ClickHouse/pull/57592) ([Bharat Nallan](https://github.com/bharatnc)).
-* Allow passing optional session token to the `s3` table function. [#57850](https://github.com/ClickHouse/ClickHouse/pull/57850) ([Shani Elharrar](https://github.com/shanielh)).
-* Introduce a new setting `http_make_head_request`. If it is turned off, the URL table engine will not do a HEAD request to determine the file size. This is needed to support inefficient, misconfigured, or not capable HTTP servers. [#54602](https://github.com/ClickHouse/ClickHouse/pull/54602) ([Fionera](https://github.com/fionera)).
-* It is now possible to refer to ALIAS column in index (non-primary-key) definitions (issue [#55650](https://github.com/ClickHouse/ClickHouse/issues/55650)). Example: `CREATE TABLE tab(col UInt32, col_alias ALIAS col + 1, INDEX idx (col_alias) TYPE minmax) ENGINE = MergeTree ORDER BY col;`. [#57546](https://github.com/ClickHouse/ClickHouse/pull/57546) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added a new setting `readonly` which can be used to specify an S3 disk is read only. It can be useful to create a table on a disk of `s3_plain` type, while having read only access to the underlying S3 bucket. [#57977](https://github.com/ClickHouse/ClickHouse/pull/57977) ([Pengyuan Bian](https://github.com/bianpengyuan)).
-* The primary key analysis in MergeTree tables will now be applied to predicates that include the virtual column `_part_offset` (optionally with `_part`). This feature can serve as a special kind of a secondary index. [#58224](https://github.com/ClickHouse/ClickHouse/pull/58224) ([Amos Bird](https://github.com/amosbird)).
+* Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
+* Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
+* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
+* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
+* Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
+* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
+* Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
+* Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).
+* Table system.dropped_tables_parts contains parts of system.dropped_tables tables (dropped but not yet removed tables). [#58038](https://github.com/ClickHouse/ClickHouse/pull/58038) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Add settings `max_materialized_views_size_for_table` to limit the number of materialized views attached to a table. [#58068](https://github.com/ClickHouse/ClickHouse/pull/58068) ([zhongyuankai](https://github.com/zhongyuankai)).
+* `clickhouse-format` improvements: support INSERT queries with `VALUES`; support comments (use `--comments` to output them); support `--max_line_length` option to format only long queries in multiline. [#58246](https://github.com/ClickHouse/ClickHouse/pull/58246) ([vdimir](https://github.com/vdimir)).
+* Attach all system tables in `clickhouse-local`, including `system.parts`. This closes [#58312](https://github.com/ClickHouse/ClickHouse/issues/58312). [#58359](https://github.com/ClickHouse/ClickHouse/pull/58359) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support for `Enum` data types in function `transform`. This closes [#58241](https://github.com/ClickHouse/ClickHouse/issues/58241). [#58360](https://github.com/ClickHouse/ClickHouse/pull/58360) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add table `system.database_engines`. [#58390](https://github.com/ClickHouse/ClickHouse/pull/58390) ([Bharat Nallan](https://github.com/bharatnc)). Allow registering database engines independently in the codebase. [#58365](https://github.com/ClickHouse/ClickHouse/pull/58365) ([Bharat Nallan](https://github.com/bharatnc)). Allow registering interpreters independently. [#58443](https://github.com/ClickHouse/ClickHouse/pull/58443) ([Bharat Nallan](https://github.com/bharatnc)).
+* Added `FROM <Replicas>` modifier for `SYSTEM SYNC REPLICA LIGHTWEIGHT` query. With the `FROM` modifier ensures we wait for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
+* Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
+* Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
 
 #### Performance Improvement
-* Extract non-intersecting parts ranges from MergeTree table during FINAL processing. That way we can avoid additional FINAL logic for this non-intersecting parts ranges. In case when amount of duplicate values with same primary key is low, performance will be almost the same as without FINAL. Improve reading performance for MergeTree FINAL when `do_not_merge_across_partitions_select_final` setting is set. [#58120](https://github.com/ClickHouse/ClickHouse/pull/58120) ([Maksim Kita](https://github.com/kitaisreal)).
-* Made copy between s3 disks using a s3-server-side copy instead of copying through the buffer. Improves `BACKUP/RESTORE` operations and `clickhouse-disks copy` command. [#56744](https://github.com/ClickHouse/ClickHouse/pull/56744) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Hash JOIN respects setting `max_joined_block_size_rows` and do not produce large blocks for `ALL JOIN`. [#56996](https://github.com/ClickHouse/ClickHouse/pull/56996) ([vdimir](https://github.com/vdimir)).
-* Release memory for aggregation earlier. This may avoid unnecessary external aggregation. [#57691](https://github.com/ClickHouse/ClickHouse/pull/57691) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Improve performance of string serialization. [#57717](https://github.com/ClickHouse/ClickHouse/pull/57717) ([Maksim Kita](https://github.com/kitaisreal)).
-* Support trivial count optimization for `Merge`-engine tables. [#57867](https://github.com/ClickHouse/ClickHouse/pull/57867) ([skyoct](https://github.com/skyoct)).
-* Optimized aggregation in some cases. [#57872](https://github.com/ClickHouse/ClickHouse/pull/57872) ([Anton Popov](https://github.com/CurtizJ)).
-* The `hasAny` function can now take advantage of the full-text skipping indices. [#57878](https://github.com/ClickHouse/ClickHouse/pull/57878) ([Jpnock](https://github.com/Jpnock)).
-* Function `if(cond, then, else)` (and its alias `cond ? then : else`) were optimized to use branch-free evaluation. [#57885](https://github.com/ClickHouse/ClickHouse/pull/57885) ([zhanglistar](https://github.com/zhanglistar)).
-* MergeTree automatically derive `do_not_merge_across_partitions_select_final` setting if partition key expression contains only columns from primary key expression. [#58218](https://github.com/ClickHouse/ClickHouse/pull/58218) ([Maksim Kita](https://github.com/kitaisreal)).
-* Speedup `MIN` and `MAX` for native types. [#58231](https://github.com/ClickHouse/ClickHouse/pull/58231) ([Raúl Marín](https://github.com/Algunenano)).
-* Implement `SLRU` cache policy for filesystem cache. [#57076](https://github.com/ClickHouse/ClickHouse/pull/57076) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The limit for the number of connections per endpoint for background fetches was raised from `15` to the value of `background_fetches_pool_size` setting. - MergeTree-level setting `replicated_max_parallel_fetches_for_host` became obsolete - MergeTree-level settings `replicated_fetches_http_connection_timeout`, `replicated_fetches_http_send_timeout` and `replicated_fetches_http_receive_timeout` are moved to the Server-level. - Setting `keep_alive_timeout` is added to the list of Server-level settings. [#57523](https://github.com/ClickHouse/ClickHouse/pull/57523) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Make querying `system.filesystem_cache` not memory intensive. [#57687](https://github.com/ClickHouse/ClickHouse/pull/57687) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Reduce memory usage on strings deserialization. [#57787](https://github.com/ClickHouse/ClickHouse/pull/57787) ([Maksim Kita](https://github.com/kitaisreal)).
-* More efficient constructor for Enum - it makes sense when Enum has a boatload of values. [#57887](https://github.com/ClickHouse/ClickHouse/pull/57887) ([Duc Canh Le](https://github.com/canhld94)).
-* An improvement for reading from the filesystem cache: always use `pread` method. [#57970](https://github.com/ClickHouse/ClickHouse/pull/57970) ([Nikita Taranov](https://github.com/nickitat)).
-* Add optimization for AND notEquals chain in logical expression optimizer. This optimization is only available with the experimental Analyzer enabled. [#58214](https://github.com/ClickHouse/ClickHouse/pull/58214) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+* Coordination for parallel replicas is rewritten for better parallelism and cache locality. It has been tested for linear scalability on hundreds of replicas. It also got support for reading in order. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).
+* Replace HTTP outgoing buffering based with the native ClickHouse buffers. Add bytes counting metrics for interfaces. [#56064](https://github.com/ClickHouse/ClickHouse/pull/56064) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Large aggregation states of `uniqExact` will be merged in parallel in distrubuted queries. [#59009](https://github.com/ClickHouse/ClickHouse/pull/59009) ([Nikita Taranov](https://github.com/nickitat)).
+* Lower memory usage after reading from `MergeTree` tables. [#59290](https://github.com/ClickHouse/ClickHouse/pull/59290) ([Anton Popov](https://github.com/CurtizJ)).
+* Lower memory usage in vertical merges. [#59340](https://github.com/ClickHouse/ClickHouse/pull/59340) ([Anton Popov](https://github.com/CurtizJ)).
+* Avoid huge memory consumption during Keeper startup for more cases. [#58455](https://github.com/ClickHouse/ClickHouse/pull/58455) ([Antonio Andelic](https://github.com/antonio2368)).
+* Keeper improvement: reduce Keeper's memory usage for stored nodes. [#59002](https://github.com/ClickHouse/ClickHouse/pull/59002) ([Antonio Andelic](https://github.com/antonio2368)).
+* More cache-friendly final implementation. Note on the behaviour change: previously queries with `FINAL` modifier that read with a single stream (e.g. `max_threads = 1`) produced sorted output without explicitly provided `ORDER BY` clause. This is no longer guaranteed when `enable_vertical_final = true` (and it is so by default). [#54366](https://github.com/ClickHouse/ClickHouse/pull/54366) ([Duc Canh Le](https://github.com/canhld94)).
+* Bypass extra copying in `ReadBufferFromIStream` which is used, e.g., for reading from S3. [#56961](https://github.com/ClickHouse/ClickHouse/pull/56961) ([Nikita Taranov](https://github.com/nickitat)).
+* Optimize array element function when input is Array(Map)/Array(Array(Num)/Array(Array(String))/Array(BigInt)/Array(Decimal). The previous implementations did more allocations than needed. The optimization speed up is up to ~6x especially when input type is Array(Map). [#56403](https://github.com/ClickHouse/ClickHouse/pull/56403) ([李扬](https://github.com/taiyang-li)).
+* Read column once while reading more than one subcolumn from it in compact parts. [#57631](https://github.com/ClickHouse/ClickHouse/pull/57631) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rewrite the AST of `sum(column + constant)` function. This is available as an optimization pass for Analyzer [#57853](https://github.com/ClickHouse/ClickHouse/pull/57853) ([Jiebin Sun](https://github.com/jiebinn)).
+* The evaluation of function `match` now utilizes skipping indices `ngrambf_v1` and `tokenbf_v1`. [#57882](https://github.com/ClickHouse/ClickHouse/pull/57882) ([凌涛](https://github.com/lingtaolf)).
+* The evaluation of function `match` now utilizes inverted indices. [#58284](https://github.com/ClickHouse/ClickHouse/pull/58284) ([凌涛](https://github.com/lingtaolf)).
+* MergeTree `FINAL` does not compare rows from same non-L0 part. [#58142](https://github.com/ClickHouse/ClickHouse/pull/58142) ([Duc Canh Le](https://github.com/canhld94)).
+* Speed up iota calls (filling array with consecutive numbers). [#58271](https://github.com/ClickHouse/ClickHouse/pull/58271) ([Raúl Marín](https://github.com/Algunenano)).
+* Speedup MIN/MAX for non-numeric types. [#58334](https://github.com/ClickHouse/ClickHouse/pull/58334) ([Raúl Marín](https://github.com/Algunenano)).
+* Optimize the combination of filters (like in multi-stage PREWHERE) with BMI2/SSE intrinsics [#58800](https://github.com/ClickHouse/ClickHouse/pull/58800) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Use one thread less in `clickhouse-local`. [#58968](https://github.com/ClickHouse/ClickHouse/pull/58968) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the `multiIf` function performance when the type is Nullable. [#57745](https://github.com/ClickHouse/ClickHouse/pull/57745) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Lower memory consumption in backups to S3. [#58962](https://github.com/ClickHouse/ClickHouse/pull/58962) ([Vitaly Baranov](https://github.com/vitlibar)).
 
 #### Improvement
-* Support for soft memory limit in Keeper. It will refuse requests if the memory usage is close to the maximum. [#57271](https://github.com/ClickHouse/ClickHouse/pull/57271) ([Han Fei](https://github.com/hanfei1991)). [#57699](https://github.com/ClickHouse/ClickHouse/pull/57699) ([Han Fei](https://github.com/hanfei1991)).
-* Make inserts into distributed tables handle updated cluster configuration properly. When the list of cluster nodes is dynamically updated, the Directory Monitor of the distribution table will update it. [#42826](https://github.com/ClickHouse/ClickHouse/pull/42826) ([zhongyuankai](https://github.com/zhongyuankai)).
-* Do not allow creating a replicated table with inconsistent merge parameters. [#56833](https://github.com/ClickHouse/ClickHouse/pull/56833) ([Duc Canh Le](https://github.com/canhld94)).
-* Show uncompressed size in `system.tables`. [#56618](https://github.com/ClickHouse/ClickHouse/issues/56618). [#57186](https://github.com/ClickHouse/ClickHouse/pull/57186) ([Chen Lixiang](https://github.com/chenlx0)).
-* Add `skip_unavailable_shards` as a setting for `Distributed` tables that is similar to the corresponding query-level setting. Closes [#43666](https://github.com/ClickHouse/ClickHouse/issues/43666). [#57218](https://github.com/ClickHouse/ClickHouse/pull/57218) ([Gagan Goel](https://github.com/tntnatbry)).
-* The function `substring` (aliases: `substr`, `mid`) can now be used with `Enum` types. Previously, the first function argument had to be a value of type `String` or `FixedString`. This improves compatibility with 3rd party tools such as Tableau via MySQL interface. [#57277](https://github.com/ClickHouse/ClickHouse/pull/57277) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Function `format` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). This is important to calculate `SELECT format('The {0} to all questions is {1}', 'answer', 42)`. [#57549](https://github.com/ClickHouse/ClickHouse/pull/57549) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allows to use the `date_trunc` function with a case-insensitive first argument. Both cases are now supported: `SELECT date_trunc('day', now())` and `SELECT date_trunc('DAY', now())`. [#57624](https://github.com/ClickHouse/ClickHouse/pull/57624) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Better hints when a table doesn't exist. [#57342](https://github.com/ClickHouse/ClickHouse/pull/57342) ([Bharat Nallan](https://github.com/bharatnc)).
-* Allow to overwrite `max_partition_size_to_drop` and `max_table_size_to_drop` server settings in query time. [#57452](https://github.com/ClickHouse/ClickHouse/pull/57452) ([Jordi Villar](https://github.com/jrdi)).
-* Slightly better inference of unnamed tupes in JSON formats. [#57751](https://github.com/ClickHouse/ClickHouse/pull/57751) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for read-only flag when connecting to Keeper (fixes [#53749](https://github.com/ClickHouse/ClickHouse/issues/53749)). [#57479](https://github.com/ClickHouse/ClickHouse/pull/57479) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Fix possible distributed sends stuck due to "No such file or directory" (during recovering a batch from disk). Fix possible issues with `error_count` from `system.distribution_queue` (in case of `distributed_directory_monitor_max_sleep_time_ms` >5min). Introduce profile event to track async INSERT failures - `DistributedAsyncInsertionFailures`. [#57480](https://github.com/ClickHouse/ClickHouse/pull/57480) ([Azat Khuzhin](https://github.com/azat)).
-* Support PostgreSQL generated columns and default column values in `MaterializedPostgreSQL` (experimental feature). Closes [#40449](https://github.com/ClickHouse/ClickHouse/issues/40449). [#57568](https://github.com/ClickHouse/ClickHouse/pull/57568) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow to apply some filesystem cache config settings changes without server restart. [#57578](https://github.com/ClickHouse/ClickHouse/pull/57578) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Properly handling PostgreSQL table structure with empty array. [#57618](https://github.com/ClickHouse/ClickHouse/pull/57618) ([Mike Kot](https://github.com/myrrc)).
-* Expose the total number of errors occurred since last server restart as a `ClickHouseErrorMetric_ALL` metric. [#57627](https://github.com/ClickHouse/ClickHouse/pull/57627) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow nodes in the configuration file with `from_env`/`from_zk` reference and non empty element with replace=1. [#57628](https://github.com/ClickHouse/ClickHouse/pull/57628) ([Azat Khuzhin](https://github.com/azat)).
-* A table function `fuzzJSON` which allows generating a lot of malformed JSON for fuzzing. [#57646](https://github.com/ClickHouse/ClickHouse/pull/57646) ([Julia Kartseva](https://github.com/jkartseva)).
-* Allow IPv6 to UInt128 conversion and binary arithmetic. [#57707](https://github.com/ClickHouse/ClickHouse/pull/57707) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add a setting for `async inserts deduplication cache` - how long we wait for cache update. Deprecate setting `async_block_ids_cache_min_update_interval_ms`. Now cache is updated only in case of conflicts. [#57743](https://github.com/ClickHouse/ClickHouse/pull/57743) ([alesapin](https://github.com/alesapin)).
-* `sleep()` function now can be cancelled with `KILL QUERY`. [#57746](https://github.com/ClickHouse/ClickHouse/pull/57746) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Forbid `CREATE TABLE ... AS SELECT` queries for `Replicated` table engines in the experimental `Replicated` database because they are not supported. Reference [#35408](https://github.com/ClickHouse/ClickHouse/issues/35408). [#57796](https://github.com/ClickHouse/ClickHouse/pull/57796) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix and improve transforming queries for external databases, to recursively obtain all compatible predicates. [#57888](https://github.com/ClickHouse/ClickHouse/pull/57888) ([flynn](https://github.com/ucasfl)).
-* Support dynamic reloading of the filesystem cache size. Closes [#57866](https://github.com/ClickHouse/ClickHouse/issues/57866). [#57897](https://github.com/ClickHouse/ClickHouse/pull/57897) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Correctly support `system.stack_trace` for threads with blocked SIGRTMIN (these threads can exist in low-quality external libraries such as Apache rdkafka). [#57907](https://github.com/ClickHouse/ClickHouse/pull/57907) ([Azat Khuzhin](https://github.com/azat)). Aand also send signal to the threads only if it is not blocked to avoid waiting `storage_system_stack_trace_pipe_read_timeout_ms` when it does not make any sense. [#58136](https://github.com/ClickHouse/ClickHouse/pull/58136) ([Azat Khuzhin](https://github.com/azat)).
-* Tolerate keeper failures in the quorum inserts' check. [#57986](https://github.com/ClickHouse/ClickHouse/pull/57986) ([Raúl Marín](https://github.com/Algunenano)).
-* Add max/peak RSS (`MemoryResidentMax`) into system.asynchronous_metrics. [#58095](https://github.com/ClickHouse/ClickHouse/pull/58095) ([Azat Khuzhin](https://github.com/azat)).
-* This PR allows users to use s3-style links (`https://` and `s3://`) without mentioning region if it's not default. Also find the correct region if the user mentioned the wrong one. [#58148](https://github.com/ClickHouse/ClickHouse/pull/58148) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* `clickhouse-format --obfuscate` will know about Settings, MergeTreeSettings, and time zones and keep their names unchanged. [#58179](https://github.com/ClickHouse/ClickHouse/pull/58179) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added explicit `finalize()` function in `ZipArchiveWriter`. Simplify too complicated code in `ZipArchiveWriter`. This fixes [#58074](https://github.com/ClickHouse/ClickHouse/issues/58074). [#58202](https://github.com/ClickHouse/ClickHouse/pull/58202) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Make caches with the same path use the same cache objects. This behaviour existed before, but was broken in 23.4. If such caches with the same path have different set of cache settings, an exception will be thrown, that this is not allowed. [#58264](https://github.com/ClickHouse/ClickHouse/pull/58264) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Parallel replicas (experimental feature): friendly settings [#57542](https://github.com/ClickHouse/ClickHouse/pull/57542) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): announcement response handling improvement [#57749](https://github.com/ClickHouse/ClickHouse/pull/57749) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): give more respect to `min_number_of_marks` in `ParallelReplicasReadingCoordinator` [#57763](https://github.com/ClickHouse/ClickHouse/pull/57763) ([Nikita Taranov](https://github.com/nickitat)).
-* Parallel replicas (experimental feature): disable parallel replicas with IN (subquery) [#58133](https://github.com/ClickHouse/ClickHouse/pull/58133) ([Igor Nikonov](https://github.com/devcrafter)).
-* Parallel replicas (experimental feature): add profile event 'ParallelReplicasUsedCount' [#58173](https://github.com/ClickHouse/ClickHouse/pull/58173) ([Igor Nikonov](https://github.com/devcrafter)).
-* Non POST requests such as HEAD will be readonly similar to GET. [#58060](https://github.com/ClickHouse/ClickHouse/pull/58060) ([San](https://github.com/santrancisco)).
-* Add `bytes_uncompressed` column to `system.part_log` [#58167](https://github.com/ClickHouse/ClickHouse/pull/58167) ([Jordi Villar](https://github.com/jrdi)).
-* Add base backup name to `system.backups` and `system.backup_log` tables [#58178](https://github.com/ClickHouse/ClickHouse/pull/58178) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Add support for specifying query parameters in the command line in clickhouse-local [#58210](https://github.com/ClickHouse/ClickHouse/pull/58210) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Added comments (brief descriptions) to all columns of system tables. There are several reasons for this: - We use system tables a lot, and sometimes it could be very difficult for developer to understand the purpose and the meaning of a particular column. - We change (add new ones or modify existing) system tables a lot and the documentation for them is always outdated. For example take a look at the documentation page for [`system.parts`](https://clickhouse.com/docs/en/operations/system-tables/parts). It misses a lot of columns - We would like to eventually generate documentation directly from ClickHouse. [#58356](https://github.com/ClickHouse/ClickHouse/pull/58356) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow queries without aliases for subqueries for `PASTE JOIN`. [#58654](https://github.com/ClickHouse/ClickHouse/pull/58654) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Enable `MySQL`/`MariaDB` integration on macOS. This closes [#21191](https://github.com/ClickHouse/ClickHouse/issues/21191). [#46316](https://github.com/ClickHouse/ClickHouse/pull/46316) ([Alexey Milovidov](https://github.com/alexey-milovidov)) ([Robert Schulze](https://github.com/rschu1ze)).
+* Disable `max_rows_in_set_to_optimize_join` by default. [#56396](https://github.com/ClickHouse/ClickHouse/pull/56396) ([vdimir](https://github.com/vdimir)).
+* Add `<host_name>` config parameter that allows avoiding resolving hostnames in ON CLUSTER DDL queries and Replicated database engines. This mitigates the possibility of the queue being stuck in case of a change in cluster definition. Closes [#57573](https://github.com/ClickHouse/ClickHouse/issues/57573). [#57603](https://github.com/ClickHouse/ClickHouse/pull/57603) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Increase `load_metadata_threads` to 16 for the filesystem cache. It will make the server start up faster. [#57732](https://github.com/ClickHouse/ClickHouse/pull/57732) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add ability to throttle merges/mutations (`max_mutations_bandwidth_for_server`/`max_merges_bandwidth_for_server`). [#57877](https://github.com/ClickHouse/ClickHouse/pull/57877) ([Azat Khuzhin](https://github.com/azat)).
+* Replaced undocumented (boolean) column `is_hot_reloadable` in system table `system.server_settings` by (Enum8) column `changeable_without_restart` with possible values `No`, `Yes`, `IncreaseOnly` and `DecreaseOnly`. Also documented the column. [#58029](https://github.com/ClickHouse/ClickHouse/pull/58029) ([skyoct](https://github.com/skyoct)).
+* Cluster discovery supports setting username and password, close [#58063](https://github.com/ClickHouse/ClickHouse/issues/58063). [#58123](https://github.com/ClickHouse/ClickHouse/pull/58123) ([vdimir](https://github.com/vdimir)).
+* Support query parameters in `ALTER TABLE ... PART`. [#58297](https://github.com/ClickHouse/ClickHouse/pull/58297) ([Azat Khuzhin](https://github.com/azat)).
+* Create consumers for Kafka tables on the fly (but keep them for some period - `kafka_consumers_pool_ttl_ms`, since last used), this should fix problem with statistics for `system.kafka_consumers` (that does not consumed when nobody reads from Kafka table, which leads to live memory leak and slow table detach) and also this PR enables stats for `system.kafka_consumers` by default again. [#58310](https://github.com/ClickHouse/ClickHouse/pull/58310) ([Azat Khuzhin](https://github.com/azat)).
+* `sparkBar` as an alias to `sparkbar`. [#58335](https://github.com/ClickHouse/ClickHouse/pull/58335) ([凌涛](https://github.com/lingtaolf)).
+* Avoid sending `ComposeObject` requests after upload to `GCS`. [#58343](https://github.com/ClickHouse/ClickHouse/pull/58343) ([Azat Khuzhin](https://github.com/azat)).
+* Correctly handle keys with dot in the name in configurations XMLs. [#58354](https://github.com/ClickHouse/ClickHouse/pull/58354) ([Azat Khuzhin](https://github.com/azat)).
+* Make function `format` return constant on constant arguments. This closes [#58355](https://github.com/ClickHouse/ClickHouse/issues/58355). [#58358](https://github.com/ClickHouse/ClickHouse/pull/58358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Adding a setting `max_estimated_execution_time` to separate `max_execution_time` and `max_estimated_execution_time`. [#58402](https://github.com/ClickHouse/ClickHouse/pull/58402) ([Zhang Yifan](https://github.com/zhangyifan27)).
+* Provide a hint when an invalid database engine name is used. [#58444](https://github.com/ClickHouse/ClickHouse/pull/58444) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add settings for better control of indexes type in Arrow dictionary. Use signed integer type for indexes by default as Arrow recommends. Closes [#57401](https://github.com/ClickHouse/ClickHouse/issues/57401). [#58519](https://github.com/ClickHouse/ClickHouse/pull/58519) ([Kruglov Pavel](https://github.com/Avogar)).
+* Implement [#58575](https://github.com/ClickHouse/ClickHouse/issues/58575) Support `CLICKHOUSE_PASSWORD_FILE ` environment variable when running the docker image. [#58583](https://github.com/ClickHouse/ClickHouse/pull/58583) ([Eyal Halpern Shalev](https://github.com/Eyal-Shalev)).
+* When executing some queries, which require a lot of streams for reading data, the error `"Paste JOIN requires sorted tables only"` was previously thrown. Now the numbers of streams resize to 1 in that case. [#58608](https://github.com/ClickHouse/ClickHouse/pull/58608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Better message for INVALID_IDENTIFIER error. [#58703](https://github.com/ClickHouse/ClickHouse/pull/58703) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Improved handling of signed numeric literals in normalizeQuery. [#58710](https://github.com/ClickHouse/ClickHouse/pull/58710) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Support Point data type for MySQL. [#58721](https://github.com/ClickHouse/ClickHouse/pull/58721) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* When comparing a Float32 column and a const string, read the string as Float32 (instead of Float64). [#58724](https://github.com/ClickHouse/ClickHouse/pull/58724) ([Raúl Marín](https://github.com/Algunenano)).
+* Improve S3 compatibility, add ECloud EOS storage support. [#58786](https://github.com/ClickHouse/ClickHouse/pull/58786) ([xleoken](https://github.com/xleoken)).
+* Allow `KILL QUERY` to cancel backups / restores. This PR also makes running backups and restores visible in `system.processes`. Also, there is a new setting in the server configuration now - `shutdown_wait_backups_and_restores` (default=true) which makes the server either wait on shutdown for all running backups and restores to finish or just cancel them. [#58804](https://github.com/ClickHouse/ClickHouse/pull/58804) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Avro format to support ZSTD codec. Closes [#58735](https://github.com/ClickHouse/ClickHouse/issues/58735). [#58805](https://github.com/ClickHouse/ClickHouse/pull/58805) ([flynn](https://github.com/ucasfl)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#58835](https://github.com/ClickHouse/ClickHouse/pull/58835) ([Serge Klochkov](https://github.com/slvrtrn)).
+* A better exception message while conflict of creating dictionary and table with the same name. [#58841](https://github.com/ClickHouse/ClickHouse/pull/58841) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Make sure that for custom (created from SQL) disks ether `filesystem_caches_path` (a common directory prefix for all filesystem caches) or `custom_cached_disks_base_directory` (a common directory prefix for only filesystem caches created from custom disks) is specified in server config. `custom_cached_disks_base_directory` has higher priority for custom disks over `filesystem_caches_path`, which is used if the former one is absent. Filesystem cache setting `path` must lie inside that directory, otherwise exception will be thrown preventing disk to be created. This will not affect disks created on an older version and server was upgraded - then the exception will not be thrown to allow the server to successfully start). `custom_cached_disks_base_directory` is added to default server config as `/var/lib/clickhouse/caches/`. Closes [#57825](https://github.com/ClickHouse/ClickHouse/issues/57825). [#58869](https://github.com/ClickHouse/ClickHouse/pull/58869) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MySQL interface gained compatibility with `SHOW WARNINGS`/`SHOW COUNT(*) WARNINGS` queries, though the returned result is always an empty set. [#58929](https://github.com/ClickHouse/ClickHouse/pull/58929) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Skip unavailable replicas when executing parallel distributed `INSERT SELECT`. [#58931](https://github.com/ClickHouse/ClickHouse/pull/58931) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Display word-descriptive log level while enabling structured log formatting in json. [#58936](https://github.com/ClickHouse/ClickHouse/pull/58936) ([Tim Liou](https://github.com/wheatdog)).
+* MySQL interface gained support for `CAST(x AS SIGNED)` and `CAST(x AS UNSIGNED)` statements via data type aliases: `SIGNED` for Int64, and `UNSIGNED` for UInt64. This improves compatibility with BI tools such as Looker Studio. [#58954](https://github.com/ClickHouse/ClickHouse/pull/58954) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Change working directory to the data path in docker container. [#58975](https://github.com/ClickHouse/ClickHouse/pull/58975) ([cangyin](https://github.com/cangyin)).
+* Added setting for Azure Blob Storage `azure_max_unexpected_write_error_retries` , can also be set from config under azure section. [#59001](https://github.com/ClickHouse/ClickHouse/pull/59001) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Allow server to start with broken data lake table. Closes [#58625](https://github.com/ClickHouse/ClickHouse/issues/58625). [#59080](https://github.com/ClickHouse/ClickHouse/pull/59080) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow to ignore schema evolution in the `Iceberg` table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prohibit mutable operations (`INSERT`/`ALTER`/`OPTIMIZE`/...) on read-only/write-once storages with a proper `TABLE_IS_READ_ONLY` error (to avoid leftovers). Avoid leaving left-overs on write-once disks (`format_version.txt`) on `CREATE`/`ATTACH`. Ignore `DROP` for `ReplicatedMergeTree` (so as for `MergeTree`). Fix iterating over `s3_plain` (`MetadataStorageFromPlainObjectStorage::iterateDirectory`). Note read-only is `web` disk, and write-once is `s3_plain`. [#59170](https://github.com/ClickHouse/ClickHouse/pull/59170) ([Azat Khuzhin](https://github.com/azat)).
+* Fix bug in the experimental `_block_number` column which could lead to logical error during complex combination of `ALTER`s and `merge`s. Fixes [#56202](https://github.com/ClickHouse/ClickHouse/issues/56202). Replaces [#58601](https://github.com/ClickHouse/ClickHouse/issues/58601). [#59295](https://github.com/ClickHouse/ClickHouse/pull/59295) ([alesapin](https://github.com/alesapin)).
+* Play UI understands when an exception is returned inside JSON. Adjustment for [#52853](https://github.com/ClickHouse/ClickHouse/issues/52853). [#59303](https://github.com/ClickHouse/ClickHouse/pull/59303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `/binary` HTTP handler allows to specify user, host, and optionally, password in the query string. [#59311](https://github.com/ClickHouse/ClickHouse/pull/59311) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support backups for compressed in-memory tables. This closes [#57893](https://github.com/ClickHouse/ClickHouse/issues/57893). [#59315](https://github.com/ClickHouse/ClickHouse/pull/59315) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support the `FORMAT` clause in `BACKUP` and `RESTORE` queries. [#59338](https://github.com/ClickHouse/ClickHouse/pull/59338) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Function `concatWithSeparator` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). For example, `SELECT concatWithSeparator('.', 'number', 1)` now returns `number.1`. [#59341](https://github.com/ClickHouse/ClickHouse/pull/59341) ([Robert Schulze](https://github.com/rschu1ze)).
 
 #### Build/Testing/Packaging Improvement
-* Randomize more settings [#39663](https://github.com/ClickHouse/ClickHouse/pull/39663) ([Anton Popov](https://github.com/CurtizJ)).
-* Randomize disabled optimizations in CI [#57315](https://github.com/ClickHouse/ClickHouse/pull/57315) ([Raúl Marín](https://github.com/Algunenano)).
-* Allow usage of Azure-related table engines/functions on macOS. [#51866](https://github.com/ClickHouse/ClickHouse/pull/51866) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* ClickHouse Fast Test now uses Musl instead of GLibc. [#57711](https://github.com/ClickHouse/ClickHouse/pull/57711) ([Alexey Milovidov](https://github.com/alexey-milovidov)). The fully-static Musl build is available to download from the CI.
-* Run ClickBench for every commit. This closes [#57708](https://github.com/ClickHouse/ClickHouse/issues/57708). [#57712](https://github.com/ClickHouse/ClickHouse/pull/57712) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the usage of a harmful C/POSIX `select` function from external libraries. [#57467](https://github.com/ClickHouse/ClickHouse/pull/57467) ([Igor Nikonov](https://github.com/devcrafter)).
-* Settings only available in ClickHouse Cloud will be also present in the open-source ClickHouse build for convenience. [#57638](https://github.com/ClickHouse/ClickHouse/pull/57638) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fixed a possibility of sorting order breakage in TTL GROUP BY [#49103](https://github.com/ClickHouse/ClickHouse/pull/49103) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix: split `lttb` bucket strategy, first bucket and last bucket should only contain single point [#57003](https://github.com/ClickHouse/ClickHouse/pull/57003) ([FFish](https://github.com/wxybear)).
-* Fix possible deadlock in the `Template` format during sync after error [#57004](https://github.com/ClickHouse/ClickHouse/pull/57004) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix early stop while parsing a file with skipping lots of errors [#57006](https://github.com/ClickHouse/ClickHouse/pull/57006) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent dictionary's ACL bypass via the `dictionary` table function [#57362](https://github.com/ClickHouse/ClickHouse/pull/57362) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix another case of a "non-ready set" error found by Fuzzer. [#57423](https://github.com/ClickHouse/ClickHouse/pull/57423) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix several issues regarding PostgreSQL `array_ndims` usage. [#57436](https://github.com/ClickHouse/ClickHouse/pull/57436) ([Ryan Jacobs](https://github.com/ryanmjacobs)).
-* Fix RWLock inconsistency after write lock timeout [#57454](https://github.com/ClickHouse/ClickHouse/pull/57454) ([Vitaly Baranov](https://github.com/vitlibar)). Fix RWLock inconsistency after write lock timeout (again) [#57733](https://github.com/ClickHouse/ClickHouse/pull/57733) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix: don't exclude ephemeral column when building pushing to view chain [#57461](https://github.com/ClickHouse/ClickHouse/pull/57461) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* MaterializedPostgreSQL (experimental issue): fix issue [#41922](https://github.com/ClickHouse/ClickHouse/issues/41922), add test for [#41923](https://github.com/ClickHouse/ClickHouse/issues/41923) [#57515](https://github.com/ClickHouse/ClickHouse/pull/57515) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Ignore ON CLUSTER clause in grant/revoke queries for management of replicated access entities.  [#57538](https://github.com/ClickHouse/ClickHouse/pull/57538) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix crash in clickhouse-local [#57553](https://github.com/ClickHouse/ClickHouse/pull/57553) ([Nikolay Degterinsky](https://github.com/evillique)).
-* A fix for Hash JOIN. [#57564](https://github.com/ClickHouse/ClickHouse/pull/57564) ([vdimir](https://github.com/vdimir)).
-* Fix possible error in PostgreSQL source [#57567](https://github.com/ClickHouse/ClickHouse/pull/57567) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix type correction in Hash JOIN for nested LowCardinality. [#57614](https://github.com/ClickHouse/ClickHouse/pull/57614) ([vdimir](https://github.com/vdimir)).
-* Avoid hangs of `system.stack_trace` by correctly prohibiting parallel reading from it. [#57641](https://github.com/ClickHouse/ClickHouse/pull/57641) ([Azat Khuzhin](https://github.com/azat)).
-* Fix an error for aggregation of sparse columns with `any(...) RESPECT NULL` [#57710](https://github.com/ClickHouse/ClickHouse/pull/57710) ([Azat Khuzhin](https://github.com/azat)).
-* Fix unary operators parsing [#57713](https://github.com/ClickHouse/ClickHouse/pull/57713) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix dependency loading for the experimental table engine `MaterializedPostgreSQL`. [#57754](https://github.com/ClickHouse/ClickHouse/pull/57754) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix retries for disconnected nodes for BACKUP/RESTORE ON CLUSTER [#57764](https://github.com/ClickHouse/ClickHouse/pull/57764) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix result of external aggregation in case of partially materialized projection [#57790](https://github.com/ClickHouse/ClickHouse/pull/57790) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix merge in aggregation functions with `*Map` combinator [#57795](https://github.com/ClickHouse/ClickHouse/pull/57795) ([Anton Popov](https://github.com/CurtizJ)).
-* Disable `system.kafka_consumers` because it has a bug. [#57822](https://github.com/ClickHouse/ClickHouse/pull/57822) ([Azat Khuzhin](https://github.com/azat)).
-* Fix LowCardinality keys support in Merge JOIN. [#57827](https://github.com/ClickHouse/ClickHouse/pull/57827) ([vdimir](https://github.com/vdimir)).
-* A fix for `InterpreterCreateQuery` related to the sample block. [#57855](https://github.com/ClickHouse/ClickHouse/pull/57855) ([Maksim Kita](https://github.com/kitaisreal)).
-* `addresses_expr` were ignored for named collections from PostgreSQL. [#57874](https://github.com/ClickHouse/ClickHouse/pull/57874) ([joelynch](https://github.com/joelynch)).
-* Fix invalid memory access in BLAKE3 (Rust) [#57876](https://github.com/ClickHouse/ClickHouse/pull/57876) ([Raúl Marín](https://github.com/Algunenano)). Then it was rewritten from Rust to C++ for better [memory-safety](https://www.memorysafety.org/). [#57994](https://github.com/ClickHouse/ClickHouse/pull/57994) ([Raúl Marín](https://github.com/Algunenano)).
-* Normalize function names in `CREATE INDEX` [#57906](https://github.com/ClickHouse/ClickHouse/pull/57906) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix handling of unavailable replicas before first request happened [#57933](https://github.com/ClickHouse/ClickHouse/pull/57933) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix literal alias misclassification [#57988](https://github.com/ClickHouse/ClickHouse/pull/57988) ([Chen768959](https://github.com/Chen768959)).
-* Fix invalid preprocessing on Keeper [#58069](https://github.com/ClickHouse/ClickHouse/pull/58069) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix integer overflow in the `Poco` library, related to `UTF32Encoding` [#58073](https://github.com/ClickHouse/ClickHouse/pull/58073) ([Andrey Fedotov](https://github.com/anfedotoff)).
-* Fix parallel replicas (experimental feature) in presence of a scalar subquery with a big integer value [#58118](https://github.com/ClickHouse/ClickHouse/pull/58118) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix `accurateCastOrNull` for out-of-range `DateTime` [#58139](https://github.com/ClickHouse/ClickHouse/pull/58139) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix possible `PARAMETER_OUT_OF_BOUND` error during subcolumns reading from a wide part in MergeTree [#58175](https://github.com/ClickHouse/ClickHouse/pull/58175) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix a slow-down of CREATE VIEW with an enormous number of subqueries [#58220](https://github.com/ClickHouse/ClickHouse/pull/58220) ([Tao Wang](https://github.com/wangtZJU)).
-* Fix parallel parsing for JSONCompactEachRow [#58181](https://github.com/ClickHouse/ClickHouse/pull/58181) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#58250](https://github.com/ClickHouse/ClickHouse/pull/58250) ([Kruglov Pavel](https://github.com/Avogar)).
-
-
-### <a id="2311"></a> ClickHouse release 23.11, 2023-12-06
-
-#### Backward Incompatible Change
-* The default ClickHouse server configuration file has enabled `access_management` (user manipulation by SQL queries) and `named_collection_control` (manipulation of named collection by SQL queries) for the `default` user by default. This closes [#56482](https://github.com/ClickHouse/ClickHouse/issues/56482). [#56619](https://github.com/ClickHouse/ClickHouse/pull/56619) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Multiple improvements for `RESPECT NULLS`/`IGNORE NULLS` for window functions. If you use them as aggregate functions and store the states of aggregate functions with these modifiers, they might become incompatible. [#57189](https://github.com/ClickHouse/ClickHouse/pull/57189) ([Raúl Marín](https://github.com/Algunenano)).
-* Remove optimization `optimize_move_functions_out_of_any`. [#57190](https://github.com/ClickHouse/ClickHouse/pull/57190) ([Raúl Marín](https://github.com/Algunenano)).
-* Formatters `%l`/`%k`/`%c` in function `parseDateTime` are now able to parse hours/months without leading zeros, e.g. `select parseDateTime('2023-11-26 8:14', '%F %k:%i')` now works. Set `parsedatetime_parse_without_leading_zeros = 0` to restore the previous behavior which required two digits. Function `formatDateTime` is now also able to print hours/months without leading zeros. This is controlled by setting `formatdatetime_format_without_leading_zeros` but off by default to not break existing use cases. [#55872](https://github.com/ClickHouse/ClickHouse/pull/55872) ([Azat Khuzhin](https://github.com/azat)).
-* You can no longer use the aggregate function `avgWeighted` with arguments of type `Decimal`. Workaround: convert arguments to `Float64`. This closes [#43928](https://github.com/ClickHouse/ClickHouse/issues/43928). This closes [#31768](https://github.com/ClickHouse/ClickHouse/issues/31768). This closes [#56435](https://github.com/ClickHouse/ClickHouse/issues/56435). If you have used this function inside materialized views or projections with `Decimal` arguments, contact support@clickhouse.com. Fixed error in aggregate function `sumMap` and made it slower around 1.5..2 times. It does not matter because the function is garbage anyway. This closes [#54955](https://github.com/ClickHouse/ClickHouse/issues/54955). This closes [#53134](https://github.com/ClickHouse/ClickHouse/issues/53134). This closes [#55148](https://github.com/ClickHouse/ClickHouse/issues/55148). Fix a bug in function `groupArraySample` - it used the same random seed in case more than one aggregate state is generated in a query. [#56350](https://github.com/ClickHouse/ClickHouse/pull/56350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* Added server setting `async_load_databases` for asynchronous loading of databases and tables. Speeds up the server start time. Applies to databases with `Ordinary`, `Atomic` and `Replicated` engines. Their tables load metadata asynchronously. Query to a table increases the priority of the load job and waits for it to be done. Added a new table `system.asynchronous_loader` for introspection. [#49351](https://github.com/ClickHouse/ClickHouse/pull/49351) ([Sergei Trifonov](https://github.com/serxa)).
-* Add system table `blob_storage_log`. It allows auditing all the data written to S3 and other object storages. [#52918](https://github.com/ClickHouse/ClickHouse/pull/52918) ([vdimir](https://github.com/vdimir)).
-* Use statistics to order prewhere conditions better. [#53240](https://github.com/ClickHouse/ClickHouse/pull/53240) ([Han Fei](https://github.com/hanfei1991)).
-* Added support for compression in the Keeper's protocol. It can be enabled on the ClickHouse side by using this flag `use_compression` inside `zookeeper` section. Keep in mind that only ClickHouse Keeper supports compression, while Apache ZooKeeper does not. Resolves [#49507](https://github.com/ClickHouse/ClickHouse/issues/49507). [#54957](https://github.com/ClickHouse/ClickHouse/pull/54957) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Introduce the feature `storage_metadata_write_full_object_key`. If it is set as `true` then metadata files are written with the new format. With that format ClickHouse stores full remote object key in the metadata file which allows better flexibility and optimization. [#55566](https://github.com/ClickHouse/ClickHouse/pull/55566) ([Sema Checherinda](https://github.com/CheSema)).
-* Add new settings and syntax to protect named collections' fields from being overridden. This is meant to prevent a malicious user from obtaining unauthorized access to secrets. [#55782](https://github.com/ClickHouse/ClickHouse/pull/55782) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Add `hostname` column to all system log tables - it is useful if you make the system tables replicated, shared, or distributed. [#55894](https://github.com/ClickHouse/ClickHouse/pull/55894) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `CHECK ALL TABLES` query. [#56022](https://github.com/ClickHouse/ClickHouse/pull/56022) ([vdimir](https://github.com/vdimir)).
-* Added function `fromDaysSinceYearZero` which is similar to MySQL's `FROM_DAYS`. E.g. `SELECT fromDaysSinceYearZero(739136)` returns `2023-09-08`. [#56088](https://github.com/ClickHouse/ClickHouse/pull/56088) ([Joanna Hulboj](https://github.com/jh0x)).
-* Add an external Python tool to view backups and to extract information from them without using ClickHouse. [#56268](https://github.com/ClickHouse/ClickHouse/pull/56268) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Implement a new setting called `preferred_optimize_projection_name`. If it is set to a non-empty string, the specified projection would be used if possible instead of choosing from all the candidates. [#56309](https://github.com/ClickHouse/ClickHouse/pull/56309) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add 4-letter command for yielding/resigning leadership (https://github.com/ClickHouse/ClickHouse/issues/56352). [#56354](https://github.com/ClickHouse/ClickHouse/pull/56354) ([Pradeep Chhetri](https://github.com/chhetripradeep)). [#56620](https://github.com/ClickHouse/ClickHouse/pull/56620) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Added a new SQL function, `arrayRandomSample(arr, k)` which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. `SELECT arrayReduce('groupArraySample(3)', range(10))`. [#56416](https://github.com/ClickHouse/ClickHouse/pull/56416) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added support for `Float16` type data to use in `.npy` files. Closes [#56344](https://github.com/ClickHouse/ClickHouse/issues/56344). [#56424](https://github.com/ClickHouse/ClickHouse/pull/56424) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Added a system view `information_schema.statistics` for better compatibility with Tableau Online. [#56425](https://github.com/ClickHouse/ClickHouse/pull/56425) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Add `system.symbols` table useful for introspection of the binary. [#56548](https://github.com/ClickHouse/ClickHouse/pull/56548) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Configurable dashboards. Queries for charts are now loaded using a query, which by default uses a new `system.dashboards` table. [#56771](https://github.com/ClickHouse/ClickHouse/pull/56771) ([Sergei Trifonov](https://github.com/serxa)).
-* Introduce `fileCluster` table function - it is useful if you mount a shared filesystem (NFS and similar) into the `user_files` directory. [#56868](https://github.com/ClickHouse/ClickHouse/pull/56868) ([Andrey Zvonov](https://github.com/zvonand)).
-* Add `_size` virtual column with file size in bytes to `s3/file/hdfs/url/azureBlobStorage` engines. [#57126](https://github.com/ClickHouse/ClickHouse/pull/57126) ([Kruglov Pavel](https://github.com/Avogar)).
-* Expose the number of errors for each error code occurred on a server since last restart from the Prometheus endpoint. [#57209](https://github.com/ClickHouse/ClickHouse/pull/57209) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* ClickHouse keeper reports its running availability zone at `/keeper/availability-zone` path. This can be configured via `<availability_zone><value>us-west-1a</value></availability_zone>`. [#56715](https://github.com/ClickHouse/ClickHouse/pull/56715) ([Jianfei Hu](https://github.com/incfly)).
-* Make ALTER materialized_view MODIFY QUERY non experimental and deprecate `allow_experimental_alter_materialized_view_structure` setting. Fixes [#15206](https://github.com/ClickHouse/ClickHouse/issues/15206). [#57311](https://github.com/ClickHouse/ClickHouse/pull/57311) ([alesapin](https://github.com/alesapin)).
-* Setting `join_algorithm` respects specified order [#51745](https://github.com/ClickHouse/ClickHouse/pull/51745) ([vdimir](https://github.com/vdimir)).
-* Add support for the [well-known Protobuf types](https://protobuf.dev/reference/protobuf/google.protobuf/) in the Protobuf format. [#56741](https://github.com/ClickHouse/ClickHouse/pull/56741) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-
-#### Performance Improvement
-* Adaptive timeouts for interacting with S3. The first attempt is made with low send and receive timeouts. [#56314](https://github.com/ClickHouse/ClickHouse/pull/56314) ([Sema Checherinda](https://github.com/CheSema)).
-* Increase the default value of `max_concurrent_queries` from 100 to 1000. This makes sense when there is a large number of connecting clients, which are slowly sending or receiving data, so the server is not limited by CPU, or when the number of CPU cores is larger than 100. Also, enable the concurrency control by default, and set the desired number of query processing threads in total as twice the number of CPU cores. It improves performance in scenarios with a very large number of concurrent queries. [#46927](https://github.com/ClickHouse/ClickHouse/pull/46927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support parallel evaluation of window functions. Fixes [#34688](https://github.com/ClickHouse/ClickHouse/issues/34688). [#39631](https://github.com/ClickHouse/ClickHouse/pull/39631) ([Dmitry Novik](https://github.com/novikd)).
-* `Numbers` table engine (of the `system.numbers` table) now analyzes the condition to generate the needed subset of data, like table's index. [#50909](https://github.com/ClickHouse/ClickHouse/pull/50909) ([JackyWoo](https://github.com/JackyWoo)).
-* Improved the performance of filtering by `IN (...)` condition for `Merge` table engine. [#54905](https://github.com/ClickHouse/ClickHouse/pull/54905) ([Nikita Taranov](https://github.com/nickitat)).
-* An improvement which takes place when the filesystem cache is full and there are big reads. [#55158](https://github.com/ClickHouse/ClickHouse/pull/55158) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add ability to disable checksums for S3 to avoid excessive pass over the file (this is controlled by the setting `s3_disable_checksum`). [#55559](https://github.com/ClickHouse/ClickHouse/pull/55559) ([Azat Khuzhin](https://github.com/azat)).
-* Now we read synchronously from remote tables when data is in page cache (like we do for local tables). It is faster, it doesn't require synchronisation inside the thread pool, and doesn't hesitate to do `seek`-s on local FS, and reduces CPU wait. [#55841](https://github.com/ClickHouse/ClickHouse/pull/55841) ([Nikita Taranov](https://github.com/nickitat)).
-* Optimization for getting value from `map`, `arrayElement`. It will bring about 30% speedup. - reduce the reserved memory - reduce the `resize` call. [#55957](https://github.com/ClickHouse/ClickHouse/pull/55957) ([lgbo](https://github.com/lgbo-ustc)).
-* Optimization of multi-stage filtering with AVX-512. The performance experiments of the OnTime dataset on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring the improvements of 7.4%, 5.9%, 4.7%, 3.0%, and 4.6% to the QPS of the query Q2, Q3, Q4, Q5 and Q6 respectively while having no impact on others. [#56079](https://github.com/ClickHouse/ClickHouse/pull/56079) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Limit the number of threads busy inside the query profiler. If there are more - they will skip profiling. [#56105](https://github.com/ClickHouse/ClickHouse/pull/56105) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Decrease the amount of virtual function calls in window functions. [#56120](https://github.com/ClickHouse/ClickHouse/pull/56120) ([Maksim Kita](https://github.com/kitaisreal)).
-* Allow recursive Tuple field pruning in ORC data format to speed up scaning. [#56122](https://github.com/ClickHouse/ClickHouse/pull/56122) ([李扬](https://github.com/taiyang-li)).
-* Trivial count optimization for `Npy` data format: queries like `select count() from 'data.npy'` will work much more fast because of caching the results. [#56304](https://github.com/ClickHouse/ClickHouse/pull/56304) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Queries with aggregation and a large number of streams will use less amount of memory during the plan's construction. [#57074](https://github.com/ClickHouse/ClickHouse/pull/57074) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Improve performance of executing queries for use cases with many users and highly concurrent queries (>2000 QPS) by optimizing the access to ProcessList. [#57106](https://github.com/ClickHouse/ClickHouse/pull/57106) ([Andrej Hoos](https://github.com/adikus)).
-* Trivial improvement on array join, reuse some intermediate results. [#57183](https://github.com/ClickHouse/ClickHouse/pull/57183) ([李扬](https://github.com/taiyang-li)).
-* There are cases when stack unwinding was slow. Not anymore. [#57221](https://github.com/ClickHouse/ClickHouse/pull/57221) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Now we use default read pool for reading from external storage when `max_streams = 1`. It is beneficial when read prefetches are enabled. [#57334](https://github.com/ClickHouse/ClickHouse/pull/57334) ([Nikita Taranov](https://github.com/nickitat)).
-* Keeper improvement: improve memory-usage during startup by delaying log preprocessing. [#55660](https://github.com/ClickHouse/ClickHouse/pull/55660) ([Antonio Andelic](https://github.com/antonio2368)).
-* Improved performance of glob matching for `File` and `HDFS` storages. [#56141](https://github.com/ClickHouse/ClickHouse/pull/56141) ([Andrey Zvonov](https://github.com/zvonand)).
-* Posting lists in experimental full text indexes are now compressed which reduces their size by 10-30%. [#56226](https://github.com/ClickHouse/ClickHouse/pull/56226) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Parallelise `BackupEntriesCollector` in backups. [#56312](https://github.com/ClickHouse/ClickHouse/pull/56312) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-#### Improvement
-* Add a new `MergeTree` setting `add_implicit_sign_column_constraint_for_collapsing_engine` (disabled by default). When enabled, it adds an implicit CHECK constraint for `CollapsingMergeTree` tables that restricts the value of the `Sign` column to be only -1 or 1. [#56701](https://github.com/ClickHouse/ClickHouse/issues/56701). [#56986](https://github.com/ClickHouse/ClickHouse/pull/56986) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
-* Enable adding new disk to storage configuration without restart. [#56367](https://github.com/ClickHouse/ClickHouse/pull/56367) ([Duc Canh Le](https://github.com/canhld94)).
-* Support creating and materializing index in the same alter query, also support "modify TTL" and "materialize TTL" in the same query. Closes [#55651](https://github.com/ClickHouse/ClickHouse/issues/55651). [#56331](https://github.com/ClickHouse/ClickHouse/pull/56331) ([flynn](https://github.com/ucasfl)).
-* Add a new table function named `fuzzJSON` with rows containing perturbed versions of the source JSON string with random variations. [#56490](https://github.com/ClickHouse/ClickHouse/pull/56490) ([Julia Kartseva](https://github.com/jkartseva)).
-* Engine `Merge` filters the records according to the row policies of the underlying tables, so you don't have to create another row policy on a `Merge` table. [#50209](https://github.com/ClickHouse/ClickHouse/pull/50209) ([Ilya Golshtein](https://github.com/ilejn)).
-* Add a setting `max_execution_time_leaf` to limit the execution time on shard for distributed query, and `timeout_overflow_mode_leaf` to control the behaviour if timeout happens. [#51823](https://github.com/ClickHouse/ClickHouse/pull/51823) ([Duc Canh Le](https://github.com/canhld94)).
-* Add ClickHouse setting to disable tunneling for HTTPS requests over HTTP proxy. [#55033](https://github.com/ClickHouse/ClickHouse/pull/55033) ([Arthur Passos](https://github.com/arthurpassos)).
-* Set `background_fetches_pool_size` to 16, background_schedule_pool_size to 512 that is better for production usage with frequent small insertions. [#54327](https://github.com/ClickHouse/ClickHouse/pull/54327) ([Denny Crane](https://github.com/den-crane)).
-* While read data from a csv format file, and at end of line is `\r` , which not followed by `\n`, then we will enconter the exception as follows `Cannot parse CSV format: found \r (CR) not followed by \n (LF). Line must end by \n (LF) or \r\n (CR LF) or \n\r.` In clickhouse, the csv end of line must be `\n` or `\r\n` or `\n\r`, so the `\r` must be followed by `\n`, but in some suitation, the csv input data is abnormal, like above, `\r` is at end of line. [#54340](https://github.com/ClickHouse/ClickHouse/pull/54340) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Update Arrow library to release-13.0.0 that supports new encodings. Closes [#44505](https://github.com/ClickHouse/ClickHouse/issues/44505). [#54800](https://github.com/ClickHouse/ClickHouse/pull/54800) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improve performance of ON CLUSTER queries by removing heavy system calls to get all network interfaces when looking for local ip address in the DDL entry hosts list. [#54909](https://github.com/ClickHouse/ClickHouse/pull/54909) ([Duc Canh Le](https://github.com/canhld94)).
-* Fixed accounting of memory allocated before attaching a thread to a query or a user. [#56089](https://github.com/ClickHouse/ClickHouse/pull/56089) ([Nikita Taranov](https://github.com/nickitat)).
-* Add support for `LARGE_LIST` in Apache Arrow formats. [#56118](https://github.com/ClickHouse/ClickHouse/pull/56118) ([edef](https://github.com/edef1c)).
-* Allow manual compaction of `EmbeddedRocksDB` via `OPTIMIZE` query. [#56225](https://github.com/ClickHouse/ClickHouse/pull/56225) ([Azat Khuzhin](https://github.com/azat)).
-* Add ability to specify BlockBasedTableOptions for `EmbeddedRocksDB` tables. [#56264](https://github.com/ClickHouse/ClickHouse/pull/56264) ([Azat Khuzhin](https://github.com/azat)).
-* `SHOW COLUMNS` now displays MySQL's equivalent data type name when the connection was made through the MySQL protocol. Previously, this was the case when setting `use_mysql_types_in_show_columns = 1`. The setting is retained but made obsolete. [#56277](https://github.com/ClickHouse/ClickHouse/pull/56277) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fixed possible `The local set of parts of table doesn't look like the set of parts in ZooKeeper` error if server was restarted just after `TRUNCATE` or `DROP PARTITION`. [#56282](https://github.com/ClickHouse/ClickHouse/pull/56282) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fixed handling of non-const query strings in functions `formatQuery`/ `formatQuerySingleLine`. Also added `OrNull` variants of both functions that return a NULL when a query cannot be parsed instead of throwing an exception. [#56327](https://github.com/ClickHouse/ClickHouse/pull/56327) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allow backup of materialized view with dropped inner table instead of failing the backup. [#56387](https://github.com/ClickHouse/ClickHouse/pull/56387) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Queries to `system.replicas` initiate requests to ZooKeeper when certain columns are queried. When there are thousands of tables these requests might produce a considerable load on ZooKeeper. If there are multiple simultaneous queries to `system.replicas` they do same requests multiple times. The change is to "deduplicate" requests from concurrent queries. [#56420](https://github.com/ClickHouse/ClickHouse/pull/56420) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix translation to MySQL compatible query for querying external databases. [#56456](https://github.com/ClickHouse/ClickHouse/pull/56456) ([flynn](https://github.com/ucasfl)).
-* Add support for backing up and restoring tables using `KeeperMap` engine. [#56460](https://github.com/ClickHouse/ClickHouse/pull/56460) ([Antonio Andelic](https://github.com/antonio2368)).
-* 404 response for CompleteMultipartUpload has to be rechecked. Operation could be done on server even if client got timeout or other network errors. The next retry of CompleteMultipartUpload receives 404 response. If the object key exists that operation is considered as successful. [#56475](https://github.com/ClickHouse/ClickHouse/pull/56475) ([Sema Checherinda](https://github.com/CheSema)).
-* Enable the HTTP OPTIONS method by default - it simplifies requesting ClickHouse from a web browser. [#56483](https://github.com/ClickHouse/ClickHouse/pull/56483) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The value for `dns_max_consecutive_failures` was changed by mistake in [#46550](https://github.com/ClickHouse/ClickHouse/issues/46550) - this is reverted and adjusted to a better value. Also, increased the HTTP keep-alive timeout to a reasonable value from production. [#56485](https://github.com/ClickHouse/ClickHouse/pull/56485) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Load base backups lazily (a base backup won't be loaded until it's needed). Also add some log message and profile events for backups. [#56516](https://github.com/ClickHouse/ClickHouse/pull/56516) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Setting `query_cache_store_results_of_queries_with_nondeterministic_functions` (with values `false` or `true`) was marked obsolete. It was replaced by setting `query_cache_nondeterministic_function_handling`, a three-valued enum that controls how the query cache handles queries with non-deterministic functions: a) throw an exception (default behavior), b) save the non-deterministic query result regardless, or c) ignore, i.e. don't throw an exception and don't cache the result. [#56519](https://github.com/ClickHouse/ClickHouse/pull/56519) ([Robert Schulze](https://github.com/rschu1ze)).
-* Rewrite equality with `is null` check in JOIN ON section. Experimental *Analyzer only*. [#56538](https://github.com/ClickHouse/ClickHouse/pull/56538) ([vdimir](https://github.com/vdimir)).
-* Function`concat` now supports arbitrary argument types (instead of only String and FixedString arguments). This makes it behave more similar to MySQL `concat` implementation. For example, `SELECT concat('ab', 42)` now returns `ab42`. [#56540](https://github.com/ClickHouse/ClickHouse/pull/56540) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Allow getting cache configuration from 'named_collection' section in config or from SQL created named collections. [#56541](https://github.com/ClickHouse/ClickHouse/pull/56541) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* PostgreSQL database engine: Make the removal of outdated tables less aggressive with unsuccessful postgres connection. [#56609](https://github.com/ClickHouse/ClickHouse/pull/56609) ([jsc0218](https://github.com/jsc0218)).
-* It took too much time to connnect to PG when URL is not right, so the relevant query stucks there and get cancelled. [#56648](https://github.com/ClickHouse/ClickHouse/pull/56648) ([jsc0218](https://github.com/jsc0218)).
-* Keeper improvement: disable compressed logs by default in Keeper. [#56763](https://github.com/ClickHouse/ClickHouse/pull/56763) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add config setting `wait_dictionaries_load_at_startup`. [#56782](https://github.com/ClickHouse/ClickHouse/pull/56782) ([Vitaly Baranov](https://github.com/vitlibar)).
-* There was a potential vulnerability in previous ClickHouse versions: if a user has connected and unsuccessfully tried to authenticate with the "interserver secret" method, the server didn't terminate the connection immediately but continued to receive and ignore the leftover packets from the client. While these packets are ignored, they are still parsed, and if they use a compression method with another known vulnerability, it will lead to exploitation of it without authentication. This issue was found with [ClickHouse Bug Bounty Program](https://github.com/ClickHouse/ClickHouse/issues/38986) by https://twitter.com/malacupa. [#56794](https://github.com/ClickHouse/ClickHouse/pull/56794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fetching a part waits when that part is fully committed on remote replica. It is better not send part in PreActive state. In case of zero copy this is mandatory restriction. [#56808](https://github.com/ClickHouse/ClickHouse/pull/56808) ([Sema Checherinda](https://github.com/CheSema)).
-* Fix possible postgresql logical replication conversion error when using experimental `MaterializedPostgreSQL`. [#53721](https://github.com/ClickHouse/ClickHouse/pull/53721) ([takakawa](https://github.com/takakawa)).
-* Implement user-level setting `alter_move_to_space_execute_async` which allow to execute queries `ALTER TABLE ... MOVE PARTITION|PART TO DISK|VOLUME` asynchronously. The size of pool for background executions is controlled by `background_move_pool_size`. Default behavior is synchronous execution. Fixes [#47643](https://github.com/ClickHouse/ClickHouse/issues/47643). [#56809](https://github.com/ClickHouse/ClickHouse/pull/56809) ([alesapin](https://github.com/alesapin)).
-* Able to filter by engine when scanning system.tables, avoid unnecessary (potentially time-consuming) connection. [#56813](https://github.com/ClickHouse/ClickHouse/pull/56813) ([jsc0218](https://github.com/jsc0218)).
-* Show `total_bytes` and `total_rows` in system tables for RocksDB storage. [#56816](https://github.com/ClickHouse/ClickHouse/pull/56816) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Allow basic commands in ALTER for TEMPORARY tables. [#56892](https://github.com/ClickHouse/ClickHouse/pull/56892) ([Sergey](https://github.com/icuken)).
-* LZ4 compression. Buffer compressed block in a rare case when out buffer capacity is not enough for writing compressed block directly to out's buffer. [#56938](https://github.com/ClickHouse/ClickHouse/pull/56938) ([Sema Checherinda](https://github.com/CheSema)).
-* Add metrics for the number of queued jobs, which is useful for the IO thread pool. [#56958](https://github.com/ClickHouse/ClickHouse/pull/56958) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add a setting for PostgreSQL table engine setting in the config file. Added a check for the setting Added documentation around the additional setting. [#56959](https://github.com/ClickHouse/ClickHouse/pull/56959) ([Peignon Melvyn](https://github.com/melvynator)).
-* Function `concat` can now be called with a single argument, e.g., `SELECT concat('abc')`. This makes its behavior more consistent with MySQL's concat implementation. [#57000](https://github.com/ClickHouse/ClickHouse/pull/57000) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Signs all `x-amz-*` headers as required by AWS S3 docs. [#57001](https://github.com/ClickHouse/ClickHouse/pull/57001) ([Arthur Passos](https://github.com/arthurpassos)).
-* Function `fromDaysSinceYearZero` (alias: `FROM_DAYS`) can now be used with unsigned and signed integer types (previously, it had to be an unsigned integer). This improve compatibility with 3rd party tools such as Tableau Online. [#57002](https://github.com/ClickHouse/ClickHouse/pull/57002) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Add `system.s3queue_log` to default config. [#57036](https://github.com/ClickHouse/ClickHouse/pull/57036) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Change the default for `wait_dictionaries_load_at_startup` to true, and use this setting only if `dictionaries_lazy_load` is false. [#57133](https://github.com/ClickHouse/ClickHouse/pull/57133) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Check dictionary source type on creation even if `dictionaries_lazy_load` is enabled. [#57134](https://github.com/ClickHouse/ClickHouse/pull/57134) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Plan-level optimizations can now be enabled/disabled individually. Previously, it was only possible to disable them all. The setting which previously did that (`query_plan_enable_optimizations`) is retained and can still be used to disable all optimizations. [#57152](https://github.com/ClickHouse/ClickHouse/pull/57152) ([Robert Schulze](https://github.com/rschu1ze)).
-* The server's exit code will correspond to the exception code. For example, if the server cannot start due to memory limit, it will exit with the code 241 = MEMORY_LIMIT_EXCEEDED. In previous versions, the exit code for exceptions was always 70 = Poco::Util::ExitCode::EXIT_SOFTWARE. [#57153](https://github.com/ClickHouse/ClickHouse/pull/57153) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Do not demangle and symbolize stack frames from `functional` C++ header. [#57201](https://github.com/ClickHouse/ClickHouse/pull/57201) ([Mike Kot](https://github.com/myrrc)).
-* HTTP server page `/dashboard` now supports charts with multiple lines. [#57236](https://github.com/ClickHouse/ClickHouse/pull/57236) ([Sergei Trifonov](https://github.com/serxa)).
-* The `max_memory_usage_in_client` command line option supports a string value with a suffix (K, M, G, etc). Closes [#56879](https://github.com/ClickHouse/ClickHouse/issues/56879). [#57273](https://github.com/ClickHouse/ClickHouse/pull/57273) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Bumped Intel QPL (used by codec `DEFLATE_QPL`) from v1.2.0 to v1.3.1 . Also fixed a bug in case of BOF (Block On Fault) = 0, changed to handle page faults by falling back to SW path. [#57291](https://github.com/ClickHouse/ClickHouse/pull/57291) ([jasperzhu](https://github.com/jinjunzh)).
-* Increase default `replicated_deduplication_window` of MergeTree settings from 100 to 1k. [#57335](https://github.com/ClickHouse/ClickHouse/pull/57335) ([sichenzhao](https://github.com/sichenzhao)).
-* Stop using `INCONSISTENT_METADATA_FOR_BACKUP` that much. If possible prefer to continue scanning instead of stopping and starting the scanning for backup from the beginning. [#57385](https://github.com/ClickHouse/ClickHouse/pull/57385) ([Vitaly Baranov](https://github.com/vitlibar)).
-
-#### Build/Testing/Packaging Improvement
-* Add SQLLogic test. [#56078](https://github.com/ClickHouse/ClickHouse/pull/56078) ([Han Fei](https://github.com/hanfei1991)).
-* Make `clickhouse-local` and `clickhouse-client` available under short names (`ch`, `chl`, `chc`) for usability. [#56634](https://github.com/ClickHouse/ClickHouse/pull/56634) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Optimized build size further by removing unused code from external libraries. [#56786](https://github.com/ClickHouse/ClickHouse/pull/56786) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add automatic check that there are no large translation units. [#56559](https://github.com/ClickHouse/ClickHouse/pull/56559) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Lower the size of the single-binary distribution. This closes [#55181](https://github.com/ClickHouse/ClickHouse/issues/55181). [#56617](https://github.com/ClickHouse/ClickHouse/pull/56617) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Information about the sizes of every translation unit and binary file after each build will be sent to the CI database in ClickHouse Cloud. This closes [#56107](https://github.com/ClickHouse/ClickHouse/issues/56107). [#56636](https://github.com/ClickHouse/ClickHouse/pull/56636) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Certain files of "Apache Arrow" library (which we use only for non-essential things like parsing the arrow format) were rebuilt all the time regardless of the build cache. This is fixed. [#56657](https://github.com/ClickHouse/ClickHouse/pull/56657) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Avoid recompiling translation units depending on the autogenerated source file about version. [#56660](https://github.com/ClickHouse/ClickHouse/pull/56660) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Tracing data of the linker invocations will be sent to the CI database in ClickHouse Cloud. [#56725](https://github.com/ClickHouse/ClickHouse/pull/56725) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Use DWARF 5 debug symbols for the clickhouse binary (was DWARF 4 previously). [#56770](https://github.com/ClickHouse/ClickHouse/pull/56770) ([Michael Kolupaev](https://github.com/al13n321)).
-* Add a new build option `SANITIZE_COVERAGE`. If it is enabled, the code is instrumented to track the coverage. The collected information is available inside ClickHouse with: (1) a new function `coverage` that returns an array of unique addresses in the code found after the previous coverage reset; (2) `SYSTEM RESET COVERAGE` query that resets the accumulated data. This allows us to compare the coverage of different tests, including differential code coverage. Continuation of [#20539](https://github.com/ClickHouse/ClickHouse/issues/20539). [#56102](https://github.com/ClickHouse/ClickHouse/pull/56102) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Some of the stack frames might not be resolved when collecting stacks. In such cases the raw address might be helpful. [#56267](https://github.com/ClickHouse/ClickHouse/pull/56267) ([Alexander Gololobov](https://github.com/davenger)).
-* Add an option to disable `libssh`. [#56333](https://github.com/ClickHouse/ClickHouse/pull/56333) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Enable temporary_data_in_cache in S3 tests in CI. [#48425](https://github.com/ClickHouse/ClickHouse/pull/48425) ([vdimir](https://github.com/vdimir)).
-* Set the max memory usage for clickhouse-client (`1G`) in the CI. [#56873](https://github.com/ClickHouse/ClickHouse/pull/56873) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix exerimental Analyzer - insertion from select with subquery referencing insertion table should process only insertion block. [#50857](https://github.com/ClickHouse/ClickHouse/pull/50857) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix a bug in `str_to_map` function. [#56423](https://github.com/ClickHouse/ClickHouse/pull/56423) ([Arthur Passos](https://github.com/arthurpassos)).
-* Keeper `reconfig`: add timeout before yielding/taking leadership [#53481](https://github.com/ClickHouse/ClickHouse/pull/53481) ([Mike Kot](https://github.com/myrrc)).
-* Fix incorrect header in grace hash join and filter pushdown [#53922](https://github.com/ClickHouse/ClickHouse/pull/53922) ([vdimir](https://github.com/vdimir)).
-* Select from system tables when table based on table function. [#55540](https://github.com/ClickHouse/ClickHouse/pull/55540) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* RFC: Fix "Cannot find column X in source stream" for Distributed queries with LIMIT BY [#55836](https://github.com/ClickHouse/ClickHouse/pull/55836) ([Azat Khuzhin](https://github.com/azat)).
-* Fix 'Cannot read from file:' while running client in a background [#55976](https://github.com/ClickHouse/ClickHouse/pull/55976) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix clickhouse-local exit on bad send_logs_level setting [#55994](https://github.com/ClickHouse/ClickHouse/pull/55994) ([Kruglov Pavel](https://github.com/Avogar)).
-* Bug fix explain ast with parameterized view [#56004](https://github.com/ClickHouse/ClickHouse/pull/56004) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix a crash during table loading on startup [#56232](https://github.com/ClickHouse/ClickHouse/pull/56232) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ClickHouse-sourced dictionaries with an explicit query [#56236](https://github.com/ClickHouse/ClickHouse/pull/56236) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix segfault in signal handler for Keeper [#56266](https://github.com/ClickHouse/ClickHouse/pull/56266) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix incomplete query result for UNION in view() function. [#56274](https://github.com/ClickHouse/ClickHouse/pull/56274) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix inconsistency of "cast('0' as DateTime64(3))" and "cast('0' as Nullable(DateTime64(3)))" [#56286](https://github.com/ClickHouse/ClickHouse/pull/56286) ([李扬](https://github.com/taiyang-li)).
-* Fix rare race condition related to Memory allocation failure [#56303](https://github.com/ClickHouse/ClickHouse/pull/56303) ([alesapin](https://github.com/alesapin)).
-* Fix restore from backup with `flatten_nested` and `data_type_default_nullable` [#56306](https://github.com/ClickHouse/ClickHouse/pull/56306) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix crash in case of adding a column with type Object(JSON) [#56307](https://github.com/ClickHouse/ClickHouse/pull/56307) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix crash in filterPushDown [#56380](https://github.com/ClickHouse/ClickHouse/pull/56380) ([vdimir](https://github.com/vdimir)).
-* Fix restore from backup with mat view and dropped source table [#56383](https://github.com/ClickHouse/ClickHouse/pull/56383) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix segfault during Kerberos initialization [#56401](https://github.com/ClickHouse/ClickHouse/pull/56401) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix buffer overflow in T64 [#56434](https://github.com/ClickHouse/ClickHouse/pull/56434) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix nullable primary key in final (2) [#56452](https://github.com/ClickHouse/ClickHouse/pull/56452) ([Amos Bird](https://github.com/amosbird)).
-* Fix ON CLUSTER queries without database on initial node [#56484](https://github.com/ClickHouse/ClickHouse/pull/56484) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix startup failure due to TTL dependency [#56489](https://github.com/ClickHouse/ClickHouse/pull/56489) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ALTER COMMENT queries ON CLUSTER [#56491](https://github.com/ClickHouse/ClickHouse/pull/56491) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix ALTER COLUMN with ALIAS [#56493](https://github.com/ClickHouse/ClickHouse/pull/56493) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix empty NAMED COLLECTIONs [#56494](https://github.com/ClickHouse/ClickHouse/pull/56494) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix two cases of projection analysis. [#56502](https://github.com/ClickHouse/ClickHouse/pull/56502) ([Amos Bird](https://github.com/amosbird)).
-* Fix handling of aliases in query cache [#56545](https://github.com/ClickHouse/ClickHouse/pull/56545) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix conversion from `Nullable(Enum)` to `Nullable(String)` [#56644](https://github.com/ClickHouse/ClickHouse/pull/56644) ([Nikolay Degterinsky](https://github.com/evillique)).
-* More reliable log handling in Keeper [#56670](https://github.com/ClickHouse/ClickHouse/pull/56670) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix configuration merge for nodes with substitution attributes [#56694](https://github.com/ClickHouse/ClickHouse/pull/56694) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix duplicate usage of table function input(). [#56695](https://github.com/ClickHouse/ClickHouse/pull/56695) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix: RabbitMQ OpenSSL dynamic loading issue [#56703](https://github.com/ClickHouse/ClickHouse/pull/56703) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix crash in GCD codec in case when zeros present in data [#56704](https://github.com/ClickHouse/ClickHouse/pull/56704) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix 'mutex lock failed: Invalid argument' in clickhouse-local during insert into function [#56710](https://github.com/ClickHouse/ClickHouse/pull/56710) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Date text parsing in optimistic path [#56765](https://github.com/ClickHouse/ClickHouse/pull/56765) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix crash in FPC codec [#56795](https://github.com/ClickHouse/ClickHouse/pull/56795) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* DatabaseReplicated: fix DDL query timeout after recovering a replica [#56796](https://github.com/ClickHouse/ClickHouse/pull/56796) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix incorrect nullable columns reporting in MySQL binary protocol [#56799](https://github.com/ClickHouse/ClickHouse/pull/56799) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Support Iceberg metadata files for metastore tables [#56810](https://github.com/ClickHouse/ClickHouse/pull/56810) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix TSAN report under transform [#56817](https://github.com/ClickHouse/ClickHouse/pull/56817) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix SET query and SETTINGS formatting [#56825](https://github.com/ClickHouse/ClickHouse/pull/56825) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix failure to start due to table dependency in joinGet [#56828](https://github.com/ClickHouse/ClickHouse/pull/56828) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix flattening existing Nested columns during ADD COLUMN [#56830](https://github.com/ClickHouse/ClickHouse/pull/56830) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix allow cr end of line for csv [#56901](https://github.com/ClickHouse/ClickHouse/pull/56901) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix `tryBase64Decode` with invalid input [#56913](https://github.com/ClickHouse/ClickHouse/pull/56913) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix generating deep nested columns in CapnProto/Protobuf schemas [#56941](https://github.com/ClickHouse/ClickHouse/pull/56941) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent incompatible ALTER of projection columns [#56948](https://github.com/ClickHouse/ClickHouse/pull/56948) ([Amos Bird](https://github.com/amosbird)).
-* Fix sqlite file path validation [#56984](https://github.com/ClickHouse/ClickHouse/pull/56984) ([San](https://github.com/santrancisco)).
-* S3Queue: fix metadata reference increment [#56990](https://github.com/ClickHouse/ClickHouse/pull/56990) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* S3Queue minor fix [#56999](https://github.com/ClickHouse/ClickHouse/pull/56999) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix file path validation for DatabaseFileSystem [#57029](https://github.com/ClickHouse/ClickHouse/pull/57029) ([San](https://github.com/santrancisco)).
-* Fix `fuzzBits` with `ARRAY JOIN` [#57033](https://github.com/ClickHouse/ClickHouse/pull/57033) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix Nullptr dereference in partial merge join with joined_subquery_re… [#57048](https://github.com/ClickHouse/ClickHouse/pull/57048) ([vdimir](https://github.com/vdimir)).
-* Fix race condition in RemoteSource [#57052](https://github.com/ClickHouse/ClickHouse/pull/57052) ([Raúl Marín](https://github.com/Algunenano)).
-* Implement `bitHammingDistance` for big integers [#57073](https://github.com/ClickHouse/ClickHouse/pull/57073) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* S3-style links bug fix [#57075](https://github.com/ClickHouse/ClickHouse/pull/57075) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Fix JSON_QUERY function with multiple numeric paths [#57096](https://github.com/ClickHouse/ClickHouse/pull/57096) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix buffer overflow in Gorilla codec [#57107](https://github.com/ClickHouse/ClickHouse/pull/57107) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Close interserver connection on any exception before authentication [#57142](https://github.com/ClickHouse/ClickHouse/pull/57142) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix segfault after ALTER UPDATE with Nullable MATERIALIZED column [#57147](https://github.com/ClickHouse/ClickHouse/pull/57147) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix incorrect JOIN plan optimization with partially materialized normal projection [#57196](https://github.com/ClickHouse/ClickHouse/pull/57196) ([Amos Bird](https://github.com/amosbird)).
-* Ignore comments when comparing column descriptions [#57259](https://github.com/ClickHouse/ClickHouse/pull/57259) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix `ReadonlyReplica` metric for all cases [#57267](https://github.com/ClickHouse/ClickHouse/pull/57267) ([Antonio Andelic](https://github.com/antonio2368)).
-* Background merges correctly use temporary data storage in the cache [#57275](https://github.com/ClickHouse/ClickHouse/pull/57275) ([vdimir](https://github.com/vdimir)).
-* Keeper fix for changelog and snapshots [#57299](https://github.com/ClickHouse/ClickHouse/pull/57299) ([Antonio Andelic](https://github.com/antonio2368)).
-* Ignore finished ON CLUSTER tasks if hostname changed [#57339](https://github.com/ClickHouse/ClickHouse/pull/57339) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* MergeTree mutations reuse source part index granularity [#57352](https://github.com/ClickHouse/ClickHouse/pull/57352) ([Maksim Kita](https://github.com/kitaisreal)).
-* FS cache: add a limit for background download [#57424](https://github.com/ClickHouse/ClickHouse/pull/57424) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-
-### <a id="2310"></a> ClickHouse release 23.10, 2023-11-02
-
-#### Backward Incompatible Change
-* There is no longer an option to automatically remove broken data parts. This closes [#55174](https://github.com/ClickHouse/ClickHouse/issues/55174). [#55184](https://github.com/ClickHouse/ClickHouse/pull/55184) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#55557](https://github.com/ClickHouse/ClickHouse/pull/55557) ([Jihyuk Bok](https://github.com/tomahawk28)).
-* The obsolete in-memory data parts can no longer be read from the write-ahead log. If you have configured in-memory parts before, they have to be removed before the upgrade. [#55186](https://github.com/ClickHouse/ClickHouse/pull/55186) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the integration with Meilisearch. Reason: it was compatible only with the old version 0.18. The recent version of Meilisearch changed the protocol and does not work anymore. Note: we would appreciate it if you help to return it back. [#55189](https://github.com/ClickHouse/ClickHouse/pull/55189) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Rename directory monitor concept into background INSERT. All the settings `*directory_monitor*` had been renamed to `distributed_background_insert*`. *Backward compatibility should be preserved* (since old settings had been added as an alias). [#55978](https://github.com/ClickHouse/ClickHouse/pull/55978) ([Azat Khuzhin](https://github.com/azat)).
-* Do not interpret the `send_timeout` set on the client side as the `receive_timeout` on the server side and vise-versa. [#56035](https://github.com/ClickHouse/ClickHouse/pull/56035) ([Azat Khuzhin](https://github.com/azat)).
-* Comparison of time intervals with different units will throw an exception. This closes [#55942](https://github.com/ClickHouse/ClickHouse/issues/55942). You might have occasionally rely on the previous behavior when the underlying numeric values were compared regardless of the units. [#56090](https://github.com/ClickHouse/ClickHouse/pull/56090) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Rewrited the experimental `S3Queue` table engine completely: changed the way we keep information in zookeeper which allows to make less zookeeper requests, added caching of zookeeper state in cases when we know the state will not change, improved the polling from s3 process to make it less aggressive, changed the way ttl and max set for trached files is maintained, now it is a background process. Added `system.s3queue` and `system.s3queue_log` tables. Closes [#54998](https://github.com/ClickHouse/ClickHouse/issues/54998). [#54422](https://github.com/ClickHouse/ClickHouse/pull/54422) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Arbitrary paths on HTTP endpoint are no longer interpreted as a request to the `/query` endpoint. [#55521](https://github.com/ClickHouse/ClickHouse/pull/55521) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-
-#### New Feature
-* Add function `arrayFold(accumulator, x1, ..., xn -> expression, initial, array1, ..., arrayn)` which applies a lambda function to multiple arrays of the same cardinality and collects the result in an accumulator. [#49794](https://github.com/ClickHouse/ClickHouse/pull/49794) ([Lirikl](https://github.com/Lirikl)).
-* Support for `Npy` format. `SELECT * FROM file('example_array.npy', Npy)`. [#55982](https://github.com/ClickHouse/ClickHouse/pull/55982) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* If a table has a space-filling curve in its key, e.g., `ORDER BY mortonEncode(x, y)`, the conditions on its arguments, e.g., `x >= 10 AND x <= 20 AND y >= 20 AND y <= 30` can be used for indexing. A setting `analyze_index_with_space_filling_curves` is added to enable or disable this analysis. This closes [#41195](https://github.com/ClickHouse/ClickHouse/issue/41195). Continuation of [#4538](https://github.com/ClickHouse/ClickHouse/pull/4538). Continuation of [#6286](https://github.com/ClickHouse/ClickHouse/pull/6286). Continuation of [#28130](https://github.com/ClickHouse/ClickHouse/pull/28130). Continuation of [#41753](https://github.com/ClickHouse/ClickHouse/pull/#41753). [#55642](https://github.com/ClickHouse/ClickHouse/pull/55642) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* A new setting called `force_optimize_projection_name`, it takes a name of projection as an argument. If it's value set to a non-empty string, ClickHouse checks that this projection is used in the query at least once. Closes [#55331](https://github.com/ClickHouse/ClickHouse/issues/55331). [#56134](https://github.com/ClickHouse/ClickHouse/pull/56134) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Support asynchronous inserts with external data via native protocol. Previously it worked only if data is inlined into query. [#54730](https://github.com/ClickHouse/ClickHouse/pull/54730) ([Anton Popov](https://github.com/CurtizJ)).
-* Added aggregation function `lttb` which uses the [Largest-Triangle-Three-Buckets](https://skemman.is/bitstream/1946/15343/3/SS_MSthesis.pdf) algorithm for downsampling data for visualization. [#53145](https://github.com/ClickHouse/ClickHouse/pull/53145) ([Sinan](https://github.com/sinsinan)).
-* Query`CHECK TABLE` has better performance and usability (sends progress updates, cancellable). Support checking particular part with `CHECK TABLE ... PART 'part_name'`. [#53404](https://github.com/ClickHouse/ClickHouse/pull/53404) ([vdimir](https://github.com/vdimir)).
-* Added function `jsonMergePatch`. When working with JSON data as strings, it provides a way to merge these strings (of JSON objects) together to form a single string containing a single JSON object. [#54364](https://github.com/ClickHouse/ClickHouse/pull/54364) ([Memo](https://github.com/Joeywzr)).
-* The second part of Kusto Query Language dialect support. [Phase 1 implementation ](https://github.com/ClickHouse/ClickHouse/pull/37961) has been merged. [#42510](https://github.com/ClickHouse/ClickHouse/pull/42510) ([larryluogit](https://github.com/larryluogit)).
-* Added a new SQL function, `arrayRandomSample(arr, k)` which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. "SELECT arrayReduce('groupArraySample(3)', range(10))". [#54391](https://github.com/ClickHouse/ClickHouse/pull/54391) ([itayisraelov](https://github.com/itayisraelov)).
-* Introduce `-ArgMin`/`-ArgMax` aggregate combinators which allow to aggregate by min/max values only. One use case can be found in [#54818](https://github.com/ClickHouse/ClickHouse/issues/54818). This PR also reorganize combinators into dedicated folder. [#54947](https://github.com/ClickHouse/ClickHouse/pull/54947) ([Amos Bird](https://github.com/amosbird)).
-* Allow to drop cache for Protobuf format with `SYSTEM DROP SCHEMA FORMAT CACHE [FOR Protobuf]`. [#55064](https://github.com/ClickHouse/ClickHouse/pull/55064) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Add external HTTP Basic authenticator. [#55199](https://github.com/ClickHouse/ClickHouse/pull/55199) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Added function `byteSwap` which reverses the bytes of unsigned integers. This is particularly useful for reversing values of types which are represented as unsigned integers internally such as IPv4. [#55211](https://github.com/ClickHouse/ClickHouse/pull/55211) ([Priyansh Agrawal](https://github.com/Priyansh121096)).
-* Added function `formatQuery` which returns a formatted version (possibly spanning multiple lines) of a SQL query string. Also added function `formatQuerySingleLine` which does the same but the returned string will not contain linebreaks. [#55239](https://github.com/ClickHouse/ClickHouse/pull/55239) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Added `DWARF` input format that reads debug symbols from an ELF executable/library/object file. [#55450](https://github.com/ClickHouse/ClickHouse/pull/55450) ([Michael Kolupaev](https://github.com/al13n321)).
-* Allow to save unparsed records and errors in RabbitMQ, NATS and FileLog engines. Add virtual columns `_error` and `_raw_message`(for NATS and RabbitMQ), `_raw_record` (for FileLog) that are filled when ClickHouse fails to parse new record. The behaviour is controlled under storage settings `nats_handle_error_mode` for NATS, `rabbitmq_handle_error_mode` for RabbitMQ, `handle_error_mode` for FileLog similar to `kafka_handle_error_mode`. If it's set to `default`, en exception will be thrown when ClickHouse fails to parse a record, if it's set to `stream`, erorr and raw record will be saved into virtual columns. Closes [#36035](https://github.com/ClickHouse/ClickHouse/issues/36035). [#55477](https://github.com/ClickHouse/ClickHouse/pull/55477) ([Kruglov Pavel](https://github.com/Avogar)).
-* Keeper client improvement: add `get_all_children_number command` that returns number of all children nodes under a specific path. [#55485](https://github.com/ClickHouse/ClickHouse/pull/55485) ([guoxiaolong](https://github.com/guoxiaolongzte)).
-* Keeper client improvement: add `get_direct_children_number` command that returns number of direct children nodes under a path. [#55898](https://github.com/ClickHouse/ClickHouse/pull/55898) ([xuzifu666](https://github.com/xuzifu666)).
-* Add statement `SHOW SETTING setting_name` which is a simpler version of existing statement `SHOW SETTINGS`. [#55979](https://github.com/ClickHouse/ClickHouse/pull/55979) ([Maksim Kita](https://github.com/kitaisreal)).
-* Added fields `substreams` and `filenames` to the `system.parts_columns` table. [#55108](https://github.com/ClickHouse/ClickHouse/pull/55108) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for `SHOW MERGES` query. [#55815](https://github.com/ClickHouse/ClickHouse/pull/55815) ([megao](https://github.com/jetgm)).
-* Introduce a setting `create_table_empty_primary_key_by_default` for default `ORDER BY ()`. [#55899](https://github.com/ClickHouse/ClickHouse/pull/55899) ([Srikanth Chekuri](https://github.com/srikanthccv)).
-
-#### Performance Improvement
-* Add option `query_plan_preserve_num_streams_after_window_functions` to preserve the number of streams after evaluating window functions to allow parallel stream processing. [#50771](https://github.com/ClickHouse/ClickHouse/pull/50771) ([frinkr](https://github.com/frinkr)).
-* Release more streams if data is small. [#53867](https://github.com/ClickHouse/ClickHouse/pull/53867) ([Jiebin Sun](https://github.com/jiebinn)).
-* RoaringBitmaps being optimized before serialization. [#55044](https://github.com/ClickHouse/ClickHouse/pull/55044) ([UnamedRus](https://github.com/UnamedRus)).
-* Posting lists in inverted indexes are now optimized to use the smallest possible representation for internal bitmaps. Depending on the repetitiveness of the data, this may significantly reduce the space consumption of inverted indexes. [#55069](https://github.com/ClickHouse/ClickHouse/pull/55069) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Fix contention on Context lock, this significantly improves performance for a lot of short-running concurrent queries. [#55121](https://github.com/ClickHouse/ClickHouse/pull/55121) ([Maksim Kita](https://github.com/kitaisreal)).
-* Improved the performance of inverted index creation by 30%. This was achieved by replacing `std::unordered_map` with `absl::flat_hash_map`. [#55210](https://github.com/ClickHouse/ClickHouse/pull/55210) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Support ORC filter push down (rowgroup level). [#55330](https://github.com/ClickHouse/ClickHouse/pull/55330) ([李扬](https://github.com/taiyang-li)).
-* Improve performance of external aggregation with a lot of temporary files. [#55489](https://github.com/ClickHouse/ClickHouse/pull/55489) ([Maksim Kita](https://github.com/kitaisreal)).
-* Set a reasonable size for the marks cache for secondary indices by default to avoid loading the marks over and over again. [#55654](https://github.com/ClickHouse/ClickHouse/pull/55654) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Avoid unnecessary reconstruction of index granules when reading skip indexes. This addresses [#55653](https://github.com/ClickHouse/ClickHouse/issues/55653#issuecomment-1763766009). [#55683](https://github.com/ClickHouse/ClickHouse/pull/55683) ([Amos Bird](https://github.com/amosbird)).
-* Cache CAST function in set during execution to improve the performance of function `IN` when set element type doesn't exactly match column type. [#55712](https://github.com/ClickHouse/ClickHouse/pull/55712) ([Duc Canh Le](https://github.com/canhld94)).
-* Performance improvement for `ColumnVector::insertMany` and `ColumnVector::insertManyFrom`. [#55714](https://github.com/ClickHouse/ClickHouse/pull/55714) ([frinkr](https://github.com/frinkr)).
-* Optimized Map subscript operations by predicting the next row's key position and reduce the comparisons. [#55929](https://github.com/ClickHouse/ClickHouse/pull/55929) ([lgbo](https://github.com/lgbo-ustc)).
-* Support struct fields pruning in Parquet (in previous versions it didn't work in some cases). [#56117](https://github.com/ClickHouse/ClickHouse/pull/56117) ([lgbo](https://github.com/lgbo-ustc)).
-* Add the ability to tune the number of parallel replicas used in a query execution based on the estimation of rows to read. [#51692](https://github.com/ClickHouse/ClickHouse/pull/51692) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimized external aggregation memory consumption in case many temporary files were generated. [#54798](https://github.com/ClickHouse/ClickHouse/pull/54798) ([Nikita Taranov](https://github.com/nickitat)).
-* Distributed queries executed in `async_socket_for_remote` mode (default) now respect `max_threads` limit. Previously, some queries could create excessive threads (up to `max_distributed_connections`), causing server performance issues. [#53504](https://github.com/ClickHouse/ClickHouse/pull/53504) ([filimonov](https://github.com/filimonov)).
-* Caching skip-able entries while executing DDL from Zookeeper distributed DDL queue. [#54828](https://github.com/ClickHouse/ClickHouse/pull/54828) ([Duc Canh Le](https://github.com/canhld94)).
-* Experimental inverted indexes do not store tokens with too many matches (i.e. row ids in the posting list). This saves space and avoids ineffective index lookups when sequential scans would be equally fast or faster. The previous heuristics (`density` parameter passed to the index definition) that controlled when tokens would not be stored was too confusing for users. A much simpler heuristics based on parameter `max_rows_per_postings_list` (default: 64k) is introduced which directly controls the maximum allowed number of row ids in a postings list. [#55616](https://github.com/ClickHouse/ClickHouse/pull/55616) ([Harry Lee](https://github.com/HarryLeeIBM)).
-* Improve write performance to `EmbeddedRocksDB` tables. [#55732](https://github.com/ClickHouse/ClickHouse/pull/55732) ([Duc Canh Le](https://github.com/canhld94)).
-* Improved overall resilience for ClickHouse in case of many parts within partition (more than 1000). It might reduce the number of `TOO_MANY_PARTS` errors. [#55526](https://github.com/ClickHouse/ClickHouse/pull/55526) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Reduced memory consumption during loading of hierarchical dictionaries. [#55838](https://github.com/ClickHouse/ClickHouse/pull/55838) ([Nikita Taranov](https://github.com/nickitat)).
-* All dictionaries support setting `dictionary_use_async_executor`. [#55839](https://github.com/ClickHouse/ClickHouse/pull/55839) ([vdimir](https://github.com/vdimir)).
-* Prevent excesive memory usage when deserializing AggregateFunctionTopKGenericData. [#55947](https://github.com/ClickHouse/ClickHouse/pull/55947) ([Raúl Marín](https://github.com/Algunenano)).
-* On a Keeper with lots of watches AsyncMetrics threads can consume 100% of CPU for noticable time in `DB::KeeperStorage::getSessionsWithWatchesCount`. The fix is to avoid traversing heavy `watches` and `list_watches` sets. [#56054](https://github.com/ClickHouse/ClickHouse/pull/56054) ([Alexander Gololobov](https://github.com/davenger)).
-* Add setting `optimize_trivial_approximate_count_query` to use `count` approximation for storage EmbeddedRocksDB. Enable trivial count for StorageJoin. [#55806](https://github.com/ClickHouse/ClickHouse/pull/55806) ([Duc Canh Le](https://github.com/canhld94)).
-
-#### Improvement
-* Functions `toDayOfWeek` (MySQL alias: `DAYOFWEEK`), `toYearWeek` (`YEARWEEK`) and `toWeek` (`WEEK`) now supports `String` arguments. This makes its behavior consistent with MySQL's behavior. [#55589](https://github.com/ClickHouse/ClickHouse/pull/55589) ([Robert Schulze](https://github.com/rschu1ze)).
-* Introduced setting `date_time_overflow_behavior` with possible values `ignore`, `throw`, `saturate` that controls the overflow behavior when converting from Date, Date32, DateTime64, Integer or Float to Date, Date32, DateTime or DateTime64. [#55696](https://github.com/ClickHouse/ClickHouse/pull/55696) ([Andrey Zvonov](https://github.com/zvonand)).
-* Implement query parameters support for `ALTER TABLE ... ACTION PARTITION [ID] {parameter_name:ParameterType}`. Merges [#49516](https://github.com/ClickHouse/ClickHouse/issues/49516). Closes [#49449](https://github.com/ClickHouse/ClickHouse/issues/49449). [#55604](https://github.com/ClickHouse/ClickHouse/pull/55604) ([alesapin](https://github.com/alesapin)).
-* Print processor ids in a prettier manner in EXPLAIN. [#48852](https://github.com/ClickHouse/ClickHouse/pull/48852) ([Vlad Seliverstov](https://github.com/behebot)).
-* Creating a direct dictionary with a lifetime field will be rejected at create time (as the lifetime does not make sense for direct dictionaries). Fixes: [#27861](https://github.com/ClickHouse/ClickHouse/issues/27861). [#49043](https://github.com/ClickHouse/ClickHouse/pull/49043) ([Rory Crispin](https://github.com/RoryCrispin)).
-* Allow parameters in queries with partitions like `ALTER TABLE t DROP PARTITION`. Closes [#49449](https://github.com/ClickHouse/ClickHouse/issues/49449). [#49516](https://github.com/ClickHouse/ClickHouse/pull/49516) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add a new column `xid` for `system.zookeeper_connection`. [#50702](https://github.com/ClickHouse/ClickHouse/pull/50702) ([helifu](https://github.com/helifu)).
-* Display the correct server settings in `system.server_settings` after configuration reload. [#53774](https://github.com/ClickHouse/ClickHouse/pull/53774) ([helifu](https://github.com/helifu)).
-* Add support for mathematical minus `−` character in queries, similar to `-`. [#54100](https://github.com/ClickHouse/ClickHouse/pull/54100) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add replica groups to the experimental `Replicated` database engine. Closes [#53620](https://github.com/ClickHouse/ClickHouse/issues/53620). [#54421](https://github.com/ClickHouse/ClickHouse/pull/54421) ([Nikolay Degterinsky](https://github.com/evillique)).
-* It is better to retry retriable s3 errors than totally fail the query. Set bigger value to the s3_retry_attempts by default. [#54770](https://github.com/ClickHouse/ClickHouse/pull/54770) ([Sema Checherinda](https://github.com/CheSema)).
-* Add load balancing mode `hostname_levenshtein_distance`. [#54826](https://github.com/ClickHouse/ClickHouse/pull/54826) ([JackyWoo](https://github.com/JackyWoo)).
-* Improve hiding secrets in logs. [#55089](https://github.com/ClickHouse/ClickHouse/pull/55089) ([Vitaly Baranov](https://github.com/vitlibar)).
-* For now the projection analysis will be performed only on top of query plan. The setting `query_plan_optimize_projection` became obsolete (it was enabled by default long time ago). [#55112](https://github.com/ClickHouse/ClickHouse/pull/55112) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* When function `untuple` is now called on a tuple with named elements and itself has an alias (e.g. `select untuple(tuple(1)::Tuple(element_alias Int)) AS untuple_alias`), then the result column name is now generated from the untuple alias and the tuple element alias (in the example: "untuple_alias.element_alias"). [#55123](https://github.com/ClickHouse/ClickHouse/pull/55123) ([garcher22](https://github.com/garcher22)).
-* Added setting `describe_include_virtual_columns`, which allows to include virtual columns of table into result of `DESCRIBE` query. Added setting `describe_compact_output`. If it is set to `true`, `DESCRIBE` query returns only names and types of columns without extra information. [#55129](https://github.com/ClickHouse/ClickHouse/pull/55129) ([Anton Popov](https://github.com/CurtizJ)).
-* Sometimes `OPTIMIZE` with `optimize_throw_if_noop=1` may fail with an error `unknown reason` while the real cause of it - different projections in different parts. This behavior is fixed. [#55130](https://github.com/ClickHouse/ClickHouse/pull/55130) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow to have several `MaterializedPostgreSQL` tables following the same Postgres table. By default this behaviour is not enabled (for compatibility, because it is a backward-incompatible change), but can be turned on with setting `materialized_postgresql_use_unique_replication_consumer_identifier`. Closes [#54918](https://github.com/ClickHouse/ClickHouse/issues/54918). [#55145](https://github.com/ClickHouse/ClickHouse/pull/55145) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow to parse negative `DateTime64` and `DateTime` with fractional part from short strings. [#55146](https://github.com/ClickHouse/ClickHouse/pull/55146) ([Andrey Zvonov](https://github.com/zvonand)).
-* To improve compatibility with MySQL, 1. `information_schema.tables` now includes the new field `table_rows`, and 2. `information_schema.columns` now includes the new field `extra`. [#55215](https://github.com/ClickHouse/ClickHouse/pull/55215) ([Robert Schulze](https://github.com/rschu1ze)).
-* Clickhouse-client won't show "0 rows in set" if it is zero and if exception was thrown. [#55240](https://github.com/ClickHouse/ClickHouse/pull/55240) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Support rename table without keyword `TABLE` like `RENAME db.t1 to db.t2`. [#55373](https://github.com/ClickHouse/ClickHouse/pull/55373) ([凌涛](https://github.com/lingtaolf)).
-* Add `internal_replication` to `system.clusters`. [#55377](https://github.com/ClickHouse/ClickHouse/pull/55377) ([Konstantin Morozov](https://github.com/k-morozov)).
-* Select remote proxy resolver based on request protocol, add proxy feature docs and remove `DB::ProxyConfiguration::Protocol::ANY`. [#55430](https://github.com/ClickHouse/ClickHouse/pull/55430) ([Arthur Passos](https://github.com/arthurpassos)).
-* Avoid retrying keeper operations on INSERT after table shutdown. [#55519](https://github.com/ClickHouse/ClickHouse/pull/55519) ([Azat Khuzhin](https://github.com/azat)).
-* `SHOW COLUMNS` now correctly reports type `FixedString` as `BLOB` if setting `use_mysql_types_in_show_columns` is on. Also added two new settings, `mysql_map_string_to_text_in_show_columns` and `mysql_map_fixed_string_to_text_in_show_columns` to switch the output for types `String` and `FixedString` as `TEXT` or `BLOB`. [#55617](https://github.com/ClickHouse/ClickHouse/pull/55617) ([Serge Klochkov](https://github.com/slvrtrn)).
-* During ReplicatedMergeTree tables startup clickhouse server checks set of parts for unexpected parts (exists locally, but not in zookeeper). All unexpected parts move to detached directory and instead of them server tries to restore some ancestor (covered) parts. Now server tries to restore closest ancestors instead of random covered parts. [#55645](https://github.com/ClickHouse/ClickHouse/pull/55645) ([alesapin](https://github.com/alesapin)).
-* The advanced dashboard now supports draggable charts on touch devices. This closes [#54206](https://github.com/ClickHouse/ClickHouse/issues/54206). [#55649](https://github.com/ClickHouse/ClickHouse/pull/55649) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Use the default query format if declared when outputting exception with `http_write_exception_in_output_format`. [#55739](https://github.com/ClickHouse/ClickHouse/pull/55739) ([Raúl Marín](https://github.com/Algunenano)).
-* Provide a better message for common MATERIALIZED VIEW pitfalls. [#55826](https://github.com/ClickHouse/ClickHouse/pull/55826) ([Raúl Marín](https://github.com/Algunenano)).
-* If you dropped the current database, you will still be able to run some queries in `clickhouse-local` and switch to another database. This makes the behavior consistent with `clickhouse-client`. This closes [#55834](https://github.com/ClickHouse/ClickHouse/issues/55834). [#55853](https://github.com/ClickHouse/ClickHouse/pull/55853) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Functions `(add|subtract)(Year|Quarter|Month|Week|Day|Hour|Minute|Second|Millisecond|Microsecond|Nanosecond)` now support string-encoded date arguments, e.g. `SELECT addDays('2023-10-22', 1)`. This increases compatibility with MySQL and is needed by Tableau Online. [#55869](https://github.com/ClickHouse/ClickHouse/pull/55869) ([Robert Schulze](https://github.com/rschu1ze)).
-* The setting `apply_deleted_mask` when disabled allows to read rows that where marked as deleted by lightweight DELETE queries. This is useful for debugging. [#55952](https://github.com/ClickHouse/ClickHouse/pull/55952) ([Alexander Gololobov](https://github.com/davenger)).
-* Allow skipping `null` values when serailizing Tuple to json objects, which makes it possible to keep compatiability with Spark's `to_json` function, which is also useful for gluten. [#55956](https://github.com/ClickHouse/ClickHouse/pull/55956) ([李扬](https://github.com/taiyang-li)).
-* Functions `(add|sub)Date` now support string-encoded date arguments, e.g. `SELECT addDate('2023-10-22 11:12:13', INTERVAL 5 MINUTE)`. The same support for string-encoded date arguments is added to the plus and minus operators, e.g. `SELECT '2023-10-23' + INTERVAL 1 DAY`. This increases compatibility with MySQL and is needed by Tableau Online. [#55960](https://github.com/ClickHouse/ClickHouse/pull/55960) ([Robert Schulze](https://github.com/rschu1ze)).
-* Allow unquoted strings with CR (`\r`) in CSV format. Closes [#39930](https://github.com/ClickHouse/ClickHouse/issues/39930). [#56046](https://github.com/ClickHouse/ClickHouse/pull/56046) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to run `clickhouse-keeper` using embedded config. [#56086](https://github.com/ClickHouse/ClickHouse/pull/56086) ([Maksim Kita](https://github.com/kitaisreal)).
-* Set limit of the maximum configuration value for `queued.min.messages` to avoid problem with start fetching data with Kafka. [#56121](https://github.com/ClickHouse/ClickHouse/pull/56121) ([Stas Morozov](https://github.com/r3b-fish)).
-* Fixed a typo in SQL function `minSampleSizeContinous` (renamed `minSampleSizeContinuous`). Old name is preserved for backward compatibility. This closes: [#56139](https://github.com/ClickHouse/ClickHouse/issues/56139). [#56143](https://github.com/ClickHouse/ClickHouse/pull/56143) ([Dorota Szeremeta](https://github.com/orotaday)).
-* Print path for broken parts on disk before shutting down the server. Before this change if a part is corrupted on disk and server cannot start, it was almost impossible to understand which part is broken. This is fixed. [#56181](https://github.com/ClickHouse/ClickHouse/pull/56181) ([Duc Canh Le](https://github.com/canhld94)).
-
-#### Build/Testing/Packaging Improvement
-* If the database in Docker is already initialized, it doesn't need to be initialized again upon subsequent launches. This can potentially fix the issue of infinite container restarts when the database fails to load within 1000 attempts (relevant for very large databases and multi-node setups). [#50724](https://github.com/ClickHouse/ClickHouse/pull/50724) ([Alexander Nikolaev](https://github.com/AlexNik)).
-* Resource with source code including submodules is built in Darwin special build task. It may be used to build ClickHouse without checking out the submodules. [#51435](https://github.com/ClickHouse/ClickHouse/pull/51435) ([Ilya Yatsishin](https://github.com/qoega)).
-* An error was occuring when building ClickHouse with the AVX series of instructions enabled globally (which isn't recommended). The reason is that snappy does not enable `SNAPPY_HAVE_X86_CRC32`. [#55049](https://github.com/ClickHouse/ClickHouse/pull/55049) ([monchickey](https://github.com/monchickey)).
-* Solve issue with launching standalone `clickhouse-keeper` from `clickhouse-server` package. [#55226](https://github.com/ClickHouse/ClickHouse/pull/55226) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* In the tests, RabbitMQ version is updated to 3.12.6. Improved logs collection for RabbitMQ tests. [#55424](https://github.com/ClickHouse/ClickHouse/pull/55424) ([Ilya Yatsishin](https://github.com/qoega)).
-* Modified the error message difference between openssl and boringssl to fix the functional test. [#55975](https://github.com/ClickHouse/ClickHouse/pull/55975) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Use upstream repo for apache datasketches. [#55787](https://github.com/ClickHouse/ClickHouse/pull/55787) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Skip hardlinking inverted index files in mutation [#47663](https://github.com/ClickHouse/ClickHouse/pull/47663) ([cangyin](https://github.com/cangyin)).
-* Fixed bug of `match` function (regex) with pattern containing alternation produces incorrect key condition. Closes #53222. [#54696](https://github.com/ClickHouse/ClickHouse/pull/54696) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix 'Cannot find column' in read-in-order optimization with ARRAY JOIN [#51746](https://github.com/ClickHouse/ClickHouse/pull/51746) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Support missed experimental `Object(Nullable(json))` subcolumns in query. [#54052](https://github.com/ClickHouse/ClickHouse/pull/54052) ([zps](https://github.com/VanDarkholme7)).
-* Re-add fix for `accurateCastOrNull` [#54629](https://github.com/ClickHouse/ClickHouse/pull/54629) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix detecting `DEFAULT` for columns of a Distributed table created without AS [#55060](https://github.com/ClickHouse/ClickHouse/pull/55060) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Proper cleanup in case of exception in ctor of ShellCommandSource [#55103](https://github.com/ClickHouse/ClickHouse/pull/55103) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix deadlock in LDAP assigned role update [#55119](https://github.com/ClickHouse/ClickHouse/pull/55119) ([Julian Maicher](https://github.com/jmaicher)).
-* Suppress error statistics update for internal exceptions [#55128](https://github.com/ClickHouse/ClickHouse/pull/55128) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix deadlock in backups [#55132](https://github.com/ClickHouse/ClickHouse/pull/55132) ([alesapin](https://github.com/alesapin)).
-* Fix storage Iceberg files retrieval [#55144](https://github.com/ClickHouse/ClickHouse/pull/55144) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix partition pruning of extra columns in set. [#55172](https://github.com/ClickHouse/ClickHouse/pull/55172) ([Amos Bird](https://github.com/amosbird)).
-* Fix recalculation of skip indexes in ALTER UPDATE queries when table has adaptive granularity [#55202](https://github.com/ClickHouse/ClickHouse/pull/55202) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix for background download in fs cache [#55252](https://github.com/ClickHouse/ClickHouse/pull/55252) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Avoid possible memory leaks in compressors in case of missing buffer finalization [#55262](https://github.com/ClickHouse/ClickHouse/pull/55262) ([Azat Khuzhin](https://github.com/azat)).
-* Fix functions execution over sparse columns [#55275](https://github.com/ClickHouse/ClickHouse/pull/55275) ([Azat Khuzhin](https://github.com/azat)).
-* Fix incorrect merging of Nested for SELECT FINAL FROM SummingMergeTree [#55276](https://github.com/ClickHouse/ClickHouse/pull/55276) ([Azat Khuzhin](https://github.com/azat)).
-* Fix bug with inability to drop detached partition in replicated merge tree on top of S3 without zero copy [#55309](https://github.com/ClickHouse/ClickHouse/pull/55309) ([alesapin](https://github.com/alesapin)).
-* Fix a crash in MergeSortingPartialResultTransform (due to zero chunks after `remerge`) [#55335](https://github.com/ClickHouse/ClickHouse/pull/55335) ([Azat Khuzhin](https://github.com/azat)).
-* Fix data-race in CreatingSetsTransform (on errors) due to throwing shared exception [#55338](https://github.com/ClickHouse/ClickHouse/pull/55338) ([Azat Khuzhin](https://github.com/azat)).
-* Fix trash optimization (up to a certain extent) [#55353](https://github.com/ClickHouse/ClickHouse/pull/55353) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix leak in StorageHDFS [#55370](https://github.com/ClickHouse/ClickHouse/pull/55370) ([Azat Khuzhin](https://github.com/azat)).
-* Fix parsing of arrays in cast operator [#55417](https://github.com/ClickHouse/ClickHouse/pull/55417) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix filtering by virtual columns with OR filter in query [#55418](https://github.com/ClickHouse/ClickHouse/pull/55418) ([Azat Khuzhin](https://github.com/azat)).
-* Fix MongoDB connection issues [#55419](https://github.com/ClickHouse/ClickHouse/pull/55419) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix MySQL interface boolean representation [#55427](https://github.com/ClickHouse/ClickHouse/pull/55427) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Fix MySQL text protocol DateTime formatting and LowCardinality(Nullable(T)) types reporting [#55479](https://github.com/ClickHouse/ClickHouse/pull/55479) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Make `use_mysql_types_in_show_columns` affect only `SHOW COLUMNS` [#55481](https://github.com/ClickHouse/ClickHouse/pull/55481) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix stack symbolizer parsing `DW_FORM_ref_addr` incorrectly and sometimes crashing [#55483](https://github.com/ClickHouse/ClickHouse/pull/55483) ([Michael Kolupaev](https://github.com/al13n321)).
-* Destroy fiber in case of exception in cancelBefore in AsyncTaskExecutor [#55516](https://github.com/ClickHouse/ClickHouse/pull/55516) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Query Parameters not working with custom HTTP handlers [#55521](https://github.com/ClickHouse/ClickHouse/pull/55521) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix checking of non handled data for Values format [#55527](https://github.com/ClickHouse/ClickHouse/pull/55527) ([Azat Khuzhin](https://github.com/azat)).
-* Fix 'Invalid cursor state' in odbc interacting with MS SQL Server [#55558](https://github.com/ClickHouse/ClickHouse/pull/55558) ([vdimir](https://github.com/vdimir)).
-* Fix max execution time and 'break' overflow mode [#55577](https://github.com/ClickHouse/ClickHouse/pull/55577) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix crash in QueryNormalizer with cyclic aliases [#55602](https://github.com/ClickHouse/ClickHouse/pull/55602) ([vdimir](https://github.com/vdimir)).
-* Disable wrong optimization and add a test [#55609](https://github.com/ClickHouse/ClickHouse/pull/55609) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Merging [#52352](https://github.com/ClickHouse/ClickHouse/issues/52352) [#55621](https://github.com/ClickHouse/ClickHouse/pull/55621) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add a test to avoid incorrect decimal sorting [#55662](https://github.com/ClickHouse/ClickHouse/pull/55662) ([Amos Bird](https://github.com/amosbird)).
-* Fix progress bar for s3 and azure Cluster functions with url without globs [#55666](https://github.com/ClickHouse/ClickHouse/pull/55666) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix filtering by virtual columns with OR filter in query (resubmit) [#55678](https://github.com/ClickHouse/ClickHouse/pull/55678) ([Azat Khuzhin](https://github.com/azat)).
-* Fixes and improvements for Iceberg storage [#55695](https://github.com/ClickHouse/ClickHouse/pull/55695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix data race in CreatingSetsTransform (v2) [#55786](https://github.com/ClickHouse/ClickHouse/pull/55786) ([Azat Khuzhin](https://github.com/azat)).
-* Throw exception when parsing illegal string as float if precise_float_parsing is true [#55861](https://github.com/ClickHouse/ClickHouse/pull/55861) ([李扬](https://github.com/taiyang-li)).
-* Disable predicate pushdown if the CTE contains stateful functions [#55871](https://github.com/ClickHouse/ClickHouse/pull/55871) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix normalize ASTSelectWithUnionQuery, as it was stripping `FORMAT` from the query [#55887](https://github.com/ClickHouse/ClickHouse/pull/55887) ([flynn](https://github.com/ucasfl)).
-* Try to fix possible segfault in Native ORC input format [#55891](https://github.com/ClickHouse/ClickHouse/pull/55891) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix window functions in case of sparse columns. [#55895](https://github.com/ClickHouse/ClickHouse/pull/55895) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* fix: StorageNull supports subcolumns [#55912](https://github.com/ClickHouse/ClickHouse/pull/55912) ([FFish](https://github.com/wxybear)).
-* Do not write retriable errors for Replicated mutate/merge into error log [#55944](https://github.com/ClickHouse/ClickHouse/pull/55944) ([Azat Khuzhin](https://github.com/azat)).
-* Fix `SHOW DATABASES LIMIT <N>` [#55962](https://github.com/ClickHouse/ClickHouse/pull/55962) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix autogenerated Protobuf schema with fields with underscore [#55974](https://github.com/ClickHouse/ClickHouse/pull/55974) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix dateTime64ToSnowflake64() with non-default scale [#55983](https://github.com/ClickHouse/ClickHouse/pull/55983) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix output/input of Arrow dictionary column [#55989](https://github.com/ClickHouse/ClickHouse/pull/55989) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix fetching schema from schema registry in AvroConfluent [#55991](https://github.com/ClickHouse/ClickHouse/pull/55991) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix 'Block structure mismatch' on concurrent ALTER and INSERTs in Buffer table [#55995](https://github.com/ClickHouse/ClickHouse/pull/55995) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix incorrect free space accounting for least_used JBOD policy [#56030](https://github.com/ClickHouse/ClickHouse/pull/56030) ([Azat Khuzhin](https://github.com/azat)).
-* Fix missing scalar issue when evaluating subqueries inside table functions [#56057](https://github.com/ClickHouse/ClickHouse/pull/56057) ([Amos Bird](https://github.com/amosbird)).
-* Fix wrong query result when http_write_exception_in_output_format=1 [#56135](https://github.com/ClickHouse/ClickHouse/pull/56135) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix schema cache for fallback JSON->JSONEachRow with changed settings [#56172](https://github.com/ClickHouse/ClickHouse/pull/56172) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add error handler to odbc-bridge [#56185](https://github.com/ClickHouse/ClickHouse/pull/56185) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-
-
-### <a id="239"></a> ClickHouse release 23.9, 2023-09-28
-
-#### Backward Incompatible Change
-* Remove the `status_info` configuration option and dictionaries status from the default Prometheus handler. [#54090](https://github.com/ClickHouse/ClickHouse/pull/54090) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The experimental parts metadata cache is removed from the codebase. [#54215](https://github.com/ClickHouse/ClickHouse/pull/54215) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable setting `input_format_json_try_infer_numbers_from_strings` by default, so we don't try to infer numbers from strings in JSON formats by default to avoid possible parsing errors when sample data contains strings that looks like a number. [#55099](https://github.com/ClickHouse/ClickHouse/pull/55099) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### New Feature
-* Improve schema inference from JSON formats: 1) Now it's possible to infer named Tuples from JSON objects without experimantal JSON type under a setting `input_format_json_try_infer_named_tuples_from_objects` in JSON formats. Previously without experimantal type JSON we could only infer JSON objects as Strings or Maps, now we can infer named Tuple. Resulting Tuple type will conain all keys of objects that were read in data sample during schema inference. It can be useful for reading structured JSON data without sparse objects. The setting is enabled by default. 2) Allow parsing JSON array into a column with type String under setting `input_format_json_read_arrays_as_strings`. It can help reading arrays with values with different types. 3) Allow to use type String for JSON keys with unkown types (`null`/`[]`/`{}`) in sample data under setting `input_format_json_infer_incomplete_types_as_strings`. Now in JSON formats we can read any value into String column and we can avoid getting error `Cannot determine type for column 'column_name' by first 25000 rows of data, most likely this column contains only Nulls or empty Arrays/Maps` during schema inference by using type String for unknown types, so the data will be read successfully. [#54427](https://github.com/ClickHouse/ClickHouse/pull/54427) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added IO scheduling support for remote disks. Storage configuration for disk types `s3`, `s3_plain`, `hdfs` and `azure_blob_storage` can now contain `read_resource` and `write_resource` elements holding resource names. Scheduling policies for these resources can be configured in a separate server configuration section `resources`. Queries can be marked using setting `workload` and classified using server configuration section `workload_classifiers` to achieve diverse resource scheduling goals. More details in [the docs](https://clickhouse.com/docs/en/operations/workload-scheduling). [#47009](https://github.com/ClickHouse/ClickHouse/pull/47009) ([Sergei Trifonov](https://github.com/serxa)). Added "bandwidth_limit" IO scheduling node type. It allows you to specify `max_speed` and `max_burst` constraints on traffic passing though this node. [#54618](https://github.com/ClickHouse/ClickHouse/pull/54618) ([Sergei Trifonov](https://github.com/serxa)).
-* Added new type of authentication based on SSH keys. It works only for the native TCP protocol. [#41109](https://github.com/ClickHouse/ClickHouse/pull/41109) ([George Gamezardashvili](https://github.com/InfJoker)).
-* Added a new column `_block_number` for MergeTree tables. [#44532](https://github.com/ClickHouse/ClickHouse/issues/44532). [#47532](https://github.com/ClickHouse/ClickHouse/pull/47532) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `IF EMPTY` clause for `DROP TABLE` queries. [#48915](https://github.com/ClickHouse/ClickHouse/pull/48915) ([Pavel Novitskiy](https://github.com/pnovitskiy)).
-* SQL functions `toString(datetime, timezone)` and `formatDateTime(datetime, format, timezone)` now support non-constant timezone arguments. [#53680](https://github.com/ClickHouse/ClickHouse/pull/53680) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add support for `ALTER TABLE MODIFY COMMENT`. Note: something similar was added by an external contributor a long time ago, but the feature did not work at all and only confused users. This closes [#36377](https://github.com/ClickHouse/ClickHouse/issues/36377). [#51304](https://github.com/ClickHouse/ClickHouse/pull/51304) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Note: this command does not propagate between replicas, so the replicas of a table could have different comments.
-* Added `GCD` a.k.a. "greatest common denominator" as a new data compression codec. The codec computes the GCD of all column values, and then divides each value by the GCD. The GCD codec is a data preparation codec (similar to Delta and DoubleDelta) and cannot be used stand-alone. It works with data integer, decimal and date/time type. A viable use case for the GCD codec are column values that change (increase/decrease) in multiples of the GCD, e.g. 24 - 28 - 16 - 24 - 8 - 24 (assuming GCD = 4). [#53149](https://github.com/ClickHouse/ClickHouse/pull/53149) ([Alexander Nam](https://github.com/seshWCS)).
-* Two new type aliases `DECIMAL(P)` (as shortcut for `DECIMAL(P, 0)` and `DECIMAL` (as shortcut for `DECIMAL(10, 0)`) were added. This makes ClickHouse more compatible with MySQL's SQL dialect. [#53328](https://github.com/ClickHouse/ClickHouse/pull/53328) ([Val Doroshchuk](https://github.com/valbok)).
-* Added a new system log table `backup_log` to track all `BACKUP` and `RESTORE` operations. [#53638](https://github.com/ClickHouse/ClickHouse/pull/53638) ([Victor Krasnov](https://github.com/sirvickr)).
-* Added a format setting `output_format_markdown_escape_special_characters` (default: false). The setting controls whether special characters like `!`, `#`, `$` etc. are escaped (i.e. prefixed by a backslash) in the `Markdown` output format. [#53860](https://github.com/ClickHouse/ClickHouse/pull/53860) ([irenjj](https://github.com/irenjj)).
-* Add function `decodeHTMLComponent`. [#54097](https://github.com/ClickHouse/ClickHouse/pull/54097) ([Bharat Nallan](https://github.com/bharatnc)).
-* Added `peak_threads_usage` to query_log table. [#54335](https://github.com/ClickHouse/ClickHouse/pull/54335) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add `SHOW FUNCTIONS` support to clickhouse-client. [#54337](https://github.com/ClickHouse/ClickHouse/pull/54337) ([Julia Kartseva](https://github.com/wat-ze-hex)).
-* Added function `toDaysSinceYearZero` with alias `TO_DAYS` (for compatibility with MySQL) which returns the number of days passed since `0001-01-01` (in Proleptic Gregorian Calendar). [#54479](https://github.com/ClickHouse/ClickHouse/pull/54479) ([Robert Schulze](https://github.com/rschu1ze)). Function `toDaysSinceYearZero` now supports arguments of type `DateTime` and `DateTime64`. [#54856](https://github.com/ClickHouse/ClickHouse/pull/54856) ([Serge Klochkov](https://github.com/slvrtrn)).
-* Added functions `YYYYMMDDtoDate`, `YYYYMMDDtoDate32`, `YYYYMMDDhhmmssToDateTime` and `YYYYMMDDhhmmssToDateTime64`. They convert a date or date with time encoded as integer (e.g. 20230911) into a native date or date with time. As such, they provide the opposite functionality of existing functions `YYYYMMDDToDate`, `YYYYMMDDToDateTime`, `YYYYMMDDhhmmddToDateTime`, `YYYYMMDDhhmmddToDateTime64`. [#54509](https://github.com/ClickHouse/ClickHouse/pull/54509) ([Quanfa Fu](https://github.com/dentiscalprum)) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add several string distance functions, including `byteHammingDistance`, `editDistance`. [#54935](https://github.com/ClickHouse/ClickHouse/pull/54935) ([flynn](https://github.com/ucasfl)).
-* Allow specifying the expiration date and, optionally, the time for user credentials with `VALID UNTIL datetime` clause. [#51261](https://github.com/ClickHouse/ClickHouse/pull/51261) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow S3-style URLs for table functions `s3`, `gcs`, `oss`. URL is automatically converted to HTTP. Example: `'s3://clickhouse-public-datasets/hits.csv'` is converted to `'https://clickhouse-public-datasets.s3.amazonaws.com/hits.csv'`. [#54931](https://github.com/ClickHouse/ClickHouse/pull/54931) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add new setting `print_pretty_type_names` to print pretty deep nested types like Tuple/Maps/Arrays. [#55095](https://github.com/ClickHouse/ClickHouse/pull/55095) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Performance Improvement
-* Speed up reading from S3 by enabling prefetches by default. [#53709](https://github.com/ClickHouse/ClickHouse/pull/53709) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Do not implicitly read PK and version columns in lonely parts if unnecessary for queries with FINAL. [#53919](https://github.com/ClickHouse/ClickHouse/pull/53919) ([Duc Canh Le](https://github.com/canhld94)).
-* Optimize group by constant keys. Will optimize queries with group by `_file/_path` after https://github.com/ClickHouse/ClickHouse/pull/53529. [#53549](https://github.com/ClickHouse/ClickHouse/pull/53549) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improve performance of sorting for `Decimal` columns. Improve performance of insertion into `MergeTree` if ORDER BY contains a `Decimal` column. Improve performance of sorting when data is already sorted or almost sorted. [#35961](https://github.com/ClickHouse/ClickHouse/pull/35961) ([Maksim Kita](https://github.com/kitaisreal)).
-* Improve performance for huge query analysis. Fixes [#51224](https://github.com/ClickHouse/ClickHouse/issues/51224). [#51469](https://github.com/ClickHouse/ClickHouse/pull/51469) ([frinkr](https://github.com/frinkr)).
-* An optimization to rewrite `COUNT(DISTINCT ...)` and various `uniq` variants to `count` if it is selected from a subquery with GROUP BY. [#52082](https://github.com/ClickHouse/ClickHouse/pull/52082) [#52645](https://github.com/ClickHouse/ClickHouse/pull/52645) ([JackyWoo](https://github.com/JackyWoo)).
-* Remove manual calls to `mmap/mremap/munmap` and delegate all this work to `jemalloc` - and it slightly improves performance. [#52792](https://github.com/ClickHouse/ClickHouse/pull/52792) ([Nikita Taranov](https://github.com/nickitat)).
-* Fixed high in CPU consumption when working with NATS. [#54399](https://github.com/ClickHouse/ClickHouse/pull/54399) ([Vasilev Pyotr](https://github.com/vahpetr)).
-* Since we use separate instructions for executing `toString` with datetime argument, it is possible to improve performance a bit for non-datetime arguments and have some parts of the code cleaner. Follows up [#53680](https://github.com/ClickHouse/ClickHouse/issues/53680). [#54443](https://github.com/ClickHouse/ClickHouse/pull/54443) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Instead of serializing json elements into a `std::stringstream`, this PR try to put the serialization result into `ColumnString` direclty. [#54613](https://github.com/ClickHouse/ClickHouse/pull/54613) ([lgbo](https://github.com/lgbo-ustc)).
-* Enable ORDER BY optimization for reading data in corresponding order from a MergeTree table in case that the table is behind a view. [#54628](https://github.com/ClickHouse/ClickHouse/pull/54628) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve JSON SQL functions by reusing `GeneratorJSONPath` and removing several shared pointers. [#54735](https://github.com/ClickHouse/ClickHouse/pull/54735) ([lgbo](https://github.com/lgbo-ustc)).
-* Keeper tries to batch flush requests for better performance. [#53049](https://github.com/ClickHouse/ClickHouse/pull/53049) ([Antonio Andelic](https://github.com/antonio2368)).
-* Now `clickhouse-client` processes files in parallel in case of `INFILE 'glob_expression'`. Closes [#54218](https://github.com/ClickHouse/ClickHouse/issues/54218). [#54533](https://github.com/ClickHouse/ClickHouse/pull/54533) ([Max K.](https://github.com/mkaynov)).
-* Allow to use primary key for IN function where primary key column types are different from `IN` function right side column types. Example: `SELECT id FROM test_table WHERE id IN (SELECT '5')`. Closes [#48936](https://github.com/ClickHouse/ClickHouse/issues/48936). [#54544](https://github.com/ClickHouse/ClickHouse/pull/54544) ([Maksim Kita](https://github.com/kitaisreal)).
-* Hash JOIN tries to shrink internal buffers consuming half of maximal available memory (set by `max_bytes_in_join`). [#54584](https://github.com/ClickHouse/ClickHouse/pull/54584) ([vdimir](https://github.com/vdimir)).
-* Respect `max_block_size` for array join to avoid possible OOM. Close [#54290](https://github.com/ClickHouse/ClickHouse/issues/54290). [#54664](https://github.com/ClickHouse/ClickHouse/pull/54664) ([李扬](https://github.com/taiyang-li)).
-* Reuse HTTP connections in the `s3` table function. [#54812](https://github.com/ClickHouse/ClickHouse/pull/54812) ([Michael Kolupaev](https://github.com/al13n321)).
-* Replace the linear search in `MergeTreeRangeReader::Stream::ceilRowsToCompleteGranules` with a binary search. [#54869](https://github.com/ClickHouse/ClickHouse/pull/54869) ([usurai](https://github.com/usurai)).
-
-#### Experimental Feature
-* The creation of `Annoy` indexes can now be parallelized using setting `max_threads_for_annoy_index_creation`. [#54047](https://github.com/ClickHouse/ClickHouse/pull/54047) ([Robert Schulze](https://github.com/rschu1ze)).
-* Parallel replicas over distributed don't read from all replicas [#54199](https://github.com/ClickHouse/ClickHouse/pull/54199) ([Igor Nikonov](https://github.com/devcrafter)).
-
-#### Improvement
-* Allow to replace long names of files of columns in `MergeTree` data parts to hashes of names. It helps to avoid `File name too long` error in some cases. [#50612](https://github.com/ClickHouse/ClickHouse/pull/50612) ([Anton Popov](https://github.com/CurtizJ)).
-* Parse data in `JSON` format as `JSONEachRow` if failed to parse metadata. It will allow to read files with `.json` extension even if real format is JSONEachRow. Closes [#45740](https://github.com/ClickHouse/ClickHouse/issues/45740). [#54405](https://github.com/ClickHouse/ClickHouse/pull/54405) ([Kruglov Pavel](https://github.com/Avogar)).
-* Output valid JSON/XML on excetpion during HTTP query execution. Add setting `http_write_exception_in_output_format` to enable/disable this behaviour (enabled by default). [#52853](https://github.com/ClickHouse/ClickHouse/pull/52853) ([Kruglov Pavel](https://github.com/Avogar)).
-* View `information_schema.tables` now has a new field `data_length` which shows the approximate size of the data on disk. Required to run queries generated by Amazon QuickSight. [#55037](https://github.com/ClickHouse/ClickHouse/pull/55037) ([Robert Schulze](https://github.com/rschu1ze)).
-* The MySQL interface gained a minimal implementation of prepared statements, just enough to allow a connection from Tableau Online to ClickHouse via the MySQL connector. [#54115](https://github.com/ClickHouse/ClickHouse/pull/54115) ([Serge Klochkov](https://github.com/slvrtrn)). Please note: the prepared statements implementation is pretty minimal, we do not support arguments binding yet, it is not required in this particular Tableau online use case. It will be implemented as a follow-up if necessary after extensive testing of Tableau Online in case we discover issues.
-* Support case-insensitive and dot-all matching modes in `regexp_tree` dictionaries. [#50906](https://github.com/ClickHouse/ClickHouse/pull/50906) ([Johann Gan](https://github.com/johanngan)).
-* Keeper improvement: Add a `createIfNotExists` Keeper command. [#48855](https://github.com/ClickHouse/ClickHouse/pull/48855) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* More precise integer type inference, fix [#51236](https://github.com/ClickHouse/ClickHouse/issues/51236). [#53003](https://github.com/ClickHouse/ClickHouse/pull/53003) ([Chen768959](https://github.com/Chen768959)).
-* Introduced resolving of charsets in the string literals for MaterializedMySQL. [#53220](https://github.com/ClickHouse/ClickHouse/pull/53220) ([Val Doroshchuk](https://github.com/valbok)).
-* Fix a subtle issue with a rarely used `EmbeddedRocksDB` table engine in an extremely rare scenario: sometimes the `EmbeddedRocksDB` table engine does not close files correctly in NFS after running `DROP TABLE`. [#53502](https://github.com/ClickHouse/ClickHouse/pull/53502) ([Mingliang Pan](https://github.com/liangliangpan)).
-* `RESTORE TABLE ON CLUSTER` must create replicated tables with a matching UUID on hosts. Otherwise the macro `{uuid}` in ZooKeeper path can't work correctly after RESTORE. This PR implements that. [#53765](https://github.com/ClickHouse/ClickHouse/pull/53765) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Added restore setting `restore_broken_parts_as_detached`: if it's true the RESTORE process won't stop on broken parts while restoring, instead all the broken parts will be copied to the `detached` folder with the prefix `broken-from-backup'. If it's false the RESTORE process will stop on the first broken part (if any). The default value is false. [#53877](https://github.com/ClickHouse/ClickHouse/pull/53877) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add `elapsed_ns` field to HTTP headers X-ClickHouse-Progress and X-ClickHouse-Summary. [#54179](https://github.com/ClickHouse/ClickHouse/pull/54179) ([joelynch](https://github.com/joelynch)).
-* Implementation of `reconfig` (https://github.com/ClickHouse/ClickHouse/pull/49450), `sync`, and `exists` commands for keeper-client. [#54201](https://github.com/ClickHouse/ClickHouse/pull/54201) ([pufit](https://github.com/pufit)).
-* `clickhouse-local` and `clickhouse-client` now allow to specify the `--query` parameter multiple times, e.g. `./clickhouse-client --query "SELECT 1" --query "SELECT 2"`. This syntax is slightly more intuitive than `./clickhouse-client --multiquery "SELECT  1;S ELECT 2"`, a bit easier to script (e.g. `queries.push_back('--query "$q"')`) and more consistent with the behavior of existing parameter `--queries-file` (e.g. `./clickhouse client --queries-file queries1.sql --queries-file queries2.sql`). [#54249](https://github.com/ClickHouse/ClickHouse/pull/54249) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add sub-second precision to `formatReadableTimeDelta`. [#54250](https://github.com/ClickHouse/ClickHouse/pull/54250) ([Andrey Zvonov](https://github.com/zvonand)).
-* Enable `allow_remove_stale_moving_parts` by default. [#54260](https://github.com/ClickHouse/ClickHouse/pull/54260) ([vdimir](https://github.com/vdimir)).
-* Fix using count from cache and improve progress bar for reading from archives. [#54271](https://github.com/ClickHouse/ClickHouse/pull/54271) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for S3 credentials using SSO. To define a profile to be used with SSO, set `AWS_PROFILE` environment variable. [#54347](https://github.com/ClickHouse/ClickHouse/pull/54347) ([Antonio Andelic](https://github.com/antonio2368)).
-* Support NULL as default for nested types Array/Tuple/Map for input formats. Closes [#51100](https://github.com/ClickHouse/ClickHouse/issues/51100). [#54351](https://github.com/ClickHouse/ClickHouse/pull/54351) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow reading some unusual configuration of chunks from Arrow/Parquet formats. [#54370](https://github.com/ClickHouse/ClickHouse/pull/54370) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add `STD` alias to `stddevPop` function for MySQL compatibility. Closes [#54274](https://github.com/ClickHouse/ClickHouse/issues/54274). [#54382](https://github.com/ClickHouse/ClickHouse/pull/54382) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `addDate` function for compatibility with MySQL and `subDate` for consistency. Reference [#54275](https://github.com/ClickHouse/ClickHouse/issues/54275). [#54400](https://github.com/ClickHouse/ClickHouse/pull/54400) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `modification_time` into `system.detached_parts`. [#54506](https://github.com/ClickHouse/ClickHouse/pull/54506) ([Azat Khuzhin](https://github.com/azat)).
-* Added a setting `splitby_max_substrings_includes_remaining_string` which controls if functions "splitBy*()" with argument "max_substring" > 0 include the remaining string (if any) in the result array (Python/Spark semantics) or not. The default behavior does not change. [#54518](https://github.com/ClickHouse/ClickHouse/pull/54518) ([Robert Schulze](https://github.com/rschu1ze)).
-* Better integer types inference for `Int64`/`UInt64` fields. Continuation of [#53003](https://github.com/ClickHouse/ClickHouse/pull/53003). Now it works also for nested types like Arrays of Arrays and for functions like `map/tuple`. Issue: [#51236](https://github.com/ClickHouse/ClickHouse/issues/51236). [#54553](https://github.com/ClickHouse/ClickHouse/pull/54553) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added array operations for multiplying, dividing and modulo on scalar. Works in each way, for example `5 * [5, 5]` and `[5, 5] * 5` - both cases are possible. [#54608](https://github.com/ClickHouse/ClickHouse/pull/54608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add optional `version` argument to `rm` command in `keeper-client` to support safer deletes. [#54708](https://github.com/ClickHouse/ClickHouse/pull/54708) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Disable killing the server by systemd (that may lead to data loss when using Buffer tables). [#54744](https://github.com/ClickHouse/ClickHouse/pull/54744) ([Azat Khuzhin](https://github.com/azat)).
-* Added field `is_deterministic` to system table `system.functions` which indicates whether the result of a function is stable between two invocations (given exactly the same inputs) or not. [#54766](https://github.com/ClickHouse/ClickHouse/pull/54766) [#55035](https://github.com/ClickHouse/ClickHouse/pull/55035) ([Robert Schulze](https://github.com/rschu1ze)).
-* Made the views in schema `information_schema` more compatible with the equivalent views in MySQL (i.e. modified and extended them) up to a point where Tableau Online is able to connect to ClickHouse. More specifically: 1. The type of field `information_schema.tables.table_type` changed from Enum8 to String. 2. Added fields `table_comment` and `table_collation` to view `information_schema.table`. 3. Added views `information_schema.key_column_usage` and `referential_constraints`. 4. Replaced uppercase aliases in `information_schema` views with concrete uppercase columns. [#54773](https://github.com/ClickHouse/ClickHouse/pull/54773) ([Serge Klochkov](https://github.com/slvrtrn)).
-* The query cache now returns an error if the user tries to cache the result of a query with a non-deterministic function such as `now`, `randomString` and `dictGet`. Compared to the previous behavior (silently don't cache the result), this reduces confusion and surprise for users. [#54801](https://github.com/ClickHouse/ClickHouse/pull/54801) ([Robert Schulze](https://github.com/rschu1ze)).
-* Forbid special columns like materialized/ephemeral/alias for `file`/`s3`/`url`/... storages, fix insert into ephemeral columns from files. Closes [#53477](https://github.com/ClickHouse/ClickHouse/issues/53477). [#54803](https://github.com/ClickHouse/ClickHouse/pull/54803) ([Kruglov Pavel](https://github.com/Avogar)).
-* More configurable collecting metadata for backup. [#54804](https://github.com/ClickHouse/ClickHouse/pull/54804) ([Vitaly Baranov](https://github.com/vitlibar)).
-* `clickhouse-local`'s log file (if enabled with --server_logs_file flag) will now prefix each line with timestamp, thread id, etc, just like `clickhouse-server`. [#54807](https://github.com/ClickHouse/ClickHouse/pull/54807) ([Michael Kolupaev](https://github.com/al13n321)).
-* Field `is_obsolete` in the `system.merge_tree_settings` table - it is now 1 for obsolete merge tree settings. Previously, only the description indicated that the setting is obsolete. [#54837](https://github.com/ClickHouse/ClickHouse/pull/54837) ([Robert Schulze](https://github.com/rschu1ze)).
-* Make it possible to use plural when using interval literals. `INTERVAL 2 HOURS` should be equivalent to `INTERVAL 2 HOUR`. [#54860](https://github.com/ClickHouse/ClickHouse/pull/54860) ([Jordi Villar](https://github.com/jrdi)).
-* Always allow the creation of a projection with `Nullable` PK. This fixes [#54814](https://github.com/ClickHouse/ClickHouse/issues/54814). [#54895](https://github.com/ClickHouse/ClickHouse/pull/54895) ([Amos Bird](https://github.com/amosbird)).
-* Retry backup's S3 operations after connection reset failure. [#54900](https://github.com/ClickHouse/ClickHouse/pull/54900) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Make the exception message exact in case of the maximum value of a settings is less than the minimum value. [#54925](https://github.com/ClickHouse/ClickHouse/pull/54925) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* `LIKE`, `match`, and other regular expressions matching functions now allow matching with patterns containing non-UTF-8 substrings by falling back to binary matching. Example: you can use `string LIKE '\xFE\xFF%'` to detect BOM. This closes [#54486](https://github.com/ClickHouse/ClickHouse/issues/54486). [#54942](https://github.com/ClickHouse/ClickHouse/pull/54942) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added `ContextLockWaitMicroseconds` profile event. [#55029](https://github.com/ClickHouse/ClickHouse/pull/55029) ([Maksim Kita](https://github.com/kitaisreal)).
-* The Keeper dynamically adjusts log levels. [#50372](https://github.com/ClickHouse/ClickHouse/pull/50372) ([helifu](https://github.com/helifu)).
-* Added function `timestamp` for compatibility with MySQL. Closes [#54275](https://github.com/ClickHouse/ClickHouse/issues/54275). [#54639](https://github.com/ClickHouse/ClickHouse/pull/54639) ([Nikolay Degterinsky](https://github.com/evillique)).
-
-#### Build/Testing/Packaging Improvement
-* Bumped the compiler of official and continuous integration builds of ClickHouse from Clang 16 to 17. [#53831](https://github.com/ClickHouse/ClickHouse/pull/53831) ([Robert Schulze](https://github.com/rschu1ze)).
-* Regenerated tld data for lookups (`tldLookup.generated.cpp`). [#54269](https://github.com/ClickHouse/ClickHouse/pull/54269) ([Bharat Nallan](https://github.com/bharatnc)).
-* Remove the redundant `clickhouse-keeper-client` symlink. [#54587](https://github.com/ClickHouse/ClickHouse/pull/54587) ([Tomas Barton](https://github.com/deric)).
-* Use `/usr/bin/env` to resolve bash - now it supports Nix OS. [#54603](https://github.com/ClickHouse/ClickHouse/pull/54603) ([Fionera](https://github.com/fionera)).
-* CMake added `PROFILE_CPU` option needed to perform `perf record` without using a DWARF call graph. [#54917](https://github.com/ClickHouse/ClickHouse/pull/54917) ([Maksim Kita](https://github.com/kitaisreal)).
-* If the linker is different than LLD, stop with a fatal error. [#55036](https://github.com/ClickHouse/ClickHouse/pull/55036) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Replaced the library to handle (encode/decode) base64 values from Turbo-Base64 to aklomp-base64. Both are SIMD-accelerated on x86 and ARM but 1. the license of the latter (BSD-2) is more favorable for ClickHouse, Turbo64 switched in the meantime to GPL-3, 2. with more GitHub stars, aklomp-base64 seems more future-proof, 3. aklomp-base64 has a slightly nicer API (which is arguably subjective), and 4. aklomp-base64 does not require us to hack around bugs (like non-threadsafe initialization). Note: aklomp-base64 rejects unpadded base64 values whereas Turbo-Base64 decodes them on a best-effort basis. RFC-4648 leaves it open whether padding is mandatory or not, but depending on the context this may be a behavioral change to be aware of. [#54119](https://github.com/ClickHouse/ClickHouse/pull/54119) ([Mikhail Koviazin](https://github.com/mkmkme)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix REPLACE/MOVE PARTITION with zero-copy replication (note: "zero-copy replication" is an experimental feature) [#54193](https://github.com/ClickHouse/ClickHouse/pull/54193) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix zero copy locks with hardlinks (note: "zero-copy replication" is an experimental feature) [#54859](https://github.com/ClickHouse/ClickHouse/pull/54859) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix zero copy garbage (note: "zero-copy replication" is an experimental feature) [#54550](https://github.com/ClickHouse/ClickHouse/pull/54550) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Pass HTTP retry timeout as milliseconds (it was incorrect before). [#54438](https://github.com/ClickHouse/ClickHouse/pull/54438) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix misleading error message in OUTFILE with `CapnProto`/`Protobuf` [#52870](https://github.com/ClickHouse/ClickHouse/pull/52870) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix summary reporting with parallel replicas with LIMIT [#53050](https://github.com/ClickHouse/ClickHouse/pull/53050) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix throttling of BACKUPs from/to S3 (in case native copy was not used) and in some other places as well [#53336](https://github.com/ClickHouse/ClickHouse/pull/53336) ([Azat Khuzhin](https://github.com/azat)).
-* Fix IO throttling during copying whole directories [#53338](https://github.com/ClickHouse/ClickHouse/pull/53338) ([Azat Khuzhin](https://github.com/azat)).
-* Fix: moved to prewhere condition actions can lose column [#53492](https://github.com/ClickHouse/ClickHouse/pull/53492) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fixed internal error when replacing with byte-equal parts [#53735](https://github.com/ClickHouse/ClickHouse/pull/53735) ([Pedro Riera](https://github.com/priera)).
-* Fix: require columns participating in interpolate expression [#53754](https://github.com/ClickHouse/ClickHouse/pull/53754) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix cluster discovery initialization + setting up fail points in config [#54113](https://github.com/ClickHouse/ClickHouse/pull/54113) ([vdimir](https://github.com/vdimir)).
-* Fix issues in `accurateCastOrNull` [#54136](https://github.com/ClickHouse/ClickHouse/pull/54136) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix nullable primary key with the FINAL modifier [#54164](https://github.com/ClickHouse/ClickHouse/pull/54164) ([Amos Bird](https://github.com/amosbird)).
-* Fixed error that prevented insertion in replicated materialized view of new data in presence of duplicated data. [#54184](https://github.com/ClickHouse/ClickHouse/pull/54184) ([Pedro Riera](https://github.com/priera)).
-* Fix: allow `IPv6` for bloom filter [#54200](https://github.com/ClickHouse/ClickHouse/pull/54200) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* fix possible type mismatch with `IPv4` [#54212](https://github.com/ClickHouse/ClickHouse/pull/54212) ([Bharat Nallan](https://github.com/bharatnc)).
-* Fix `system.data_skipping_indices` for recreated indices [#54225](https://github.com/ClickHouse/ClickHouse/pull/54225) ([Artur Malchanau](https://github.com/Hexta)).
-* fix name clash for multiple join rewriter v2 [#54240](https://github.com/ClickHouse/ClickHouse/pull/54240) ([Tao Wang](https://github.com/wangtZJU)).
-* Fix unexpected errors in `system.errors` after join [#54306](https://github.com/ClickHouse/ClickHouse/pull/54306) ([vdimir](https://github.com/vdimir)).
-* Fix `isZeroOrNull(NULL)` [#54316](https://github.com/ClickHouse/ClickHouse/pull/54316) ([flynn](https://github.com/ucasfl)).
-* Fix: parallel replicas over distributed with `prefer_localhost_replica` = 1 [#54334](https://github.com/ClickHouse/ClickHouse/pull/54334) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix logical error in vertical merge + replacing merge tree + optimize cleanup [#54368](https://github.com/ClickHouse/ClickHouse/pull/54368) ([alesapin](https://github.com/alesapin)).
-* Fix possible error `URI contains invalid characters` in the `s3` table function [#54373](https://github.com/ClickHouse/ClickHouse/pull/54373) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix segfault in AST optimization of `arrayExists` function [#54379](https://github.com/ClickHouse/ClickHouse/pull/54379) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Check for overflow before addition in `analysisOfVariance` function [#54385](https://github.com/ClickHouse/ClickHouse/pull/54385) ([Antonio Andelic](https://github.com/antonio2368)).
-* Reproduce and fix the bug in removeSharedRecursive [#54430](https://github.com/ClickHouse/ClickHouse/pull/54430) ([Sema Checherinda](https://github.com/CheSema)).
-* Fix possible incorrect result with SimpleAggregateFunction in PREWHERE and FINAL [#54436](https://github.com/ClickHouse/ClickHouse/pull/54436) ([Azat Khuzhin](https://github.com/azat)).
-* Fix filtering parts with indexHint for non analyzer [#54449](https://github.com/ClickHouse/ClickHouse/pull/54449) ([Azat Khuzhin](https://github.com/azat)).
-* Fix aggregate projections with normalized states [#54480](https://github.com/ClickHouse/ClickHouse/pull/54480) ([Amos Bird](https://github.com/amosbird)).
-* `clickhouse-local`: something for multiquery parameter [#54498](https://github.com/ClickHouse/ClickHouse/pull/54498) ([CuiShuoGuo](https://github.com/bakam412)).
-* `clickhouse-local` supports `--database` command line argument [#54503](https://github.com/ClickHouse/ClickHouse/pull/54503) ([vdimir](https://github.com/vdimir)).
-* Fix possible parsing error in `-WithNames` formats with disabled `input_format_with_names_use_header` [#54513](https://github.com/ClickHouse/ClickHouse/pull/54513) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix rare case of CHECKSUM_DOESNT_MATCH error [#54549](https://github.com/ClickHouse/ClickHouse/pull/54549) ([alesapin](https://github.com/alesapin)).
-* Fix sorting of UNION ALL of already sorted results [#54564](https://github.com/ClickHouse/ClickHouse/pull/54564) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix snapshot install in Keeper [#54572](https://github.com/ClickHouse/ClickHouse/pull/54572) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix race in `ColumnUnique` [#54575](https://github.com/ClickHouse/ClickHouse/pull/54575) ([Nikita Taranov](https://github.com/nickitat)).
-* Annoy/Usearch index: Fix LOGICAL_ERROR during build-up with default values [#54600](https://github.com/ClickHouse/ClickHouse/pull/54600) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix serialization of `ColumnDecimal` [#54601](https://github.com/ClickHouse/ClickHouse/pull/54601) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix schema inference for *Cluster functions for column names with spaces [#54635](https://github.com/ClickHouse/ClickHouse/pull/54635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix using structure from insertion tables in case of defaults and explicit insert columns [#54655](https://github.com/ClickHouse/ClickHouse/pull/54655) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix: avoid using regex match, possibly containing alternation, as a key condition. [#54696](https://github.com/ClickHouse/ClickHouse/pull/54696) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix ReplacingMergeTree with vertical merge and cleanup [#54706](https://github.com/ClickHouse/ClickHouse/pull/54706) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix virtual columns having incorrect values after ORDER BY [#54811](https://github.com/ClickHouse/ClickHouse/pull/54811) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix filtering parts with indexHint for non analyzer [#54825](https://github.com/ClickHouse/ClickHouse/pull/54825) [#54449](https://github.com/ClickHouse/ClickHouse/pull/54449) ([Azat Khuzhin](https://github.com/azat)).
-* Fix Keeper segfault during shutdown [#54841](https://github.com/ClickHouse/ClickHouse/pull/54841) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix `Invalid number of rows in Chunk` in MaterializedPostgreSQL [#54844](https://github.com/ClickHouse/ClickHouse/pull/54844) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Move obsolete format settings to separate section [#54855](https://github.com/ClickHouse/ClickHouse/pull/54855) ([Kruglov Pavel](https://github.com/Avogar)).
-* Rebuild `minmax_count_projection` when partition key gets modified [#54943](https://github.com/ClickHouse/ClickHouse/pull/54943) ([Amos Bird](https://github.com/amosbird)).
-* Fix bad cast to `ColumnVector<Int128>` in function `if` [#55019](https://github.com/ClickHouse/ClickHouse/pull/55019) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prevent attaching parts from tables with different projections or indices [#55062](https://github.com/ClickHouse/ClickHouse/pull/55062) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Store NULL in scalar result map for empty subquery result [#52240](https://github.com/ClickHouse/ClickHouse/pull/52240) ([vdimir](https://github.com/vdimir)).
-* Fix `FINAL` produces invalid read ranges in a rare case [#54934](https://github.com/ClickHouse/ClickHouse/pull/54934) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix: insert quorum w/o keeper retries [#55026](https://github.com/ClickHouse/ClickHouse/pull/55026) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix simple state with nullable [#55030](https://github.com/ClickHouse/ClickHouse/pull/55030) ([Pedro Riera](https://github.com/priera)).
-
-
-### <a id="238"></a> ClickHouse release 23.8 LTS, 2023-08-31
-
-#### Backward Incompatible Change
-* If a dynamic disk contains a name, it should be specified as `disk = disk(name = 'disk_name'`, ...) in disk function arguments. In previous version it could be specified as `disk = disk_<disk_name>(...)`, which is no longer supported. [#52820](https://github.com/ClickHouse/ClickHouse/pull/52820) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* `clickhouse-benchmark` will establish connections in parallel when invoked with `--concurrency` more than one. Previously it was unusable if you ran it with 1000 concurrent connections from Europe to the US. Correct calculation of QPS for connections with high latency. Backward incompatible change: the option for JSON output of `clickhouse-benchmark` is removed. If you've used this option, you can also extract data from the `system.query_log` in JSON format as a workaround. [#53293](https://github.com/ClickHouse/ClickHouse/pull/53293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `microseconds` column is removed from the `system.text_log`, and the `milliseconds` column is removed from the `system.metric_log`, because they are redundant in the presence of the `event_time_microseconds` column. [#53601](https://github.com/ClickHouse/ClickHouse/pull/53601) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Deprecate the metadata cache feature. It is experimental and we have never used it. The feature is dangerous: [#51182](https://github.com/ClickHouse/ClickHouse/issues/51182). Remove the `system.merge_tree_metadata_cache` system table. The metadata cache is still available in this version but will be removed soon. This closes [#39197](https://github.com/ClickHouse/ClickHouse/issues/39197). [#51303](https://github.com/ClickHouse/ClickHouse/pull/51303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable support for 3DES in TLS connections. [#52893](https://github.com/ClickHouse/ClickHouse/pull/52893) ([Kenji Noguchi](https://github.com/knoguchi)).
-
-#### New Feature
-* Direct import from zip/7z/tar archives. Example: `file('*.zip :: *.csv')`. [#50321](https://github.com/ClickHouse/ClickHouse/pull/50321) ([nikitakeba](https://github.com/nikitakeba)).
-* Add column `ptr` to `system.trace_log` for `trace_type = 'MemorySample'`. This column contains an address of allocation. Added function `flameGraph` which can build flamegraph containing allocated and not released memory. Reworking of [#38391](https://github.com/ClickHouse/ClickHouse/issues/38391). [#45322](https://github.com/ClickHouse/ClickHouse/pull/45322) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Added table function `azureBlobStorageCluster`. The supported set of features is very similar to table function `s3Cluster`. [#50795](https://github.com/ClickHouse/ClickHouse/pull/50795) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Allow using `cluster`, `clusterAllReplicas`, `remote`, and `remoteSecure` without table name in issue [#50808](https://github.com/ClickHouse/ClickHouse/issues/50808). [#50848](https://github.com/ClickHouse/ClickHouse/pull/50848) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
-* A system table to monitor Kafka consumers. [#50999](https://github.com/ClickHouse/ClickHouse/pull/50999) ([Ilya Golshtein](https://github.com/ilejn)).
-* Added `max_sessions_for_user` setting. [#51724](https://github.com/ClickHouse/ClickHouse/pull/51724) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* New functions `toUTCTimestamp/fromUTCTimestamp` to act same as spark's `to_utc_timestamp/from_utc_timestamp`. [#52117](https://github.com/ClickHouse/ClickHouse/pull/52117) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Add new functions `structureToCapnProtoSchema`/`structureToProtobufSchema` that convert ClickHouse table structure to CapnProto/Protobuf format schema. Allow to input/output data in CapnProto/Protobuf format without external format schema using autogenerated schema from table structure (controlled by settings `format_capn_proto_use_autogenerated_schema`/`format_protobuf_use_autogenerated_schema`). Allow to export autogenerated schema while input/output using setting `output_format_schema`. [#52278](https://github.com/ClickHouse/ClickHouse/pull/52278) ([Kruglov Pavel](https://github.com/Avogar)).
-* A new field `query_cache_usage` in `system.query_log` now shows if and how the query cache was used. [#52384](https://github.com/ClickHouse/ClickHouse/pull/52384) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add new function `startsWithUTF8` and `endsWithUTF8`. [#52555](https://github.com/ClickHouse/ClickHouse/pull/52555) ([李扬](https://github.com/taiyang-li)).
-* Allow variable number of columns in TSV/CustomSeparated/JSONCompactEachRow, make schema inference work with variable number of columns. Add settings `input_format_tsv_allow_variable_number_of_columns`, `input_format_custom_allow_variable_number_of_columns`, `input_format_json_compact_allow_variable_number_of_columns`. [#52692](https://github.com/ClickHouse/ClickHouse/pull/52692) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added `SYSTEM STOP/START PULLING REPLICATION LOG` queries (for testing `ReplicatedMergeTree`). [#52881](https://github.com/ClickHouse/ClickHouse/pull/52881) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Allow to execute constant non-deterministic functions in mutations on initiator. [#53129](https://github.com/ClickHouse/ClickHouse/pull/53129) ([Anton Popov](https://github.com/CurtizJ)).
-* Add input format `One` that doesn't read any data and always returns single row with column `dummy` with type `UInt8` and value `0` like `system.one`. It can be used together with `_file/_path` virtual columns to list files in file/s3/url/hdfs/etc table functions without reading any data. [#53209](https://github.com/ClickHouse/ClickHouse/pull/53209) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `tupleConcat` function. Closes [#52759](https://github.com/ClickHouse/ClickHouse/issues/52759). [#53239](https://github.com/ClickHouse/ClickHouse/pull/53239) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Support `TRUNCATE DATABASE` operation. [#53261](https://github.com/ClickHouse/ClickHouse/pull/53261) ([Bharat Nallan](https://github.com/bharatnc)).
-* Add `max_threads_for_indexes` setting to limit number of threads used for primary key processing. [#53313](https://github.com/ClickHouse/ClickHouse/pull/53313) ([jorisgio](https://github.com/jorisgio)).
-* Re-add SipHash keyed functions. [#53525](https://github.com/ClickHouse/ClickHouse/pull/53525) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* ([#52755](https://github.com/ClickHouse/ClickHouse/issues/52755) , [#52895](https://github.com/ClickHouse/ClickHouse/issues/52895)) Added functions `arrayRotateLeft`, `arrayRotateRight`, `arrayShiftLeft`, `arrayShiftRight`. [#53557](https://github.com/ClickHouse/ClickHouse/pull/53557) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Add column `name` to `system.clusters` as an alias to cluster. [#53605](https://github.com/ClickHouse/ClickHouse/pull/53605) ([irenjj](https://github.com/irenjj)).
-* The advanced dashboard now allows mass editing (save/load). [#53608](https://github.com/ClickHouse/ClickHouse/pull/53608) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The advanced dashboard now has an option to maximize charts and move them around. [#53622](https://github.com/ClickHouse/ClickHouse/pull/53622) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added support for adding and subtracting arrays: `[5,2] + [1,7]`. Division and multiplication were not implemented due to confusion between pointwise multiplication and the scalar product of arguments. Closes [#49939](https://github.com/ClickHouse/ClickHouse/issues/49939). [#52625](https://github.com/ClickHouse/ClickHouse/pull/52625) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add support for string literals as table names. Closes [#52178](https://github.com/ClickHouse/ClickHouse/issues/52178). [#52635](https://github.com/ClickHouse/ClickHouse/pull/52635) ([hendrik-m](https://github.com/hendrik-m)).
-
-#### Experimental Feature
-* Add new table engine `S3Queue` for streaming data import from s3. Closes [#37012](https://github.com/ClickHouse/ClickHouse/issues/37012). [#49086](https://github.com/ClickHouse/ClickHouse/pull/49086) ([s-kat](https://github.com/s-kat)). It is not ready to use. Do not use it.
-* Enable parallel reading from replicas over distributed table. Related to [#49708](https://github.com/ClickHouse/ClickHouse/issues/49708). [#53005](https://github.com/ClickHouse/ClickHouse/pull/53005) ([Igor Nikonov](https://github.com/devcrafter)).
-* Add experimental support for HNSW as approximate neighbor search method. [#53447](https://github.com/ClickHouse/ClickHouse/pull/53447) ([Davit Vardanyan](https://github.com/davvard)). This is currently intended for those who continue working on the implementation. Do not use it.
-
-#### Performance Improvement
-* Parquet filter pushdown. I.e. when reading Parquet files, row groups (chunks of the file) are skipped based on the WHERE condition and the min/max values in each column. In particular, if the file is roughly sorted by some column, queries that filter by a short range of that column will be much faster. [#52951](https://github.com/ClickHouse/ClickHouse/pull/52951) ([Michael Kolupaev](https://github.com/al13n321)).
-* Optimize reading small row groups by batching them together in Parquet. Closes [#53069](https://github.com/ClickHouse/ClickHouse/issues/53069). [#53281](https://github.com/ClickHouse/ClickHouse/pull/53281) ([Kruglov Pavel](https://github.com/Avogar)).
-* Optimize count from files in most input formats. Closes [#44334](https://github.com/ClickHouse/ClickHouse/issues/44334). [#53637](https://github.com/ClickHouse/ClickHouse/pull/53637) ([Kruglov Pavel](https://github.com/Avogar)).
-* Use filter by file/path before reading in `url`/`file`/`hdfs` table functions. [#53529](https://github.com/ClickHouse/ClickHouse/pull/53529) ([Kruglov Pavel](https://github.com/Avogar)).
-* Enable JIT compilation for AArch64, PowerPC, SystemZ, RISC-V. [#38217](https://github.com/ClickHouse/ClickHouse/pull/38217) ([Maksim Kita](https://github.com/kitaisreal)).
-* Add setting `rewrite_count_distinct_if_with_count_distinct_implementation` to rewrite `countDistinctIf` with `count_distinct_implementation`. Closes [#30642](https://github.com/ClickHouse/ClickHouse/issues/30642). [#46051](https://github.com/ClickHouse/ClickHouse/pull/46051) ([flynn](https://github.com/ucasfl)).
-* Speed up merging of states of `uniq` and `uniqExact` aggregate functions by parallelizing conversion before merge. [#50748](https://github.com/ClickHouse/ClickHouse/pull/50748) ([Jiebin Sun](https://github.com/jiebinn)).
-* Optimize aggregation performance of nullable string key when using a large number of variable length keys. [#51399](https://github.com/ClickHouse/ClickHouse/pull/51399) ([LiuNeng](https://github.com/liuneng1994)).
-* Add a pass in Analyzer for time filter optimization with preimage. The performance experiments of SSB on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring an improvement of 8.5% to the geomean QPS when the experimental analyzer is enabled. [#52091](https://github.com/ClickHouse/ClickHouse/pull/52091) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Optimize the merge if all hash sets are single-level in the `uniqExact` (COUNT DISTINCT) function. [#52973](https://github.com/ClickHouse/ClickHouse/pull/52973) ([Jiebin Sun](https://github.com/jiebinn)).
-* `Join` table engine: do not clone hash join data structure with all columns. [#53046](https://github.com/ClickHouse/ClickHouse/pull/53046) ([Duc Canh Le](https://github.com/canhld94)).
-* Implement native `ORC` input format without the "apache arrow" library to improve performance. [#53324](https://github.com/ClickHouse/ClickHouse/pull/53324) ([李扬](https://github.com/taiyang-li)).
-* The dashboard will tell the server to compress the data, which is useful for large time frames over slow internet connections. For example, one chart with 86400 points can be 1.5 MB uncompressed and 60 KB compressed with `br`. [#53569](https://github.com/ClickHouse/ClickHouse/pull/53569) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Better utilization of thread pool for BACKUPs and RESTOREs. [#53649](https://github.com/ClickHouse/ClickHouse/pull/53649) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Load filesystem cache metadata on startup in parallel. Configured by `load_metadata_threads` (default: 1) cache config setting. Related to [#52037](https://github.com/ClickHouse/ClickHouse/issues/52037). [#52943](https://github.com/ClickHouse/ClickHouse/pull/52943) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Improve `move_primary_key_columns_to_end_of_prewhere`. [#53337](https://github.com/ClickHouse/ClickHouse/pull/53337) ([Han Fei](https://github.com/hanfei1991)).
-* This optimizes the interaction with ClickHouse Keeper. Previously the caller could register the same watch callback multiple times. In that case each entry was consuming memory and the same callback was called multiple times which didn't make much sense. In order to avoid this the caller could have some logic to not add the same watch multiple times. With this change this deduplication is done internally if the watch callback is passed via shared_ptr. [#53452](https://github.com/ClickHouse/ClickHouse/pull/53452) ([Alexander Gololobov](https://github.com/davenger)).
-* Cache number of rows in files for count in file/s3/url/hdfs/azure functions. The cache can be enabled/disabled by setting `use_cache_for_count_from_files` (enabled by default). Continuation of https://github.com/ClickHouse/ClickHouse/pull/53637. [#53692](https://github.com/ClickHouse/ClickHouse/pull/53692) ([Kruglov Pavel](https://github.com/Avogar)).
-* More careful thread management will improve the speed of the S3 table function over a large number of files by more than ~25%. [#53668](https://github.com/ClickHouse/ClickHouse/pull/53668) ([pufit](https://github.com/pufit)).
-
-#### Improvement
-* Add `stderr_reaction` configuration/setting to control the reaction (none, log or throw) when external command stderr has data. This helps make debugging external command easier. [#43210](https://github.com/ClickHouse/ClickHouse/pull/43210) ([Amos Bird](https://github.com/amosbird)).
-* Add `partition` column to the `system part_log` and merge table. [#48990](https://github.com/ClickHouse/ClickHouse/pull/48990) ([Jianfei Hu](https://github.com/incfly)).
-* The sizes of the (index) uncompressed/mark, mmap and query caches can now be configured dynamically at runtime (without server restart). [#51446](https://github.com/ClickHouse/ClickHouse/pull/51446) ([Robert Schulze](https://github.com/rschu1ze)).
-* If a dictionary is created with a complex key, automatically choose the "complex key" layout variant. [#49587](https://github.com/ClickHouse/ClickHouse/pull/49587) ([xiebin](https://github.com/xbthink)).
-* Add setting `use_concurrency_control` for better testing of the new concurrency control feature. [#49618](https://github.com/ClickHouse/ClickHouse/pull/49618) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added suggestions for mistyped names for databases and tables. [#49801](https://github.com/ClickHouse/ClickHouse/pull/49801) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* While read small files from HDFS by Gluten, we found that it will cost more times when compare to directly query by Spark. And we did something with that. [#50063](https://github.com/ClickHouse/ClickHouse/pull/50063) ([KevinyhZou](https://github.com/KevinyhZou)).
-* There were too many worthless error logs after session expiration, which we didn't like. [#50171](https://github.com/ClickHouse/ClickHouse/pull/50171) ([helifu](https://github.com/helifu)).
-* Introduce fallback ZooKeeper sessions which are time-bound. Fixed `index` column in system.zookeeper_connection for DNS addresses. [#50424](https://github.com/ClickHouse/ClickHouse/pull/50424) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Add ability to log when max_partitions_per_insert_block is reached. [#50948](https://github.com/ClickHouse/ClickHouse/pull/50948) ([Sean Haynes](https://github.com/seandhaynes)).
-* Added a bunch of custom commands to clickhouse-keeper-client (mostly to make ClickHouse debugging easier). [#51117](https://github.com/ClickHouse/ClickHouse/pull/51117) ([pufit](https://github.com/pufit)).
-* Updated check for connection string in `azureBlobStorage` table function as connection string with "sas" does not always begin with the default endpoint and updated connection URL to include "sas" token after adding Azure's container to URL. [#51141](https://github.com/ClickHouse/ClickHouse/pull/51141) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix description for filtering sets in the `full_sorting_merge` JOIN algorithm. [#51329](https://github.com/ClickHouse/ClickHouse/pull/51329) ([Tanay Tummalapalli](https://github.com/ttanay)).
-* Fixed memory consumption in `Aggregator` when `max_block_size` is huge. [#51566](https://github.com/ClickHouse/ClickHouse/pull/51566) ([Nikita Taranov](https://github.com/nickitat)).
-* Add `SYSTEM SYNC FILESYSTEM CACHE` command. It will compare in-memory state of filesystem cache with what it has on disk and fix in-memory state if needed. This is only needed if you are making manual interventions in on-disk data, which is highly discouraged. [#51622](https://github.com/ClickHouse/ClickHouse/pull/51622) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Attempt to create a generic proxy resolver for CH while keeping backwards compatibility with existing S3 storage conf proxy resolver. [#51749](https://github.com/ClickHouse/ClickHouse/pull/51749) ([Arthur Passos](https://github.com/arthurpassos)).
-* Support reading tuple subcolumns from file/s3/hdfs/url/azureBlobStorage table functions. [#51806](https://github.com/ClickHouse/ClickHouse/pull/51806) ([Kruglov Pavel](https://github.com/Avogar)).
-* Function `arrayIntersect` now returns the values in the order, corresponding to the first argument. Closes [#27622](https://github.com/ClickHouse/ClickHouse/issues/27622). [#51850](https://github.com/ClickHouse/ClickHouse/pull/51850) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Add new queries, which allow to create/drop of access entities in specified access storage or move access entities from one access storage to another. [#51912](https://github.com/ClickHouse/ClickHouse/pull/51912) ([pufit](https://github.com/pufit)).
-* Make `ALTER TABLE FREEZE` queries not replicated in the Replicated database engine. [#52064](https://github.com/ClickHouse/ClickHouse/pull/52064) ([Mike Kot](https://github.com/myrrc)).
-* Added possibility to flush system tables on unexpected shutdown. [#52174](https://github.com/ClickHouse/ClickHouse/pull/52174) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix the case when `s3` table function refused to work with pre-signed URLs. close [#50846](https://github.com/ClickHouse/ClickHouse/issues/50846). [#52310](https://github.com/ClickHouse/ClickHouse/pull/52310) ([chen](https://github.com/xiedeyantu)).
-* Add column `name` as an alias to `event` and `metric` in the `system.events` and `system.metrics` tables. Closes [#51257](https://github.com/ClickHouse/ClickHouse/issues/51257). [#52315](https://github.com/ClickHouse/ClickHouse/pull/52315) ([chen](https://github.com/xiedeyantu)).
-* Added support of syntax `CREATE UNIQUE INDEX` in parser as a no-op for better SQL compatibility. `UNIQUE` index is not supported. Set `create_index_ignore_unique = 1` to ignore UNIQUE keyword in queries. [#52320](https://github.com/ClickHouse/ClickHouse/pull/52320) ([Ilya Yatsishin](https://github.com/qoega)).
-* Add support of predefined macro (`{database}` and `{table}`) in some Kafka engine settings: topic, consumer, client_id, etc. [#52386](https://github.com/ClickHouse/ClickHouse/pull/52386) ([Yury Bogomolov](https://github.com/ybogo)).
-* Disable updating the filesystem cache during backup/restore. Filesystem cache must not be updated during backup/restore, it seems it just slows down the process without any profit (because the BACKUP command can read a lot of data and it's no use to put all the data to the filesystem cache and immediately evict it). [#52402](https://github.com/ClickHouse/ClickHouse/pull/52402) ([Vitaly Baranov](https://github.com/vitlibar)).
-* The configuration of S3 endpoint allow using it from the root, and append '/' automatically if needed. [#47809](https://github.com/ClickHouse/ClickHouse/issues/47809). [#52600](https://github.com/ClickHouse/ClickHouse/pull/52600) ([xiaolei565](https://github.com/xiaolei565)).
-* For clickhouse-local allow positional options and populate global UDF settings (user_scripts_path and user_defined_executable_functions_config). [#52643](https://github.com/ClickHouse/ClickHouse/pull/52643) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* `system.asynchronous_metrics` now includes metrics "QueryCacheEntries" and "QueryCacheBytes" to inspect the query cache. [#52650](https://github.com/ClickHouse/ClickHouse/pull/52650) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added possibility to use `s3_storage_class` parameter in the `SETTINGS` clause of the `BACKUP` statement for backups to S3. [#52658](https://github.com/ClickHouse/ClickHouse/pull/52658) ([Roman Vasin](https://github.com/rvasin)).
-* Add utility `print-backup-info.py` which parses a backup metadata file and prints information about the backup. [#52690](https://github.com/ClickHouse/ClickHouse/pull/52690) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Closes [#49510](https://github.com/ClickHouse/ClickHouse/issues/49510). Currently we have database and table names case-sensitive, but BI tools query `information_schema` sometimes in lowercase, sometimes in uppercase. For this reason we have `information_schema` database, containing lowercase tables, such as `information_schema.tables` and `INFORMATION_SCHEMA` database, containing uppercase tables, such as `INFORMATION_SCHEMA.TABLES`. But some tools are querying `INFORMATION_SCHEMA.tables` and `information_schema.TABLES`. The proposed solution is to duplicate both lowercase and uppercase tables in lowercase and uppercase `information_schema` database. [#52695](https://github.com/ClickHouse/ClickHouse/pull/52695) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Query`CHECK TABLE` has better performance and usability (sends progress updates, cancellable). [#52745](https://github.com/ClickHouse/ClickHouse/pull/52745) ([vdimir](https://github.com/vdimir)).
-* Add support for `modulo`, `intDiv`, `intDivOrZero` for tuples by distributing them across tuple's elements. [#52758](https://github.com/ClickHouse/ClickHouse/pull/52758) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Search for default `yaml` and `yml` configs in clickhouse-client after `xml`. [#52767](https://github.com/ClickHouse/ClickHouse/pull/52767) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* When merging into non-'clickhouse' rooted configuration, configs with different root node name just bypassed without exception. [#52770](https://github.com/ClickHouse/ClickHouse/pull/52770) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Now it's possible to specify min (`memory_profiler_sample_min_allocation_size`) and max (`memory_profiler_sample_max_allocation_size`) size for allocations to be tracked with sampling memory profiler. [#52779](https://github.com/ClickHouse/ClickHouse/pull/52779) ([alesapin](https://github.com/alesapin)).
-* Add `precise_float_parsing` setting to switch float parsing methods (fast/precise). [#52791](https://github.com/ClickHouse/ClickHouse/pull/52791) ([Andrey Zvonov](https://github.com/zvonand)).
-* Use the same default paths for `clickhouse-keeper` (symlink) as for `clickhouse-keeper` (executable). [#52861](https://github.com/ClickHouse/ClickHouse/pull/52861) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve error message for table function `remote`. Closes [#40220](https://github.com/ClickHouse/ClickHouse/issues/40220). [#52959](https://github.com/ClickHouse/ClickHouse/pull/52959) ([jiyoungyoooo](https://github.com/jiyoungyoooo)).
-* Added the possibility to specify custom storage policy in the `SETTINGS` clause of `RESTORE` queries. [#52970](https://github.com/ClickHouse/ClickHouse/pull/52970) ([Victor Krasnov](https://github.com/sirvickr)).
-* Add the ability to throttle the S3 requests on backup operations (`BACKUP` and `RESTORE` commands now honor `s3_max_[get/put]_[rps/burst]`). [#52974](https://github.com/ClickHouse/ClickHouse/pull/52974) ([Daniel Pozo Escalona](https://github.com/danipozo)).
-* Add settings to ignore ON CLUSTER clause in queries for management of replicated user-defined functions or access control entities with replicated storage. [#52975](https://github.com/ClickHouse/ClickHouse/pull/52975) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* EXPLAIN actions for JOIN step. [#53006](https://github.com/ClickHouse/ClickHouse/pull/53006) ([Maksim Kita](https://github.com/kitaisreal)).
-* Make `hasTokenOrNull` and `hasTokenCaseInsensitiveOrNull` return null for empty needles. [#53059](https://github.com/ClickHouse/ClickHouse/pull/53059) ([ltrk2](https://github.com/ltrk2)).
-* Allow to restrict allowed paths for filesystem caches. Mainly useful for dynamic disks. If in server config `filesystem_caches_path` is specified, all filesystem caches' paths will be restricted to this directory. E.g. if the `path` in cache config is relative - it will be put in `filesystem_caches_path`; if `path` in cache config is absolute, it will be required to lie inside `filesystem_caches_path`. If `filesystem_caches_path` is not specified in config, then behaviour will be the same as in earlier versions. [#53124](https://github.com/ClickHouse/ClickHouse/pull/53124) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Added a bunch of custom commands (mostly to make ClickHouse debugging easier). [#53127](https://github.com/ClickHouse/ClickHouse/pull/53127) ([pufit](https://github.com/pufit)).
-* Add diagnostic info about file name during schema inference - it helps when you process multiple files with globs. [#53135](https://github.com/ClickHouse/ClickHouse/pull/53135) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Client will load suggestions using the main connection if the second connection is not allowed to create a session. [#53177](https://github.com/ClickHouse/ClickHouse/pull/53177) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add EXCEPT clause to `SYSTEM STOP/START LISTEN QUERIES [ALL/DEFAULT/CUSTOM]` query, for example `SYSTEM STOP LISTEN QUERIES ALL EXCEPT TCP, HTTP`. [#53280](https://github.com/ClickHouse/ClickHouse/pull/53280) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Change the default of `max_concurrent_queries` from 100 to 1000. It's ok to have many concurrent queries if they are not heavy, and mostly waiting for the network. Note: don't confuse concurrent queries and QPS: for example, ClickHouse server can do tens of thousands of QPS with less than 100 concurrent queries. [#53285](https://github.com/ClickHouse/ClickHouse/pull/53285) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Limit number of concurrent background partition optimize merges. [#53405](https://github.com/ClickHouse/ClickHouse/pull/53405) ([Duc Canh Le](https://github.com/canhld94)).
-* Added a setting `allow_moving_table_directory_to_trash` that allows to ignore `Directory for table data already exists` error when replicating/recovering a `Replicated` database. [#53425](https://github.com/ClickHouse/ClickHouse/pull/53425) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* If server settings `asynchronous_metrics_update_period_s` and `asynchronous_heavy_metrics_update_period_s` are misconfigured to 0, it will now fail gracefully instead of terminating the application. [#53428](https://github.com/ClickHouse/ClickHouse/pull/53428) ([Robert Schulze](https://github.com/rschu1ze)).
-* The ClickHouse server now respects memory limits changed via cgroups when reloading its configuration. [#53455](https://github.com/ClickHouse/ClickHouse/pull/53455) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add ability to turn off flush of Distributed tables on `DETACH`, `DROP`, or server shutdown. [#53501](https://github.com/ClickHouse/ClickHouse/pull/53501) ([Azat Khuzhin](https://github.com/azat)).
-* The `domainRFC` function now supports IPv6 in square brackets. [#53506](https://github.com/ClickHouse/ClickHouse/pull/53506) ([Chen768959](https://github.com/Chen768959)).
-* Use longer timeout for S3 CopyObject requests, which are used in backups. [#53533](https://github.com/ClickHouse/ClickHouse/pull/53533) ([Michael Kolupaev](https://github.com/al13n321)).
-* Added server setting `aggregate_function_group_array_max_element_size`. This setting is used to limit array size for `groupArray` function at serialization. The default value is `16777215`. [#53550](https://github.com/ClickHouse/ClickHouse/pull/53550) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* `SCHEMA` was added as alias for `DATABASE` to improve MySQL compatibility. [#53587](https://github.com/ClickHouse/ClickHouse/pull/53587) ([Daniël van Eeden](https://github.com/dveeden)).
-* Add asynchronous metrics about tables in the system database. For example, `TotalBytesOfMergeTreeTablesSystem`. This closes [#53603](https://github.com/ClickHouse/ClickHouse/issues/53603). [#53604](https://github.com/ClickHouse/ClickHouse/pull/53604) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* SQL editor in the Play UI and Dashboard will not use Grammarly. [#53614](https://github.com/ClickHouse/ClickHouse/pull/53614) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* As expert-level settings, it is now possible to (1) configure the size_ratio (i.e. the relative size of the protected queue) of the [index] mark/uncompressed caches, (2) configure the cache policy of the index mark and index uncompressed caches. [#53657](https://github.com/ClickHouse/ClickHouse/pull/53657) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added client info validation to the query packet in TCPHandler. [#53673](https://github.com/ClickHouse/ClickHouse/pull/53673) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Retry loading parts in case of network errors while interaction with Microsoft Azure. [#53750](https://github.com/ClickHouse/ClickHouse/pull/53750) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Stacktrace for exceptions, Materailized view exceptions are propagated. [#53766](https://github.com/ClickHouse/ClickHouse/pull/53766) ([Ilya Golshtein](https://github.com/ilejn)).
-* If no hostname or port were specified, keeper client will try to search for a connection string in the ClickHouse's config.xml. [#53769](https://github.com/ClickHouse/ClickHouse/pull/53769) ([pufit](https://github.com/pufit)).
-* Add profile event `PartsLockMicroseconds` which shows the amount of microseconds we hold the data parts lock in MergeTree table engine family. [#53797](https://github.com/ClickHouse/ClickHouse/pull/53797) ([alesapin](https://github.com/alesapin)).
-* Make reconnect limit in RAFT limits configurable for keeper. This configuration can help to make keeper to rebuild connection with peers quicker if the current connection is broken. [#53817](https://github.com/ClickHouse/ClickHouse/pull/53817) ([Pengyuan Bian](https://github.com/bianpengyuan)).
-* Ignore foreign keys in tables definition to improve compatibility with MySQL, so a user wouldn't need to rewrite his SQL of the foreign key part, ref [#53380](https://github.com/ClickHouse/ClickHouse/issues/53380). [#53864](https://github.com/ClickHouse/ClickHouse/pull/53864) ([jsc0218](https://github.com/jsc0218)).
-
-#### Build/Testing/Packaging Improvement
-* Don't expose symbols from ClickHouse binary to dynamic linker. It might fix [#43933](https://github.com/ClickHouse/ClickHouse/issues/43933). [#47475](https://github.com/ClickHouse/ClickHouse/pull/47475) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add `clickhouse-keeper-client` symlink to the clickhouse-server package. [#51882](https://github.com/ClickHouse/ClickHouse/pull/51882) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Add https://github.com/elliotchance/sqltest to CI to report the SQL 2016 conformance. [#52293](https://github.com/ClickHouse/ClickHouse/pull/52293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Upgrade PRQL to 0.9.3. [#53060](https://github.com/ClickHouse/ClickHouse/pull/53060) ([Maximilian Roos](https://github.com/max-sixty)).
-* System tables from CI checks are exported to ClickHouse Cloud. [#53086](https://github.com/ClickHouse/ClickHouse/pull/53086) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The compiler's profile data (`-ftime-trace`) is uploaded to ClickHouse Cloud. [#53100](https://github.com/ClickHouse/ClickHouse/pull/53100) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up Debug and Tidy builds. [#53178](https://github.com/ClickHouse/ClickHouse/pull/53178) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up the build by removing tons and tonnes of garbage. One of the frequently included headers was poisoned by boost. [#53180](https://github.com/ClickHouse/ClickHouse/pull/53180) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove even more garbage. [#53182](https://github.com/ClickHouse/ClickHouse/pull/53182) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The function `arrayAUC` was using heavy C++ templates - ditched them. [#53183](https://github.com/ClickHouse/ClickHouse/pull/53183) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Some translation units were always rebuilt regardless of ccache. The culprit is found and fixed. [#53184](https://github.com/ClickHouse/ClickHouse/pull/53184) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The compiler's profile data (`-ftime-trace`) is uploaded to ClickHouse Cloud., the second attempt after [#53100](https://github.com/ClickHouse/ClickHouse/issues/53100). [#53213](https://github.com/ClickHouse/ClickHouse/pull/53213) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in stateful tests to ClickHouse Cloud. [#53351](https://github.com/ClickHouse/ClickHouse/pull/53351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in stress tests. [#53353](https://github.com/ClickHouse/ClickHouse/pull/53353) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Export logs from CI in fuzzer. [#53354](https://github.com/ClickHouse/ClickHouse/pull/53354) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Preserve environment parameters in `clickhouse start` command. Fixes [#51962](https://github.com/ClickHouse/ClickHouse/issues/51962). [#53418](https://github.com/ClickHouse/ClickHouse/pull/53418) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Follow up for [#53418](https://github.com/ClickHouse/ClickHouse/issues/53418). Small improvements for install_check.py, adding tests for proper ENV parameters passing to the main process on `init.d start`. [#53457](https://github.com/ClickHouse/ClickHouse/pull/53457) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Reorganize file management in CMake to prevent potential duplications. For instance, `indexHint.cpp` is duplicated in both `dbms_sources` and `clickhouse_functions_sources`. [#53621](https://github.com/ClickHouse/ClickHouse/pull/53621) ([Amos Bird](https://github.com/amosbird)).
-* Upgrade snappy to 1.1.10. [#53672](https://github.com/ClickHouse/ClickHouse/pull/53672) ([李扬](https://github.com/taiyang-li)).
-* Slightly improve cmake build by sanitizing some dependencies and removing some duplicates. Each commit includes a short description of the changes made. [#53759](https://github.com/ClickHouse/ClickHouse/pull/53759) ([Amos Bird](https://github.com/amosbird)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Do not reset (experimental) Annoy index during build-up with more than one mark [#51325](https://github.com/ClickHouse/ClickHouse/pull/51325) ([Tian Xinhui](https://github.com/xinhuitian)).
-* Fix usage of temporary directories during RESTORE [#51493](https://github.com/ClickHouse/ClickHouse/pull/51493) ([Azat Khuzhin](https://github.com/azat)).
-* Fix binary arithmetic for Nullable(IPv4) [#51642](https://github.com/ClickHouse/ClickHouse/pull/51642) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Support IPv4 and IPv6 data types as dictionary attributes [#51756](https://github.com/ClickHouse/ClickHouse/pull/51756) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* A fix for checksum of compress marks [#51777](https://github.com/ClickHouse/ClickHouse/pull/51777) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix mistakenly comma parsing as part of datetime in CSV best effort parsing [#51950](https://github.com/ClickHouse/ClickHouse/pull/51950) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't throw exception when executable UDF has parameters [#51961](https://github.com/ClickHouse/ClickHouse/pull/51961) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix recalculation of skip indexes and projections in `ALTER DELETE` queries [#52530](https://github.com/ClickHouse/ClickHouse/pull/52530) ([Anton Popov](https://github.com/CurtizJ)).
-* MaterializedMySQL: Fix the infinite loop in ReadBuffer::read [#52621](https://github.com/ClickHouse/ClickHouse/pull/52621) ([Val Doroshchuk](https://github.com/valbok)).
-* Load suggestion only with `clickhouse` dialect [#52628](https://github.com/ClickHouse/ClickHouse/pull/52628) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Init and destroy ares channel on demand. [#52634](https://github.com/ClickHouse/ClickHouse/pull/52634) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix filtering by virtual columns with OR expression [#52653](https://github.com/ClickHouse/ClickHouse/pull/52653) ([Azat Khuzhin](https://github.com/azat)).
-* Fix crash in function `tuple` with one sparse column argument [#52659](https://github.com/ClickHouse/ClickHouse/pull/52659) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix named collections on cluster [#52687](https://github.com/ClickHouse/ClickHouse/pull/52687) ([Al Korgun](https://github.com/alkorgun)).
-* Fix reading of unnecessary column in case of multistage `PREWHERE` [#52689](https://github.com/ClickHouse/ClickHouse/pull/52689) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix unexpected sort result on multi columns with nulls first direction [#52761](https://github.com/ClickHouse/ClickHouse/pull/52761) ([copperybean](https://github.com/copperybean)).
-* Fix data race in Keeper reconfiguration [#52804](https://github.com/ClickHouse/ClickHouse/pull/52804) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix sorting of sparse columns with large limit [#52827](https://github.com/ClickHouse/ClickHouse/pull/52827) ([Anton Popov](https://github.com/CurtizJ)).
-* clickhouse-keeper: fix implementation of server with poll. [#52833](https://github.com/ClickHouse/ClickHouse/pull/52833) ([Andy Fiddaman](https://github.com/citrus-it)).
-* Make regexp analyzer recognize named capturing groups [#52840](https://github.com/ClickHouse/ClickHouse/pull/52840) ([Han Fei](https://github.com/hanfei1991)).
-* Fix possible assert in `~PushingAsyncPipelineExecutor` in clickhouse-local [#52862](https://github.com/ClickHouse/ClickHouse/pull/52862) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix reading of empty `Nested(Array(LowCardinality(...)))` [#52949](https://github.com/ClickHouse/ClickHouse/pull/52949) ([Anton Popov](https://github.com/CurtizJ)).
-* Added new tests for session_log and fixed the inconsistency between login and logout. [#52958](https://github.com/ClickHouse/ClickHouse/pull/52958) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix password leak in show create mysql table [#52962](https://github.com/ClickHouse/ClickHouse/pull/52962) ([Duc Canh Le](https://github.com/canhld94)).
-* Convert sparse column format to full in CreateSetAndFilterOnTheFlyStep [#53000](https://github.com/ClickHouse/ClickHouse/pull/53000) ([vdimir](https://github.com/vdimir)).
-* Fix rare race condition with empty key prefix directory deletion in fs cache [#53055](https://github.com/ClickHouse/ClickHouse/pull/53055) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix ZstdDeflatingWriteBuffer truncating the output sometimes [#53064](https://github.com/ClickHouse/ClickHouse/pull/53064) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix query_id in part_log with async flush queries [#53103](https://github.com/ClickHouse/ClickHouse/pull/53103) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix possible error from cache "Read unexpected size" [#53121](https://github.com/ClickHouse/ClickHouse/pull/53121) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disable the new parquet encoder [#53130](https://github.com/ClickHouse/ClickHouse/pull/53130) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix "Not-ready Set" exception [#53162](https://github.com/ClickHouse/ClickHouse/pull/53162) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix character escaping in the PostgreSQL engine [#53250](https://github.com/ClickHouse/ClickHouse/pull/53250) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Experimental session_log table: Added new tests for session_log and fixed the inconsistency between login and logout. [#53255](https://github.com/ClickHouse/ClickHouse/pull/53255) ([Alexey Gerasimchuck](https://github.com/Demilivor)). Fixed inconsistency between login success and logout [#53302](https://github.com/ClickHouse/ClickHouse/pull/53302) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix adding sub-second intervals to DateTime [#53309](https://github.com/ClickHouse/ClickHouse/pull/53309) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix "Context has expired" error in dictionaries [#53342](https://github.com/ClickHouse/ClickHouse/pull/53342) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect normal projection AST format [#53347](https://github.com/ClickHouse/ClickHouse/pull/53347) ([Amos Bird](https://github.com/amosbird)).
-* Forbid use_structure_from_insertion_table_in_table_functions when execute Scalar [#53348](https://github.com/ClickHouse/ClickHouse/pull/53348) ([flynn](https://github.com/ucasfl)).
-* Fix loading lazy database during system.table select query [#53372](https://github.com/ClickHouse/ClickHouse/pull/53372) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fixed system.data_skipping_indices for MaterializedMySQL [#53381](https://github.com/ClickHouse/ClickHouse/pull/53381) ([Filipp Ozinov](https://github.com/bakwc)).
-* Fix processing single carriage return in TSV file segmentation engine [#53407](https://github.com/ClickHouse/ClickHouse/pull/53407) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `Context has expired` error properly [#53433](https://github.com/ClickHouse/ClickHouse/pull/53433) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix `timeout_overflow_mode` when having subquery in the rhs of IN [#53439](https://github.com/ClickHouse/ClickHouse/pull/53439) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix an unexpected behavior in [#53152](https://github.com/ClickHouse/ClickHouse/issues/53152) [#53440](https://github.com/ClickHouse/ClickHouse/pull/53440) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Fix JSON_QUERY Function parse error while path is all number [#53470](https://github.com/ClickHouse/ClickHouse/pull/53470) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Fix wrong columns order for queries with parallel FINAL. [#53489](https://github.com/ClickHouse/ClickHouse/pull/53489) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fixed SELECTing from ReplacingMergeTree with do_not_merge_across_partitions_select_final [#53511](https://github.com/ClickHouse/ClickHouse/pull/53511) ([Vasily Nemkov](https://github.com/Enmk)).
-* Flush async insert queue first on shutdown [#53547](https://github.com/ClickHouse/ClickHouse/pull/53547) ([joelynch](https://github.com/joelynch)).
-* Fix crash in join on sparse columna [#53548](https://github.com/ClickHouse/ClickHouse/pull/53548) ([vdimir](https://github.com/vdimir)).
-* Fix possible UB in Set skipping index for functions with incorrect args [#53559](https://github.com/ClickHouse/ClickHouse/pull/53559) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible UB in inverted indexes (experimental feature) [#53560](https://github.com/ClickHouse/ClickHouse/pull/53560) ([Azat Khuzhin](https://github.com/azat)).
-* Fix: interpolate expression takes source column instead of same name aliased from select expression. [#53572](https://github.com/ClickHouse/ClickHouse/pull/53572) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix number of dropped granules in EXPLAIN PLAN index=1 [#53616](https://github.com/ClickHouse/ClickHouse/pull/53616) ([wangxiaobo](https://github.com/wzb5212)).
-* Correctly handle totals and extremes with `DelayedSource` [#53644](https://github.com/ClickHouse/ClickHouse/pull/53644) ([Antonio Andelic](https://github.com/antonio2368)).
-* Prepared set cache in mutation pipeline stuck [#53645](https://github.com/ClickHouse/ClickHouse/pull/53645) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix bug on mutations with subcolumns of type JSON in predicates of UPDATE and DELETE queries. [#53677](https://github.com/ClickHouse/ClickHouse/pull/53677) ([VanDarkholme7](https://github.com/VanDarkholme7)).
-* Fix filter pushdown for full_sorting_merge join [#53699](https://github.com/ClickHouse/ClickHouse/pull/53699) ([vdimir](https://github.com/vdimir)).
-* Try to fix bug with `NULL::LowCardinality(Nullable(...)) NOT IN` [#53706](https://github.com/ClickHouse/ClickHouse/pull/53706) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix: sorted distinct with sparse columns [#53711](https://github.com/ClickHouse/ClickHouse/pull/53711) ([Igor Nikonov](https://github.com/devcrafter)).
-* `transform`: correctly handle default column with multiple rows [#53742](https://github.com/ClickHouse/ClickHouse/pull/53742) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix fuzzer crash in parseDateTime [#53764](https://github.com/ClickHouse/ClickHouse/pull/53764) ([Robert Schulze](https://github.com/rschu1ze)).
-* MaterializedPostgreSQL: fix uncaught exception in getCreateTableQueryImpl [#53832](https://github.com/ClickHouse/ClickHouse/pull/53832) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible segfault while using PostgreSQL engine [#53847](https://github.com/ClickHouse/ClickHouse/pull/53847) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix named_collection_admin alias [#54066](https://github.com/ClickHouse/ClickHouse/pull/54066) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-### <a id="237"></a> ClickHouse release 23.7, 2023-07-27
-
-#### Backward Incompatible Change
-* Add `NAMED COLLECTION` access type (aliases `USE NAMED COLLECTION`, `NAMED COLLECTION USAGE`). This PR is backward incompatible because this access type is disabled by default (because a parent access type `NAMED COLLECTION ADMIN` is disabled by default as well). Proposed in [#50277](https://github.com/ClickHouse/ClickHouse/issues/50277). To grant use `GRANT NAMED COLLECTION ON collection_name TO user` or `GRANT NAMED COLLECTION ON * TO user`, to be able to give these grants `named_collection_admin` is required in config (previously it was named `named_collection_control`, so will remain as an alias). [#50625](https://github.com/ClickHouse/ClickHouse/pull/50625) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fixing a typo in the `system.parts` column name `last_removal_attemp_time`. Now it is named `last_removal_attempt_time`. [#52104](https://github.com/ClickHouse/ClickHouse/pull/52104) ([filimonov](https://github.com/filimonov)).
-* Bump version of the distributed_ddl_entry_format_version to 5 by default (enables opentelemetry and initial_query_idd pass through). This will not allow to process existing entries for distributed DDL after *downgrade* (but note, that usually there should be no such unprocessed entries). [#52128](https://github.com/ClickHouse/ClickHouse/pull/52128) ([Azat Khuzhin](https://github.com/azat)).
-* Check projection metadata the same way we check ordinary metadata. This change may prevent the server from starting in case there was a table with an invalid projection. An example is a projection that created positional columns in PK (e.g. `projection p (select * order by 1, 4)` which is not allowed in table PK and can cause a crash during insert/merge). Drop such projections before the update. Fixes [#52353](https://github.com/ClickHouse/ClickHouse/issues/52353). [#52361](https://github.com/ClickHouse/ClickHouse/pull/52361) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* The experimental feature `hashid` is removed due to a bug. The quality of implementation was questionable at the start, and it didn't get through the experimental status. This closes [#52406](https://github.com/ClickHouse/ClickHouse/issues/52406). [#52449](https://github.com/ClickHouse/ClickHouse/pull/52449) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* Added `Overlay` database engine to combine multiple databases into one. Added `Filesystem` database engine to represent a directory in the filesystem as a set of implicitly available tables with auto-detected formats and structures. A new `S3` database engine allows to read-only interact with s3 storage by representing a prefix as a set of tables. A new `HDFS` database engine allows to interact with HDFS storage in the same way. [#48821](https://github.com/ClickHouse/ClickHouse/pull/48821) ([alekseygolub](https://github.com/alekseygolub)).
-* Add support for external disks in Keeper for storing snapshots and logs. [#50098](https://github.com/ClickHouse/ClickHouse/pull/50098) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for multi-directory selection (`{}`) globs. [#50559](https://github.com/ClickHouse/ClickHouse/pull/50559) ([Andrey Zvonov](https://github.com/zvonand)).
-* Kafka connector can fetch Avro schema from schema registry with basic authentication using url-encoded credentials. [#49664](https://github.com/ClickHouse/ClickHouse/pull/49664) ([Ilya Golshtein](https://github.com/ilejn)).
-* Add function `arrayJaccardIndex` which computes the Jaccard similarity between two arrays. [#50076](https://github.com/ClickHouse/ClickHouse/pull/50076) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Add a column `is_obsolete` to `system.settings` and similar tables. Closes [#50819](https://github.com/ClickHouse/ClickHouse/issues/50819). [#50826](https://github.com/ClickHouse/ClickHouse/pull/50826) ([flynn](https://github.com/ucasfl)).
-* Implement support of encrypted elements in configuration file. Added possibility to use encrypted text in leaf elements of configuration file. The text is encrypted using encryption codecs from `<encryption_codecs>` section. [#50986](https://github.com/ClickHouse/ClickHouse/pull/50986) ([Roman Vasin](https://github.com/rvasin)).
-* Grace Hash Join algorithm is now applicable to FULL and RIGHT JOINs. [#49483](https://github.com/ClickHouse/ClickHouse/issues/49483). [#51013](https://github.com/ClickHouse/ClickHouse/pull/51013) ([lgbo](https://github.com/lgbo-ustc)).
-* Add `SYSTEM STOP LISTEN` query for more graceful termination. Closes [#47972](https://github.com/ClickHouse/ClickHouse/issues/47972). [#51016](https://github.com/ClickHouse/ClickHouse/pull/51016) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `input_format_csv_allow_variable_number_of_columns` options. [#51273](https://github.com/ClickHouse/ClickHouse/pull/51273) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Another boring feature: add function `substring_index`, as in Spark or MySQL. [#51472](https://github.com/ClickHouse/ClickHouse/pull/51472) ([李扬](https://github.com/taiyang-li)).
-* A system table `jemalloc_bins` to show stats for jemalloc bins. Example `SELECT *, size * (nmalloc - ndalloc) AS allocated_bytes FROM system.jemalloc_bins WHERE allocated_bytes > 0 ORDER BY allocated_bytes DESC LIMIT 10`. Enjoy. [#51674](https://github.com/ClickHouse/ClickHouse/pull/51674) ([Alexander Gololobov](https://github.com/davenger)).
-* Add `RowBinaryWithDefaults` format with extra byte before each column as a flag for using the column's default value. Closes [#50854](https://github.com/ClickHouse/ClickHouse/issues/50854). [#51695](https://github.com/ClickHouse/ClickHouse/pull/51695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added `default_temporary_table_engine` setting. Same as `default_table_engine` but for temporary tables. [#51292](https://github.com/ClickHouse/ClickHouse/issues/51292). [#51708](https://github.com/ClickHouse/ClickHouse/pull/51708) ([velavokr](https://github.com/velavokr)).
-* Added new `initcap` / `initcapUTF8` functions which convert the first letter of each word to upper case and the rest to lower case. [#51735](https://github.com/ClickHouse/ClickHouse/pull/51735) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Create table now supports `PRIMARY KEY` syntax in column definition. Columns are added to primary index in the same order columns are defined. [#51881](https://github.com/ClickHouse/ClickHouse/pull/51881) ([Ilya Yatsishin](https://github.com/qoega)).
-* Added the possibility to use date and time format specifiers in log and error log file names, either in config files (`log` and `errorlog` tags) or command line arguments (`--log-file` and `--errorlog-file`). [#51945](https://github.com/ClickHouse/ClickHouse/pull/51945) ([Victor Krasnov](https://github.com/sirvickr)).
-* Added Peak Memory Usage statistic to HTTP headers. [#51946](https://github.com/ClickHouse/ClickHouse/pull/51946) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Added new `hasSubsequence` (+`CaseInsensitive` and `UTF8` versions) functions to match subsequences in strings. [#52050](https://github.com/ClickHouse/ClickHouse/pull/52050) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Add `array_agg` as alias of `groupArray` for PostgreSQL compatibility. Closes [#52100](https://github.com/ClickHouse/ClickHouse/issues/52100). ### Documentation entry for user-facing changes. [#52135](https://github.com/ClickHouse/ClickHouse/pull/52135) ([flynn](https://github.com/ucasfl)).
-* Add `any_value` as a compatibility alias for `any` aggregate function. Closes [#52140](https://github.com/ClickHouse/ClickHouse/issues/52140). [#52147](https://github.com/ClickHouse/ClickHouse/pull/52147) ([flynn](https://github.com/ucasfl)).
-* Add aggregate function `array_concat_agg` for compatibility with BigQuery, it's alias of `groupArrayArray`. Closes [#52139](https://github.com/ClickHouse/ClickHouse/issues/52139). [#52149](https://github.com/ClickHouse/ClickHouse/pull/52149) ([flynn](https://github.com/ucasfl)).
-* Add `OCTET_LENGTH` as an alias to `length`. Closes [#52153](https://github.com/ClickHouse/ClickHouse/issues/52153). [#52176](https://github.com/ClickHouse/ClickHouse/pull/52176) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Added `firstLine` function to extract the first line from the multi-line string. This closes [#51172](https://github.com/ClickHouse/ClickHouse/issues/51172). [#52209](https://github.com/ClickHouse/ClickHouse/pull/52209) ([Mikhail Koviazin](https://github.com/mkmkme)).
-* Implement KQL-style formatting for the `Interval` data type. This is only needed for compatibility with the `Kusto` query language. [#45671](https://github.com/ClickHouse/ClickHouse/pull/45671) ([ltrk2](https://github.com/ltrk2)).
-* Added query `SYSTEM FLUSH ASYNC INSERT QUEUE` which flushes all pending asynchronous inserts to the destination tables. Added a server-side setting `async_insert_queue_flush_on_shutdown` (`true` by default) which determines whether to flush queue of asynchronous inserts on graceful shutdown. Setting `async_insert_threads` is now a server-side setting. [#49160](https://github.com/ClickHouse/ClickHouse/pull/49160) ([Anton Popov](https://github.com/CurtizJ)).
-* Aliases `current_database` and a new function `current_schemas` for compatibility with PostgreSQL. [#51076](https://github.com/ClickHouse/ClickHouse/pull/51076) ([Pedro Riera](https://github.com/priera)).
-* Add alias for functions `today` (now available under the `curdate`/`current_date` names) and `now` (`current_timestamp`). [#52106](https://github.com/ClickHouse/ClickHouse/pull/52106) ([Lloyd-Pottiger](https://github.com/Lloyd-Pottiger)).
-* Support `async_deduplication_token` for async insert. [#52136](https://github.com/ClickHouse/ClickHouse/pull/52136) ([Han Fei](https://github.com/hanfei1991)).
-* Add new setting `disable_url_encoding` that allows to disable decoding/encoding path in uri in URL engine. [#52337](https://github.com/ClickHouse/ClickHouse/pull/52337) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Performance Improvement
-* Enable automatic selection of the sparse serialization format by default. It improves performance. The format is supported since version 22.1. After this change, downgrading to versions older than 22.1 might not be possible. A downgrade may require to set `ratio_of_defaults_for_sparse_serialization=0.9375` [55153](https://github.com/ClickHouse/ClickHouse/issues/55153). You can turn off the usage of the sparse serialization format by providing the `ratio_of_defaults_for_sparse_serialization = 1` setting for your MergeTree tables. [#49631](https://github.com/ClickHouse/ClickHouse/pull/49631) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Enable `move_all_conditions_to_prewhere` and `enable_multiple_prewhere_read_steps` settings by default. [#46365](https://github.com/ClickHouse/ClickHouse/pull/46365) ([Alexander Gololobov](https://github.com/davenger)).
-* Improves performance of some queries by tuning allocator. [#46416](https://github.com/ClickHouse/ClickHouse/pull/46416) ([Azat Khuzhin](https://github.com/azat)).
-* Now we use fixed-size tasks in `MergeTreePrefetchedReadPool` as in `MergeTreeReadPool`. Also from now we use connection pool for S3 requests. [#49732](https://github.com/ClickHouse/ClickHouse/pull/49732) ([Nikita Taranov](https://github.com/nickitat)).
-* More pushdown to the right side of join. [#50532](https://github.com/ClickHouse/ClickHouse/pull/50532) ([Nikita Taranov](https://github.com/nickitat)).
-* Improve grace_hash join by reserving hash table's size (resubmit). [#50875](https://github.com/ClickHouse/ClickHouse/pull/50875) ([lgbo](https://github.com/lgbo-ustc)).
-* Waiting on lock in `OpenedFileCache` could be noticeable sometimes. We sharded it into multiple sub-maps (each with its own lock) to avoid contention. [#51341](https://github.com/ClickHouse/ClickHouse/pull/51341) ([Nikita Taranov](https://github.com/nickitat)).
-* Move conditions with primary key columns to the end of PREWHERE chain. The idea is that conditions with PK columns are likely to be used in PK analysis and will not contribute much more to PREWHERE filtering. [#51958](https://github.com/ClickHouse/ClickHouse/pull/51958) ([Alexander Gololobov](https://github.com/davenger)).
-* Speed up `COUNT(DISTINCT)` for String types by inlining SipHash. The performance experiments of *OnTime* on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring an improvement of *11.6%* to the QPS of the query *Q8* while having no impact on others. [#52036](https://github.com/ClickHouse/ClickHouse/pull/52036) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Enable `allow_vertical_merges_from_compact_to_wide_parts` by default. It will save memory usage during merges. [#52295](https://github.com/ClickHouse/ClickHouse/pull/52295) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect projection analysis which invalidates primary keys. This issue only exists when `query_plan_optimize_primary_key = 1, query_plan_optimize_projection = 1`. This fixes [#48823](https://github.com/ClickHouse/ClickHouse/issues/48823). This fixes [#51173](https://github.com/ClickHouse/ClickHouse/issues/51173). [#52308](https://github.com/ClickHouse/ClickHouse/pull/52308) ([Amos Bird](https://github.com/amosbird)).
-* Reduce the number of syscalls in `FileCache::loadMetadata` - this speeds up server startup if the filesystem cache is configured. [#52435](https://github.com/ClickHouse/ClickHouse/pull/52435) ([Raúl Marín](https://github.com/Algunenano)).
-* Allow to have strict lower boundary for file segment size by downloading remaining data in the background. Minimum size of file segment (if actual file size is bigger) is configured as cache configuration setting `boundary_alignment`, by default `4Mi`. Number of background threads are configured as cache configuration setting `background_download_threads`, by default `2`. Also `max_file_segment_size` was increased from `8Mi` to `32Mi` in this PR. [#51000](https://github.com/ClickHouse/ClickHouse/pull/51000) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Decreased default timeouts for S3 from 30 seconds to 3 seconds, and for other HTTP from 180 seconds to 30 seconds. [#51171](https://github.com/ClickHouse/ClickHouse/pull/51171) ([Michael Kolupaev](https://github.com/al13n321)).
-* New setting `merge_tree_determine_task_size_by_prewhere_columns` added. If set to `true` only sizes of the columns from `PREWHERE` section will be considered to determine reading task size. Otherwise all the columns from query are considered. [#52606](https://github.com/ClickHouse/ClickHouse/pull/52606) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Improvement
-* Use read_bytes/total_bytes_to_read for progress bar in s3/file/url/... table functions for better progress indication. [#51286](https://github.com/ClickHouse/ClickHouse/pull/51286) ([Kruglov Pavel](https://github.com/Avogar)).
-* Introduce a table setting `wait_for_unique_parts_send_before_shutdown_ms` which specify the amount of time replica will wait before closing interserver handler for replicated sends. Also fix inconsistency with shutdown of tables and interserver handlers: now server shutdown tables first and only after it shut down interserver handlers. [#51851](https://github.com/ClickHouse/ClickHouse/pull/51851) ([alesapin](https://github.com/alesapin)).
-* Allow SQL standard `FETCH` without `OFFSET`. See https://antonz.org/sql-fetch/. [#51293](https://github.com/ClickHouse/ClickHouse/pull/51293) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow filtering HTTP headers for the URL/S3 table functions with the new `http_forbid_headers` section in config. Both exact matching and regexp filters are available. [#51038](https://github.com/ClickHouse/ClickHouse/pull/51038) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Don't show messages about `16 EiB` free space in logs, as they don't make sense. This closes [#49320](https://github.com/ClickHouse/ClickHouse/issues/49320). [#49342](https://github.com/ClickHouse/ClickHouse/pull/49342) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Properly check the limit for the `sleepEachRow` function. Add a setting `function_sleep_max_microseconds_per_block`. This is needed for generic query fuzzer. [#49343](https://github.com/ClickHouse/ClickHouse/pull/49343) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix two issues in `geoHash` functions. [#50066](https://github.com/ClickHouse/ClickHouse/pull/50066) ([李扬](https://github.com/taiyang-li)).
-* Log async insert flush queries into `system.query_log`. [#51160](https://github.com/ClickHouse/ClickHouse/pull/51160) ([Raúl Marín](https://github.com/Algunenano)).
-* Functions `date_diff` and `age` now support millisecond/microsecond unit and work with microsecond precision. [#51291](https://github.com/ClickHouse/ClickHouse/pull/51291) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Improve parsing of path in clickhouse-keeper-client. [#51359](https://github.com/ClickHouse/ClickHouse/pull/51359) ([Azat Khuzhin](https://github.com/azat)).
-* A third-party product depending on ClickHouse (Gluten: a Plugin to Double SparkSQL's Performance) had a bug. This fix avoids heap overflow in that third-party product while reading from HDFS. [#51386](https://github.com/ClickHouse/ClickHouse/pull/51386) ([李扬](https://github.com/taiyang-li)).
-* Add ability to disable native copy for S3 (setting for BACKUP/RESTORE `allow_s3_native_copy`, and `s3_allow_native_copy` for `s3`/`s3_plain` disks). [#51448](https://github.com/ClickHouse/ClickHouse/pull/51448) ([Azat Khuzhin](https://github.com/azat)).
-* Add column `primary_key_size` to `system.parts` table to show compressed primary key size on disk. Closes [#51400](https://github.com/ClickHouse/ClickHouse/issues/51400). [#51496](https://github.com/ClickHouse/ClickHouse/pull/51496) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
-* Allow running `clickhouse-local` without procfs, without home directory existing, and without name resolution plugins from glibc. [#51518](https://github.com/ClickHouse/ClickHouse/pull/51518) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add placeholder `%a` for rull filename in rename_files_after_processing setting. [#51603](https://github.com/ClickHouse/ClickHouse/pull/51603) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add column `modification_time` into `system.parts_columns`. [#51685](https://github.com/ClickHouse/ClickHouse/pull/51685) ([Azat Khuzhin](https://github.com/azat)).
-* Add new setting `input_format_csv_use_default_on_bad_values` to CSV format that allows to insert default value when parsing of a single field failed. [#51716](https://github.com/ClickHouse/ClickHouse/pull/51716) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Added a crash log flush to the disk after the unexpected crash. [#51720](https://github.com/ClickHouse/ClickHouse/pull/51720) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Fix behavior in dashboard page where errors unrelated to authentication are not shown. Also fix 'overlapping' chart behavior. [#51744](https://github.com/ClickHouse/ClickHouse/pull/51744) ([Zach Naimon](https://github.com/ArctypeZach)).
-* Allow UUID to UInt128 conversion. [#51765](https://github.com/ClickHouse/ClickHouse/pull/51765) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Added support for function `range` of Nullable arguments. [#51767](https://github.com/ClickHouse/ClickHouse/pull/51767) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Convert condition like `toyear(x) = c` to `c1 <= x < c2`. [#51795](https://github.com/ClickHouse/ClickHouse/pull/51795) ([Han Fei](https://github.com/hanfei1991)).
-* Improve MySQL compatibility of the statement `SHOW INDEX`. [#51796](https://github.com/ClickHouse/ClickHouse/pull/51796) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix `use_structure_from_insertion_table_in_table_functions` does not work with `MATERIALIZED` and `ALIAS` columns. Closes [#51817](https://github.com/ClickHouse/ClickHouse/issues/51817). Closes [#51019](https://github.com/ClickHouse/ClickHouse/issues/51019). [#51825](https://github.com/ClickHouse/ClickHouse/pull/51825) ([flynn](https://github.com/ucasfl)).
-* Cache dictionary now requests only unique keys from source. Closes [#51762](https://github.com/ClickHouse/ClickHouse/issues/51762). [#51853](https://github.com/ClickHouse/ClickHouse/pull/51853) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fixed the case when settings were not applied for EXPLAIN query when FORMAT was provided. [#51859](https://github.com/ClickHouse/ClickHouse/pull/51859) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow SETTINGS before FORMAT in DESCRIBE TABLE query for compatibility with SELECT query. Closes [#51544](https://github.com/ClickHouse/ClickHouse/issues/51544). [#51899](https://github.com/ClickHouse/ClickHouse/pull/51899) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Var-Int encoded integers (e.g. used by the native protocol) can now use the full 64-bit range. 3rd party clients are advised to update their var-int code accordingly. [#51905](https://github.com/ClickHouse/ClickHouse/pull/51905) ([Robert Schulze](https://github.com/rschu1ze)).
-* Update certificates when they change without the need to manually SYSTEM RELOAD CONFIG. [#52030](https://github.com/ClickHouse/ClickHouse/pull/52030) ([Mike Kot](https://github.com/myrrc)).
-* Added `allow_create_index_without_type` setting that allow to ignore `ADD INDEX` queries without specified `TYPE`. Standard SQL queries will just succeed without changing table schema. [#52056](https://github.com/ClickHouse/ClickHouse/pull/52056) ([Ilya Yatsishin](https://github.com/qoega)).
-* Log messages are written to the `system.text_log` from the server startup. [#52113](https://github.com/ClickHouse/ClickHouse/pull/52113) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* In cases where the HTTP endpoint has multiple IP addresses and the first of them is unreachable, a timeout exception was thrown. Made session creation with handling all resolved endpoints. [#52116](https://github.com/ClickHouse/ClickHouse/pull/52116) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Avro input format now supports Union even if it contains only a single type. Closes [#52131](https://github.com/ClickHouse/ClickHouse/issues/52131). [#52137](https://github.com/ClickHouse/ClickHouse/pull/52137) ([flynn](https://github.com/ucasfl)).
-* Add setting `optimize_use_implicit_projections` to disable implicit projections (currently only `min_max_count` projection). [#52152](https://github.com/ClickHouse/ClickHouse/pull/52152) ([Amos Bird](https://github.com/amosbird)).
-* It was possible to use the function `hasToken` for infinite loop. Now this possibility is removed. This closes [#52156](https://github.com/ClickHouse/ClickHouse/issues/52156). [#52160](https://github.com/ClickHouse/ClickHouse/pull/52160) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Create ZK ancestors optimistically. [#52195](https://github.com/ClickHouse/ClickHouse/pull/52195) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix [#50582](https://github.com/ClickHouse/ClickHouse/issues/50582). Avoid the `Not found column ... in block` error in some cases of reading in-order and constants. [#52259](https://github.com/ClickHouse/ClickHouse/pull/52259) ([Chen768959](https://github.com/Chen768959)).
-* Check whether S2 geo primitives are invalid as early as possible on ClickHouse side. This closes: [#27090](https://github.com/ClickHouse/ClickHouse/issues/27090). [#52260](https://github.com/ClickHouse/ClickHouse/pull/52260) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Add back missing projection QueryAccessInfo when `query_plan_optimize_projection = 1`. This fixes [#50183](https://github.com/ClickHouse/ClickHouse/issues/50183) . This fixes [#50093](https://github.com/ClickHouse/ClickHouse/issues/50093). [#52327](https://github.com/ClickHouse/ClickHouse/pull/52327) ([Amos Bird](https://github.com/amosbird)).
-* When `ZooKeeperRetriesControl` rethrows an error, it's more useful to see its original stack trace, not the one from `ZooKeeperRetriesControl` itself. [#52347](https://github.com/ClickHouse/ClickHouse/pull/52347) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Wait for zero copy replication lock even if some disks don't support it. [#52376](https://github.com/ClickHouse/ClickHouse/pull/52376) ([Raúl Marín](https://github.com/Algunenano)).
-* Now interserver port will be closed only after tables are shut down. [#52498](https://github.com/ClickHouse/ClickHouse/pull/52498) ([alesapin](https://github.com/alesapin)).
-
-#### Experimental Feature
-* Writing parquet files is 10x faster, it's multi-threaded now. Almost the same speed as reading. [#49367](https://github.com/ClickHouse/ClickHouse/pull/49367) ([Michael Kolupaev](https://github.com/al13n321)). This is controlled by the setting `output_format_parquet_use_custom_encoder` which is disabled by default, because the feature is non-ideal.
-* Added support for [PRQL](https://prql-lang.org/) as a query language. [#50686](https://github.com/ClickHouse/ClickHouse/pull/50686) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Allow to add disk name for custom disks. Previously custom disks would use an internal generated disk name. Now it will be possible with `disk = disk_<name>(...)` (e.g. disk will have name `name`) . [#51552](https://github.com/ClickHouse/ClickHouse/pull/51552) ([Kseniia Sumarokova](https://github.com/kssenii)). This syntax can be changed in this release.
-* (experimental MaterializedMySQL) Fixed crash when `mysqlxx::Pool::Entry` is used after it was disconnected. [#52063](https://github.com/ClickHouse/ClickHouse/pull/52063) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) `CREATE TABLE ... AS SELECT` .. is now supported in MaterializedMySQL. [#52067](https://github.com/ClickHouse/ClickHouse/pull/52067) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Introduced automatic conversion of text types to utf8 for MaterializedMySQL. [#52084](https://github.com/ClickHouse/ClickHouse/pull/52084) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Now unquoted UTF-8 strings are supported in DDL for MaterializedMySQL. [#52318](https://github.com/ClickHouse/ClickHouse/pull/52318) ([Val Doroshchuk](https://github.com/valbok)).
-* (experimental MaterializedMySQL) Now double quoted comments are supported in MaterializedMySQL. [#52355](https://github.com/ClickHouse/ClickHouse/pull/52355) ([Val Doroshchuk](https://github.com/valbok)).
-* Upgrade Intel QPL from v1.1.0 to v1.2.0 2. Upgrade Intel accel-config from v3.5 to v4.0 3. Fixed issue that Device IOTLB miss has big perf. impact for IAA accelerators. [#52180](https://github.com/ClickHouse/ClickHouse/pull/52180) ([jasperzhu](https://github.com/jinjunzh)).
-* The `session_timezone` setting (new in version 23.6) is demoted to experimental. [#52445](https://github.com/ClickHouse/ClickHouse/pull/52445) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support ZooKeeper `reconfig` command for ClickHouse Keeper with incremental reconfiguration which can be enabled via `keeper_server.enable_reconfiguration` setting. Support adding servers, removing servers, and changing server priorities. [#49450](https://github.com/ClickHouse/ClickHouse/pull/49450) ([Mike Kot](https://github.com/myrrc)). It is suspected that this feature is incomplete.
-
-#### Build/Testing/Packaging Improvement
-* Add experimental ClickHouse builds for Linux RISC-V 64 to CI. [#31398](https://github.com/ClickHouse/ClickHouse/pull/31398) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add integration test check with the enabled Analyzer. [#50926](https://github.com/ClickHouse/ClickHouse/pull/50926) [#52210](https://github.com/ClickHouse/ClickHouse/pull/52210) ([Dmitry Novik](https://github.com/novikd)).
-* Reproducible builds for Rust. [#52395](https://github.com/ClickHouse/ClickHouse/pull/52395) ([Azat Khuzhin](https://github.com/azat)).
-* Update Cargo dependencies. [#51721](https://github.com/ClickHouse/ClickHouse/pull/51721) ([Raúl Marín](https://github.com/Algunenano)).
-* Make the function `CHColumnToArrowColumn::fillArrowArrayWithArrayColumnData` to work with nullable arrays, which are not possible in ClickHouse, but needed for Gluten. [#52112](https://github.com/ClickHouse/ClickHouse/pull/52112) ([李扬](https://github.com/taiyang-li)).
-* We've updated the CCTZ library to master, but there are no user-visible changes. [#52124](https://github.com/ClickHouse/ClickHouse/pull/52124) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `system.licenses` table now includes the hard-forked library Poco. This closes [#52066](https://github.com/ClickHouse/ClickHouse/issues/52066). [#52127](https://github.com/ClickHouse/ClickHouse/pull/52127) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Check that there are no cases of bad punctuation: whitespace before a comma like `Hello ,world` instead of `Hello, world`. [#52549](https://github.com/ClickHouse/ClickHouse/pull/52549) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix MaterializedPostgreSQL syncTables [#49698](https://github.com/ClickHouse/ClickHouse/pull/49698) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix projection with optimize_aggregators_of_group_by_keys [#49709](https://github.com/ClickHouse/ClickHouse/pull/49709) ([Amos Bird](https://github.com/amosbird)).
-* Fix optimize_skip_unused_shards with JOINs [#51037](https://github.com/ClickHouse/ClickHouse/pull/51037) ([Azat Khuzhin](https://github.com/azat)).
-* Fix formatDateTime() with fractional negative datetime64 [#51290](https://github.com/ClickHouse/ClickHouse/pull/51290) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Functions `hasToken*` were totally wrong. Add a test for [#43358](https://github.com/ClickHouse/ClickHouse/issues/43358) [#51378](https://github.com/ClickHouse/ClickHouse/pull/51378) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix optimization to move functions before sorting. [#51481](https://github.com/ClickHouse/ClickHouse/pull/51481) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix Block structure mismatch in Pipe::unitePipes for FINAL [#51492](https://github.com/ClickHouse/ClickHouse/pull/51492) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix SIGSEGV for clusters with zero weight across all shards (fixes INSERT INTO FUNCTION clusterAllReplicas()) [#51545](https://github.com/ClickHouse/ClickHouse/pull/51545) ([Azat Khuzhin](https://github.com/azat)).
-* Fix timeout for hedged requests [#51582](https://github.com/ClickHouse/ClickHouse/pull/51582) ([Azat Khuzhin](https://github.com/azat)).
-* Fix logical error in ANTI join with NULL [#51601](https://github.com/ClickHouse/ClickHouse/pull/51601) ([vdimir](https://github.com/vdimir)).
-* Fix for moving 'IN' conditions to PREWHERE [#51610](https://github.com/ClickHouse/ClickHouse/pull/51610) ([Alexander Gololobov](https://github.com/davenger)).
-* Do not apply PredicateExpressionsOptimizer for ASOF/ANTI join [#51633](https://github.com/ClickHouse/ClickHouse/pull/51633) ([vdimir](https://github.com/vdimir)).
-* Fix async insert with deduplication for ReplicatedMergeTree using merging algorithms [#51676](https://github.com/ClickHouse/ClickHouse/pull/51676) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix reading from empty column in `parseSipHashKey` [#51804](https://github.com/ClickHouse/ClickHouse/pull/51804) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix segfault when create invalid EmbeddedRocksdb table [#51847](https://github.com/ClickHouse/ClickHouse/pull/51847) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix inserts into MongoDB tables [#51876](https://github.com/ClickHouse/ClickHouse/pull/51876) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix deadlock on DatabaseCatalog shutdown [#51908](https://github.com/ClickHouse/ClickHouse/pull/51908) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix error in subquery operators [#51922](https://github.com/ClickHouse/ClickHouse/pull/51922) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix async connect to hosts with multiple ips [#51934](https://github.com/ClickHouse/ClickHouse/pull/51934) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not remove inputs after ActionsDAG::merge [#51947](https://github.com/ClickHouse/ClickHouse/pull/51947) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Check refcount in `RemoveManyObjectStorageOperation::finalize` instead of `execute` [#51954](https://github.com/ClickHouse/ClickHouse/pull/51954) ([vdimir](https://github.com/vdimir)).
-* Allow parametric UDFs [#51964](https://github.com/ClickHouse/ClickHouse/pull/51964) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Small fix for toDateTime64() for dates after 2283-12-31 [#52130](https://github.com/ClickHouse/ClickHouse/pull/52130) ([Andrey Zvonov](https://github.com/zvonand)).
-* Fix ORDER BY tuple of WINDOW functions [#52145](https://github.com/ClickHouse/ClickHouse/pull/52145) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix incorrect projection analysis when aggregation expression contains monotonic functions [#52151](https://github.com/ClickHouse/ClickHouse/pull/52151) ([Amos Bird](https://github.com/amosbird)).
-* Fix error in `groupArrayMoving` functions [#52161](https://github.com/ClickHouse/ClickHouse/pull/52161) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disable direct join for range dictionary [#52187](https://github.com/ClickHouse/ClickHouse/pull/52187) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix sticky mutations test (and extremely rare race condition) [#52197](https://github.com/ClickHouse/ClickHouse/pull/52197) ([alesapin](https://github.com/alesapin)).
-* Fix race in Web disk [#52211](https://github.com/ClickHouse/ClickHouse/pull/52211) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix data race in Connection::setAsyncCallback on unknown packet from server [#52219](https://github.com/ClickHouse/ClickHouse/pull/52219) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix temp data deletion on startup, add test [#52275](https://github.com/ClickHouse/ClickHouse/pull/52275) ([vdimir](https://github.com/vdimir)).
-* Don't use minmax_count projections when counting nullable columns [#52297](https://github.com/ClickHouse/ClickHouse/pull/52297) ([Amos Bird](https://github.com/amosbird)).
-* MergeTree/ReplicatedMergeTree should use server timezone for log entries [#52325](https://github.com/ClickHouse/ClickHouse/pull/52325) ([Azat Khuzhin](https://github.com/azat)).
-* Fix parameterized view with cte and multiple usage [#52328](https://github.com/ClickHouse/ClickHouse/pull/52328) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Disable expression templates for time intervals [#52335](https://github.com/ClickHouse/ClickHouse/pull/52335) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix `apply_snapshot` in Keeper [#52358](https://github.com/ClickHouse/ClickHouse/pull/52358) ([Antonio Andelic](https://github.com/antonio2368)).
-* Update build-osx.md [#52377](https://github.com/ClickHouse/ClickHouse/pull/52377) ([AlexBykovski](https://github.com/AlexBykovski)).
-* Fix `countSubstrings` hang with empty needle and a column haystack [#52409](https://github.com/ClickHouse/ClickHouse/pull/52409) ([Sergei Trifonov](https://github.com/serxa)).
-* Fix normal projection with merge table  [#52432](https://github.com/ClickHouse/ClickHouse/pull/52432) ([Amos Bird](https://github.com/amosbird)).
-* Fix possible double-free in Aggregator [#52439](https://github.com/ClickHouse/ClickHouse/pull/52439) ([Nikita Taranov](https://github.com/nickitat)).
-* Fixed inserting into Buffer engine [#52440](https://github.com/ClickHouse/ClickHouse/pull/52440) ([Vasily Nemkov](https://github.com/Enmk)).
-* The implementation of AnyHash was non-conformant. [#52448](https://github.com/ClickHouse/ClickHouse/pull/52448) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Check recursion depth in OptimizedRegularExpression [#52451](https://github.com/ClickHouse/ClickHouse/pull/52451) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix data-race DatabaseReplicated::startupTables()/canExecuteReplicatedMetadataAlter() [#52490](https://github.com/ClickHouse/ClickHouse/pull/52490) ([Azat Khuzhin](https://github.com/azat)).
-* Fix abort in function `transform` [#52513](https://github.com/ClickHouse/ClickHouse/pull/52513) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix lightweight delete after drop of projection [#52517](https://github.com/ClickHouse/ClickHouse/pull/52517) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix possible error "Cannot drain connections: cancel first" [#52585](https://github.com/ClickHouse/ClickHouse/pull/52585) ([Kruglov Pavel](https://github.com/Avogar)).
-
-
-### <a id="236"></a> ClickHouse release 23.6, 2023-06-29
-
-#### Backward Incompatible Change
-* Delete feature `do_not_evict_index_and_mark_files` in the fs cache. This feature was only making things worse. [#51253](https://github.com/ClickHouse/ClickHouse/pull/51253) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Remove ALTER support for experimental LIVE VIEW. [#51287](https://github.com/ClickHouse/ClickHouse/pull/51287) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Decrease the default values for `http_max_field_value_size` and `http_max_field_name_size` to 128 KiB. [#51163](https://github.com/ClickHouse/ClickHouse/pull/51163) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* CGroups metrics related to CPU are replaced with one metric, `CGroupMaxCPU` for better usability. The `Normalized` CPU usage metrics will be normalized to CGroups limits instead of the total number of CPUs when they are set. This closes [#50836](https://github.com/ClickHouse/ClickHouse/issues/50836). [#50835](https://github.com/ClickHouse/ClickHouse/pull/50835) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### New Feature
-* The function `transform` as well as `CASE` with value matching started to support all data types. This closes [#29730](https://github.com/ClickHouse/ClickHouse/issues/29730). This closes [#32387](https://github.com/ClickHouse/ClickHouse/issues/32387). This closes [#50827](https://github.com/ClickHouse/ClickHouse/issues/50827). This closes [#31336](https://github.com/ClickHouse/ClickHouse/issues/31336). This closes [#40493](https://github.com/ClickHouse/ClickHouse/issues/40493). [#51351](https://github.com/ClickHouse/ClickHouse/pull/51351) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added option `--rename_files_after_processing <pattern>`. This closes [#34207](https://github.com/ClickHouse/ClickHouse/issues/34207). [#49626](https://github.com/ClickHouse/ClickHouse/pull/49626) ([alekseygolub](https://github.com/alekseygolub)).
-* Add support for `TRUNCATE` modifier in `INTO OUTFILE` clause. Suggest using `APPEND` or `TRUNCATE` for `INTO OUTFILE` when file exists. [#50950](https://github.com/ClickHouse/ClickHouse/pull/50950) ([alekar](https://github.com/alekar)).
-* Add table engine `Redis` and table function `redis`. It allows querying external Redis servers. [#50150](https://github.com/ClickHouse/ClickHouse/pull/50150) ([JackyWoo](https://github.com/JackyWoo)).
-* Allow to skip empty files in file/s3/url/hdfs table functions using settings `s3_skip_empty_files`, `hdfs_skip_empty_files`, `engine_file_skip_empty_files`, `engine_url_skip_empty_files`. [#50364](https://github.com/ClickHouse/ClickHouse/pull/50364) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a new setting named `use_mysql_types_in_show_columns` to alter the `SHOW COLUMNS` SQL statement to display MySQL equivalent types when a client is connected via the MySQL compatibility port. [#49577](https://github.com/ClickHouse/ClickHouse/pull/49577) ([Thomas Panetti](https://github.com/tpanetti)).
-* Clickhouse-client can now be called with a connection string instead of "--host", "--port", "--user" etc. [#50689](https://github.com/ClickHouse/ClickHouse/pull/50689) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Add setting `session_timezone`; it is used as the default timezone for a session when not explicitly specified. [#44149](https://github.com/ClickHouse/ClickHouse/pull/44149) ([Andrey Zvonov](https://github.com/zvonand)).
-* Codec DEFLATE_QPL is now controlled via server setting "enable_deflate_qpl_codec" (default: false) instead of setting "allow_experimental_codecs". This marks DEFLATE_QPL non-experimental. [#50775](https://github.com/ClickHouse/ClickHouse/pull/50775) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Performance Improvement
-* Improved scheduling of merge selecting and cleanup tasks in `ReplicatedMergeTree`. The tasks will not be executed too frequently when there's nothing to merge or cleanup. Added settings `max_merge_selecting_sleep_ms`, `merge_selecting_sleep_slowdown_factor`, `max_cleanup_delay_period` and `cleanup_thread_preferred_points_per_iteration`. It should close [#31919](https://github.com/ClickHouse/ClickHouse/issues/31919). [#50107](https://github.com/ClickHouse/ClickHouse/pull/50107) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Make filter push down through cross join. [#50605](https://github.com/ClickHouse/ClickHouse/pull/50605) ([Han Fei](https://github.com/hanfei1991)).
-* Improve performance with enabled QueryProfiler using thread-local timer_id instead of global object. [#48778](https://github.com/ClickHouse/ClickHouse/pull/48778) ([Jiebin Sun](https://github.com/jiebinn)).
-* Rewrite CapnProto input/output format to improve its performance. Map column names and CapnProto fields case insensitive, fix reading/writing of nested structure fields. [#49752](https://github.com/ClickHouse/ClickHouse/pull/49752) ([Kruglov Pavel](https://github.com/Avogar)).
-* Optimize parquet write performance for parallel threads. [#50102](https://github.com/ClickHouse/ClickHouse/pull/50102) ([Hongbin Ma](https://github.com/binmahone)).
-* Disable `parallelize_output_from_storages` for processing MATERIALIZED VIEWs and storages with one block only. [#50214](https://github.com/ClickHouse/ClickHouse/pull/50214) ([Azat Khuzhin](https://github.com/azat)).
-* Merge PR [#46558](https://github.com/ClickHouse/ClickHouse/pull/46558). Avoid block permutation during sort if the block is already sorted. [#50697](https://github.com/ClickHouse/ClickHouse/pull/50697) ([Alexey Milovidov](https://github.com/alexey-milovidov), [Maksim Kita](https://github.com/kitaisreal)).
-* Make multiple list requests to ZooKeeper in parallel to speed up reading from system.zookeeper table. [#51042](https://github.com/ClickHouse/ClickHouse/pull/51042) ([Alexander Gololobov](https://github.com/davenger)).
-* Speedup initialization of DateTime lookup tables for time zones. This should reduce startup/connect time of clickhouse-client especially in debug build as it is rather heavy. [#51347](https://github.com/ClickHouse/ClickHouse/pull/51347) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix data lakes slowness because of synchronous head requests. (Related to Iceberg/Deltalake/Hudi being slow with a lot of files). [#50976](https://github.com/ClickHouse/ClickHouse/pull/50976) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Do not read all the columns from right GLOBAL JOIN table. [#50721](https://github.com/ClickHouse/ClickHouse/pull/50721) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-
-#### Experimental Feature
-* Support parallel replicas with the analyzer. [#50441](https://github.com/ClickHouse/ClickHouse/pull/50441) ([Raúl Marín](https://github.com/Algunenano)).
-* Add random sleep before large merges/mutations execution to split load more evenly between replicas in case of zero-copy replication. [#51282](https://github.com/ClickHouse/ClickHouse/pull/51282) ([alesapin](https://github.com/alesapin)).
-* Do not replicate `ALTER PARTITION` queries and mutations through `Replicated` database if it has only one shard and the underlying table is `ReplicatedMergeTree`. [#51049](https://github.com/ClickHouse/ClickHouse/pull/51049) ([Alexander Tokmakov](https://github.com/tavplubix)).
-
-#### Improvement
-* Relax the thresholds for "too many parts" to be more modern. Return the backpressure during long-running insert queries. [#50856](https://github.com/ClickHouse/ClickHouse/pull/50856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow to cast IPv6 to IPv4 address for CIDR ::ffff:0:0/96 (IPv4-mapped addresses). [#49759](https://github.com/ClickHouse/ClickHouse/pull/49759) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Update MongoDB protocol to support MongoDB 5.1 version and newer. Support for the versions with the old protocol (<3.6) is preserved. Closes [#45621](https://github.com/ClickHouse/ClickHouse/issues/45621), [#49879](https://github.com/ClickHouse/ClickHouse/issues/49879). [#50061](https://github.com/ClickHouse/ClickHouse/pull/50061) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add setting `input_format_max_bytes_to_read_for_schema_inference` to limit the number of bytes to read in schema inference. Closes [#50577](https://github.com/ClickHouse/ClickHouse/issues/50577). [#50592](https://github.com/ClickHouse/ClickHouse/pull/50592) ([Kruglov Pavel](https://github.com/Avogar)).
-* Respect setting `input_format_null_as_default` in schema inference. [#50602](https://github.com/ClickHouse/ClickHouse/pull/50602) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to skip trailing empty lines in CSV/TSV/CustomSeparated formats via settings `input_format_csv_skip_trailing_empty_lines`, `input_format_tsv_skip_trailing_empty_lines` and `input_format_custom_skip_trailing_empty_lines` (disabled by default). Closes [#49315](https://github.com/ClickHouse/ClickHouse/issues/49315). [#50635](https://github.com/ClickHouse/ClickHouse/pull/50635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Functions "toDateOrDefault|OrNull" and "accuateCast[OrDefault|OrNull]" now correctly parse numeric arguments. [#50709](https://github.com/ClickHouse/ClickHouse/pull/50709) ([Dmitry Kardymon](https://github.com/kardymonds)).
-* Support CSV with whitespace or `\t` field delimiters, and these delimiters are supported in Spark. [#50712](https://github.com/ClickHouse/ClickHouse/pull/50712) ([KevinyhZou](https://github.com/KevinyhZou)).
-* Settings `number_of_mutations_to_delay` and `number_of_mutations_to_throw` are enabled by default now with values 500 and 1000 respectively. [#50726](https://github.com/ClickHouse/ClickHouse/pull/50726) ([Anton Popov](https://github.com/CurtizJ)).
-* The dashboard correctly shows missing values. This closes [#50831](https://github.com/ClickHouse/ClickHouse/issues/50831). [#50832](https://github.com/ClickHouse/ClickHouse/pull/50832) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added the possibility to use date and time arguments in the syslog timestamp format in functions `parseDateTimeBestEffort*` and `parseDateTime64BestEffort*`. [#50925](https://github.com/ClickHouse/ClickHouse/pull/50925) ([Victor Krasnov](https://github.com/sirvickr)).
-* Command line parameter "--password" in clickhouse-client can now be specified only once. [#50966](https://github.com/ClickHouse/ClickHouse/pull/50966) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
-* Use `hash_of_all_files` from `system.parts` to check identity of parts during on-cluster backups. [#50997](https://github.com/ClickHouse/ClickHouse/pull/50997) ([Vitaly Baranov](https://github.com/vitlibar)).
-* The system table zookeeper_connection connected_time identifies the time when the connection is established (standard format), and session_uptime_elapsed_seconds is added, which labels the duration of the established connection session (in seconds). [#51026](https://github.com/ClickHouse/ClickHouse/pull/51026) ([郭小龙](https://github.com/guoxiaolongzte)).
-* Improve the progress bar for file/s3/hdfs/url table functions by using chunk size from source data and using incremental total size counting in each thread. Fix the progress bar for *Cluster functions. This closes [#47250](https://github.com/ClickHouse/ClickHouse/issues/47250). [#51088](https://github.com/ClickHouse/ClickHouse/pull/51088) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add total_bytes_to_read to the Progress packet in TCP protocol for better Progress bar. [#51158](https://github.com/ClickHouse/ClickHouse/pull/51158) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better checking of data parts on disks with filesystem cache. [#51164](https://github.com/ClickHouse/ClickHouse/pull/51164) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix sometimes not correct current_elements_num in fs cache. [#51242](https://github.com/ClickHouse/ClickHouse/pull/51242) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-#### Build/Testing/Packaging Improvement
-* Add embedded keeper-client to standalone keeper binary. [#50964](https://github.com/ClickHouse/ClickHouse/pull/50964) ([pufit](https://github.com/pufit)).
-* Actual LZ4 version is used now. [#50621](https://github.com/ClickHouse/ClickHouse/pull/50621) ([Nikita Taranov](https://github.com/nickitat)).
-* ClickHouse server will print the list of changed settings on fatal errors. This closes [#51137](https://github.com/ClickHouse/ClickHouse/issues/51137). [#51138](https://github.com/ClickHouse/ClickHouse/pull/51138) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow building ClickHouse with clang-17. [#51300](https://github.com/ClickHouse/ClickHouse/pull/51300) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* [SQLancer](https://github.com/sqlancer/sqlancer) check is considered stable as bugs that were triggered by it are fixed. Now failures of SQLancer check will be reported as failed check status. [#51340](https://github.com/ClickHouse/ClickHouse/pull/51340) ([Ilya Yatsishin](https://github.com/qoega)).
-* Split huge `RUN` in Dockerfile into smaller conditional. Install the necessary tools on demand in the same `RUN` layer, and remove them after that. Upgrade the OS only once at the beginning. Use a modern way to check the signed repository. Downgrade the base repo to ubuntu:20.04 to address the issues on older docker versions. Upgrade golang version to address golang vulnerabilities. [#51504](https://github.com/ClickHouse/ClickHouse/pull/51504) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Improve aliases for clickhouse binary (now `ch`/`clickhouse` is `clickhouse-local` or `clickhouse` depends on the arguments) and add bash completion for new aliases. [#58344](https://github.com/ClickHouse/ClickHouse/pull/58344) ([Azat Khuzhin](https://github.com/azat)).
+* Add settings changes check to CI to check that all settings changes are reflected in settings changes history. [#58555](https://github.com/ClickHouse/ClickHouse/pull/58555) ([Kruglov Pavel](https://github.com/Avogar)).
+* Use tables directly attached from S3 in stateful tests. [#58791](https://github.com/ClickHouse/ClickHouse/pull/58791) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Save the whole `fuzzer.log` as an archive instead of the last 100k lines. `tail -n 100000` often removes lines with table definitions. Example:. [#58821](https://github.com/ClickHouse/ClickHouse/pull/58821) ([Dmitry Novik](https://github.com/novikd)).
+* Enable Rust on macOS with Aarch64 (this will add fuzzy search in client with skim and the PRQL language, though I don't think that are people who host ClickHouse on darwin, so it is mostly for fuzzy search in client I would say). [#59272](https://github.com/ClickHouse/ClickHouse/pull/59272) ([Azat Khuzhin](https://github.com/azat)).
+* Fix aggregation issue in mixed x86_64 and ARM clusters [#59132](https://github.com/ClickHouse/ClickHouse/pull/59132) ([Harry Lee](https://github.com/HarryLeeIBM)).
 
 #### Bug Fix (user-visible misbehavior in an official stable release)
 
-* Report loading status for executable dictionaries correctly [#48775](https://github.com/ClickHouse/ClickHouse/pull/48775) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Proper mutation of skip indices and projections [#50104](https://github.com/ClickHouse/ClickHouse/pull/50104) ([Amos Bird](https://github.com/amosbird)).
-* Cleanup moving parts [#50489](https://github.com/ClickHouse/ClickHouse/pull/50489) ([vdimir](https://github.com/vdimir)).
-* Fix backward compatibility for IP types hashing in aggregate functions [#50551](https://github.com/ClickHouse/ClickHouse/pull/50551) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix Log family table return wrong rows count after truncate [#50585](https://github.com/ClickHouse/ClickHouse/pull/50585) ([flynn](https://github.com/ucasfl)).
-* Fix bug in `uniqExact` parallel merging [#50590](https://github.com/ClickHouse/ClickHouse/pull/50590) ([Nikita Taranov](https://github.com/nickitat)).
-* Revert recent grace hash join changes [#50699](https://github.com/ClickHouse/ClickHouse/pull/50699) ([vdimir](https://github.com/vdimir)).
-* Query Cache: Try to fix bad cast from `ColumnConst` to `ColumnVector<char8_t>` [#50704](https://github.com/ClickHouse/ClickHouse/pull/50704) ([Robert Schulze](https://github.com/rschu1ze)).
-* Avoid storing logs in Keeper containing unknown operation [#50751](https://github.com/ClickHouse/ClickHouse/pull/50751) ([Antonio Andelic](https://github.com/antonio2368)).
-* SummingMergeTree support for DateTime64 [#50797](https://github.com/ClickHouse/ClickHouse/pull/50797) ([Jordi Villar](https://github.com/jrdi)).
-* Add compatibility setting for non-const timezones [#50834](https://github.com/ClickHouse/ClickHouse/pull/50834) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix hashing of LDAP params in the cache entries [#50865](https://github.com/ClickHouse/ClickHouse/pull/50865) ([Julian Maicher](https://github.com/jmaicher)).
-* Fallback to parsing big integer from String instead of exception in Parquet format [#50873](https://github.com/ClickHouse/ClickHouse/pull/50873) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix checking the lock file too often while writing a backup [#50889](https://github.com/ClickHouse/ClickHouse/pull/50889) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Do not apply projection if read-in-order was enabled. [#50923](https://github.com/ClickHouse/ClickHouse/pull/50923) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix race in the Azure blob storage iterator [#50936](https://github.com/ClickHouse/ClickHouse/pull/50936) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix erroneous `sort_description` propagation in `CreatingSets` [#50955](https://github.com/ClickHouse/ClickHouse/pull/50955) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix Iceberg v2 optional metadata parsing [#50974](https://github.com/ClickHouse/ClickHouse/pull/50974) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* MaterializedMySQL: Keep parentheses for empty table overrides [#50977](https://github.com/ClickHouse/ClickHouse/pull/50977) ([Val Doroshchuk](https://github.com/valbok)).
-* Fix crash in BackupCoordinationStageSync::setError() [#51012](https://github.com/ClickHouse/ClickHouse/pull/51012) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix subtly broken copy-on-write of ColumnLowCardinality dictionary [#51064](https://github.com/ClickHouse/ClickHouse/pull/51064) ([Michael Kolupaev](https://github.com/al13n321)).
-* Generate safe IVs [#51086](https://github.com/ClickHouse/ClickHouse/pull/51086) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix ineffective query cache for SELECTs with subqueries [#51132](https://github.com/ClickHouse/ClickHouse/pull/51132) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix Set index with constant nullable comparison. [#51205](https://github.com/ClickHouse/ClickHouse/pull/51205) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix a crash in s3 and s3Cluster functions [#51209](https://github.com/ClickHouse/ClickHouse/pull/51209) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix a crash with compiled expressions [#51231](https://github.com/ClickHouse/ClickHouse/pull/51231) ([LiuNeng](https://github.com/liuneng1994)).
-* Fix use-after-free in StorageURL when switching URLs [#51260](https://github.com/ClickHouse/ClickHouse/pull/51260) ([Michael Kolupaev](https://github.com/al13n321)).
-* Updated check for parameterized view [#51272](https://github.com/ClickHouse/ClickHouse/pull/51272) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix multiple writing of same file to backup [#51299](https://github.com/ClickHouse/ClickHouse/pull/51299) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix fuzzer failure in ActionsDAG [#51301](https://github.com/ClickHouse/ClickHouse/pull/51301) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove garbage from function `transform` [#51350](https://github.com/ClickHouse/ClickHouse/pull/51350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add join keys conversion for nested LowCardinality [#51550](https://github.com/ClickHouse/ClickHouse/pull/51550) ([vdimir](https://github.com/vdimir)).
+* Flatten only true Nested type if flatten_nested=1, not all Array(Tuple) [#56132](https://github.com/ClickHouse/ClickHouse/pull/56132) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix a bug with projections and the `aggregate_functions_null_for_empty` setting during insertion. [#56944](https://github.com/ClickHouse/ClickHouse/pull/56944) ([Amos Bird](https://github.com/amosbird)).
+* Fixed potential exception due to stale profile UUID [#57263](https://github.com/ClickHouse/ClickHouse/pull/57263) ([Vasily Nemkov](https://github.com/Enmk)).
+* Fix working with read buffers in StreamingFormatExecutor [#57438](https://github.com/ClickHouse/ClickHouse/pull/57438) ([Kruglov Pavel](https://github.com/Avogar)).
+* Ignore MVs with dropped target table during pushing to views [#57520](https://github.com/ClickHouse/ClickHouse/pull/57520) ([Kruglov Pavel](https://github.com/Avogar)).
+* Eliminate possible race between ALTER_METADATA and MERGE_PARTS [#57755](https://github.com/ClickHouse/ClickHouse/pull/57755) ([Azat Khuzhin](https://github.com/azat)).
+* Fix the expressions order bug in group by with rollup [#57786](https://github.com/ClickHouse/ClickHouse/pull/57786) ([Chen768959](https://github.com/Chen768959)).
+* A fix for the obsolete "zero-copy" replication feature: Fix lost blobs after dropping a replica with broken detached parts [#58333](https://github.com/ClickHouse/ClickHouse/pull/58333) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow users to work with symlinks in user_files_path [#58447](https://github.com/ClickHouse/ClickHouse/pull/58447) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix a crash when graphite table does not have an agg function [#58453](https://github.com/ClickHouse/ClickHouse/pull/58453) ([Duc Canh Le](https://github.com/canhld94)).
+* Delay reading from StorageKafka to allow multiple reads in materialized views [#58477](https://github.com/ClickHouse/ClickHouse/pull/58477) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTreePrefetchedReadPool disable for LIMIT only queries [#58505](https://github.com/ClickHouse/ClickHouse/pull/58505) ([Maksim Kita](https://github.com/kitaisreal)).
+* Enable ordinary databases while restoration [#58520](https://github.com/ClickHouse/ClickHouse/pull/58520) ([Jihyuk Bok](https://github.com/tomahawk28)).
+* Fix Apache Hive threadpool reading for ORC/Parquet/... [#58537](https://github.com/ClickHouse/ClickHouse/pull/58537) ([sunny](https://github.com/sunny19930321)).
+* Hide credentials in `system.backup_log`'s `base_backup_name` column [#58550](https://github.com/ClickHouse/ClickHouse/pull/58550) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* `toStartOfInterval` for milli- microsencods values rounding [#58557](https://github.com/ClickHouse/ClickHouse/pull/58557) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Disable `max_joined_block_rows` in ConcurrentHashJoin [#58595](https://github.com/ClickHouse/ClickHouse/pull/58595) ([vdimir](https://github.com/vdimir)).
+* Fix join using nullable in the old analyzer [#58596](https://github.com/ClickHouse/ClickHouse/pull/58596) ([vdimir](https://github.com/vdimir)).
+* `makeDateTime64`: Allow non-const fraction argument [#58597](https://github.com/ClickHouse/ClickHouse/pull/58597) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix possible NULL dereference during symbolizing inline frames [#58607](https://github.com/ClickHouse/ClickHouse/pull/58607) ([Azat Khuzhin](https://github.com/azat)).
+* Improve isolation of query cache entries under re-created users or role switches [#58611](https://github.com/ClickHouse/ClickHouse/pull/58611) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix broken partition key analysis when doing projection optimization [#58638](https://github.com/ClickHouse/ClickHouse/pull/58638) ([Amos Bird](https://github.com/amosbird)).
+* Query cache: Fix per-user quota [#58731](https://github.com/ClickHouse/ClickHouse/pull/58731) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't process requests in Keeper during shutdown [#58765](https://github.com/ClickHouse/ClickHouse/pull/58765) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix a null pointer dereference in `SlabsPolygonIndex::find` [#58771](https://github.com/ClickHouse/ClickHouse/pull/58771) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* A fix for unexpected accumulation of memory usage while creating a huge number of tables by CREATE and DROP. [#58831](https://github.com/ClickHouse/ClickHouse/pull/58831) ([Maksim Kita](https://github.com/kitaisreal)).
+* Multiple read file log storage in mv [#58877](https://github.com/ClickHouse/ClickHouse/pull/58877) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Restriction for the access key id for s3. [#58900](https://github.com/ClickHouse/ClickHouse/pull/58900) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix possible crash in clickhouse-local during loading suggestions [#58907](https://github.com/ClickHouse/ClickHouse/pull/58907) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash when `indexHint` is used [#58911](https://github.com/ClickHouse/ClickHouse/pull/58911) ([Dmitry Novik](https://github.com/novikd)).
+* Fix StorageURL forgetting headers on server restart [#58933](https://github.com/ClickHouse/ClickHouse/pull/58933) ([Michael Kolupaev](https://github.com/al13n321)).
+* Analyzer: fix storage replacement with insertion block [#58958](https://github.com/ClickHouse/ClickHouse/pull/58958) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix seek in ReadBufferFromZipArchive [#58966](https://github.com/ClickHouse/ClickHouse/pull/58966) ([Michael Kolupaev](https://github.com/al13n321)).
+* A fix for experimental inverted indices (don't use in production): `DROP INDEX` of inverted index now removes all relevant files from persistence [#59040](https://github.com/ClickHouse/ClickHouse/pull/59040) ([mochi](https://github.com/MochiXu)).
+* Fix data race on query_factories_info [#59049](https://github.com/ClickHouse/ClickHouse/pull/59049) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Disable "Too many redirects" error retry [#59099](https://github.com/ClickHouse/ClickHouse/pull/59099) ([skyoct](https://github.com/skyoct)).
+* Fix not started database shutdown deadlock [#59137](https://github.com/ClickHouse/ClickHouse/pull/59137) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash with nullable timezone for `toString` [#59190](https://github.com/ClickHouse/ClickHouse/pull/59190) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix abort in iceberg metadata on bad file paths [#59275](https://github.com/ClickHouse/ClickHouse/pull/59275) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix architecture name in select of Rust target [#59307](https://github.com/ClickHouse/ClickHouse/pull/59307) ([p1rattttt](https://github.com/p1rattttt)).
+* Fix a logical error about "not-ready set" for querying from `system.tables` with a subquery in the IN clause. [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
 
-
-### <a id="235"></a> ClickHouse release 23.5, 2023-06-08
-
-#### Upgrade Notes
-* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. **Upgrade notes:** If you upgrade from versions prior to 22.9, you should either upgrade all replicas at once or disable the compression before upgrade, or upgrade through an intermediate version, where the compressed marks are supported but not enabled by default, such as 23.3. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Make local object storage work consistently with s3 object storage, fix problem with append (closes [#48465](https://github.com/ClickHouse/ClickHouse/issues/48465)), make it configurable as independent storage. The change is backward incompatible because the cache on top of local object storage is not compatible to previous versions. [#48791](https://github.com/ClickHouse/ClickHouse/pull/48791) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The experimental feature "in-memory data parts" is removed. The data format is still supported, but the settings are no-op, and compact or wide parts will be used instead. This closes [#45409](https://github.com/ClickHouse/ClickHouse/issues/45409). [#49429](https://github.com/ClickHouse/ClickHouse/pull/49429) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Changed default values of settings `parallelize_output_from_storages` and `input_format_parquet_preserve_order`. This allows ClickHouse to reorder rows when reading from files (e.g. CSV or Parquet), greatly improving performance in many cases. To restore the old behavior of preserving order, use `parallelize_output_from_storages = 0`, `input_format_parquet_preserve_order = 1`. [#49479](https://github.com/ClickHouse/ClickHouse/pull/49479) ([Michael Kolupaev](https://github.com/al13n321)).
-* Make projections production-ready. Add the `optimize_use_projections` setting to control whether the projections will be selected for SELECT queries. The setting `allow_experimental_projection_optimization` is obsolete and does nothing. [#49719](https://github.com/ClickHouse/ClickHouse/pull/49719) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Mark `joinGet` as non-deterministic (so as `dictGet`). It allows using them in mutations without an extra setting. [#49843](https://github.com/ClickHouse/ClickHouse/pull/49843) ([Azat Khuzhin](https://github.com/azat)).
-* Revert the "`groupArray` returns cannot be nullable" change (due to binary compatibility breakage for `groupArray`/`groupArrayLast`/`groupArraySample` over `Nullable` types, which likely will lead to `TOO_LARGE_ARRAY_SIZE` or `CANNOT_READ_ALL_DATA`). [#49971](https://github.com/ClickHouse/ClickHouse/pull/49971) ([Azat Khuzhin](https://github.com/azat)).
-* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. If you update from version prior to 22.12, we recommend to set this flag to `false` until update is finished. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### New Feature
-* Added storage engine AzureBlobStorage and azureBlobStorage table function. The supported set of features is very similar to storage/table function S3 [#50604] (https://github.com/ClickHouse/ClickHouse/pull/50604) ([alesapin](https://github.com/alesapin)) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni).
-* Added native ClickHouse Keeper CLI Client, it is available as `clickhouse keeper-client` [#47414](https://github.com/ClickHouse/ClickHouse/pull/47414) ([pufit](https://github.com/pufit)).
-* Add `urlCluster` table function. Refactor all *Cluster table functions to reduce code duplication. Make schema inference work for all possible *Cluster function signatures and for named collections. Closes [#38499](https://github.com/ClickHouse/ClickHouse/issues/38499). [#45427](https://github.com/ClickHouse/ClickHouse/pull/45427) ([attack204](https://github.com/attack204)), Pavel Kruglov.
-* The query cache can now be used for production workloads. [#47977](https://github.com/ClickHouse/ClickHouse/pull/47977) ([Robert Schulze](https://github.com/rschu1ze)). The query cache can now support queries with totals and extremes modifier. [#48853](https://github.com/ClickHouse/ClickHouse/pull/48853) ([Robert Schulze](https://github.com/rschu1ze)). Make `allow_experimental_query_cache` setting as obsolete for backward-compatibility. It was removed in https://github.com/ClickHouse/ClickHouse/pull/47977. [#49934](https://github.com/ClickHouse/ClickHouse/pull/49934) ([Timur Solodovnikov](https://github.com/tsolodov)).
-* Geographical data types (`Point`, `Ring`, `Polygon`, and `MultiPolygon`) are production-ready. [#50022](https://github.com/ClickHouse/ClickHouse/pull/50022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add schema inference to PostgreSQL, MySQL, MeiliSearch, and SQLite table engines. Closes [#49972](https://github.com/ClickHouse/ClickHouse/issues/49972). [#50000](https://github.com/ClickHouse/ClickHouse/pull/50000) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Password type in queries like `CREATE USER u IDENTIFIED BY 'p'` will be automatically set according to the setting `default_password_type` in the `config.xml` on the server. Closes [#42915](https://github.com/ClickHouse/ClickHouse/issues/42915). [#44674](https://github.com/ClickHouse/ClickHouse/pull/44674) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add bcrypt password authentication type. Closes [#34599](https://github.com/ClickHouse/ClickHouse/issues/34599). [#44905](https://github.com/ClickHouse/ClickHouse/pull/44905) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Introduces new keyword `INTO OUTFILE 'file.txt' APPEND`. [#48880](https://github.com/ClickHouse/ClickHouse/pull/48880) ([alekar](https://github.com/alekar)).
-* Added `system.zookeeper_connection` table that shows information about Keeper connections. [#45245](https://github.com/ClickHouse/ClickHouse/pull/45245) ([mateng915](https://github.com/mateng0915)).
-* Add new function `generateRandomStructure` that generates random table structure. It can be used in combination with table function `generateRandom`. [#47409](https://github.com/ClickHouse/ClickHouse/pull/47409) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow the use of `CASE` without an `ELSE` branch and extended `transform` to deal with more types. Also fix some issues that made transform() return incorrect results when decimal types were mixed with other numeric types. [#48300](https://github.com/ClickHouse/ClickHouse/pull/48300) ([Salvatore Mesoraca](https://github.com/aiven-sal)). This closes #2655. This closes #9596. This closes #38666.
-* Added [server-side encryption using KMS keys](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) with S3 tables, and the `header` setting with S3 disks. Closes [#48723](https://github.com/ClickHouse/ClickHouse/issues/48723). [#48724](https://github.com/ClickHouse/ClickHouse/pull/48724) ([Johann Gan](https://github.com/johanngan)).
-* Add MemoryTracker for the background tasks (merges and mutation). Introduces `merges_mutations_memory_usage_soft_limit` and `merges_mutations_memory_usage_to_ram_ratio` settings that represent the soft memory limit for merges and mutations. If this limit is reached ClickHouse won't schedule new merge or mutation tasks. Also `MergesMutationsMemoryTracking` metric is introduced to allow observing current memory usage of background tasks. Resubmit [#46089](https://github.com/ClickHouse/ClickHouse/issues/46089). Closes [#48774](https://github.com/ClickHouse/ClickHouse/issues/48774). [#48787](https://github.com/ClickHouse/ClickHouse/pull/48787) ([Dmitry Novik](https://github.com/novikd)).
-* Function `dotProduct` work for array. [#49050](https://github.com/ClickHouse/ClickHouse/pull/49050) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Support statement `SHOW INDEX` to improve compatibility with MySQL. [#49158](https://github.com/ClickHouse/ClickHouse/pull/49158) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add virtual column `_file` and `_path` support to table function `url`. - Improve error message for table function `url`. - resolves [#49231](https://github.com/ClickHouse/ClickHouse/issues/49231) - resolves [#49232](https://github.com/ClickHouse/ClickHouse/issues/49232). [#49356](https://github.com/ClickHouse/ClickHouse/pull/49356) ([Ziyi Tan](https://github.com/Ziy1-Tan)).
-* Adding the `grants` field in the users.xml file, which allows specifying grants for users. [#49381](https://github.com/ClickHouse/ClickHouse/pull/49381) ([pufit](https://github.com/pufit)).
-* Support full/right join by using grace hash join algorithm. [#49483](https://github.com/ClickHouse/ClickHouse/pull/49483) ([lgbo](https://github.com/lgbo-ustc)).
-* `WITH FILL` modifier groups filling by sorting prefix. Controlled by `use_with_fill_by_sorting_prefix` setting (enabled by default). Related to [#33203](https://github.com/ClickHouse/ClickHouse/issues/33203)#issuecomment-1418736794. [#49503](https://github.com/ClickHouse/ClickHouse/pull/49503) ([Igor Nikonov](https://github.com/devcrafter)).
-* Clickhouse-client now accepts queries after "--multiquery" when "--query" (or "-q") is absent. example: clickhouse-client --multiquery "select 1; select 2;". [#49870](https://github.com/ClickHouse/ClickHouse/pull/49870) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Add separate `handshake_timeout` for receiving Hello packet from replica. Closes [#48854](https://github.com/ClickHouse/ClickHouse/issues/48854). [#49948](https://github.com/ClickHouse/ClickHouse/pull/49948) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added a function "space" which repeats a space as many times as specified. [#50103](https://github.com/ClickHouse/ClickHouse/pull/50103) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added --input_format_csv_trim_whitespaces option. [#50215](https://github.com/ClickHouse/ClickHouse/pull/50215) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Allow the `dictGetAll` function for regexp tree dictionaries to return values from multiple matches as arrays. Closes [#50254](https://github.com/ClickHouse/ClickHouse/issues/50254). [#50255](https://github.com/ClickHouse/ClickHouse/pull/50255) ([Johann Gan](https://github.com/johanngan)).
-* Added `toLastDayOfWeek` function to round a date or a date with time up to the nearest Saturday or Sunday. [#50315](https://github.com/ClickHouse/ClickHouse/pull/50315) ([Victor Krasnov](https://github.com/sirvickr)).
-* Ability to ignore a skip index by specifying `ignore_data_skipping_indices`. [#50329](https://github.com/ClickHouse/ClickHouse/pull/50329) ([Boris Kuschel](https://github.com/bkuschel)).
-* Add `system.user_processes` table and `SHOW USER PROCESSES` query to show memory info and ProfileEvents on user level. [#50492](https://github.com/ClickHouse/ClickHouse/pull/50492) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-* Add server and format settings `display_secrets_in_show_and_select` for displaying secrets of tables, databases, table functions, and dictionaries. Add privilege `displaySecretsInShowAndSelect` controlling which users can view secrets. [#46528](https://github.com/ClickHouse/ClickHouse/pull/46528) ([Mike Kot](https://github.com/myrrc)).
-* Allow to set up a ROW POLICY for all tables that belong to a DATABASE. [#47640](https://github.com/ClickHouse/ClickHouse/pull/47640) ([Ilya Golshtein](https://github.com/ilejn)).
-
-#### Performance Improvement
-* Compress marks and primary key by default. It significantly reduces the cold query time. Upgrade notes: the support for compressed marks and primary key has been added in version 22.9. If you turned on compressed marks or primary key or installed version 23.5 or newer, which has compressed marks or primary key on by default, you will not be able to downgrade to version 22.8 or earlier. You can also explicitly disable compressed marks or primary keys by specifying the `compress_marks` and `compress_primary_key` settings in the `<merge_tree>` section of the server configuration file. [#42587](https://github.com/ClickHouse/ClickHouse/pull/42587) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* New setting s3_max_inflight_parts_for_one_file sets the limit of concurrently loaded parts with multipart upload request in scope of one file. [#49961](https://github.com/ClickHouse/ClickHouse/pull/49961) ([Sema Checherinda](https://github.com/CheSema)).
-* When reading from multiple files reduce parallel parsing threads for each file. Resolves [#42192](https://github.com/ClickHouse/ClickHouse/issues/42192). [#46661](https://github.com/ClickHouse/ClickHouse/pull/46661) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Use aggregate projection only if it reads fewer granules than normal reading. It should help in case if query hits the PK of the table, but not the projection. Fixes [#49150](https://github.com/ClickHouse/ClickHouse/issues/49150). [#49417](https://github.com/ClickHouse/ClickHouse/pull/49417) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Do not store blocks in `ANY` hash join if nothing is inserted. [#48633](https://github.com/ClickHouse/ClickHouse/pull/48633) ([vdimir](https://github.com/vdimir)).
-* Fixes aggregate combinator `-If` when JIT compiled, and enable JIT compilation for aggregate functions. Closes [#48120](https://github.com/ClickHouse/ClickHouse/issues/48120). [#49083](https://github.com/ClickHouse/ClickHouse/pull/49083) ([Igor Nikonov](https://github.com/devcrafter)).
-* For reading from remote tables we use smaller tasks (instead of reading the whole part) to make tasks stealing work * task size is determined by size of columns to read * always use 1mb buffers for reading from s3 * boundaries of cache segments aligned to 1mb so they have decent size even with small tasks. it also should prevent fragmentation. [#49287](https://github.com/ClickHouse/ClickHouse/pull/49287) ([Nikita Taranov](https://github.com/nickitat)).
-* Introduced settings: - `merge_max_block_size_bytes` to limit the amount of memory used for background operations. - `vertical_merge_algorithm_min_bytes_to_activate` to add another condition to activate vertical merges. [#49313](https://github.com/ClickHouse/ClickHouse/pull/49313) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Default size of a read buffer for reading from local filesystem changed to a slightly better value. Also two new settings are introduced: `max_read_buffer_size_local_fs` and `max_read_buffer_size_remote_fs`. [#49321](https://github.com/ClickHouse/ClickHouse/pull/49321) ([Nikita Taranov](https://github.com/nickitat)).
-* Improve memory usage and speed of `SPARSE_HASHED`/`HASHED` dictionaries (e.g. `SPARSE_HASHED` now eats 2.6x less memory, and is ~2x faster). [#49380](https://github.com/ClickHouse/ClickHouse/pull/49380) ([Azat Khuzhin](https://github.com/azat)).
-* Optimize the `system.query_log` and `system.query_thread_log` tables by applying `LowCardinality` when appropriate. The queries over these tables will be faster. [#49530](https://github.com/ClickHouse/ClickHouse/pull/49530) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Better performance when reading local `Parquet` files (through parallel reading). [#49539](https://github.com/ClickHouse/ClickHouse/pull/49539) ([Michael Kolupaev](https://github.com/al13n321)).
-* Improve the performance of `RIGHT/FULL JOIN` by up to 2 times in certain scenarios, especially when joining a small left table with a large right table. [#49585](https://github.com/ClickHouse/ClickHouse/pull/49585) ([lgbo](https://github.com/lgbo-ustc)).
-* Improve performance of BLAKE3 by 11% by enabling LTO for Rust. [#49600](https://github.com/ClickHouse/ClickHouse/pull/49600) ([Azat Khuzhin](https://github.com/azat)). Now it is on par with C++.
-* Optimize the structure of the `system.opentelemetry_span_log`. Use `LowCardinality` where appropriate. Although this table is generally stupid (it is using the Map data type even for common attributes), it will be slightly better. [#49647](https://github.com/ClickHouse/ClickHouse/pull/49647) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Try to reserve hash table's size in `grace_hash` join. [#49816](https://github.com/ClickHouse/ClickHouse/pull/49816) ([lgbo](https://github.com/lgbo-ustc)).
-* Parallel merge of `uniqExactIf` states. Closes [#49885](https://github.com/ClickHouse/ClickHouse/issues/49885). [#50285](https://github.com/ClickHouse/ClickHouse/pull/50285) ([flynn](https://github.com/ucasfl)).
-* Keeper improvement: add `CheckNotExists` request to Keeper, which allows to improve the performance of Replicated tables. [#48897](https://github.com/ClickHouse/ClickHouse/pull/48897) ([Antonio Andelic](https://github.com/antonio2368)).
-* Keeper performance improvements: avoid serializing same request twice while processing. Cache deserialization results of large requests. Controlled by new coordination setting `min_request_size_for_cache`. [#49004](https://github.com/ClickHouse/ClickHouse/pull/49004) ([Antonio Andelic](https://github.com/antonio2368)).
-* Reduced number of `List` ZooKeeper requests when selecting parts to merge and a lot of partitions do not have anything to merge. [#49637](https://github.com/ClickHouse/ClickHouse/pull/49637) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Rework locking in the FS cache [#44985](https://github.com/ClickHouse/ClickHouse/pull/44985) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disable pure parallel replicas if trivial count optimization is possible. [#50594](https://github.com/ClickHouse/ClickHouse/pull/50594) ([Raúl Marín](https://github.com/Algunenano)).
-* Don't send head request for all keys in Iceberg schema inference, only for keys that are used for reaing data. [#50203](https://github.com/ClickHouse/ClickHouse/pull/50203) ([Kruglov Pavel](https://github.com/Avogar)).
-* Setting `enable_memory_bound_merging_of_aggregation_results` is enabled by default. [#50319](https://github.com/ClickHouse/ClickHouse/pull/50319) ([Nikita Taranov](https://github.com/nickitat)).
-
-#### Experimental Feature
-* `DEFLATE_QPL` codec lower the minimum simd version to SSE 4.2. [doc change in qpl](https://github.com/intel/qpl/commit/3f8f5cea27739f5261e8fd577dc233ffe88bf679) - Intel® QPL relies on a run-time kernels dispatcher and cpuid check to choose the best available implementation(sse/avx2/avx512) - restructured cmakefile for qpl build in clickhouse to align with latest upstream qpl. [#49811](https://github.com/ClickHouse/ClickHouse/pull/49811) ([jasperzhu](https://github.com/jinjunzh)).
-* Add initial support to do JOINs with pure parallel replicas. [#49544](https://github.com/ClickHouse/ClickHouse/pull/49544) ([Raúl Marín](https://github.com/Algunenano)).
-* More parallelism on `Outdated` parts removal with "zero-copy replication". [#49630](https://github.com/ClickHouse/ClickHouse/pull/49630) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Parallel Replicas: 1) Fixed an error `NOT_FOUND_COLUMN_IN_BLOCK` in case of using parallel replicas with non-replicated storage with disabled setting `parallel_replicas_for_non_replicated_merge_tree` 2) Now `allow_experimental_parallel_reading_from_replicas` have 3 possible values - 0, 1 and 2. 0 - disabled, 1 - enabled, silently disable them in case of failure (in case of FINAL or JOIN), 2 - enabled, throw an exception in case of failure. 3) If FINAL modifier is used in SELECT query and parallel replicas are enabled, ClickHouse will try to disable them if `allow_experimental_parallel_reading_from_replicas` is set to 1 and throw an exception otherwise. [#50195](https://github.com/ClickHouse/ClickHouse/pull/50195) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* When parallel replicas are enabled they will always skip unavailable servers (the behavior is controlled by the setting `skip_unavailable_shards`, enabled by default and can be only disabled). This closes: [#48565](https://github.com/ClickHouse/ClickHouse/issues/48565). [#50293](https://github.com/ClickHouse/ClickHouse/pull/50293) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Improvement
-* The `BACKUP` command will not decrypt data from encrypted disks while making a backup. Instead the data will be stored in a backup in encrypted form. Such backups can be restored only to an encrypted disk with the same (or extended) list of encryption keys. [#48896](https://github.com/ClickHouse/ClickHouse/pull/48896) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Added possibility to use temporary tables in FROM part of ATTACH PARTITION FROM and REPLACE PARTITION FROM. [#49436](https://github.com/ClickHouse/ClickHouse/pull/49436) ([Roman Vasin](https://github.com/rvasin)).
-* Added setting `async_insert` for `MergeTree` tables. It has the same meaning as query-level setting `async_insert` and enables asynchronous inserts for specific table. Note: it doesn't take effect for insert queries from `clickhouse-client`, use query-level setting in that case. [#49122](https://github.com/ClickHouse/ClickHouse/pull/49122) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for size suffixes in quota creation statement parameters. [#49087](https://github.com/ClickHouse/ClickHouse/pull/49087) ([Eridanus](https://github.com/Eridanus117)).
-* Extend `first_value` and `last_value` to accept NULL. [#46467](https://github.com/ClickHouse/ClickHouse/pull/46467) ([lgbo](https://github.com/lgbo-ustc)).
-* Add alias `str_to_map` and `mapFromString` for `extractKeyValuePairs`. closes https://github.com/clickhouse/clickhouse/issues/47185. [#49466](https://github.com/ClickHouse/ClickHouse/pull/49466) ([flynn](https://github.com/ucasfl)).
-* Add support for CGroup version 2 for asynchronous metrics about the memory usage and availability. This closes [#37983](https://github.com/ClickHouse/ClickHouse/issues/37983). [#45999](https://github.com/ClickHouse/ClickHouse/pull/45999) ([sichenzhao](https://github.com/sichenzhao)).
-* Cluster table functions should always skip unavailable shards. close [#46314](https://github.com/ClickHouse/ClickHouse/issues/46314). [#46765](https://github.com/ClickHouse/ClickHouse/pull/46765) ([zk_kiger](https://github.com/zk-kiger)).
-* Allow CSV file to contain empty columns in its header. [#47496](https://github.com/ClickHouse/ClickHouse/pull/47496) ([你不要过来啊](https://github.com/iiiuwioajdks)).
-* Add Google Cloud Storage S3 compatible table function `gcs`. Like the `oss` and `cosn` functions, it is just an alias over the `s3` table function, and it does not bring any new features. [#47815](https://github.com/ClickHouse/ClickHouse/pull/47815) ([Kuba Kaflik](https://github.com/jkaflik)).
-* Add ability to use strict parts size for S3 (compatibility with CloudFlare R2 S3 Storage). [#48492](https://github.com/ClickHouse/ClickHouse/pull/48492) ([Azat Khuzhin](https://github.com/azat)).
-* Added new columns with info about `Replicated` database replicas to `system.clusters`: `database_shard_name`, `database_replica_name`, `is_active`. Added an optional `FROM SHARD` clause to `SYSTEM DROP DATABASE REPLICA` query. [#48548](https://github.com/ClickHouse/ClickHouse/pull/48548) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add a new column `zookeeper_name` in system.replicas, to indicate on which (auxiliary) zookeeper cluster the replicated table's metadata is stored. [#48549](https://github.com/ClickHouse/ClickHouse/pull/48549) ([cangyin](https://github.com/cangyin)).
-* `IN` operator support the comparison of `Date` and `Date32`. Closes [#48736](https://github.com/ClickHouse/ClickHouse/issues/48736). [#48806](https://github.com/ClickHouse/ClickHouse/pull/48806) ([flynn](https://github.com/ucasfl)).
-* Support for erasure codes in `HDFS`, author: @M1eyu2018, @tomscut. [#48833](https://github.com/ClickHouse/ClickHouse/pull/48833) ([M1eyu](https://github.com/M1eyu2018)).
-* Implement SYSTEM DROP REPLICA from auxiliary ZooKeeper clusters, may be close [#48931](https://github.com/ClickHouse/ClickHouse/issues/48931). [#48932](https://github.com/ClickHouse/ClickHouse/pull/48932) ([wangxiaobo](https://github.com/wzb5212)).
-* Add Array data type to MongoDB. Closes [#48598](https://github.com/ClickHouse/ClickHouse/issues/48598). [#48983](https://github.com/ClickHouse/ClickHouse/pull/48983) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Support storing `Interval` data types in tables. [#49085](https://github.com/ClickHouse/ClickHouse/pull/49085) ([larryluogit](https://github.com/larryluogit)).
-* Allow using `ntile` window function without explicit window frame definition: `ntile(3) OVER (ORDER BY a)`, close [#46763](https://github.com/ClickHouse/ClickHouse/issues/46763). [#49093](https://github.com/ClickHouse/ClickHouse/pull/49093) ([vdimir](https://github.com/vdimir)).
-* Added settings (`number_of_mutations_to_delay`, `number_of_mutations_to_throw`) to delay or throw `ALTER` queries that create mutations (`ALTER UPDATE`, `ALTER DELETE`, `ALTER MODIFY COLUMN`, ...) in case when table already has a lot of unfinished mutations. [#49117](https://github.com/ClickHouse/ClickHouse/pull/49117) ([Anton Popov](https://github.com/CurtizJ)).
-* Catch exception from `create_directories` in filesystem cache. [#49203](https://github.com/ClickHouse/ClickHouse/pull/49203) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Copies embedded examples to a new field `example` in `system.functions` to supplement the field `description`. [#49222](https://github.com/ClickHouse/ClickHouse/pull/49222) ([Dan Roscigno](https://github.com/DanRoscigno)).
-* Enable connection options for the MongoDB dictionary. Example: ``` xml <source> <mongodb> <host>localhost</host> <port>27017</port> <user></user> <password></password> <db>test</db> <collection>dictionary_source</collection> <options>ssl=true</options> </mongodb> </source> ``` ### Documentation entry for user-facing changes. [#49225](https://github.com/ClickHouse/ClickHouse/pull/49225) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Added an alias `asymptotic` for `asymp` computational method for `kolmogorovSmirnovTest`. Improved documentation. [#49286](https://github.com/ClickHouse/ClickHouse/pull/49286) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Aggregation function groupBitAnd/Or/Xor now work on signed integer data. This makes them consistent with the behavior of scalar functions bitAnd/Or/Xor. [#49292](https://github.com/ClickHouse/ClickHouse/pull/49292) ([exmy](https://github.com/exmy)).
-* Split function-documentation into more fine-granular fields. [#49300](https://github.com/ClickHouse/ClickHouse/pull/49300) ([Robert Schulze](https://github.com/rschu1ze)).
-* Use multiple threads shared between all tables within a server to load outdated data parts. The the size of the pool and its queue is controlled by `max_outdated_parts_loading_thread_pool_size` and `outdated_part_loading_thread_pool_queue_size` settings. [#49317](https://github.com/ClickHouse/ClickHouse/pull/49317) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Don't overestimate the size of processed data for `LowCardinality` columns when they share dictionaries between blocks. This closes [#49322](https://github.com/ClickHouse/ClickHouse/issues/49322). See also [#48745](https://github.com/ClickHouse/ClickHouse/issues/48745). [#49323](https://github.com/ClickHouse/ClickHouse/pull/49323) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Parquet writer now uses reasonable row group size when invoked through `OUTFILE`. [#49325](https://github.com/ClickHouse/ClickHouse/pull/49325) ([Michael Kolupaev](https://github.com/al13n321)).
-* Allow restricted keywords like `ARRAY` as an alias if the alias is quoted. Closes [#49324](https://github.com/ClickHouse/ClickHouse/issues/49324). [#49360](https://github.com/ClickHouse/ClickHouse/pull/49360) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Data parts loading and deletion jobs were moved to shared server-wide pools instead of per-table pools. Pools sizes are controlled via settings `max_active_parts_loading_thread_pool_size`, `max_outdated_parts_loading_thread_pool_size` and `max_parts_cleaning_thread_pool_size` in top-level config. Table-level settings `max_part_loading_threads` and `max_part_removal_threads` became obsolete. [#49474](https://github.com/ClickHouse/ClickHouse/pull/49474) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Allow `?password=pass` in URL of the Play UI. Password is replaced in browser history. [#49505](https://github.com/ClickHouse/ClickHouse/pull/49505) ([Mike Kot](https://github.com/myrrc)).
-* Allow reading zero-size objects from remote filesystems. (because empty files are not backup'd, so we might end up with zero blobs in metadata file). Closes [#49480](https://github.com/ClickHouse/ClickHouse/issues/49480). [#49519](https://github.com/ClickHouse/ClickHouse/pull/49519) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Attach thread MemoryTracker to `total_memory_tracker` after `ThreadGroup` detached. [#49527](https://github.com/ClickHouse/ClickHouse/pull/49527) ([Dmitry Novik](https://github.com/novikd)).
-* Fix parameterized views when a query parameter is used multiple times in the query. [#49556](https://github.com/ClickHouse/ClickHouse/pull/49556) ([Azat Khuzhin](https://github.com/azat)).
-* Release memory allocated for the last sent ProfileEvents snapshot in the context of a query. Followup [#47564](https://github.com/ClickHouse/ClickHouse/issues/47564). [#49561](https://github.com/ClickHouse/ClickHouse/pull/49561) ([Dmitry Novik](https://github.com/novikd)).
-* Function "makeDate" now provides a MySQL-compatible overload (year & day of the year argument). [#49603](https://github.com/ClickHouse/ClickHouse/pull/49603) ([Robert Schulze](https://github.com/rschu1ze)).
-* Support `dictionary` table function for `RegExpTreeDictionary`. [#49666](https://github.com/ClickHouse/ClickHouse/pull/49666) ([Han Fei](https://github.com/hanfei1991)).
-* Added weighted fair IO scheduling policy. Added dynamic resource manager, which allows IO scheduling hierarchy to be updated in runtime w/o server restarts. [#49671](https://github.com/ClickHouse/ClickHouse/pull/49671) ([Sergei Trifonov](https://github.com/serxa)).
-* Add compose request after multipart upload to GCS. This enables the usage of copy operation on objects uploaded with the multipart upload. It's recommended to set `s3_strict_upload_part_size` to some value because compose request can fail on objects created with parts of different sizes. [#49693](https://github.com/ClickHouse/ClickHouse/pull/49693) ([Antonio Andelic](https://github.com/antonio2368)).
-* For the `extractKeyValuePairs` function: improve the "best-effort" parsing logic to accept `key_value_delimiter` as a valid part of the value. This also simplifies branching and might even speed up things a bit. [#49760](https://github.com/ClickHouse/ClickHouse/pull/49760) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add `initial_query_id` field for system.processors_profile_log [#49777](https://github.com/ClickHouse/ClickHouse/pull/49777) ([helifu](https://github.com/helifu)).
-* System log tables can now have custom sorting keys. [#49778](https://github.com/ClickHouse/ClickHouse/pull/49778) ([helifu](https://github.com/helifu)).
-* A new field `partitions` to `system.query_log` is used to indicate which partitions are participating in the calculation. [#49779](https://github.com/ClickHouse/ClickHouse/pull/49779) ([helifu](https://github.com/helifu)).
-* Added `enable_the_endpoint_id_with_zookeeper_name_prefix` setting for `ReplicatedMergeTree` (disabled by default). When enabled, it adds ZooKeeper cluster name to table's interserver communication endpoint. It avoids `Duplicate interserver IO endpoint` errors when having replicated tables with the same path, but different auxiliary ZooKeepers. [#49780](https://github.com/ClickHouse/ClickHouse/pull/49780) ([helifu](https://github.com/helifu)).
-* Add query parameters to `clickhouse-local`. Closes [#46561](https://github.com/ClickHouse/ClickHouse/issues/46561). [#49785](https://github.com/ClickHouse/ClickHouse/pull/49785) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow loading dictionaries and functions from YAML by default. In previous versions, it required editing the `dictionaries_config` or `user_defined_executable_functions_config` in the configuration file, as they expected `*.xml` files. [#49812](https://github.com/ClickHouse/ClickHouse/pull/49812) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The Kafka table engine now allows to use alias columns. [#49824](https://github.com/ClickHouse/ClickHouse/pull/49824) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Add setting to limit the max number of pairs produced by `extractKeyValuePairs`, a safeguard to avoid using way too much memory. [#49836](https://github.com/ClickHouse/ClickHouse/pull/49836) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add support for (an unusual) case where the arguments in the `IN` operator are single-element tuples. [#49844](https://github.com/ClickHouse/ClickHouse/pull/49844) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* `bitHammingDistance` function support `String` and `FixedString` data type. Closes [#48827](https://github.com/ClickHouse/ClickHouse/issues/48827). [#49858](https://github.com/ClickHouse/ClickHouse/pull/49858) ([flynn](https://github.com/ucasfl)).
-* Fix timeout resetting errors in the client on OS X. [#49863](https://github.com/ClickHouse/ClickHouse/pull/49863) ([alekar](https://github.com/alekar)).
-* Add support for big integers, such as UInt128, Int128, UInt256, and Int256 in the function `bitCount`. This enables Hamming distance over large bit masks for AI applications. [#49867](https://github.com/ClickHouse/ClickHouse/pull/49867) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fingerprints to be used instead of key IDs in encrypted disks. This simplifies the configuration of encrypted disks. [#49882](https://github.com/ClickHouse/ClickHouse/pull/49882) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add UUID data type to PostgreSQL. Closes [#49739](https://github.com/ClickHouse/ClickHouse/issues/49739). [#49894](https://github.com/ClickHouse/ClickHouse/pull/49894) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Function `toUnixTimestamp` now accepts `Date` and `Date32` arguments. [#49989](https://github.com/ClickHouse/ClickHouse/pull/49989) ([Victor Krasnov](https://github.com/sirvickr)).
-* Charge only server memory for dictionaries. [#49995](https://github.com/ClickHouse/ClickHouse/pull/49995) ([Azat Khuzhin](https://github.com/azat)).
-* The server will allow using the `SQL_*` settings such as `SQL_AUTO_IS_NULL` as no-ops for MySQL compatibility. This closes [#49927](https://github.com/ClickHouse/ClickHouse/issues/49927). [#50013](https://github.com/ClickHouse/ClickHouse/pull/50013) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Preserve initial_query_id for ON CLUSTER queries, which is useful for introspection (under `distributed_ddl_entry_format_version=5`). [#50015](https://github.com/ClickHouse/ClickHouse/pull/50015) ([Azat Khuzhin](https://github.com/azat)).
-* Preserve backward incompatibility for renamed settings by using aliases (`allow_experimental_projection_optimization` for `optimize_use_projections`, `allow_experimental_lightweight_delete` for `enable_lightweight_delete`). [#50044](https://github.com/ClickHouse/ClickHouse/pull/50044) ([Azat Khuzhin](https://github.com/azat)).
-* Support passing FQDN through setting my_hostname to register cluster node in keeper. Add setting of invisible to support multi compute groups. A compute group as a cluster, is invisible to other compute groups. [#50186](https://github.com/ClickHouse/ClickHouse/pull/50186) ([Yangkuan Liu](https://github.com/LiuYangkuan)).
-* Fix PostgreSQL reading all the data even though `LIMIT n` could be specified. [#50187](https://github.com/ClickHouse/ClickHouse/pull/50187) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add new profile events for queries with subqueries (`QueriesWithSubqueries`/`SelectQueriesWithSubqueries`/`InsertQueriesWithSubqueries`). [#50204](https://github.com/ClickHouse/ClickHouse/pull/50204) ([Azat Khuzhin](https://github.com/azat)).
-* Adding the roles field in the users.xml file, which allows specifying roles with grants via a config file. [#50278](https://github.com/ClickHouse/ClickHouse/pull/50278) ([pufit](https://github.com/pufit)).
-* Report `CGroupCpuCfsPeriod` and `CGroupCpuCfsQuota` in AsynchronousMetrics. - Respect cgroup v2 memory limits during server startup. [#50379](https://github.com/ClickHouse/ClickHouse/pull/50379) ([alekar](https://github.com/alekar)).
-* Add a signal handler for SIGQUIT to work the same way as SIGINT. Closes [#50298](https://github.com/ClickHouse/ClickHouse/issues/50298). [#50435](https://github.com/ClickHouse/ClickHouse/pull/50435) ([Nikolay Degterinsky](https://github.com/evillique)).
-* In case JSON parse fails due to the large size of the object output the last position to allow debugging. [#50474](https://github.com/ClickHouse/ClickHouse/pull/50474) ([Valentin Alexeev](https://github.com/valentinalexeev)).
-* Support decimals with not fixed size. Closes [#49130](https://github.com/ClickHouse/ClickHouse/issues/49130). [#50586](https://github.com/ClickHouse/ClickHouse/pull/50586) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Build/Testing/Packaging Improvement
-* New and improved `keeper-bench`. Everything can be customized from YAML/XML file: - request generator - each type of request generator can have a specific set of fields - multi requests can be generated just by doing the same under `multi` key - for each request or subrequest in multi a `weight` field can be defined to control distribution - define trees that need to be setup for a test run - hosts can be defined with all timeouts customizable and it's possible to control how many sessions to generate for each host - integers defined with `min_value` and `max_value` fields are random number generators. [#48547](https://github.com/ClickHouse/ClickHouse/pull/48547) ([Antonio Andelic](https://github.com/antonio2368)).
-* Io_uring is not supported on macos, don't choose it when running tests on local to avoid occasional failures. [#49250](https://github.com/ClickHouse/ClickHouse/pull/49250) ([Frank Chen](https://github.com/FrankChen021)).
-* Support named fault injection for testing. [#49361](https://github.com/ClickHouse/ClickHouse/pull/49361) ([Han Fei](https://github.com/hanfei1991)).
-* Allow running ClickHouse in the OS where the `prctl` (process control) syscall is not available, such as AWS Lambda. [#49538](https://github.com/ClickHouse/ClickHouse/pull/49538) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fixed the issue of build conflict between contrib/isa-l and isa-l in qpl [49296](https://github.com/ClickHouse/ClickHouse/issues/49296). [#49584](https://github.com/ClickHouse/ClickHouse/pull/49584) ([jasperzhu](https://github.com/jinjunzh)).
-* Utilities are now only build if explicitly requested ("-DENABLE_UTILS=1") instead of by default, this reduces link times in typical development builds. [#49620](https://github.com/ClickHouse/ClickHouse/pull/49620) ([Robert Schulze](https://github.com/rschu1ze)).
-* Pull build description of idxd-config into a separate CMake file to avoid accidental removal in future. [#49651](https://github.com/ClickHouse/ClickHouse/pull/49651) ([jasperzhu](https://github.com/jinjunzh)).
-* Add CI check with an enabled analyzer in the master. Follow-up [#49562](https://github.com/ClickHouse/ClickHouse/issues/49562). [#49668](https://github.com/ClickHouse/ClickHouse/pull/49668) ([Dmitry Novik](https://github.com/novikd)).
-* Switch to LLVM/clang 16. [#49678](https://github.com/ClickHouse/ClickHouse/pull/49678) ([Azat Khuzhin](https://github.com/azat)).
-* Allow building ClickHouse with clang-17. [#49851](https://github.com/ClickHouse/ClickHouse/pull/49851) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#50410](https://github.com/ClickHouse/ClickHouse/pull/50410) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* ClickHouse is now easier to be integrated into other cmake projects. [#49991](https://github.com/ClickHouse/ClickHouse/pull/49991) ([Amos Bird](https://github.com/amosbird)). (Which is strongly discouraged - Alexey Milovidov).
-* Fix strange additional QEMU logging after [#47151](https://github.com/ClickHouse/ClickHouse/issues/47151), see https://s3.amazonaws.com/clickhouse-test-reports/50078/a4743996ee4f3583884d07bcd6501df0cfdaa346/stateless_tests__release__databasereplicated__[3_4].html. [#50442](https://github.com/ClickHouse/ClickHouse/pull/50442) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* ClickHouse can work on Linux RISC-V 6.1.22. This closes [#50456](https://github.com/ClickHouse/ClickHouse/issues/50456). [#50457](https://github.com/ClickHouse/ClickHouse/pull/50457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump internal protobuf to v3.18 (fixes bogus CVE-2022-1941). [#50400](https://github.com/ClickHouse/ClickHouse/pull/50400) ([Robert Schulze](https://github.com/rschu1ze)).
-* Bump internal libxml2 to v2.10.4 (fixes bogus CVE-2023-28484 and bogus CVE-2023-29469). [#50402](https://github.com/ClickHouse/ClickHouse/pull/50402) ([Robert Schulze](https://github.com/rschu1ze)).
-* Bump c-ares to v1.19.1 (bogus CVE-2023-32067, bogus CVE-2023-31130, bogus CVE-2023-31147). [#50403](https://github.com/ClickHouse/ClickHouse/pull/50403) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix bogus CVE-2022-2469 in libgsasl. [#50404](https://github.com/ClickHouse/ClickHouse/pull/50404) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-
-* ActionsDAG: fix wrong optimization [#47584](https://github.com/ClickHouse/ClickHouse/pull/47584) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Correctly handle concurrent snapshots in Keeper [#48466](https://github.com/ClickHouse/ClickHouse/pull/48466) ([Antonio Andelic](https://github.com/antonio2368)).
-* MergeTreeMarksLoader holds DataPart instead of DataPartStorage [#48515](https://github.com/ClickHouse/ClickHouse/pull/48515) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Sequence state fix [#48603](https://github.com/ClickHouse/ClickHouse/pull/48603) ([Ilya Golshtein](https://github.com/ilejn)).
-* Back/Restore concurrency check on previous fails [#48726](https://github.com/ClickHouse/ClickHouse/pull/48726) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix Attaching a table with non-existent ZK path does not increase the ReadonlyReplica metric [#48954](https://github.com/ClickHouse/ClickHouse/pull/48954) ([wangxiaobo](https://github.com/wzb5212)).
-* Fix possible terminate called for uncaught exception in some places [#49112](https://github.com/ClickHouse/ClickHouse/pull/49112) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix key not found error for queries with multiple StorageJoin [#49137](https://github.com/ClickHouse/ClickHouse/pull/49137) ([vdimir](https://github.com/vdimir)).
-* Fix wrong query result when using nullable primary key [#49172](https://github.com/ClickHouse/ClickHouse/pull/49172) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix reinterpretAs*() on big endian machines [#49198](https://github.com/ClickHouse/ClickHouse/pull/49198) ([Suzy Wang](https://github.com/SuzyWangIBMer)).
-* (Experimental zero-copy replication) Lock zero copy parts more atomically [#49211](https://github.com/ClickHouse/ClickHouse/pull/49211) ([alesapin](https://github.com/alesapin)).
-* Fix race on Outdated parts loading [#49223](https://github.com/ClickHouse/ClickHouse/pull/49223) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix all key value is null and group use rollup return wrong answer [#49282](https://github.com/ClickHouse/ClickHouse/pull/49282) ([Shuai li](https://github.com/loneylee)).
-* Fix calculating load_factor for HASHED dictionaries with SHARDS [#49319](https://github.com/ClickHouse/ClickHouse/pull/49319) ([Azat Khuzhin](https://github.com/azat)).
-* Disallow configuring compression CODECs for alias columns [#49363](https://github.com/ClickHouse/ClickHouse/pull/49363) ([Timur Solodovnikov](https://github.com/tsolodov)).
-* Fix bug in removal of existing part directory [#49365](https://github.com/ClickHouse/ClickHouse/pull/49365) ([alesapin](https://github.com/alesapin)).
-* Properly fix GCS when HMAC is used [#49390](https://github.com/ClickHouse/ClickHouse/pull/49390) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix fuzz bug when subquery set is not built when reading from remote() [#49425](https://github.com/ClickHouse/ClickHouse/pull/49425) ([Alexander Gololobov](https://github.com/davenger)).
-* Invert `shutdown_wait_unfinished_queries` [#49427](https://github.com/ClickHouse/ClickHouse/pull/49427) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* (Experimental zero-copy replication) Fix another zero copy bug [#49473](https://github.com/ClickHouse/ClickHouse/pull/49473) ([alesapin](https://github.com/alesapin)).
-* Fix postgres database setting [#49481](https://github.com/ClickHouse/ClickHouse/pull/49481) ([Mal Curtis](https://github.com/snikch)).
-* Correctly handle `s3Cluster` arguments [#49490](https://github.com/ClickHouse/ClickHouse/pull/49490) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix bug in TraceCollector destructor. [#49508](https://github.com/ClickHouse/ClickHouse/pull/49508) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix AsynchronousReadIndirectBufferFromRemoteFS breaking on short seeks [#49525](https://github.com/ClickHouse/ClickHouse/pull/49525) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix dictionaries loading order [#49560](https://github.com/ClickHouse/ClickHouse/pull/49560) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Forbid the change of data type of Object('json') column [#49563](https://github.com/ClickHouse/ClickHouse/pull/49563) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix stress test (Logical error: Expected 7134 >= 11030) [#49623](https://github.com/ClickHouse/ClickHouse/pull/49623) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix bug in DISTINCT [#49628](https://github.com/ClickHouse/ClickHouse/pull/49628) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix: DISTINCT in order with zero values in non-sorted columns [#49636](https://github.com/ClickHouse/ClickHouse/pull/49636) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix one-off error in big integers found by UBSan with fuzzer [#49645](https://github.com/ClickHouse/ClickHouse/pull/49645) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix reading from sparse columns after restart [#49660](https://github.com/ClickHouse/ClickHouse/pull/49660) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix assert in SpanHolder::finish() with fibers [#49673](https://github.com/ClickHouse/ClickHouse/pull/49673) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix short circuit functions and mutations with sparse arguments [#49716](https://github.com/ClickHouse/ClickHouse/pull/49716) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix writing appended files to incremental backups [#49725](https://github.com/ClickHouse/ClickHouse/pull/49725) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix "There is no physical column _row_exists in table" error occurring during lightweight delete mutation on a table with Object column. [#49737](https://github.com/ClickHouse/ClickHouse/pull/49737) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix msan issue in randomStringUTF8(uneven number) [#49750](https://github.com/ClickHouse/ClickHouse/pull/49750) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix aggregate function kolmogorovSmirnovTest [#49768](https://github.com/ClickHouse/ClickHouse/pull/49768) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Fix settings aliases in native protocol [#49776](https://github.com/ClickHouse/ClickHouse/pull/49776) ([Azat Khuzhin](https://github.com/azat)).
-* Fix `arrayMap` with array of tuples with single argument [#49789](https://github.com/ClickHouse/ClickHouse/pull/49789) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix per-query IO/BACKUPs throttling settings [#49797](https://github.com/ClickHouse/ClickHouse/pull/49797) ([Azat Khuzhin](https://github.com/azat)).
-* Fix setting NULL in profile definition [#49831](https://github.com/ClickHouse/ClickHouse/pull/49831) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix a bug with projections and the aggregate_functions_null_for_empty setting (for query_plan_optimize_projection) [#49873](https://github.com/ClickHouse/ClickHouse/pull/49873) ([Amos Bird](https://github.com/amosbird)).
-* Fix processing pending batch for Distributed async INSERT after restart [#49884](https://github.com/ClickHouse/ClickHouse/pull/49884) ([Azat Khuzhin](https://github.com/azat)).
-* Fix assertion in CacheMetadata::doCleanup [#49914](https://github.com/ClickHouse/ClickHouse/pull/49914) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* fix `is_prefix` in OptimizeRegularExpression [#49919](https://github.com/ClickHouse/ClickHouse/pull/49919) ([Han Fei](https://github.com/hanfei1991)).
-* Fix metrics `WriteBufferFromS3Bytes`, `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` [#49930](https://github.com/ClickHouse/ClickHouse/pull/49930) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Fix IPv6 encoding in protobuf [#49933](https://github.com/ClickHouse/ClickHouse/pull/49933) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix possible Logical error on bad Nullable parsing for text formats [#49960](https://github.com/ClickHouse/ClickHouse/pull/49960) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add setting output_format_parquet_compliant_nested_types to produce more compatible Parquet files [#50001](https://github.com/ClickHouse/ClickHouse/pull/50001) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix logical error in stress test "Not enough space to add ..." [#50021](https://github.com/ClickHouse/ClickHouse/pull/50021) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Avoid deadlock when starting table in attach thread of `ReplicatedMergeTree` [#50026](https://github.com/ClickHouse/ClickHouse/pull/50026) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix assert in SpanHolder::finish() with fibers attempt 2 [#50034](https://github.com/ClickHouse/ClickHouse/pull/50034) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add proper escaping for DDL OpenTelemetry context serialization [#50045](https://github.com/ClickHouse/ClickHouse/pull/50045) ([Azat Khuzhin](https://github.com/azat)).
-* Fix reporting broken projection parts [#50052](https://github.com/ClickHouse/ClickHouse/pull/50052) ([Amos Bird](https://github.com/amosbird)).
-* JIT compilation not equals NaN fix [#50056](https://github.com/ClickHouse/ClickHouse/pull/50056) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix crashing in case of Replicated database without arguments [#50058](https://github.com/ClickHouse/ClickHouse/pull/50058) ([Azat Khuzhin](https://github.com/azat)).
-* Fix crash with `multiIf` and constant condition and nullable arguments [#50123](https://github.com/ClickHouse/ClickHouse/pull/50123) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix invalid index analysis for date related keys [#50153](https://github.com/ClickHouse/ClickHouse/pull/50153) ([Amos Bird](https://github.com/amosbird)).
-* do not allow modify order by when there are no order by cols [#50154](https://github.com/ClickHouse/ClickHouse/pull/50154) ([Han Fei](https://github.com/hanfei1991)).
-* Fix broken index analysis when binary operator contains a null constant argument [#50177](https://github.com/ClickHouse/ClickHouse/pull/50177) ([Amos Bird](https://github.com/amosbird)).
-* clickhouse-client: disallow usage of `--query` and `--queries-file` at the same time [#50210](https://github.com/ClickHouse/ClickHouse/pull/50210) ([Alexey Gerasimchuk](https://github.com/Demilivor)).
-* Fix UB for INTO OUTFILE extensions (APPEND / AND STDOUT) and WATCH EVENTS [#50216](https://github.com/ClickHouse/ClickHouse/pull/50216) ([Azat Khuzhin](https://github.com/azat)).
-* Fix skipping spaces at end of row in CustomSeparatedIgnoreSpaces format [#50224](https://github.com/ClickHouse/ClickHouse/pull/50224) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix iceberg metadata parsing [#50232](https://github.com/ClickHouse/ClickHouse/pull/50232) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix nested distributed SELECT in WITH clause [#50234](https://github.com/ClickHouse/ClickHouse/pull/50234) ([Azat Khuzhin](https://github.com/azat)).
-* Fix msan issue in keyed siphash [#50245](https://github.com/ClickHouse/ClickHouse/pull/50245) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix bugs in Poco sockets in non-blocking mode, use true non-blocking sockets [#50252](https://github.com/ClickHouse/ClickHouse/pull/50252) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix checksum calculation for backup entries [#50264](https://github.com/ClickHouse/ClickHouse/pull/50264) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Comparison functions NaN fix [#50287](https://github.com/ClickHouse/ClickHouse/pull/50287) ([Maksim Kita](https://github.com/kitaisreal)).
-* JIT aggregation nullable key fix [#50291](https://github.com/ClickHouse/ClickHouse/pull/50291) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix clickhouse-local crashing when writing empty Arrow or Parquet output [#50328](https://github.com/ClickHouse/ClickHouse/pull/50328) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix crash when Pool::Entry::disconnect() is called [#50334](https://github.com/ClickHouse/ClickHouse/pull/50334) ([Val Doroshchuk](https://github.com/valbok)).
-* Improved fetch part by holding directory lock longer [#50339](https://github.com/ClickHouse/ClickHouse/pull/50339) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix bitShift* functions with both constant arguments [#50343](https://github.com/ClickHouse/ClickHouse/pull/50343) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix Keeper deadlock on exception when preprocessing requests. [#50387](https://github.com/ClickHouse/ClickHouse/pull/50387) ([frinkr](https://github.com/frinkr)).
-* Fix hashing of const integer values [#50421](https://github.com/ClickHouse/ClickHouse/pull/50421) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix merge_tree_min_rows_for_seek/merge_tree_min_bytes_for_seek for data skipping indexes [#50432](https://github.com/ClickHouse/ClickHouse/pull/50432) ([Azat Khuzhin](https://github.com/azat)).
-* Limit the number of in-flight tasks for loading outdated parts [#50450](https://github.com/ClickHouse/ClickHouse/pull/50450) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Keeper fix: apply uncommitted state after snapshot install [#50483](https://github.com/ClickHouse/ClickHouse/pull/50483) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix incorrect constant folding [#50536](https://github.com/ClickHouse/ClickHouse/pull/50536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix logical error in stress test (Not enough space to add ...) [#50583](https://github.com/ClickHouse/ClickHouse/pull/50583) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix converting Null to LowCardinality(Nullable) in values table function [#50637](https://github.com/ClickHouse/ClickHouse/pull/50637) ([Kruglov Pavel](https://github.com/Avogar)).
-* Revert invalid RegExpTreeDictionary optimization [#50642](https://github.com/ClickHouse/ClickHouse/pull/50642) ([Johann Gan](https://github.com/johanngan)).
-
-### <a id="234"></a> ClickHouse release 23.4, 2023-04-26
-
-#### Backward Incompatible Change
-* Formatter '%M' in function formatDateTime() now prints the month name instead of the minutes. This makes the behavior consistent with MySQL. The previous behavior can be restored using setting "formatdatetime_parsedatetime_m_is_month_name = 0". [#47246](https://github.com/ClickHouse/ClickHouse/pull/47246) ([Robert Schulze](https://github.com/rschu1ze)).
-* This change makes sense only if you are using the virtual filesystem cache. If `path` in the virtual filesystem cache configuration is not empty and is not an absolute path, then it will be put in `<clickhouse server data directory>/caches/<path_from_cache_config>`. [#48784](https://github.com/ClickHouse/ClickHouse/pull/48784) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Primary/secondary indices and sorting keys with identical expressions are now rejected. This behavior can be disabled using setting `allow_suspicious_indices`. [#48536](https://github.com/ClickHouse/ClickHouse/pull/48536) ([凌涛](https://github.com/lingtaolf)).
-
-#### New Feature
-* Support new aggregate function `quantileGK`/`quantilesGK`, like [approx_percentile](https://spark.apache.org/docs/latest/api/sql/index.html#approx_percentile) in spark. Greenwald-Khanna algorithm refer to http://infolab.stanford.edu/~datar/courses/cs361a/papers/quantiles.pdf. [#46428](https://github.com/ClickHouse/ClickHouse/pull/46428) ([李扬](https://github.com/taiyang-li)).
-* Add a statement `SHOW COLUMNS` which shows distilled information from system.columns. [#48017](https://github.com/ClickHouse/ClickHouse/pull/48017) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added `LIGHTWEIGHT` and `PULL` modifiers for `SYSTEM SYNC REPLICA` query. `LIGHTWEIGHT` version waits for fetches and drop-ranges only (merges and mutations are ignored). `PULL` version pulls new entries from ZooKeeper and does not wait for them. Fixes [#47794](https://github.com/ClickHouse/ClickHouse/issues/47794). [#48085](https://github.com/ClickHouse/ClickHouse/pull/48085) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add `kafkaMurmurHash` function for compatibility with Kafka DefaultPartitioner. Closes [#47834](https://github.com/ClickHouse/ClickHouse/issues/47834). [#48185](https://github.com/ClickHouse/ClickHouse/pull/48185) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Allow to easily create a user with the same grants as the current user by using `GRANT CURRENT GRANTS`. [#48262](https://github.com/ClickHouse/ClickHouse/pull/48262) ([pufit](https://github.com/pufit)).
-* Add statistical aggregate function `kolmogorovSmirnovTest`. Close [#48228](https://github.com/ClickHouse/ClickHouse/issues/48228). [#48325](https://github.com/ClickHouse/ClickHouse/pull/48325) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Added a `lost_part_count` column to the `system.replicas` table. The column value shows the total number of lost parts in the corresponding table. Value is stored in zookeeper and can be used instead of not persistent `ReplicatedDataLoss` profile event for monitoring. [#48526](https://github.com/ClickHouse/ClickHouse/pull/48526) ([Sergei Trifonov](https://github.com/serxa)).
-* Add `soundex` function for compatibility. Closes [#39880](https://github.com/ClickHouse/ClickHouse/issues/39880). [#48567](https://github.com/ClickHouse/ClickHouse/pull/48567) ([FriendLey](https://github.com/FriendLey)).
-* Support `Map` type for JSONExtract. [#48629](https://github.com/ClickHouse/ClickHouse/pull/48629) ([李扬](https://github.com/taiyang-li)).
-* Add `PrettyJSONEachRow` format to output pretty JSON with new line delimiters and 4 space indents. [#48898](https://github.com/ClickHouse/ClickHouse/pull/48898) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `ParquetMetadata` input format to read Parquet file metadata. [#48911](https://github.com/ClickHouse/ClickHouse/pull/48911) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add `extractKeyValuePairs` function to extract key value pairs from strings. Input strings might contain noise (i.e. log files / do not need to be 100% formatted in key-value-pair format), the algorithm will look for key value pairs matching the arguments passed to the function. As of now, function accepts the following arguments: `data_column` (mandatory), `key_value_pair_delimiter` (defaults to `:`), `pair_delimiters` (defaults to `\space \, \;`) and `quoting_character` (defaults to double quotes). [#43606](https://github.com/ClickHouse/ClickHouse/pull/43606) ([Arthur Passos](https://github.com/arthurpassos)).
-* Functions replaceOne(), replaceAll(), replaceRegexpOne() and replaceRegexpAll() can now be called with non-const pattern and replacement arguments. [#46589](https://github.com/ClickHouse/ClickHouse/pull/46589) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added functions to work with columns of type `Map`: `mapConcat`, `mapSort`, `mapExists`. [#48071](https://github.com/ClickHouse/ClickHouse/pull/48071) ([Anton Popov](https://github.com/CurtizJ)).
-
-#### Performance Improvement
-* Reading files in `Parquet` format is now much faster. IO and decoding are parallelized (controlled by `max_threads` setting), and only required data ranges are read. [#47964](https://github.com/ClickHouse/ClickHouse/pull/47964) ([Michael Kolupaev](https://github.com/al13n321)).
-* If we run a mutation with IN (subquery) like this: `ALTER TABLE t UPDATE col='new value' WHERE id IN (SELECT id FROM huge_table)` and the table `t` has multiple parts than for each part a set for subquery `SELECT id FROM huge_table` is built in memory. And if there are many parts then this might consume a lot of memory (and lead to an OOM) and CPU. The solution is to introduce a short-lived cache of sets that are currently being built by mutation tasks. If another task of the same mutation is executed concurrently it can look up the set in the cache, wait for it to be built and reuse it. [#46835](https://github.com/ClickHouse/ClickHouse/pull/46835) ([Alexander Gololobov](https://github.com/davenger)).
-* Only check dependencies if necessary when applying `ALTER TABLE` queries. [#48062](https://github.com/ClickHouse/ClickHouse/pull/48062) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize function `mapUpdate`. [#48118](https://github.com/ClickHouse/ClickHouse/pull/48118) ([Anton Popov](https://github.com/CurtizJ)).
-* Now an internal query to local replica is sent explicitly and data from it received through loopback interface. Setting `prefer_localhost_replica` is not respected for parallel replicas. This is needed for better scheduling and makes the code cleaner: the initiator is only responsible for coordinating of the reading process and merging results, continuously answering for requests while all the secondary queries read the data. Note: Using loopback interface is not so performant, otherwise some replicas could starve for tasks which could lead to even slower query execution and not utilizing all possible resources. The initialization of the coordinator is now even more lazy. All incoming requests contain the information about the reading algorithm we initialize the coordinator with it when first request comes. If any replica decides to read with a different algorithm–an exception will be thrown and a query will be aborted. [#48246](https://github.com/ClickHouse/ClickHouse/pull/48246) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Do not build set for the right side of `IN` clause with subquery when it is used only for analysis of skip indexes, and they are disabled by setting (`use_skip_indexes=0`). Previously it might affect the performance of queries. [#48299](https://github.com/ClickHouse/ClickHouse/pull/48299) ([Anton Popov](https://github.com/CurtizJ)).
-* Query processing is parallelized right after reading `FROM file(...)`. Related to [#38755](https://github.com/ClickHouse/ClickHouse/issues/38755). [#48525](https://github.com/ClickHouse/ClickHouse/pull/48525) ([Igor Nikonov](https://github.com/devcrafter)). Query processing is parallelized right after reading from any data source. Affected data sources are mostly simple or external storages like table functions `url`, `file`. [#48727](https://github.com/ClickHouse/ClickHouse/pull/48727) ([Igor Nikonov](https://github.com/devcrafter)). This is controlled by the setting `parallelize_output_from_storages` which is not enabled by default.
-* Lowered contention of ThreadPool mutex (may increase performance for a huge amount of small jobs). [#48750](https://github.com/ClickHouse/ClickHouse/pull/48750) ([Sergei Trifonov](https://github.com/serxa)).
-* Reduce memory usage for multiple `ALTER DELETE` mutations. [#48522](https://github.com/ClickHouse/ClickHouse/pull/48522) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Remove the excessive connection attempts if the `skip_unavailable_shards` setting is enabled. [#48771](https://github.com/ClickHouse/ClickHouse/pull/48771) ([Azat Khuzhin](https://github.com/azat)).
-
-#### Experimental Feature
-* Entries in the query cache are now squashed to max_block_size and compressed. [#45912](https://github.com/ClickHouse/ClickHouse/pull/45912) ([Robert Schulze](https://github.com/rschu1ze)).
-* It is now possible to define per-user quotas in the query cache. [#48284](https://github.com/ClickHouse/ClickHouse/pull/48284) ([Robert Schulze](https://github.com/rschu1ze)).
-* Some fixes for parallel replicas [#48433](https://github.com/ClickHouse/ClickHouse/pull/48433) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Implement zero-copy-replication (an experimental feature) on encrypted disks. [#48741](https://github.com/ClickHouse/ClickHouse/pull/48741) ([Vitaly Baranov](https://github.com/vitlibar)).
-
-#### Improvement
-* Increase default value for `connect_timeout_with_failover_ms` to 1000 ms (because of adding async connections in https://github.com/ClickHouse/ClickHouse/pull/47229) . Closes [#5188](https://github.com/ClickHouse/ClickHouse/issues/5188). [#49009](https://github.com/ClickHouse/ClickHouse/pull/49009) ([Kruglov Pavel](https://github.com/Avogar)).
-* Several improvements around data lakes: - Make `Iceberg` work with non-partitioned data. - Support `Iceberg` format version v2 (previously only v1 was supported) - Support reading partitioned data for `DeltaLake`/`Hudi` - Faster reading of `DeltaLake` metadata by using Delta's checkpoint files - Fixed incorrect `Hudi` reads: previously it incorrectly chose which data to read and therefore was able to read correctly only small size tables - Made these engines to pickup updates of changed data (previously the state was set on table creation) - Make proper testing for `Iceberg`/`DeltaLake`/`Hudi` using spark. [#47307](https://github.com/ClickHouse/ClickHouse/pull/47307) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add async connection to socket and async writing to socket. Make creating connections and sending query/external tables async across shards. Refactor code with fibers. Closes [#46931](https://github.com/ClickHouse/ClickHouse/issues/46931). We will be able to increase `connect_timeout_with_failover_ms` by default after this PR (https://github.com/ClickHouse/ClickHouse/issues/5188). [#47229](https://github.com/ClickHouse/ClickHouse/pull/47229) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support config sections `keeper`/`keeper_server` as an alternative to `zookeeper`. Close [#34766](https://github.com/ClickHouse/ClickHouse/issues/34766) , [#34767](https://github.com/ClickHouse/ClickHouse/issues/34767). [#35113](https://github.com/ClickHouse/ClickHouse/pull/35113) ([李扬](https://github.com/taiyang-li)).
-* It is possible to set _secure_ flag in named_collections for a dictionary with a ClickHouse table source. Addresses [#38450](https://github.com/ClickHouse/ClickHouse/issues/38450) . [#46323](https://github.com/ClickHouse/ClickHouse/pull/46323) ([Ilya Golshtein](https://github.com/ilejn)).
-* `bitCount` function support `FixedString` and `String` data type. [#49044](https://github.com/ClickHouse/ClickHouse/pull/49044) ([flynn](https://github.com/ucasfl)).
-* Added configurable retries for all operations with [Zoo]Keeper for Backup queries. [#47224](https://github.com/ClickHouse/ClickHouse/pull/47224) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Enable `use_environment_credentials` for S3 by default, so the entire provider chain is constructed by default. [#47397](https://github.com/ClickHouse/ClickHouse/pull/47397) ([Antonio Andelic](https://github.com/antonio2368)).
-* Currently, the JSON_VALUE function is similar as spark's get_json_object function, which support to get value from JSON string by a path like '$.key'. But still has something different - 1. in spark's get_json_object will return null while the path is not exist, but in JSON_VALUE will return empty string; - 2. in spark's get_json_object will return a complex type value, such as a JSON object/array value, but in JSON_VALUE will return empty string. [#47494](https://github.com/ClickHouse/ClickHouse/pull/47494) ([KevinyhZou](https://github.com/KevinyhZou)).
-* For `use_structure_from_insertion_table_in_table_functions` more flexible insert table structure propagation to table function. Fixed an issue with name mapping and using virtual columns. No more need for 'auto' setting. [#47962](https://github.com/ClickHouse/ClickHouse/pull/47962) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Do not continue retrying to connect to Keeper if the query is killed or over limits. [#47985](https://github.com/ClickHouse/ClickHouse/pull/47985) ([Raúl Marín](https://github.com/Algunenano)).
-* Support Enum output/input in `BSONEachRow`, allow all map key types and avoid extra calculations on output. [#48122](https://github.com/ClickHouse/ClickHouse/pull/48122) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support more ClickHouse types in `ORC`/`Arrow`/`Parquet` formats: Enum(8|16), (U)Int(128|256), Decimal256 (for ORC), allow reading IPv4 from Int32 values (ORC outputs IPv4 as Int32, and we couldn't read it back), fix reading Nullable(IPv6) from binary data for `ORC`. [#48126](https://github.com/ClickHouse/ClickHouse/pull/48126) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add columns `perform_ttl_move_on_insert`, `load_balancing` for table `system.storage_policies`, modify column `volume_type` type to `Enum8`. [#48167](https://github.com/ClickHouse/ClickHouse/pull/48167) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Added support for `BACKUP ALL` command which backups all tables and databases, including temporary and system ones. [#48189](https://github.com/ClickHouse/ClickHouse/pull/48189) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Function mapFromArrays supports `Map` type as an input. [#48207](https://github.com/ClickHouse/ClickHouse/pull/48207) ([李扬](https://github.com/taiyang-li)).
-* The output of some SHOW PROCESSLIST is now sorted. [#48241](https://github.com/ClickHouse/ClickHouse/pull/48241) ([Robert Schulze](https://github.com/rschu1ze)).
-* Per-query/per-server throttling for remote IO/local IO/BACKUPs (server settings: `max_remote_read_network_bandwidth_for_server`, `max_remote_write_network_bandwidth_for_server`, `max_local_read_bandwidth_for_server`, `max_local_write_bandwidth_for_server`, `max_backup_bandwidth_for_server`, settings: `max_remote_read_network_bandwidth`, `max_remote_write_network_bandwidth`, `max_local_read_bandwidth`, `max_local_write_bandwidth`, `max_backup_bandwidth`). [#48242](https://github.com/ClickHouse/ClickHouse/pull/48242) ([Azat Khuzhin](https://github.com/azat)).
-* Support more types in `CapnProto` format: Map, (U)Int(128|256), Decimal(128|256). Allow integer conversions during input/output. [#48257](https://github.com/ClickHouse/ClickHouse/pull/48257) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't throw CURRENT_WRITE_BUFFER_IS_EXHAUSTED for normal behaviour. [#48288](https://github.com/ClickHouse/ClickHouse/pull/48288) ([Raúl Marín](https://github.com/Algunenano)).
-* Add new setting `keeper_map_strict_mode` which enforces extra guarantees on operations made on top of `KeeperMap` tables. [#48293](https://github.com/ClickHouse/ClickHouse/pull/48293) ([Antonio Andelic](https://github.com/antonio2368)).
-* Check primary key type for simple dictionary is native unsigned integer type Add setting `check_dictionary_primary_key ` for compatibility(set `check_dictionary_primary_key =false` to disable checking). [#48335](https://github.com/ClickHouse/ClickHouse/pull/48335) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Don't replicate mutations for `KeeperMap` because it's unnecessary. [#48354](https://github.com/ClickHouse/ClickHouse/pull/48354) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow to write/read unnamed tuple as nested Message in Protobuf format. Tuple elements and Message fields are matched by position. [#48390](https://github.com/ClickHouse/ClickHouse/pull/48390) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support `additional_table_filters` and `additional_result_filter` settings in the new planner. Also, add a documentation entry for `additional_result_filter`. [#48405](https://github.com/ClickHouse/ClickHouse/pull/48405) ([Dmitry Novik](https://github.com/novikd)).
-* `parseDateTime` now understands format string '%f' (fractional seconds). [#48420](https://github.com/ClickHouse/ClickHouse/pull/48420) ([Robert Schulze](https://github.com/rschu1ze)).
-* Format string "%f" in formatDateTime() now prints "000000" if the formatted value has no fractional seconds, the previous behavior (single zero) can be restored using setting "formatdatetime_f_prints_single_zero = 1". [#48422](https://github.com/ClickHouse/ClickHouse/pull/48422) ([Robert Schulze](https://github.com/rschu1ze)).
-* Don't replicate DELETE and TRUNCATE for KeeperMap. [#48434](https://github.com/ClickHouse/ClickHouse/pull/48434) ([Antonio Andelic](https://github.com/antonio2368)).
-* Generate valid Decimals and Bools in generateRandom function. [#48436](https://github.com/ClickHouse/ClickHouse/pull/48436) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow trailing commas in expression list of SELECT query, for example `SELECT a, b, c, FROM table`. Closes [#37802](https://github.com/ClickHouse/ClickHouse/issues/37802). [#48438](https://github.com/ClickHouse/ClickHouse/pull/48438) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Override `CLICKHOUSE_USER` and `CLICKHOUSE_PASSWORD` environment variables with `--user` and `--password` client parameters. Closes [#38909](https://github.com/ClickHouse/ClickHouse/issues/38909). [#48440](https://github.com/ClickHouse/ClickHouse/pull/48440) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Added retries to loading of data parts in `MergeTree` tables in case of retryable errors. [#48442](https://github.com/ClickHouse/ClickHouse/pull/48442) ([Anton Popov](https://github.com/CurtizJ)).
-* Add support for `Date`, `Date32`, `DateTime`, `DateTime64` data types to `arrayMin`, `arrayMax`, `arrayDifference` functions. Closes [#21645](https://github.com/ClickHouse/ClickHouse/issues/21645). [#48445](https://github.com/ClickHouse/ClickHouse/pull/48445) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add support for `{server_uuid}` macro. It is useful for identifying replicas in autoscaled clusters when new replicas are constantly added and removed in runtime. This closes [#48554](https://github.com/ClickHouse/ClickHouse/issues/48554). [#48563](https://github.com/ClickHouse/ClickHouse/pull/48563) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The installation script will create a hard link instead of copying if it is possible. [#48578](https://github.com/ClickHouse/ClickHouse/pull/48578) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support `SHOW TABLE` syntax meaning the same as `SHOW CREATE TABLE`. Closes [#48580](https://github.com/ClickHouse/ClickHouse/issues/48580). [#48591](https://github.com/ClickHouse/ClickHouse/pull/48591) ([flynn](https://github.com/ucasfl)).
-* HTTP temporary buffers now support working by evicting data from the virtual filesystem cache. [#48664](https://github.com/ClickHouse/ClickHouse/pull/48664) ([Vladimir C](https://github.com/vdimir)).
-* Make Schema inference works for `CREATE AS SELECT`. Closes [#47599](https://github.com/ClickHouse/ClickHouse/issues/47599). [#48679](https://github.com/ClickHouse/ClickHouse/pull/48679) ([flynn](https://github.com/ucasfl)).
-* Added a `replicated_max_mutations_in_one_entry` setting for `ReplicatedMergeTree` that allows limiting the number of mutation commands per one `MUTATE_PART` entry (default is 10000). [#48731](https://github.com/ClickHouse/ClickHouse/pull/48731) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* In AggregateFunction types, don't count unused arena bytes as `read_bytes`. [#48745](https://github.com/ClickHouse/ClickHouse/pull/48745) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix some MySQL-related settings not being handled with the MySQL dictionary source + named collection. Closes [#48402](https://github.com/ClickHouse/ClickHouse/issues/48402). [#48759](https://github.com/ClickHouse/ClickHouse/pull/48759) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* If a user set `max_single_part_upload_size` to a very large value, it can lead to a crash due to a bug in the AWS S3 SDK. This fixes [#47679](https://github.com/ClickHouse/ClickHouse/issues/47679). [#48816](https://github.com/ClickHouse/ClickHouse/pull/48816) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix data race in `RabbitMQ` ([report](https://pastila.nl/?004f7100/de1505289ab5bb355e67ebe6c7cc8707)), refactor the code. [#48845](https://github.com/ClickHouse/ClickHouse/pull/48845) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add aliases `name` and `part_name` form `system.parts` and `system.part_log`. Closes [#48718](https://github.com/ClickHouse/ClickHouse/issues/48718). [#48850](https://github.com/ClickHouse/ClickHouse/pull/48850) ([sichenzhao](https://github.com/sichenzhao)).
-* Functions "arrayDifferenceSupport()", "arrayCumSum()" and "arrayCumSumNonNegative()" now support input arrays of wide integer types (U)Int128/256. [#48866](https://github.com/ClickHouse/ClickHouse/pull/48866) ([cluster](https://github.com/infdahai)).
-* Multi-line history in clickhouse-client is now no longer padded. This makes pasting more natural. [#48870](https://github.com/ClickHouse/ClickHouse/pull/48870) ([Joanna Hulboj](https://github.com/jh0x)).
-* Implement a slight improvement for the rare case when ClickHouse is run inside LXC and LXCFS is used. The LXCFS has an issue: sometimes it returns an error "Transport endpoint is not connected" on reading from the file inside `/proc`. This error was correctly logged into ClickHouse's server log. We have additionally workaround this issue by reopening a file. This is a minuscule change. [#48922](https://github.com/ClickHouse/ClickHouse/pull/48922) ([Real](https://github.com/RunningXie)).
-* Improve memory accounting for prefetches. Randomise prefetch settings In CI. [#48973](https://github.com/ClickHouse/ClickHouse/pull/48973) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Correctly set headers for native copy operations on GCS. [#48981](https://github.com/ClickHouse/ClickHouse/pull/48981) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for specifying setting names in the command line with dashes instead of underscores, for example, `--max-threads` instead of `--max_threads`. Additionally, support Unicode dash characters like `—` instead of `--` - this is useful when you communicate with a team in another company, and a manager from that team copy-pasted code from MS Word. [#48985](https://github.com/ClickHouse/ClickHouse/pull/48985) ([alekseygolub](https://github.com/alekseygolub)).
-* Add fallback to password authentication when authentication with SSL user certificate has failed. Closes [#48974](https://github.com/ClickHouse/ClickHouse/issues/48974). [#48989](https://github.com/ClickHouse/ClickHouse/pull/48989) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Improve the embedded dashboard. Close [#46671](https://github.com/ClickHouse/ClickHouse/issues/46671). [#49036](https://github.com/ClickHouse/ClickHouse/pull/49036) ([Kevin Zhang](https://github.com/Kinzeng)).
-* Add profile events for log messages, so you can easily see the count of log messages by severity. [#49042](https://github.com/ClickHouse/ClickHouse/pull/49042) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* In previous versions, the `LineAsString` format worked inconsistently when the parallel parsing was enabled or not, in presence of DOS or macOS Classic line breaks. This closes [#49039](https://github.com/ClickHouse/ClickHouse/issues/49039). [#49052](https://github.com/ClickHouse/ClickHouse/pull/49052) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The exception message about the unparsed query parameter will also tell about the name of the parameter. Reimplement [#48878](https://github.com/ClickHouse/ClickHouse/issues/48878). Close [#48772](https://github.com/ClickHouse/ClickHouse/issues/48772). [#49061](https://github.com/ClickHouse/ClickHouse/pull/49061) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Build/Testing/Packaging Improvement
-* Update time zones. The following were updated: Africa/Cairo, Africa/Casablanca, Africa/El_Aaiun, America/Bogota, America/Cambridge_Bay, America/Ciudad_Juarez, America/Godthab, America/Inuvik, America/Iqaluit, America/Nuuk, America/Ojinaga, America/Pangnirtung, America/Rankin_Inlet, America/Resolute, America/Whitehorse, America/Yellowknife, Asia/Gaza, Asia/Hebron, Asia/Kuala_Lumpur, Asia/Singapore, Canada/Yukon, Egypt, Europe/Kirov, Europe/Volgograd, Singapore. [#48572](https://github.com/ClickHouse/ClickHouse/pull/48572) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Reduce the number of dependencies in the header files to speed up the build. [#47984](https://github.com/ClickHouse/ClickHouse/pull/47984) ([Dmitry Novik](https://github.com/novikd)).
-* Randomize compression of marks and indices in tests. [#48286](https://github.com/ClickHouse/ClickHouse/pull/48286) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump internal ZSTD from 1.5.4 to 1.5.5. [#46797](https://github.com/ClickHouse/ClickHouse/pull/46797) ([Robert Schulze](https://github.com/rschu1ze)).
-* Randomize vertical merges from compact to wide parts in tests. [#48287](https://github.com/ClickHouse/ClickHouse/pull/48287) ([Raúl Marín](https://github.com/Algunenano)).
-* Support for CRC32 checksum in HDFS. Fix performance issues. [#48614](https://github.com/ClickHouse/ClickHouse/pull/48614) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove remainders of GCC support. [#48671](https://github.com/ClickHouse/ClickHouse/pull/48671) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add CI run with new analyzer infrastructure enabled. [#48719](https://github.com/ClickHouse/ClickHouse/pull/48719) ([Dmitry Novik](https://github.com/novikd)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-
-* Fix system.query_views_log for MVs that are pushed from background threads [#46668](https://github.com/ClickHouse/ClickHouse/pull/46668) ([Azat Khuzhin](https://github.com/azat)).
-* Fix several `RENAME COLUMN` bugs [#46946](https://github.com/ClickHouse/ClickHouse/pull/46946) ([alesapin](https://github.com/alesapin)).
-* Fix minor hiliting issues in clickhouse-format [#47610](https://github.com/ClickHouse/ClickHouse/pull/47610) ([Natasha Murashkina](https://github.com/murfel)).
-* Fix a bug in LLVM's libc++ leading to a crash for uploading parts to S3 which size is greater than INT_MAX [#47693](https://github.com/ClickHouse/ClickHouse/pull/47693) ([Azat Khuzhin](https://github.com/azat)).
-* Fix overflow in the `sparkbar` function [#48121](https://github.com/ClickHouse/ClickHouse/pull/48121) ([Vladimir C](https://github.com/vdimir)).
-* Fix race in S3 [#48190](https://github.com/ClickHouse/ClickHouse/pull/48190) ([Anton Popov](https://github.com/CurtizJ)).
-* Disable JIT for aggregate functions due to inconsistent behavior [#48195](https://github.com/ClickHouse/ClickHouse/pull/48195) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix alter formatting (minor) [#48289](https://github.com/ClickHouse/ClickHouse/pull/48289) ([Natasha Murashkina](https://github.com/murfel)).
-* Fix CPU usage in RabbitMQ (was worsened in 23.2 after [#44404](https://github.com/ClickHouse/ClickHouse/issues/44404)) [#48311](https://github.com/ClickHouse/ClickHouse/pull/48311) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix crash in EXPLAIN PIPELINE for Merge over Distributed [#48320](https://github.com/ClickHouse/ClickHouse/pull/48320) ([Azat Khuzhin](https://github.com/azat)).
-* Fix serializing LowCardinality as Arrow dictionary [#48361](https://github.com/ClickHouse/ClickHouse/pull/48361) ([Kruglov Pavel](https://github.com/Avogar)).
-* Reset downloader for cache file segment in TemporaryFileStream [#48386](https://github.com/ClickHouse/ClickHouse/pull/48386) ([Vladimir C](https://github.com/vdimir)).
-* Fix possible SYSTEM SYNC REPLICA stuck in case of DROP/REPLACE PARTITION [#48391](https://github.com/ClickHouse/ClickHouse/pull/48391) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a startup error when loading a distributed table that depends on a dictionary [#48419](https://github.com/ClickHouse/ClickHouse/pull/48419) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Don't check dependencies when renaming system tables automatically [#48431](https://github.com/ClickHouse/ClickHouse/pull/48431) ([Raúl Marín](https://github.com/Algunenano)).
-* Update only affected rows in KeeperMap storage [#48435](https://github.com/ClickHouse/ClickHouse/pull/48435) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix possible segfault in the VFS cache [#48469](https://github.com/ClickHouse/ClickHouse/pull/48469) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* `toTimeZone` function throws an error when no constant string is provided [#48471](https://github.com/ClickHouse/ClickHouse/pull/48471) ([Jordi Villar](https://github.com/jrdi)).
-* Fix logical error with IPv4 in Protobuf, add support for Date32 [#48486](https://github.com/ClickHouse/ClickHouse/pull/48486) ([Kruglov Pavel](https://github.com/Avogar)).
-* "changed" flag in system.settings was calculated incorrectly for settings with multiple values [#48516](https://github.com/ClickHouse/ClickHouse/pull/48516) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix storage `Memory` with enabled compression [#48517](https://github.com/ClickHouse/ClickHouse/pull/48517) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix bracketed-paste mode messing up password input in the event of client reconnection [#48528](https://github.com/ClickHouse/ClickHouse/pull/48528) ([Michael Kolupaev](https://github.com/al13n321)).
-* Fix nested map for keys of IP and UUID types [#48556](https://github.com/ClickHouse/ClickHouse/pull/48556) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix an uncaught exception in case of parallel loader for hashed dictionaries [#48571](https://github.com/ClickHouse/ClickHouse/pull/48571) ([Azat Khuzhin](https://github.com/azat)).
-* The `groupArray` aggregate function correctly works for empty result over nullable types [#48593](https://github.com/ClickHouse/ClickHouse/pull/48593) ([lgbo](https://github.com/lgbo-ustc)).
-* Fix bug in Keeper when a node is not created with scheme `auth` in ACL sometimes. [#48595](https://github.com/ClickHouse/ClickHouse/pull/48595) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Allow IPv4 comparison operators with UInt [#48611](https://github.com/ClickHouse/ClickHouse/pull/48611) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix possible error from cache [#48636](https://github.com/ClickHouse/ClickHouse/pull/48636) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Async inserts with empty data will no longer throw exception. [#48663](https://github.com/ClickHouse/ClickHouse/pull/48663) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix table dependencies in case of failed RENAME TABLE [#48683](https://github.com/ClickHouse/ClickHouse/pull/48683) ([Azat Khuzhin](https://github.com/azat)).
-* If the primary key has duplicate columns (which is only possible for projections), in previous versions it might lead to a bug [#48838](https://github.com/ClickHouse/ClickHouse/pull/48838) ([Amos Bird](https://github.com/amosbird)).
-* Fix for a race condition in ZooKeeper when joining send_thread/receive_thread [#48849](https://github.com/ClickHouse/ClickHouse/pull/48849) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix unexpected part name error when trying to drop a ignored detached part with zero copy replication [#48862](https://github.com/ClickHouse/ClickHouse/pull/48862) ([Michael Lex](https://github.com/mlex)).
-* Fix reading `Date32` Parquet/Arrow column into not a `Date32` column [#48864](https://github.com/ClickHouse/ClickHouse/pull/48864) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `UNKNOWN_IDENTIFIER` error while selecting from table with row policy and column with dots [#48976](https://github.com/ClickHouse/ClickHouse/pull/48976) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix aggregation by empty nullable strings [#48999](https://github.com/ClickHouse/ClickHouse/pull/48999) ([LiuNeng](https://github.com/liuneng1994)).
-
-### <a id="233"></a> ClickHouse release 23.3 LTS, 2023-03-30
-
-#### Upgrade Notes
-* Lightweight DELETEs are production ready and enabled by default. The `DELETE` query for MergeTree tables is now available by default.
-* The behavior of `*domain*RFC` and `netloc` functions is slightly changed: relaxed the set of symbols that are allowed in the URL authority for better conformance. [#46841](https://github.com/ClickHouse/ClickHouse/pull/46841) ([Azat Khuzhin](https://github.com/azat)).
-* Prohibited creating tables based on KafkaEngine with DEFAULT/EPHEMERAL/ALIAS/MATERIALIZED statements for columns. [#47138](https://github.com/ClickHouse/ClickHouse/pull/47138) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* An "asynchronous connection drain" feature is removed. Related settings and metrics are removed as well. It was an internal feature, so the removal should not affect users who had never heard about that feature. [#47486](https://github.com/ClickHouse/ClickHouse/pull/47486) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Support 256-bit Decimal data type (more than 38 digits) in `arraySum`/`Min`/`Max`/`Avg`/`Product`, `arrayCumSum`/`CumSumNonNegative`, `arrayDifference`, array construction, IN operator, query parameters, `groupArrayMovingSum`, statistical functions, `min`/`max`/`any`/`argMin`/`argMax`, PostgreSQL wire protocol, MySQL table engine and function, `sumMap`, `mapAdd`, `mapSubtract`, `arrayIntersect`. Add support for big integers in `arrayIntersect`. Statistical aggregate functions involving moments (such as `corr` or various `TTest`s) will use `Float64` as their internal representation (they were using `Decimal128` before this change, but it was pointless), and these functions can return `nan` instead of `inf` in case of infinite variance. Some functions were allowed on `Decimal256` data types but returned `Decimal128` in previous versions - now it is fixed. This closes [#47569](https://github.com/ClickHouse/ClickHouse/issues/47569). This closes [#44864](https://github.com/ClickHouse/ClickHouse/issues/44864). This closes [#28335](https://github.com/ClickHouse/ClickHouse/issues/28335). [#47594](https://github.com/ClickHouse/ClickHouse/pull/47594) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Make backup_threads/restore_threads server settings (instead of user settings). [#47881](https://github.com/ClickHouse/ClickHouse/pull/47881) ([Azat Khuzhin](https://github.com/azat)).
-* Do not allow const and non-deterministic secondary indices [#46839](https://github.com/ClickHouse/ClickHouse/pull/46839) ([Anton Popov](https://github.com/CurtizJ)).
-
-#### New Feature
-* Add a new mode for splitting the work on replicas using settings `parallel_replicas_custom_key` and `parallel_replicas_custom_key_filter_type`. If the cluster consists of a single shard with multiple replicas, up to `max_parallel_replicas` will be randomly picked and turned into shards. For each shard, a corresponding filter is added to the query on the initiator before being sent to the shard. If the cluster consists of multiple shards, it will behave the same as `sample_key` but with the possibility to define an arbitrary key. [#45108](https://github.com/ClickHouse/ClickHouse/pull/45108) ([Antonio Andelic](https://github.com/antonio2368)).
-* An option to display partial result on cancel: Added query setting `partial_result_on_first_cancel` allowing the canceled query (e.g. due to Ctrl-C) to return a partial result. [#45689](https://github.com/ClickHouse/ClickHouse/pull/45689) ([Alexey Perevyshin](https://github.com/alexX512)).
-* Added support of arbitrary tables engines for temporary tables (except for Replicated and KeeperMap engines). Close [#31497](https://github.com/ClickHouse/ClickHouse/issues/31497). [#46071](https://github.com/ClickHouse/ClickHouse/pull/46071) ([Roman Vasin](https://github.com/rvasin)).
-* Add support for replication of user-defined SQL functions using centralized storage in Keeper. [#46085](https://github.com/ClickHouse/ClickHouse/pull/46085) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Implement `system.server_settings` (similar to `system.settings`), which will contain server configurations. [#46550](https://github.com/ClickHouse/ClickHouse/pull/46550) ([pufit](https://github.com/pufit)).
-* Support for `UNDROP TABLE` query. Closes [#46811](https://github.com/ClickHouse/ClickHouse/issues/46811). [#47241](https://github.com/ClickHouse/ClickHouse/pull/47241) ([chen](https://github.com/xiedeyantu)).
-* Allow separate grants for named collections (e.g. to be able to give `SHOW/CREATE/ALTER/DROP named collection` access only to certain collections, instead of all at once). Closes [#40894](https://github.com/ClickHouse/ClickHouse/issues/40894). Add new access type `NAMED_COLLECTION_CONTROL` which is not given to user default unless explicitly added to the user config (is required to be able to do `GRANT ALL`), also `show_named_collections` is no longer obligatory to be manually specified for user default to be able to have full access rights as was in 23.2. [#46241](https://github.com/ClickHouse/ClickHouse/pull/46241) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Allow nested custom disks. Previously custom disks supported only flat disk structure. [#47106](https://github.com/ClickHouse/ClickHouse/pull/47106) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Introduce a function `widthBucket` (with a `WIDTH_BUCKET` alias for compatibility). [#42974](https://github.com/ClickHouse/ClickHouse/issues/42974). [#46790](https://github.com/ClickHouse/ClickHouse/pull/46790) ([avoiderboi](https://github.com/avoiderboi)).
-* Add new function `parseDateTime`/`parseDateTimeInJodaSyntax` according to the specified format string. parseDateTime parses String to DateTime in MySQL syntax, parseDateTimeInJodaSyntax parses in Joda syntax. [#46815](https://github.com/ClickHouse/ClickHouse/pull/46815) ([李扬](https://github.com/taiyang-li)).
-* Use `dummy UInt8` for the default structure of table function `null`. Closes [#46930](https://github.com/ClickHouse/ClickHouse/issues/46930). [#47006](https://github.com/ClickHouse/ClickHouse/pull/47006) ([flynn](https://github.com/ucasfl)).
-* Support for date format with a comma, like `Dec 15, 2021` in the `parseDateTimeBestEffort` function. Closes [#46816](https://github.com/ClickHouse/ClickHouse/issues/46816). [#47071](https://github.com/ClickHouse/ClickHouse/pull/47071) ([chen](https://github.com/xiedeyantu)).
-* Add settings `http_wait_end_of_query` and `http_response_buffer_size` that corresponds to URL params `wait_end_of_query` and `buffer_size` for the HTTP interface. This allows changing these settings in the profiles. [#47108](https://github.com/ClickHouse/ClickHouse/pull/47108) ([Vladimir C](https://github.com/vdimir)).
-* Add `system.dropped_tables` table that shows tables that were dropped from `Atomic` databases but were not completely removed yet. [#47364](https://github.com/ClickHouse/ClickHouse/pull/47364) ([chen](https://github.com/xiedeyantu)).
-* Add `INSTR` as alias of `positionCaseInsensitive` for MySQL compatibility. Closes [#47529](https://github.com/ClickHouse/ClickHouse/issues/47529). [#47535](https://github.com/ClickHouse/ClickHouse/pull/47535) ([flynn](https://github.com/ucasfl)).
-* Added `toDecimalString` function allowing to convert numbers to string with fixed precision. [#47838](https://github.com/ClickHouse/ClickHouse/pull/47838) ([Andrey Zvonov](https://github.com/zvonand)).
-* Add a merge tree setting `max_number_of_mutations_for_replica`. It limits the number of part mutations per replica to the specified amount. Zero means no limit on the number of mutations per replica (the execution can still be constrained by other settings). [#48047](https://github.com/ClickHouse/ClickHouse/pull/48047) ([Vladimir C](https://github.com/vdimir)).
-* Add the Map-related function `mapFromArrays`, which allows the creation of a map from a pair of arrays. [#31125](https://github.com/ClickHouse/ClickHouse/pull/31125) ([李扬](https://github.com/taiyang-li)).
-* Allow control of compression in Parquet/ORC/Arrow output formats, adds support for more compression input formats. This closes [#13541](https://github.com/ClickHouse/ClickHouse/issues/13541). [#47114](https://github.com/ClickHouse/ClickHouse/pull/47114) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add SSL User Certificate authentication to the native protocol. Closes [#47077](https://github.com/ClickHouse/ClickHouse/issues/47077). [#47596](https://github.com/ClickHouse/ClickHouse/pull/47596) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add *OrNull() and *OrZero() variants for `parseDateTime`, add alias `str_to_date` for MySQL parity. [#48000](https://github.com/ClickHouse/ClickHouse/pull/48000) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added operator `REGEXP` (similar to operators "LIKE", "IN", "MOD" etc.) for better compatibility with MySQL [#47869](https://github.com/ClickHouse/ClickHouse/pull/47869) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### Performance Improvement
-* Marks in memory are now compressed, using 3-6x less memory. [#47290](https://github.com/ClickHouse/ClickHouse/pull/47290) ([Michael Kolupaev](https://github.com/al13n321)).
-* Backups for large numbers of files were unbelievably slow in previous versions. Not anymore. Now they are unbelievably fast. [#47251](https://github.com/ClickHouse/ClickHouse/pull/47251) ([Alexey Milovidov](https://github.com/alexey-milovidov)). Introduced a separate thread pool for backup's IO operations. This will allow scaling it independently of other pools and increase performance. [#47174](https://github.com/ClickHouse/ClickHouse/pull/47174) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)). Use MultiRead request and retries for collecting metadata at the final stage of backup processing. [#47243](https://github.com/ClickHouse/ClickHouse/pull/47243) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)). If a backup and restoring data are both in S3 then server-side copy should be used from now on. [#47546](https://github.com/ClickHouse/ClickHouse/pull/47546) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fixed excessive reading in queries with `FINAL`. [#47801](https://github.com/ClickHouse/ClickHouse/pull/47801) ([Nikita Taranov](https://github.com/nickitat)).
-* Setting `max_final_threads` would be set to the number of cores at server startup (by the same algorithm as used for `max_threads`). This improves the concurrency of `final` execution on servers with high number of CPUs. [#47915](https://github.com/ClickHouse/ClickHouse/pull/47915) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow executing reading pipeline for DIRECT dictionary with CLICKHOUSE source in multiple threads. To enable set `dictionary_use_async_executor=1` in `SETTINGS` section for source in `CREATE DICTIONARY` statement. [#47986](https://github.com/ClickHouse/ClickHouse/pull/47986) ([Vladimir C](https://github.com/vdimir)).
-* Optimize one nullable key aggregate performance. [#45772](https://github.com/ClickHouse/ClickHouse/pull/45772) ([LiuNeng](https://github.com/liuneng1994)).
-* Implemented lowercase `tokenbf_v1` index utilization for `hasTokenOrNull`, `hasTokenCaseInsensitive` and `hasTokenCaseInsensitiveOrNull`. [#46252](https://github.com/ClickHouse/ClickHouse/pull/46252) ([ltrk2](https://github.com/ltrk2)).
-* Optimize functions `position` and `LIKE` by searching the first two chars using SIMD. [#46289](https://github.com/ClickHouse/ClickHouse/pull/46289) ([Jiebin Sun](https://github.com/jiebinn)).
-* Optimize queries from the `system.detached_parts`, which could be significantly large. Added several sources with respect to the block size limitation; in each block, an IO thread pool is used to calculate the part size, i.e. to make syscalls in parallel. [#46624](https://github.com/ClickHouse/ClickHouse/pull/46624) ([Sema Checherinda](https://github.com/CheSema)).
-* Increase the default value of `max_replicated_merges_in_queue` for ReplicatedMergeTree tables from 16 to 1000. It allows faster background merge operation on clusters with a very large number of replicas, such as clusters with shared storage in ClickHouse Cloud. [#47050](https://github.com/ClickHouse/ClickHouse/pull/47050) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Updated `clickhouse-copier` to use `GROUP BY` instead of `DISTINCT` to get the list of partitions. For large tables, this reduced the select time from over 500s to under 1s. [#47386](https://github.com/ClickHouse/ClickHouse/pull/47386) ([Clayton McClure](https://github.com/cmcclure-twilio)).
-* Fix performance degradation in `ASOF JOIN`. [#47544](https://github.com/ClickHouse/ClickHouse/pull/47544) ([Ongkong](https://github.com/ongkong)).
-* Even more batching in Keeper. Improve performance by avoiding breaking batches on read requests. [#47978](https://github.com/ClickHouse/ClickHouse/pull/47978) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow PREWHERE for Merge with different DEFAULT expressions for columns. [#46831](https://github.com/ClickHouse/ClickHouse/pull/46831) ([Azat Khuzhin](https://github.com/azat)).
-
-#### Experimental Feature
-* Parallel replicas: Improved the overall performance by better utilizing the local replica, and forbid the reading with parallel replicas from non-replicated MergeTree by default. [#47858](https://github.com/ClickHouse/ClickHouse/pull/47858) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Support filter push down to left table for JOIN with `Join`, `Dictionary` and `EmbeddedRocksDB` tables if the experimental Analyzer is enabled. [#47280](https://github.com/ClickHouse/ClickHouse/pull/47280) ([Maksim Kita](https://github.com/kitaisreal)).
-* Now ReplicatedMergeTree with zero copy replication has less load to Keeper. [#47676](https://github.com/ClickHouse/ClickHouse/pull/47676) ([alesapin](https://github.com/alesapin)).
-* Fix create materialized view with MaterializedPostgreSQL [#40807](https://github.com/ClickHouse/ClickHouse/pull/40807) ([Maksim Buren](https://github.com/maks-buren630501)).
-
-#### Improvement
-* Enable `input_format_json_ignore_unknown_keys_in_named_tuple` by default. [#46742](https://github.com/ClickHouse/ClickHouse/pull/46742) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow errors to be ignored while pushing to MATERIALIZED VIEW (add new setting `materialized_views_ignore_errors`, by default to `false`, but it is set to `true` for flushing logs to `system.*_log` tables unconditionally). [#46658](https://github.com/ClickHouse/ClickHouse/pull/46658) ([Azat Khuzhin](https://github.com/azat)).
-* Track the file queue of distributed sends in memory. [#45491](https://github.com/ClickHouse/ClickHouse/pull/45491) ([Azat Khuzhin](https://github.com/azat)).
-* Now `X-ClickHouse-Query-Id` and `X-ClickHouse-Timezone` headers are added to responses in all queries via HTTP protocol. Previously it was done only for `SELECT` queries. [#46364](https://github.com/ClickHouse/ClickHouse/pull/46364) ([Anton Popov](https://github.com/CurtizJ)).
-* External tables from `MongoDB`: support for connection to a replica set via a URI with a host:port enum and support for the readPreference option in MongoDB dictionaries. Example URI: mongodb://db0.example.com:27017,db1.example.com:27017,db2.example.com:27017/?replicaSet=myRepl&readPreference=primary. [#46524](https://github.com/ClickHouse/ClickHouse/pull/46524) ([artem-yadr](https://github.com/artem-yadr)).
-* This improvement should be invisible for users. Re-implement projection analysis on top of query plan. Added setting `query_plan_optimize_projection=1` to switch between old and new version. Fixes [#44963](https://github.com/ClickHouse/ClickHouse/issues/44963). [#46537](https://github.com/ClickHouse/ClickHouse/pull/46537) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Use Parquet format v2 instead of v1 in output format by default. Add setting `output_format_parquet_version` to control parquet version, possible values `1.0`, `2.4`, `2.6`, `2.latest` (default). [#46617](https://github.com/ClickHouse/ClickHouse/pull/46617) ([Kruglov Pavel](https://github.com/Avogar)).
-* It is now possible to use the new configuration syntax to configure Kafka topics with periods (`.`) in their name. [#46752](https://github.com/ClickHouse/ClickHouse/pull/46752) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix heuristics that check hyperscan patterns for problematic repeats. [#46819](https://github.com/ClickHouse/ClickHouse/pull/46819) ([Robert Schulze](https://github.com/rschu1ze)).
-* Don't report ZK node exists to system.errors when a block was created concurrently by a different replica. [#46820](https://github.com/ClickHouse/ClickHouse/pull/46820) ([Raúl Marín](https://github.com/Algunenano)).
-* Increase the limit for opened files in `clickhouse-local`. It will be able to read from `web` tables on servers with a huge number of CPU cores. Do not back off reading from the URL table engine in case of too many opened files. This closes [#46852](https://github.com/ClickHouse/ClickHouse/issues/46852). [#46853](https://github.com/ClickHouse/ClickHouse/pull/46853) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Exceptions thrown when numbers cannot be parsed now have an easier-to-read exception message. [#46917](https://github.com/ClickHouse/ClickHouse/pull/46917) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added update `system.backups` after every processed task to track the progress of backups. [#46989](https://github.com/ClickHouse/ClickHouse/pull/46989) ([Aleksandr Musorin](https://github.com/AVMusorin)).
-* Allow types conversion in Native input format. Add settings `input_format_native_allow_types_conversion` that controls it (enabled by default). [#46990](https://github.com/ClickHouse/ClickHouse/pull/46990) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow IPv4 in the `range` function to generate IP ranges. [#46995](https://github.com/ClickHouse/ClickHouse/pull/46995) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Improve exception message when it's impossible to move a part from one volume/disk to another. [#47032](https://github.com/ClickHouse/ClickHouse/pull/47032) ([alesapin](https://github.com/alesapin)).
-* Support `Bool` type in `JSONType` function. Previously `Null` type was mistakenly returned for bool values. [#47046](https://github.com/ClickHouse/ClickHouse/pull/47046) ([Anton Popov](https://github.com/CurtizJ)).
-* Use `_request_body` parameter to configure predefined HTTP queries. [#47086](https://github.com/ClickHouse/ClickHouse/pull/47086) ([Constantine Peresypkin](https://github.com/pkit)).
-* Automatic indentation in the built-in UI SQL editor when Enter is pressed. [#47113](https://github.com/ClickHouse/ClickHouse/pull/47113) ([Alexey Korepanov](https://github.com/alexkorep)).
-* Self-extraction with 'sudo' will attempt to set uid and gid of extracted files to running user. [#47116](https://github.com/ClickHouse/ClickHouse/pull/47116) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Previously, the `repeat` function's second argument only accepted an unsigned integer type, which meant it could not accept values such as -1. This behavior differed from that of the Spark function. In this update, the repeat function has been modified to match the behavior of the Spark function. It now accepts the same types of inputs, including negative integers. Extensive testing has been performed to verify the correctness of the updated implementation. [#47134](https://github.com/ClickHouse/ClickHouse/pull/47134) ([KevinyhZou](https://github.com/KevinyhZou)). Note: the changelog entry was rewritten by ChatGPT.
-* Remove `::__1` part from stacktraces. Display `std::basic_string<char, ...` as `String` in stacktraces. [#47171](https://github.com/ClickHouse/ClickHouse/pull/47171) ([Mike Kot](https://github.com/myrrc)).
-* Reimplement interserver mode to avoid replay attacks (note, that change is backward compatible with older servers). [#47213](https://github.com/ClickHouse/ClickHouse/pull/47213) ([Azat Khuzhin](https://github.com/azat)).
-* Improve recognition of regular expression groups and refine the regexp_tree dictionary. [#47218](https://github.com/ClickHouse/ClickHouse/pull/47218) ([Han Fei](https://github.com/hanfei1991)).
-* Keeper improvement: Add new 4LW `clrs` to clean resources used by Keeper (e.g. release unused memory). [#47256](https://github.com/ClickHouse/ClickHouse/pull/47256) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add optional arguments to codecs `DoubleDelta(bytes_size)`, `Gorilla(bytes_size)`, `FPC(level, float_size)`, this allows using these codecs without column type in `clickhouse-compressor`. Fix possible aborts and arithmetic errors in `clickhouse-compressor` with these codecs. Fixes: https://github.com/ClickHouse/ClickHouse/discussions/47262. [#47271](https://github.com/ClickHouse/ClickHouse/pull/47271) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for big int types to the `runningDifference` function. Closes [#47194](https://github.com/ClickHouse/ClickHouse/issues/47194). [#47322](https://github.com/ClickHouse/ClickHouse/pull/47322) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add an expiration window for S3 credentials that have an expiration time to avoid `ExpiredToken` errors in some edge cases. It can be controlled with `expiration_window_seconds` config, the default is 120 seconds. [#47423](https://github.com/ClickHouse/ClickHouse/pull/47423) ([Antonio Andelic](https://github.com/antonio2368)).
-* Support Decimals and Date32 in `Avro` format. [#47434](https://github.com/ClickHouse/ClickHouse/pull/47434) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not start the server if an interrupted conversion from `Ordinary` to `Atomic` was detected, print a better error message with troubleshooting instructions. [#47487](https://github.com/ClickHouse/ClickHouse/pull/47487) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Add a new column `kind` to the `system.opentelemetry_span_log`. This column holds the value of [SpanKind](https://opentelemetry.io/docs/reference/specification/trace/api/#spankind) defined in OpenTelemtry. [#47499](https://github.com/ClickHouse/ClickHouse/pull/47499) ([Frank Chen](https://github.com/FrankChen021)).
-* Allow reading/writing nested arrays in `Protobuf` format with only the root field name as column name. Previously column name should've contained all nested field names (like `a.b.c Array(Array(Array(UInt32)))`, now you can use just `a Array(Array(Array(UInt32)))`. [#47650](https://github.com/ClickHouse/ClickHouse/pull/47650) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added an optional `STRICT` modifier for `SYSTEM SYNC REPLICA` which makes the query wait for the replication queue to become empty (just like it worked before https://github.com/ClickHouse/ClickHouse/pull/45648). [#47659](https://github.com/ClickHouse/ClickHouse/pull/47659) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Improve the naming of some OpenTelemetry span logs. [#47667](https://github.com/ClickHouse/ClickHouse/pull/47667) ([Frank Chen](https://github.com/FrankChen021)).
-* Prevent using too long chains of aggregate function combinators (they can lead to slow queries in the analysis stage). This closes [#47715](https://github.com/ClickHouse/ClickHouse/issues/47715). [#47716](https://github.com/ClickHouse/ClickHouse/pull/47716) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Support for subquery in parameterized views; resolves [#46741](https://github.com/ClickHouse/ClickHouse/issues/46741) [#47725](https://github.com/ClickHouse/ClickHouse/pull/47725) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix memory leak in MySQL integration (reproduces with `connection_auto_close=1`). [#47732](https://github.com/ClickHouse/ClickHouse/pull/47732) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Improved error handling in the code related to Decimal parameters, resulting in more informative error messages. Previously, when incorrect Decimal parameters were supplied, the error message generated was unclear or unhelpful. With this update, the error message printed has been fixed to provide more detailed and useful information, making it easier to identify and correct issues related to Decimal parameters. [#47812](https://github.com/ClickHouse/ClickHouse/pull/47812) ([Yu Feng](https://github.com/Vigor-jpg)). Note: this changelog entry is rewritten by ChatGPT.
-* The parameter `exact_rows_before_limit` is used to make `rows_before_limit_at_least` is designed to accurately reflect the number of rows returned before the limit is reached. This pull request addresses issues encountered when the query involves distributed processing across multiple shards or sorting operations. Prior to this update, these scenarios were not functioning as intended. [#47874](https://github.com/ClickHouse/ClickHouse/pull/47874) ([Amos Bird](https://github.com/amosbird)).
-* ThreadPools metrics introspection. [#47880](https://github.com/ClickHouse/ClickHouse/pull/47880) ([Azat Khuzhin](https://github.com/azat)).
-* Add `WriteBufferFromS3Microseconds` and `WriteBufferFromS3RequestsErrors` profile events. [#47885](https://github.com/ClickHouse/ClickHouse/pull/47885) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add `--link` and `--noninteractive` (`-y`) options to ClickHouse install. Closes [#47750](https://github.com/ClickHouse/ClickHouse/issues/47750). [#47887](https://github.com/ClickHouse/ClickHouse/pull/47887) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fixed `UNKNOWN_TABLE` exception when attaching to a materialized view that has dependent tables that are not available. This might be useful when trying to restore state from a backup. [#47975](https://github.com/ClickHouse/ClickHouse/pull/47975) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
-* Fix case when the (optional) path is not added to an encrypted disk configuration. [#47981](https://github.com/ClickHouse/ClickHouse/pull/47981) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Support for CTE in parameterized views Implementation: Updated to allow query parameters while evaluating scalar subqueries. [#48065](https://github.com/ClickHouse/ClickHouse/pull/48065) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Support big integers `(U)Int128/(U)Int256`, `Map` with any key type and `DateTime64` with any precision (not only 3 and 6). [#48119](https://github.com/ClickHouse/ClickHouse/pull/48119) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow skipping errors related to unknown enum values in row input formats. [#48133](https://github.com/ClickHouse/ClickHouse/pull/48133) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-
-#### Build/Testing/Packaging Improvement
-* ClickHouse now builds with `C++23`. [#47424](https://github.com/ClickHouse/ClickHouse/pull/47424) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fuzz `EXPLAIN` queries in the AST Fuzzer. [#47803](https://github.com/ClickHouse/ClickHouse/pull/47803) [#47852](https://github.com/ClickHouse/ClickHouse/pull/47852) ([flynn](https://github.com/ucasfl)).
-* Split stress test and the automated backward compatibility check (now Upgrade check). [#44879](https://github.com/ClickHouse/ClickHouse/pull/44879) ([Kruglov Pavel](https://github.com/Avogar)).
-* Updated the Ubuntu Image for Docker to calm down some bogus security reports. [#46784](https://github.com/ClickHouse/ClickHouse/pull/46784) ([Julio Jimenez](https://github.com/juliojimenez)). Please note that ClickHouse has no dependencies and does not require Docker.
-* Adds a prompt to allow the removal of an existing `clickhouse` download when using "curl | sh" download of ClickHouse. Prompt is "ClickHouse binary clickhouse already exists. Overwrite? \[y/N\]". [#46859](https://github.com/ClickHouse/ClickHouse/pull/46859) ([Dan Roscigno](https://github.com/DanRoscigno)).
-* Fix error during server startup on old distros (e.g. Amazon Linux 2) and on ARM that glibc 2.28 symbols are not found. [#47008](https://github.com/ClickHouse/ClickHouse/pull/47008) ([Robert Schulze](https://github.com/rschu1ze)).
-* Prepare for clang 16. [#47027](https://github.com/ClickHouse/ClickHouse/pull/47027) ([Amos Bird](https://github.com/amosbird)).
-* Added a CI check which ensures ClickHouse can run with an old glibc on ARM. [#47063](https://github.com/ClickHouse/ClickHouse/pull/47063) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a style check to prevent incorrect usage of the `NDEBUG` macro. [#47699](https://github.com/ClickHouse/ClickHouse/pull/47699) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Speed up the build a little. [#47714](https://github.com/ClickHouse/ClickHouse/pull/47714) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Bump `vectorscan` to 5.4.9. [#47955](https://github.com/ClickHouse/ClickHouse/pull/47955) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add a unit test to assert Apache Arrow's fatal logging does not abort. It covers the changes in [ClickHouse/arrow#16](https://github.com/ClickHouse/arrow/pull/16). [#47958](https://github.com/ClickHouse/ClickHouse/pull/47958) ([Arthur Passos](https://github.com/arthurpassos)).
-* Restore the ability of native macOS debug server build to start. [#48050](https://github.com/ClickHouse/ClickHouse/pull/48050) ([Robert Schulze](https://github.com/rschu1ze)). Note: this change is only relevant for development, as the ClickHouse official builds are done with cross-compilation.
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-* Fix formats parser resetting, test processing bad messages in `Kafka` [#45693](https://github.com/ClickHouse/ClickHouse/pull/45693) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix data size calculation in Keeper [#46086](https://github.com/ClickHouse/ClickHouse/pull/46086) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fixed a bug in automatic retries of `DROP TABLE` query with `ReplicatedMergeTree` tables and `Atomic` databases. In rare cases it could lead to `Can't get data for node /zk_path/log_pointer` and `The specified key does not exist` errors if the ZooKeeper session expired during DROP and a new replicated table with the same path in ZooKeeper was created in parallel. [#46384](https://github.com/ClickHouse/ClickHouse/pull/46384) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix incorrect alias recursion while normalizing queries that prevented some queries to run. [#46609](https://github.com/ClickHouse/ClickHouse/pull/46609) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix IPv4/IPv6 serialization/deserialization in binary formats [#46616](https://github.com/ClickHouse/ClickHouse/pull/46616) ([Kruglov Pavel](https://github.com/Avogar)).
-* ActionsDAG: do not change result of `and` during optimization [#46653](https://github.com/ClickHouse/ClickHouse/pull/46653) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Improve query cancellation when a client dies [#46681](https://github.com/ClickHouse/ClickHouse/pull/46681) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix arithmetic operations in aggregate optimization [#46705](https://github.com/ClickHouse/ClickHouse/pull/46705) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix possible `clickhouse-local`'s abort on JSONEachRow schema inference [#46731](https://github.com/ClickHouse/ClickHouse/pull/46731) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix changing an expired role [#46772](https://github.com/ClickHouse/ClickHouse/pull/46772) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix combined PREWHERE column accumulation from multiple steps [#46785](https://github.com/ClickHouse/ClickHouse/pull/46785) ([Alexander Gololobov](https://github.com/davenger)).
-* Use initial range for fetching file size in HTTP read buffer. Without this change, some remote files couldn't be processed. [#46824](https://github.com/ClickHouse/ClickHouse/pull/46824) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix the incorrect progress bar while using the URL tables [#46830](https://github.com/ClickHouse/ClickHouse/pull/46830) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix MSan report in `maxIntersections` function [#46847](https://github.com/ClickHouse/ClickHouse/pull/46847) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix a bug in `Map` data type [#46856](https://github.com/ClickHouse/ClickHouse/pull/46856) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix wrong results of some LIKE searches when the LIKE pattern contains quoted non-quotable characters [#46875](https://github.com/ClickHouse/ClickHouse/pull/46875) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix - WITH FILL would produce abort when the Filling Transform processing an empty block [#46897](https://github.com/ClickHouse/ClickHouse/pull/46897) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix date and int inference from string in JSON [#46972](https://github.com/ClickHouse/ClickHouse/pull/46972) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug in zero-copy replication disk choice during fetch [#47010](https://github.com/ClickHouse/ClickHouse/pull/47010) ([alesapin](https://github.com/alesapin)).
-* Fix a typo in systemd service definition [#47051](https://github.com/ClickHouse/ClickHouse/pull/47051) ([Palash Goel](https://github.com/palash-goel)).
-* Fix the NOT_IMPLEMENTED error with CROSS JOIN and algorithm = auto [#47068](https://github.com/ClickHouse/ClickHouse/pull/47068) ([Vladimir C](https://github.com/vdimir)).
-* Fix the problem that the 'ReplicatedMergeTree' table failed to insert two similar data when the 'part_type' is configured as 'InMemory' mode (experimental feature). [#47121](https://github.com/ClickHouse/ClickHouse/pull/47121) ([liding1992](https://github.com/liding1992)).
-* External dictionaries / library-bridge: Fix error "unknown library method 'extDict_libClone'" [#47136](https://github.com/ClickHouse/ClickHouse/pull/47136) ([alex filatov](https://github.com/phil-88)).
-* Fix race condition in a grace hash join with limit [#47153](https://github.com/ClickHouse/ClickHouse/pull/47153) ([Vladimir C](https://github.com/vdimir)).
-* Fix concrete columns PREWHERE support [#47154](https://github.com/ClickHouse/ClickHouse/pull/47154) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible deadlock in Query Status [#47161](https://github.com/ClickHouse/ClickHouse/pull/47161) ([Kruglov Pavel](https://github.com/Avogar)).
-* Forbid insert select for the same `Join` table, as it leads to a deadlock [#47260](https://github.com/ClickHouse/ClickHouse/pull/47260) ([Vladimir C](https://github.com/vdimir)).
-* Skip merged partitions for `min_age_to_force_merge_seconds` merges [#47303](https://github.com/ClickHouse/ClickHouse/pull/47303) ([Antonio Andelic](https://github.com/antonio2368)).
-* Modify find_first_symbols, so it works as expected for find_first_not_symbols [#47304](https://github.com/ClickHouse/ClickHouse/pull/47304) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix big numbers inference in CSV [#47410](https://github.com/ClickHouse/ClickHouse/pull/47410) ([Kruglov Pavel](https://github.com/Avogar)).
-* Disable logical expression optimizer for expression with aliases. [#47451](https://github.com/ClickHouse/ClickHouse/pull/47451) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix error in `decodeURLComponent` [#47457](https://github.com/ClickHouse/ClickHouse/pull/47457) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix explain graph with projection [#47473](https://github.com/ClickHouse/ClickHouse/pull/47473) ([flynn](https://github.com/ucasfl)).
-* Fix query parameters [#47488](https://github.com/ClickHouse/ClickHouse/pull/47488) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Parameterized view: a bug fix. [#47495](https://github.com/ClickHouse/ClickHouse/pull/47495) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fuzzer of data formats, and the corresponding fixes. [#47519](https://github.com/ClickHouse/ClickHouse/pull/47519) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix monotonicity check for `DateTime64` [#47526](https://github.com/ClickHouse/ClickHouse/pull/47526) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix "block structure mismatch" for a Nullable LowCardinality column [#47537](https://github.com/ClickHouse/ClickHouse/pull/47537) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Proper fix for a bug in Apache Parquet [#45878](https://github.com/ClickHouse/ClickHouse/issues/45878) [#47538](https://github.com/ClickHouse/ClickHouse/pull/47538) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `BSONEachRow` parallel parsing when document size is invalid [#47540](https://github.com/ClickHouse/ClickHouse/pull/47540) ([Kruglov Pavel](https://github.com/Avogar)).
-* Preserve error in `system.distribution_queue` on `SYSTEM FLUSH DISTRIBUTED` [#47541](https://github.com/ClickHouse/ClickHouse/pull/47541) ([Azat Khuzhin](https://github.com/azat)).
-* Check for duplicate column in `BSONEachRow` format [#47609](https://github.com/ClickHouse/ClickHouse/pull/47609) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix wait for zero copy lock during move [#47631](https://github.com/ClickHouse/ClickHouse/pull/47631) ([alesapin](https://github.com/alesapin)).
-* Fix aggregation by partitions [#47634](https://github.com/ClickHouse/ClickHouse/pull/47634) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix bug in tuple as array serialization in `BSONEachRow` format [#47690](https://github.com/ClickHouse/ClickHouse/pull/47690) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix crash in `polygonsSymDifferenceCartesian` [#47702](https://github.com/ClickHouse/ClickHouse/pull/47702) ([pufit](https://github.com/pufit)).
-* Fix reading from storage `File` compressed files with `zlib` and `gzip` compression [#47796](https://github.com/ClickHouse/ClickHouse/pull/47796) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve empty query detection for PostgreSQL (for pgx golang driver) [#47854](https://github.com/ClickHouse/ClickHouse/pull/47854) ([Azat Khuzhin](https://github.com/azat)).
-* Fix DateTime monotonicity check for LowCardinality types [#47860](https://github.com/ClickHouse/ClickHouse/pull/47860) ([Antonio Andelic](https://github.com/antonio2368)).
-* Use restore_threads (not backup_threads) for RESTORE ASYNC [#47861](https://github.com/ClickHouse/ClickHouse/pull/47861) ([Azat Khuzhin](https://github.com/azat)).
-* Fix DROP COLUMN with ReplicatedMergeTree containing projections [#47883](https://github.com/ClickHouse/ClickHouse/pull/47883) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix for Replicated database recovery [#47901](https://github.com/ClickHouse/ClickHouse/pull/47901) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Hotfix for too verbose warnings in HTTP [#47903](https://github.com/ClickHouse/ClickHouse/pull/47903) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix "Field value too long" in `catboostEvaluate` [#47970](https://github.com/ClickHouse/ClickHouse/pull/47970) ([Robert Schulze](https://github.com/rschu1ze)).
-* Fix [#36971](https://github.com/ClickHouse/ClickHouse/issues/36971): Watchdog: exit with non-zero code if child process exits [#47973](https://github.com/ClickHouse/ClickHouse/pull/47973) ([Коренберг Марк](https://github.com/socketpair)).
-* Fix for "index file `cidx` is unexpectedly long" [#48010](https://github.com/ClickHouse/ClickHouse/pull/48010) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix MaterializedPostgreSQL query to get attributes (replica-identity) [#48015](https://github.com/ClickHouse/ClickHouse/pull/48015) ([Solomatov Sergei](https://github.com/solomatovs)).
-* parseDateTime(): Fix UB (signed integer overflow) [#48019](https://github.com/ClickHouse/ClickHouse/pull/48019) ([Robert Schulze](https://github.com/rschu1ze)).
-* Use unique names for Records in Avro to avoid reusing its schema [#48057](https://github.com/ClickHouse/ClickHouse/pull/48057) ([Kruglov Pavel](https://github.com/Avogar)).
-* Correctly set TCP/HTTP socket timeouts in Keeper [#48108](https://github.com/ClickHouse/ClickHouse/pull/48108) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix possible member call on null pointer in `Avro` format [#48184](https://github.com/ClickHouse/ClickHouse/pull/48184) ([Kruglov Pavel](https://github.com/Avogar)).
-
-### <a id="232"></a> ClickHouse release 23.2, 2023-02-23
-
-#### Backward Incompatible Change
-* Extend function "toDayOfWeek()" (alias: "DAYOFWEEK") with a mode argument that encodes whether the week starts on Monday or Sunday and whether counting starts at 0 or 1. For consistency with other date time functions, the mode argument was inserted between the time and the time zone arguments. This breaks existing usage of the (previously undocumented) 2-argument syntax "toDayOfWeek(time, time_zone)". A fix is to rewrite the function into "toDayOfWeek(time, 0, time_zone)". [#45233](https://github.com/ClickHouse/ClickHouse/pull/45233) ([Robert Schulze](https://github.com/rschu1ze)).
-* Rename setting `max_query_cache_size` to `filesystem_cache_max_download_size`. [#45614](https://github.com/ClickHouse/ClickHouse/pull/45614) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* The `default` user will not have permissions for access type `SHOW NAMED COLLECTION` by default (e.g. `default` user will no longer be able to grant ALL to other users as it was before, therefore this PR is backward incompatible). [#46010](https://github.com/ClickHouse/ClickHouse/pull/46010) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* If the SETTINGS clause is specified before the FORMAT clause, the settings will be applied to formatting as well. [#46003](https://github.com/ClickHouse/ClickHouse/pull/46003) ([Azat Khuzhin](https://github.com/azat)).
-* Remove support for setting `materialized_postgresql_allow_automatic_update` (which was by default turned off). [#46106](https://github.com/ClickHouse/ClickHouse/pull/46106) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Slightly improve performance of `countDigits` on realistic datasets. This closed [#44518](https://github.com/ClickHouse/ClickHouse/issues/44518). In previous versions, `countDigits(0)` returned `0`; now it returns `1`, which is more correct, and follows the existing documentation. [#46187](https://github.com/ClickHouse/ClickHouse/pull/46187) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Disallow creation of new columns compressed by a combination of codecs "Delta" or "DoubleDelta" followed by codecs "Gorilla" or "FPC". This can be bypassed using setting "allow_suspicious_codecs = true". [#45652](https://github.com/ClickHouse/ClickHouse/pull/45652) ([Robert Schulze](https://github.com/rschu1ze)).
-
-#### New Feature
-* Add `StorageIceberg` and table function `iceberg` to access iceberg table store on S3. [#45384](https://github.com/ClickHouse/ClickHouse/pull/45384) ([flynn](https://github.com/ucasfl)).
-* Allow configuring storage as `SETTINGS disk = '<disk_name>'` (instead of `storage_policy`) and with explicit disk creation `SETTINGS disk = disk(type=s3, ...)`. [#41976](https://github.com/ClickHouse/ClickHouse/pull/41976) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Expose `ProfileEvents` counters in `system.part_log`. [#38614](https://github.com/ClickHouse/ClickHouse/pull/38614) ([Bharat Nallan](https://github.com/bharatnc)).
-* Enrichment of the existing `ReplacingMergeTree` engine to allow duplicate the insertion. It leverages the power of both `ReplacingMergeTree` and `CollapsingMergeTree` in one MergeTree engine. Deleted data are not returned when queried, but not removed from disk neither. [#41005](https://github.com/ClickHouse/ClickHouse/pull/41005) ([youennL-cs](https://github.com/youennL-cs)).
-* Add `generateULID` function. Closes [#36536](https://github.com/ClickHouse/ClickHouse/issues/36536). [#44662](https://github.com/ClickHouse/ClickHouse/pull/44662) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Add `corrMatrix` aggregate function, calculating each two columns. In addition, since Aggregatefunctions `covarSamp` and `covarPop` are similar to `corr`, I add `covarSampMatrix`, `covarPopMatrix` by the way. @alexey-milovidov closes [#44587](https://github.com/ClickHouse/ClickHouse/issues/44587). [#44680](https://github.com/ClickHouse/ClickHouse/pull/44680) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Introduce arrayShuffle function for random array permutations. [#45271](https://github.com/ClickHouse/ClickHouse/pull/45271) ([Joanna Hulboj](https://github.com/jh0x)).
-* Support types `FIXED_SIZE_BINARY` type in Arrow, `FIXED_LENGTH_BYTE_ARRAY` in `Parquet` and match them to `FixedString`. Add settings `output_format_parquet_fixed_string_as_fixed_byte_array/output_format_arrow_fixed_string_as_fixed_byte_array` to control default output type for FixedString. Closes [#45326](https://github.com/ClickHouse/ClickHouse/issues/45326). [#45340](https://github.com/ClickHouse/ClickHouse/pull/45340) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a new column `last_exception_time` to system.replication_queue. [#45457](https://github.com/ClickHouse/ClickHouse/pull/45457) ([Frank Chen](https://github.com/FrankChen021)).
-* Add two new functions which allow for user-defined keys/seeds with SipHash{64,128}. [#45513](https://github.com/ClickHouse/ClickHouse/pull/45513) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Allow a three-argument version for table function `format`. close [#45808](https://github.com/ClickHouse/ClickHouse/issues/45808). [#45873](https://github.com/ClickHouse/ClickHouse/pull/45873) ([FFFFFFFHHHHHHH](https://github.com/FFFFFFFHHHHHHH)).
-* Add `JodaTime` format support for 'x','w','S'. Refer to https://joda-time.sourceforge.net/apidocs/org/joda/time/format/DateTimeFormat.html. [#46073](https://github.com/ClickHouse/ClickHouse/pull/46073) ([zk_kiger](https://github.com/zk-kiger)).
-* Support window function `ntile`. ([lgbo](https://github.com/lgbo-ustc)).
-* Add setting `final` to implicitly apply the `FINAL` modifier to every table. [#40945](https://github.com/ClickHouse/ClickHouse/pull/40945) ([Arthur Passos](https://github.com/arthurpassos)).
-* Added `arrayPartialSort` and `arrayPartialReverseSort` functions. [#46296](https://github.com/ClickHouse/ClickHouse/pull/46296) ([Joanna Hulboj](https://github.com/jh0x)).
-* The new http parameter `client_protocol_version` allows setting a client protocol version for HTTP responses using the Native format. [#40397](https://github.com/ClickHouse/ClickHouse/issues/40397). [#46360](https://github.com/ClickHouse/ClickHouse/pull/46360) ([Geoff Genz](https://github.com/genzgd)).
-* Add new function `regexpExtract`, like spark function `REGEXP_EXTRACT` for compatibility. It is similar to the existing function `extract`. [#46469](https://github.com/ClickHouse/ClickHouse/pull/46469) ([李扬](https://github.com/taiyang-li)).
-* Add new function `JSONArrayLength`, which returns the number of elements in the outermost JSON array. The function returns NULL if the input JSON string is invalid. [#46631](https://github.com/ClickHouse/ClickHouse/pull/46631) ([李扬](https://github.com/taiyang-li)).
-
-#### Performance Improvement
-* The introduced logic works if PREWHERE condition is a conjunction of multiple conditions (cond1 AND cond2 AND ... ). It groups those conditions that require reading the same columns into steps. After each step the corresponding part of the full condition is computed and the result rows might be filtered. This allows to read fewer rows in the next steps thus saving IO bandwidth and doing less computation. This logic is disabled by default for now. It will be enabled by default in one of the future releases once it is known to not have any regressions, so it is highly encouraged to be used for testing. It can be controlled by 2 settings: "enable_multiple_prewhere_read_steps" and "move_all_conditions_to_prewhere". [#46140](https://github.com/ClickHouse/ClickHouse/pull/46140) ([Alexander Gololobov](https://github.com/davenger)).
-* An option added to aggregate partitions independently if table partition key and group by key are compatible. Controlled by the setting `allow_aggregate_partitions_independently`. Disabled by default because of limited applicability (please refer to the docs). [#45364](https://github.com/ClickHouse/ClickHouse/pull/45364) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow using Vertical merge algorithm with parts in Compact format. This will allow ClickHouse server to use much less memory for background operations. This closes [#46084](https://github.com/ClickHouse/ClickHouse/issues/46084). [#45681](https://github.com/ClickHouse/ClickHouse/pull/45681) [#46282](https://github.com/ClickHouse/ClickHouse/pull/46282) ([Anton Popov](https://github.com/CurtizJ)).
-* Optimize `Parquet` reader by using batch reader. [#45878](https://github.com/ClickHouse/ClickHouse/pull/45878) ([LiuNeng](https://github.com/liuneng1994)).
-* Add new `local_filesystem_read_method` method `io_uring` based on the asynchronous Linux [io_uring](https://kernel.dk/io_uring.pdf) subsystem, improving read performance almost universally compared to the default `pread` method. [#38456](https://github.com/ClickHouse/ClickHouse/pull/38456) ([Saulius Valatka](https://github.com/sauliusvl)).
-* Rewrite aggregate functions with `if` expression as argument when logically equivalent. For example, `avg(if(cond, col, null))` can be rewritten to avgIf(cond, col). It is helpful in performance. [#44730](https://github.com/ClickHouse/ClickHouse/pull/44730) ([李扬](https://github.com/taiyang-li)).
-* Improve lower/upper function performance with avx512 instructions. [#37894](https://github.com/ClickHouse/ClickHouse/pull/37894) ([yaqi-zhao](https://github.com/yaqi-zhao)).
-* Remove the limitation that on systems with >=32 cores and SMT disabled ClickHouse uses only half of the cores (the case when you disable Hyper Threading in BIOS). [#44973](https://github.com/ClickHouse/ClickHouse/pull/44973) ([Robert Schulze](https://github.com/rschu1ze)).
-* Improve performance of function `multiIf` by columnar executing, speed up by 2.3x. [#45296](https://github.com/ClickHouse/ClickHouse/pull/45296) ([李扬](https://github.com/taiyang-li)).
-* Add fast path for function `position` when the needle is empty. [#45382](https://github.com/ClickHouse/ClickHouse/pull/45382) ([李扬](https://github.com/taiyang-li)).
-* Enable `query_plan_remove_redundant_sorting` optimization by default. Optimization implemented in [#45420](https://github.com/ClickHouse/ClickHouse/issues/45420). [#45567](https://github.com/ClickHouse/ClickHouse/pull/45567) ([Igor Nikonov](https://github.com/devcrafter)).
-* Increased HTTP Transfer Encoding chunk size to improve performance of large queries using the HTTP interface. [#45593](https://github.com/ClickHouse/ClickHouse/pull/45593) ([Geoff Genz](https://github.com/genzgd)).
-* Fixed performance of short `SELECT` queries that read from tables with large number of `Array`/`Map`/`Nested` columns. [#45630](https://github.com/ClickHouse/ClickHouse/pull/45630) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve performance of filtering for big integers and decimal types. [#45949](https://github.com/ClickHouse/ClickHouse/pull/45949) ([李扬](https://github.com/taiyang-li)).
-* This change could effectively reduce the overhead of obtaining the filter from ColumnNullable(UInt8) and improve the overall query performance. To evaluate the impact of this change, we adopted TPC-H benchmark but revised the column types from non-nullable to nullable, and we measured the QPS of its queries as the performance indicator. [#45962](https://github.com/ClickHouse/ClickHouse/pull/45962) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Make the `_part` and `_partition_id` virtual column be `LowCardinality(String)` type. Closes [#45964](https://github.com/ClickHouse/ClickHouse/issues/45964). [#45975](https://github.com/ClickHouse/ClickHouse/pull/45975) ([flynn](https://github.com/ucasfl)).
-* Improve the performance of Decimal conversion when the scale does not change. [#46095](https://github.com/ClickHouse/ClickHouse/pull/46095) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Allow to increase prefetching for read data. [#46168](https://github.com/ClickHouse/ClickHouse/pull/46168) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Rewrite `arrayExists(x -> x = 1, arr)` -> `has(arr, 1)`, which improve performance by 1.34x. [#46188](https://github.com/ClickHouse/ClickHouse/pull/46188) ([李扬](https://github.com/taiyang-li)).
-* Fix too big memory usage for vertical merges on non-remote disk. Respect `max_insert_delayed_streams_for_parallel_write` for the remote disk. [#46275](https://github.com/ClickHouse/ClickHouse/pull/46275) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Update zstd to v1.5.4. It has some minor improvements in performance and compression ratio. If you run replicas with different versions of ClickHouse you may see reasonable error messages `Data after merge/mutation is not byte-identical to data on another replicas.` with explanation. These messages are Ok and you should not worry. [#46280](https://github.com/ClickHouse/ClickHouse/pull/46280) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix performance degradation caused by [#39737](https://github.com/ClickHouse/ClickHouse/issues/39737). [#46309](https://github.com/ClickHouse/ClickHouse/pull/46309) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `replicas_status` handle will answer quickly even in case of a large replication queue. [#46310](https://github.com/ClickHouse/ClickHouse/pull/46310) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add avx512 support for aggregate function `sum`, function unary arithmetic, function comparison. [#37870](https://github.com/ClickHouse/ClickHouse/pull/37870) ([zhao zhou](https://github.com/zzachimed)).
-* Rewrote the code around marks distribution and the overall coordination of the reading in order to achieve the maximum performance improvement. This closes [#34527](https://github.com/ClickHouse/ClickHouse/issues/34527). [#43772](https://github.com/ClickHouse/ClickHouse/pull/43772) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Remove redundant DISTINCT clauses in query (subqueries). Implemented on top of query plan. It does similar optimization as `optimize_duplicate_order_by_and_distinct` regarding DISTINCT clauses. Can be enabled via `query_plan_remove_redundant_distinct` setting. Related to [#42648](https://github.com/ClickHouse/ClickHouse/issues/42648). [#44176](https://github.com/ClickHouse/ClickHouse/pull/44176) ([Igor Nikonov](https://github.com/devcrafter)).
-* A few query rewrite optimizations: `sumIf(123, cond) -> 123 * countIf(1, cond)`, `sum(if(cond, 123, 0)) -> 123 * countIf(cond)`, `sum(if(cond, 0, 123)) -> 123 * countIf(not(cond))` [#44728](https://github.com/ClickHouse/ClickHouse/pull/44728) ([李扬](https://github.com/taiyang-li)).
-* Improved how memory bound merging and aggregation in order on top query plan interact. Previously we fell back to explicit sorting for AIO in some cases when it wasn't actually needed. [#45892](https://github.com/ClickHouse/ClickHouse/pull/45892) ([Nikita Taranov](https://github.com/nickitat)).
-* Concurrent merges are scheduled using round-robin by default to ensure fair and starvation-free operation. Previously in heavily overloaded shards, big merges could possibly be starved by smaller merges due to the use of strict priority scheduling. Added `background_merges_mutations_scheduling_policy` server config option to select scheduling algorithm (`round_robin` or `shortest_task_first`). [#46247](https://github.com/ClickHouse/ClickHouse/pull/46247) ([Sergei Trifonov](https://github.com/serxa)).
-
-#### Improvement
-* Enable retries for INSERT by default in case of ZooKeeper session loss. We already use it in production. [#46308](https://github.com/ClickHouse/ClickHouse/pull/46308) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add ability to ignore unknown keys in JSON object for named tuples (`input_format_json_ignore_unknown_keys_in_named_tuple`). [#45678](https://github.com/ClickHouse/ClickHouse/pull/45678) ([Azat Khuzhin](https://github.com/azat)).
-* Support optimizing the `where` clause with sorting key expression move to `prewhere`  for query with `final`. [#38893](https://github.com/ClickHouse/ClickHouse/issues/38893). [#38950](https://github.com/ClickHouse/ClickHouse/pull/38950) ([hexiaoting](https://github.com/hexiaoting)).
-* Add new metrics for backups: num_processed_files and processed_files_size described actual number of processed files. [#42244](https://github.com/ClickHouse/ClickHouse/pull/42244) ([Aleksandr](https://github.com/AVMusorin)).
-* Added retries on interserver DNS errors. [#43179](https://github.com/ClickHouse/ClickHouse/pull/43179) ([Anton Kozlov](https://github.com/tonickkozlov)).
-* Keeper improvement: try preallocating space on the disk to avoid undefined out-of-space issues. Introduce setting `max_log_file_size` for the maximum size of Keeper's Raft log files. [#44370](https://github.com/ClickHouse/ClickHouse/pull/44370) ([Antonio Andelic](https://github.com/antonio2368)).
-* Optimize behavior for a replica delay api logic in case the replica is read-only. [#45148](https://github.com/ClickHouse/ClickHouse/pull/45148) ([mateng915](https://github.com/mateng0915)).
-* Ask for the password in clickhouse-client interactively in a case when the empty password is wrong. Closes [#46702](https://github.com/ClickHouse/ClickHouse/issues/46702). [#46730](https://github.com/ClickHouse/ClickHouse/pull/46730) ([Nikolay Degterinsky](https://github.com/evillique)). 
-* Mark `Gorilla` compression on columns of non-Float* type as suspicious. [#45376](https://github.com/ClickHouse/ClickHouse/pull/45376) ([Robert Schulze](https://github.com/rschu1ze)).
-* Show replica name that is executing a merge in the `postpone_reason` column. [#45458](https://github.com/ClickHouse/ClickHouse/pull/45458) ([Frank Chen](https://github.com/FrankChen021)).
-* Save exception stack trace in part_log. [#45459](https://github.com/ClickHouse/ClickHouse/pull/45459) ([Frank Chen](https://github.com/FrankChen021)).
-* The `regexp_tree` dictionary is polished and now it is compatible with https://github.com/ua-parser/uap-core. [#45631](https://github.com/ClickHouse/ClickHouse/pull/45631) ([Han Fei](https://github.com/hanfei1991)).
-* Updated checking of `SYSTEM SYNC REPLICA`, resolves [#45508](https://github.com/ClickHouse/ClickHouse/issues/45508) [#45648](https://github.com/ClickHouse/ClickHouse/pull/45648) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Rename setting `replication_alter_partitions_sync` to `alter_sync`. [#45659](https://github.com/ClickHouse/ClickHouse/pull/45659) ([Antonio Andelic](https://github.com/antonio2368)).
-* The `generateRandom` table function and the engine now support `LowCardinality` data types. This is useful for testing, for example you can write `INSERT INTO table SELECT * FROM generateRandom() LIMIT 1000`. This is needed to debug [#45590](https://github.com/ClickHouse/ClickHouse/issues/45590). [#45661](https://github.com/ClickHouse/ClickHouse/pull/45661) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The experimental query result cache now provides more modular configuration settings. [#45679](https://github.com/ClickHouse/ClickHouse/pull/45679) ([Robert Schulze](https://github.com/rschu1ze)).
-* Renamed "query result cache" to "query cache". [#45682](https://github.com/ClickHouse/ClickHouse/pull/45682) ([Robert Schulze](https://github.com/rschu1ze)).
-* add `SYSTEM SYNC FILE CACHE` command. It will do the `sync` syscall. [#8921](https://github.com/ClickHouse/ClickHouse/issues/8921). [#45685](https://github.com/ClickHouse/ClickHouse/pull/45685) ([DR](https://github.com/freedomDR)).
-* Add a new S3 setting `allow_head_object_request`. This PR makes usage of `GetObjectAttributes` request instead of `HeadObject` introduced in https://github.com/ClickHouse/ClickHouse/pull/45288 optional (and disabled by default). [#45701](https://github.com/ClickHouse/ClickHouse/pull/45701) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add ability to override connection settings based on connection names (that said that now you can forget about storing password for each connection, you can simply put everything into `~/.clickhouse-client/config.xml` and even use different history files for them, which can be also useful). [#45715](https://github.com/ClickHouse/ClickHouse/pull/45715) ([Azat Khuzhin](https://github.com/azat)).
-* Arrow format: support the duration type. Closes [#45669](https://github.com/ClickHouse/ClickHouse/issues/45669). [#45750](https://github.com/ClickHouse/ClickHouse/pull/45750) ([flynn](https://github.com/ucasfl)).
-* Extend the logging in the Query Cache to improve investigations of the caching behavior. [#45751](https://github.com/ClickHouse/ClickHouse/pull/45751) ([Robert Schulze](https://github.com/rschu1ze)).
-* The query cache's server-level settings are now reconfigurable at runtime. [#45758](https://github.com/ClickHouse/ClickHouse/pull/45758) ([Robert Schulze](https://github.com/rschu1ze)).
-* Hide password in logs when a table function's arguments are specified with a named collection. [#45774](https://github.com/ClickHouse/ClickHouse/pull/45774) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Improve internal S3 client to correctly deduce regions and redirections for different types of URLs. [#45783](https://github.com/ClickHouse/ClickHouse/pull/45783) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add support for Map, IPv4 and IPv6 types in generateRandom. Mostly useful for testing. [#45785](https://github.com/ClickHouse/ClickHouse/pull/45785) ([Raúl Marín](https://github.com/Algunenano)).
-* Support empty/notEmpty for IP types. [#45799](https://github.com/ClickHouse/ClickHouse/pull/45799) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* The column `num_processed_files` was split into two columns: `num_files` (for BACKUP) and `files_read` (for RESTORE). The column `processed_files_size` was split into two columns: `total_size` (for BACKUP) and `bytes_read` (for RESTORE). [#45800](https://github.com/ClickHouse/ClickHouse/pull/45800) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add support for `SHOW ENGINES` query for MySQL compatibility. [#45859](https://github.com/ClickHouse/ClickHouse/pull/45859) ([Filatenkov Artur](https://github.com/FArthur-cmd)).
-* Improved how the obfuscator deals with queries. [#45867](https://github.com/ClickHouse/ClickHouse/pull/45867) ([Raúl Marín](https://github.com/Algunenano)).
-* Improve behaviour of conversion into Date for boundary value 65535 (2149-06-06). [#46042](https://github.com/ClickHouse/ClickHouse/pull/46042) [#45914](https://github.com/ClickHouse/ClickHouse/pull/45914) ([Joanna Hulboj](https://github.com/jh0x)).
-* Add setting `check_referential_table_dependencies` to check referential dependencies on `DROP TABLE`. This PR solves [#38326](https://github.com/ClickHouse/ClickHouse/issues/38326). [#45936](https://github.com/ClickHouse/ClickHouse/pull/45936) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix `tupleElement` to return `Null` when having `Null` argument. Closes [#45894](https://github.com/ClickHouse/ClickHouse/issues/45894). [#45952](https://github.com/ClickHouse/ClickHouse/pull/45952) ([flynn](https://github.com/ucasfl)).
-* Throw an error on no files satisfying the S3 wildcard. Closes [#45587](https://github.com/ClickHouse/ClickHouse/issues/45587). [#45957](https://github.com/ClickHouse/ClickHouse/pull/45957) ([chen](https://github.com/xiedeyantu)).
-* Use cluster state data to check concurrent backup/restore. [#45982](https://github.com/ClickHouse/ClickHouse/pull/45982) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* ClickHouse Client: Use "exact" matching for fuzzy search, which has correct case ignorance and more appropriate algorithm for matching SQL queries. [#46000](https://github.com/ClickHouse/ClickHouse/pull/46000) ([Azat Khuzhin](https://github.com/azat)).
-* Forbid wrong create View syntax `CREATE View X TO Y AS SELECT`. Closes [#4331](https://github.com/ClickHouse/ClickHouse/issues/4331). [#46043](https://github.com/ClickHouse/ClickHouse/pull/46043) ([flynn](https://github.com/ucasfl)).
-* Storage `Log` family support setting the `storage_policy`. Closes [#43421](https://github.com/ClickHouse/ClickHouse/issues/43421). [#46044](https://github.com/ClickHouse/ClickHouse/pull/46044) ([flynn](https://github.com/ucasfl)).
-* Improve `JSONColumns` format when the result is empty. Closes [#46024](https://github.com/ClickHouse/ClickHouse/issues/46024). [#46053](https://github.com/ClickHouse/ClickHouse/pull/46053) ([flynn](https://github.com/ucasfl)).
-* Add reference implementation for SipHash128. [#46065](https://github.com/ClickHouse/ClickHouse/pull/46065) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Add a new metric to record allocations times and bytes using mmap. [#46068](https://github.com/ClickHouse/ClickHouse/pull/46068) ([李扬](https://github.com/taiyang-li)).
-* Currently for functions like `leftPad`, `rightPad`, `leftPadUTF8`, `rightPadUTF8`, the second argument `length` must be UInt8|16|32|64|128|256. Which is too strict for clickhouse users, besides, it is not consistent with other similar functions like `arrayResize`, `substring` and so on. [#46103](https://github.com/ClickHouse/ClickHouse/pull/46103) ([李扬](https://github.com/taiyang-li)).
-* Fix assertion in the `welchTTest` function in debug build when the resulting statistics is NaN. Unified the behavior with other similar functions. Change the behavior of `studentTTest` to return NaN instead of throwing an exception because the previous behavior was inconvenient. This closes [#41176](https://github.com/ClickHouse/ClickHouse/issues/41176) This closes [#42162](https://github.com/ClickHouse/ClickHouse/issues/42162). [#46141](https://github.com/ClickHouse/ClickHouse/pull/46141) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* More convenient usage of big integers and ORDER BY WITH FILL. Allow using plain integers for start and end points in WITH FILL when ORDER BY big (128-bit and 256-bit) integers. Fix the wrong result for big integers with negative start or end points. This closes [#16733](https://github.com/ClickHouse/ClickHouse/issues/16733). [#46152](https://github.com/ClickHouse/ClickHouse/pull/46152) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add `parts`, `active_parts` and `total_marks` columns to `system.tables` on [issue](https://github.com/ClickHouse/ClickHouse/issues/44336). [#46161](https://github.com/ClickHouse/ClickHouse/pull/46161) ([attack204](https://github.com/attack204)).
-* Functions "multi[Fuzzy]Match(Any|AnyIndex|AllIndices}" now reject regexes which will likely evaluate very slowly in vectorscan. [#46167](https://github.com/ClickHouse/ClickHouse/pull/46167) ([Robert Schulze](https://github.com/rschu1ze)).
-* When `insert_null_as_default` is enabled and column doesn't have defined default value, the default of column type will be used. Also this PR fixes using default values on nulls in case of LowCardinality columns. [#46171](https://github.com/ClickHouse/ClickHouse/pull/46171) ([Kruglov Pavel](https://github.com/Avogar)).
-* Prefer explicitly defined access keys for S3 clients. If `use_environment_credentials` is set to `true`, and the user has provided the access key through query or config, they will be used instead of the ones from the environment variable. [#46191](https://github.com/ClickHouse/ClickHouse/pull/46191) ([Antonio Andelic](https://github.com/antonio2368)).
-* Add an alias "DATE_FORMAT()" for function "formatDateTime()" to improve compatibility with MySQL's SQL dialect, extend function `formatDateTime` with substitutions "a", "b", "c", "h", "i", "k", "l" "r", "s", "W". ### Documentation entry for user-facing changes User-readable short description: `DATE_FORMAT` is an alias of `formatDateTime`. Formats a Time according to the given Format string. Format is a constant expression, so you cannot have multiple formats for a single result column. (Provide link to [formatDateTime](https://clickhouse.com/docs/en/sql-reference/functions/date-time-functions/#formatdatetime)). [#46302](https://github.com/ClickHouse/ClickHouse/pull/46302) ([Jake Bamrah](https://github.com/JakeBamrah)).
-* Add `ProfileEvents` and `CurrentMetrics` about the callback tasks for parallel replicas (`s3Cluster` and `MergeTree` tables). [#46313](https://github.com/ClickHouse/ClickHouse/pull/46313) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Add support for `DELETE` and `UPDATE` for tables using `KeeperMap` storage engine. [#46330](https://github.com/ClickHouse/ClickHouse/pull/46330) ([Antonio Andelic](https://github.com/antonio2368)).
-* Allow writing RENAME queries with query parameters. Resolves [#45778](https://github.com/ClickHouse/ClickHouse/issues/45778). [#46407](https://github.com/ClickHouse/ClickHouse/pull/46407) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fix parameterized SELECT queries with REPLACE transformer. Resolves [#33002](https://github.com/ClickHouse/ClickHouse/issues/33002). [#46420](https://github.com/ClickHouse/ClickHouse/pull/46420) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Exclude the internal database used for temporary/external tables from the calculation of asynchronous metric "NumberOfDatabases". This makes the behavior consistent with system table "system.databases". [#46435](https://github.com/ClickHouse/ClickHouse/pull/46435) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added `last_exception_time` column into distribution_queue table. [#46564](https://github.com/ClickHouse/ClickHouse/pull/46564) ([Aleksandr](https://github.com/AVMusorin)).
-* Support for IN clause with parameter in parameterized views. [#46583](https://github.com/ClickHouse/ClickHouse/pull/46583) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Do not load named collections on server startup (load them on first access instead). [#46607](https://github.com/ClickHouse/ClickHouse/pull/46607) ([Kseniia Sumarokova](https://github.com/kssenii)).
-
-
-#### Build/Testing/Packaging Improvement
-* Introduce GWP-ASan implemented by the LLVM runtime. This closes [#27039](https://github.com/ClickHouse/ClickHouse/issues/27039). [#45226](https://github.com/ClickHouse/ClickHouse/pull/45226) ([Han Fei](https://github.com/hanfei1991)).
-* We want to make our tests less stable and more flaky: add randomization for merge tree settings in tests. [#38983](https://github.com/ClickHouse/ClickHouse/pull/38983) ([Anton Popov](https://github.com/CurtizJ)).
-* Enable the HDFS support in PowerPC and which helps to fixes the following functional tests 02113_hdfs_assert.sh, 02244_hdfs_cluster.sql and 02368_cancel_write_into_hdfs.sh. [#44949](https://github.com/ClickHouse/ClickHouse/pull/44949) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Add systemd.service file for clickhouse-keeper. Fixes [#44293](https://github.com/ClickHouse/ClickHouse/issues/44293). [#45568](https://github.com/ClickHouse/ClickHouse/pull/45568) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* ClickHouse's fork of poco was moved from "contrib/" to "base/poco/". [#46075](https://github.com/ClickHouse/ClickHouse/pull/46075) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add an option for `clickhouse-watchdog` to restart the child process. This does not make a lot of use. [#46312](https://github.com/ClickHouse/ClickHouse/pull/46312) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* If the environment variable `CLICKHOUSE_DOCKER_RESTART_ON_EXIT` is set to 1, the Docker container will run `clickhouse-server` as a child instead of the first process, and restart it when it exited. [#46391](https://github.com/ClickHouse/ClickHouse/pull/46391) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix Systemd service file. [#46461](https://github.com/ClickHouse/ClickHouse/pull/46461) ([SuperDJY](https://github.com/cmsxbc)).
-* Raised the minimum Clang version needed to build ClickHouse from 12 to 15. [#46710](https://github.com/ClickHouse/ClickHouse/pull/46710) ([Robert Schulze](https://github.com/rschu1ze)).
-* Upgrade Intel QPL from v0.3.0 to v1.0.0 2. Build libaccel-config and link it statically to QPL library instead of dynamically. [#45809](https://github.com/ClickHouse/ClickHouse/pull/45809) ([jasperzhu](https://github.com/jinjunzh)).
-
-
-#### Bug Fix (user-visible misbehavior in official stable release)
-
-* Flush data exactly by `rabbitmq_flush_interval_ms` or by `rabbitmq_max_block_size` in `StorageRabbitMQ`. Closes [#42389](https://github.com/ClickHouse/ClickHouse/issues/42389). Closes [#45160](https://github.com/ClickHouse/ClickHouse/issues/45160). [#44404](https://github.com/ClickHouse/ClickHouse/pull/44404) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Use PODArray to render in sparkBar function, so we can control the memory usage. Close [#44467](https://github.com/ClickHouse/ClickHouse/issues/44467). [#44489](https://github.com/ClickHouse/ClickHouse/pull/44489) ([Duc Canh Le](https://github.com/canhld94)).
-* Fix functions (quantilesExactExclusive, quantilesExactInclusive) return unsorted array element. [#45379](https://github.com/ClickHouse/ClickHouse/pull/45379) ([wujunfu](https://github.com/wujunfu)).
-* Fix uncaught exception in HTTPHandler when open telemetry is enabled. [#45456](https://github.com/ClickHouse/ClickHouse/pull/45456) ([Frank Chen](https://github.com/FrankChen021)).
-* Don't infer Dates from 8 digit numbers. It could lead to wrong data to be read. [#45581](https://github.com/ClickHouse/ClickHouse/pull/45581) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fixes to correctly use `odbc_bridge_use_connection_pooling` setting. [#45591](https://github.com/ClickHouse/ClickHouse/pull/45591) ([Bharat Nallan](https://github.com/bharatnc)).
-* When the callback in the cache is called, it is possible that this cache is destructed. To keep it safe, we capture members by value. It's also safe for task schedule because it will be deactivated before storage is destroyed. Resolve [#45548](https://github.com/ClickHouse/ClickHouse/issues/45548). [#45601](https://github.com/ClickHouse/ClickHouse/pull/45601) ([Han Fei](https://github.com/hanfei1991)).
-* Fix data corruption when codecs Delta or DoubleDelta are combined with codec Gorilla. [#45615](https://github.com/ClickHouse/ClickHouse/pull/45615) ([Robert Schulze](https://github.com/rschu1ze)).
-* Correctly check types when using N-gram bloom filter index to avoid invalid reads. [#45617](https://github.com/ClickHouse/ClickHouse/pull/45617) ([Antonio Andelic](https://github.com/antonio2368)).
-* A couple of segfaults have been reported around `c-ares`. They were introduced in my previous pull requests. I have fixed them with the help of Alexander Tokmakov. [#45629](https://github.com/ClickHouse/ClickHouse/pull/45629) ([Arthur Passos](https://github.com/arthurpassos)).
-* Fix key description when encountering duplicate primary keys. This can happen in projections. See [#45590](https://github.com/ClickHouse/ClickHouse/issues/45590) for details. [#45686](https://github.com/ClickHouse/ClickHouse/pull/45686) ([Amos Bird](https://github.com/amosbird)).
-* Set compression method and level for backup Closes [#45690](https://github.com/ClickHouse/ClickHouse/issues/45690). [#45737](https://github.com/ClickHouse/ClickHouse/pull/45737) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Should use `select_query_typed.limitByOffset` instead of `select_query_typed.limitOffset`. [#45817](https://github.com/ClickHouse/ClickHouse/pull/45817) ([刘陶峰](https://github.com/taofengliu)).
-* When use experimental analyzer, queries like `SELECT number FROM numbers(100) LIMIT 10 OFFSET 10;` get wrong results (empty result for this sql). That is caused by an unnecessary offset step added by planner. [#45822](https://github.com/ClickHouse/ClickHouse/pull/45822) ([刘陶峰](https://github.com/taofengliu)).
-* Backward compatibility - allow implicit narrowing conversion from UInt64 to IPv4 - required for "INSERT ... VALUES ..." expression. [#45865](https://github.com/ClickHouse/ClickHouse/pull/45865) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Bugfix IPv6 parser for mixed ip4 address with missed first octet (like `::.1.2.3`). [#45871](https://github.com/ClickHouse/ClickHouse/pull/45871) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add the `query_kind` column to the `system.processes` table and the `SHOW PROCESSLIST` query. Remove duplicate code. It fixes a bug: the global configuration parameter `max_concurrent_select_queries` was not respected to queries with `INTERSECT` or `EXCEPT` chains. [#45872](https://github.com/ClickHouse/ClickHouse/pull/45872) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix crash in a function `stochasticLinearRegression`. Found by WingFuzz. [#45985](https://github.com/ClickHouse/ClickHouse/pull/45985) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix crash in `SELECT` queries with `INTERSECT` and `EXCEPT` modifiers that read data from tables with enabled sparse columns (controlled by setting `ratio_of_defaults_for_sparse_serialization`). [#45987](https://github.com/ClickHouse/ClickHouse/pull/45987) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix read in order optimization for DESC sorting with FINAL, close [#45815](https://github.com/ClickHouse/ClickHouse/issues/45815). [#46009](https://github.com/ClickHouse/ClickHouse/pull/46009) ([Vladimir C](https://github.com/vdimir)).
-* Fix reading of non existing nested columns with multiple level in compact parts. [#46045](https://github.com/ClickHouse/ClickHouse/pull/46045) ([Azat Khuzhin](https://github.com/azat)).
-* Fix elapsed column in system.processes (10x error). [#46047](https://github.com/ClickHouse/ClickHouse/pull/46047) ([Azat Khuzhin](https://github.com/azat)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native https://github.com/ClickHouse/ClickHouse/pull/43221. [#46087](https://github.com/ClickHouse/ClickHouse/pull/46087) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix environment variable substitution in the configuration when a parameter already has a value. This closes [#46131](https://github.com/ClickHouse/ClickHouse/issues/46131). This closes [#9547](https://github.com/ClickHouse/ClickHouse/issues/9547). [#46144](https://github.com/ClickHouse/ClickHouse/pull/46144) ([pufit](https://github.com/pufit)).
-* Fix incorrect predicate push down with grouping sets. Closes [#45947](https://github.com/ClickHouse/ClickHouse/issues/45947). [#46151](https://github.com/ClickHouse/ClickHouse/pull/46151) ([flynn](https://github.com/ucasfl)).
-* Fix possible pipeline stuck error on `fulls_sorting_join` with constant keys. [#46175](https://github.com/ClickHouse/ClickHouse/pull/46175) ([Vladimir C](https://github.com/vdimir)).
-* Never rewrite tuple functions as literals during formatting to avoid incorrect results. [#46232](https://github.com/ClickHouse/ClickHouse/pull/46232) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
-* Fix possible out of bounds error while reading LowCardinality(Nullable) in Arrow format. [#46270](https://github.com/ClickHouse/ClickHouse/pull/46270) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix `SYSTEM UNFREEZE` queries failing with the exception `CANNOT_PARSE_INPUT_ASSERTION_FAILED`. [#46325](https://github.com/ClickHouse/ClickHouse/pull/46325) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Fix possible crash which can be caused by an integer overflow while deserializing aggregating state of a function that stores HashTable. [#46349](https://github.com/ClickHouse/ClickHouse/pull/46349) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix possible `LOGICAL_ERROR` in asynchronous inserts with invalid data sent in format `VALUES`. [#46350](https://github.com/ClickHouse/ClickHouse/pull/46350) ([Anton Popov](https://github.com/CurtizJ)).
-* Fixed a LOGICAL_ERROR on an attempt to execute `ALTER ... MOVE PART ... TO TABLE`. This type of query was never actually supported. [#46359](https://github.com/ClickHouse/ClickHouse/pull/46359) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix s3Cluster schema inference in parallel distributed insert select when `parallel_distributed_insert_select` is enabled. [#46381](https://github.com/ClickHouse/ClickHouse/pull/46381) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix queries like `ALTER TABLE ... UPDATE nested.arr1 = nested.arr2 ...`, where `arr1` and `arr2` are fields of the same `Nested` column. [#46387](https://github.com/ClickHouse/ClickHouse/pull/46387) ([Anton Popov](https://github.com/CurtizJ)).
-* Scheduler may fail to schedule a task. If it happens, the whole MulityPartUpload should be aborted and `UploadHelper` must wait for already scheduled tasks. [#46451](https://github.com/ClickHouse/ClickHouse/pull/46451) ([Dmitry Novik](https://github.com/novikd)).
-* Fix PREWHERE for Merge with different default types (fixes some `NOT_FOUND_COLUMN_IN_BLOCK` when the default type for the column differs, also allow `PREWHERE` when the type of column is the same across tables, and prohibit it, only if it differs). [#46454](https://github.com/ClickHouse/ClickHouse/pull/46454) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a crash that could happen when constant values are used in `ORDER BY`. Fixes [#46466](https://github.com/ClickHouse/ClickHouse/issues/46466). [#46493](https://github.com/ClickHouse/ClickHouse/pull/46493) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Do not throw exception if `disk` setting was specified on query level, but `storage_policy` was specified in config merge tree settings section. `disk` will override setting from config. [#46533](https://github.com/ClickHouse/ClickHouse/pull/46533) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix an invalid processing of constant `LowCardinality` argument in function `arrayMap`. This bug could lead to a segfault in release, and logical error `Bad cast` in debug build. [#46569](https://github.com/ClickHouse/ClickHouse/pull/46569) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* fixes [#46557](https://github.com/ClickHouse/ClickHouse/issues/46557). [#46611](https://github.com/ClickHouse/ClickHouse/pull/46611) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix endless restarts of clickhouse-server systemd unit if server cannot start within 1m30sec (Disable timeout logic for starting clickhouse-server from systemd service). [#46613](https://github.com/ClickHouse/ClickHouse/pull/46613) ([Azat Khuzhin](https://github.com/azat)).
-* Allocated during asynchronous inserts memory buffers were deallocated in the global context and MemoryTracker counters for corresponding user and query were not updated correctly. That led to false positive OOM exceptions. [#46622](https://github.com/ClickHouse/ClickHouse/pull/46622) ([Dmitry Novik](https://github.com/novikd)).
-* Updated to not clear on_expression from table_join as its used by future analyze runs resolves [#45185](https://github.com/ClickHouse/ClickHouse/issues/45185). [#46487](https://github.com/ClickHouse/ClickHouse/pull/46487) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-
-
-### <a id="231"></a> ClickHouse release 23.1, 2023-01-26
-
-### ClickHouse release 23.1
-
-#### Upgrade Notes
-* The `SYSTEM RESTART DISK` query becomes a no-op. [#44647](https://github.com/ClickHouse/ClickHouse/pull/44647) ([alesapin](https://github.com/alesapin)).
-* The `PREALLOCATE` option for `HASHED`/`SPARSE_HASHED` dictionaries becomes a no-op. [#45388](https://github.com/ClickHouse/ClickHouse/pull/45388) ([Azat Khuzhin](https://github.com/azat)). It does not give significant advantages anymore.
-* Disallow `Gorilla` codec on columns of non-Float32 or non-Float64 type. [#45252](https://github.com/ClickHouse/ClickHouse/pull/45252) ([Robert Schulze](https://github.com/rschu1ze)). It was pointless and led to inconsistencies. 
-* Parallel quorum inserts might work incorrectly with `*MergeTree` tables created with the deprecated syntax. Therefore, parallel quorum inserts support is completely disabled for such tables. It does not affect tables created with a new syntax. [#45430](https://github.com/ClickHouse/ClickHouse/pull/45430) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Use the `GetObjectAttributes` request instead of the `HeadObject` request to get the size of an object in AWS S3. This change fixes handling endpoints without explicit regions after updating the AWS SDK, for example. [#45288](https://github.com/ClickHouse/ClickHouse/pull/45288) ([Vitaly Baranov](https://github.com/vitlibar)). AWS S3 and Minio are tested, but keep in mind that various S3-compatible services (GCS, R2, B2) may have subtle incompatibilities. This change also may require you to adjust the ACL to allow the `GetObjectAttributes` request.
-* Forbid paths in timezone names. For example, a timezone name like `/usr/share/zoneinfo/Asia/Aden` is not allowed; the IANA timezone database name like `Asia/Aden` should be used. [#44225](https://github.com/ClickHouse/ClickHouse/pull/44225) ([Kruglov Pavel](https://github.com/Avogar)).
-* Queries combining equijoin and constant expressions (e.g., `JOIN ON t1.x = t2.x AND 1 = 1`) are forbidden due to incorrect results. [#44016](https://github.com/ClickHouse/ClickHouse/pull/44016) ([Vladimir C](https://github.com/vdimir)).
-
-
-#### New Feature
-* Dictionary source for extracting keys by traversing regular expressions tree. It can be used for User-Agent parsing. [#40878](https://github.com/ClickHouse/ClickHouse/pull/40878) ([Vage Ogannisian](https://github.com/nooblose)). [#43858](https://github.com/ClickHouse/ClickHouse/pull/43858) ([Han Fei](https://github.com/hanfei1991)).
-* Added parametrized view functionality, now it's possible to specify query parameters for the View table engine. resolves [#40907](https://github.com/ClickHouse/ClickHouse/issues/40907). [#41687](https://github.com/ClickHouse/ClickHouse/pull/41687) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `quantileInterpolatedWeighted`/`quantilesInterpolatedWeighted` functions. [#38252](https://github.com/ClickHouse/ClickHouse/pull/38252) ([Bharat Nallan](https://github.com/bharatnc)).
-* Array join support for the `Map` type, like the function "explode" in Spark. [#43239](https://github.com/ClickHouse/ClickHouse/pull/43239) ([李扬](https://github.com/taiyang-li)).
-* Support SQL standard binary and hex string literals. [#43785](https://github.com/ClickHouse/ClickHouse/pull/43785) ([Mo Xuan](https://github.com/mo-avatar)).
-* Allow formatting `DateTime` in Joda-Time style. Refer to [the Joda-Time docs](https://joda-time.sourceforge.net/apidocs/org/joda/time/format/DateTimeFormat.html). [#43818](https://github.com/ClickHouse/ClickHouse/pull/43818) ([李扬](https://github.com/taiyang-li)).
-* Implemented a fractional second formatter (`%f`) for `formatDateTime`. [#44060](https://github.com/ClickHouse/ClickHouse/pull/44060) ([ltrk2](https://github.com/ltrk2)). [#44497](https://github.com/ClickHouse/ClickHouse/pull/44497) ([Alexander Gololobov](https://github.com/davenger)).
-* Added `age` function to calculate the difference between two dates or dates with time values expressed as the number of full units. Closes [#41115](https://github.com/ClickHouse/ClickHouse/issues/41115). [#44421](https://github.com/ClickHouse/ClickHouse/pull/44421) ([Robert Schulze](https://github.com/rschu1ze)).
-* Add `Null` source for dictionaries. Closes [#44240](https://github.com/ClickHouse/ClickHouse/issues/44240). [#44502](https://github.com/ClickHouse/ClickHouse/pull/44502) ([mayamika](https://github.com/mayamika)).
-* Allow configuring the S3 storage class with the `s3_storage_class` configuration option. Such as `<s3_storage_class>STANDARD/INTELLIGENT_TIERING</s3_storage_class>` Closes [#44443](https://github.com/ClickHouse/ClickHouse/issues/44443). [#44707](https://github.com/ClickHouse/ClickHouse/pull/44707) ([chen](https://github.com/xiedeyantu)).
-* Insert default values in case of missing elements in JSON object while parsing named tuple. Add setting `input_format_json_defaults_for_missing_elements_in_named_tuple` that controls this behaviour. Closes [#45142](https://github.com/ClickHouse/ClickHouse/issues/45142)#issuecomment-1380153217. [#45231](https://github.com/ClickHouse/ClickHouse/pull/45231) ([Kruglov Pavel](https://github.com/Avogar)).
-* Record server startup time in ProfileEvents (`ServerStartupMilliseconds`). Resolves [#43188](https://github.com/ClickHouse/ClickHouse/issues/43188). [#45250](https://github.com/ClickHouse/ClickHouse/pull/45250) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Refactor and Improve streaming engines Kafka/RabbitMQ/NATS and add support for all formats, also refactor formats a bit: - Fix producing messages in row-based formats with suffixes/prefixes. Now every message is formatted completely with all delimiters and can be parsed back using input format. - Support block-based formats like Native, Parquet, ORC, etc. Every block is formatted as a separate message. The number of rows in one message depends on the block size, so you can control it via the setting `max_block_size`. - Add new engine settings `kafka_max_rows_per_message/rabbitmq_max_rows_per_message/nats_max_rows_per_message`. They control the number of rows formatted in one message in row-based formats. Default value: 1. - Fix high memory consumption in the NATS table engine. - Support arbitrary binary data in NATS producer (previously it worked only with strings contained \0 at the end) - Add missing Kafka/RabbitMQ/NATS engine settings in the documentation. - Refactor producing and consuming in Kafka/RabbitMQ/NATS, separate it from WriteBuffers/ReadBuffers semantic. - Refactor output formats: remove callbacks on each row used in Kafka/RabbitMQ/NATS (now we don't use callbacks there), allow to use IRowOutputFormat directly, clarify row end and row between delimiters, make it possible to reset output format to start formatting again - Add proper implementation in formatRow function (bonus after formats refactoring). [#42777](https://github.com/ClickHouse/ClickHouse/pull/42777) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support reading/writing `Nested` tables as `List` of `Struct` in `CapnProto` format. Read/write `Decimal32/64` as `Int32/64`. Closes [#43319](https://github.com/ClickHouse/ClickHouse/issues/43319). [#43379](https://github.com/ClickHouse/ClickHouse/pull/43379) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added a `message_format_string` column to `system.text_log`. The column contains a pattern that was used to format the message. [#44543](https://github.com/ClickHouse/ClickHouse/pull/44543) ([Alexander Tokmakov](https://github.com/tavplubix)). This allows various analytics over the ClickHouse logs.
-* Try to autodetect headers with column names (and maybe types) for CSV/TSV/CustomSeparated input formats.
-Add settings input_format_tsv/csv/custom_detect_header that enable this behaviour (enabled by default). Closes [#44640](https://github.com/ClickHouse/ClickHouse/issues/44640). [#44953](https://github.com/ClickHouse/ClickHouse/pull/44953) ([Kruglov Pavel](https://github.com/Avogar)).
-
-#### Experimental Feature
-* Add an experimental inverted index as a new secondary index type for efficient text search. [#38667](https://github.com/ClickHouse/ClickHouse/pull/38667) ([larryluogit](https://github.com/larryluogit)).
-* Add experimental query result cache. [#43797](https://github.com/ClickHouse/ClickHouse/pull/43797) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added extendable and configurable scheduling subsystem for IO requests (not yet integrated with IO code itself). [#41840](https://github.com/ClickHouse/ClickHouse/pull/41840) ([Sergei Trifonov](https://github.com/serxa)). This feature does nothing at all, enjoy.
-* Added `SYSTEM DROP DATABASE REPLICA` that removes metadata of a dead replica of a `Replicated` database. Resolves [#41794](https://github.com/ClickHouse/ClickHouse/issues/41794). [#42807](https://github.com/ClickHouse/ClickHouse/pull/42807) ([Alexander Tokmakov](https://github.com/tavplubix)).
-
-#### Performance Improvement
-* Do not load inactive parts at startup of `MergeTree` tables. [#42181](https://github.com/ClickHouse/ClickHouse/pull/42181) ([Anton Popov](https://github.com/CurtizJ)).
-* Improved latency of reading from storage `S3` and table function `s3` with large numbers of small files. Now settings `remote_filesystem_read_method` and `remote_filesystem_read_prefetch` take effect while reading from storage `S3`. [#43726](https://github.com/ClickHouse/ClickHouse/pull/43726) ([Anton Popov](https://github.com/CurtizJ)).
-* Optimization for reading struct fields in Parquet/ORC files. Only the required fields are loaded. [#44484](https://github.com/ClickHouse/ClickHouse/pull/44484) ([lgbo](https://github.com/lgbo-ustc)).
-* Two-level aggregation algorithm was mistakenly disabled for queries over the HTTP interface. It was enabled back, and it leads to a major performance improvement. [#45450](https://github.com/ClickHouse/ClickHouse/pull/45450) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Added mmap support for StorageFile, which should improve the performance of clickhouse-local. [#43927](https://github.com/ClickHouse/ClickHouse/pull/43927) ([pufit](https://github.com/pufit)).
-* Added sharding support in HashedDictionary to allow parallel load (almost linear scaling based on number of shards). [#40003](https://github.com/ClickHouse/ClickHouse/pull/40003) ([Azat Khuzhin](https://github.com/azat)).
-* Speed up query parsing. [#42284](https://github.com/ClickHouse/ClickHouse/pull/42284) ([Raúl Marín](https://github.com/Algunenano)).
-* Always replace OR chain `expr = x1 OR ... OR expr = xN` to `expr IN (x1, ..., xN)` in the case where `expr` is a `LowCardinality` column. Setting `optimize_min_equality_disjunction_chain_length` is ignored in this case. [#42889](https://github.com/ClickHouse/ClickHouse/pull/42889) ([Guo Wangyang](https://github.com/guowangy)).
-* Slightly improve performance by optimizing the code around ThreadStatus. [#43586](https://github.com/ClickHouse/ClickHouse/pull/43586) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Optimize the column-wise ternary logic evaluation by achieving auto-vectorization. In the performance test of this [microbenchmark](https://github.com/ZhiguoZh/ClickHouse/blob/20221123-ternary-logic-opt-example/src/Functions/examples/associative_applier_perf.cpp), we've observed a peak **performance gain** of **21x** on the ICX device (Intel Xeon Platinum 8380 CPU). [#43669](https://github.com/ClickHouse/ClickHouse/pull/43669) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Avoid acquiring read locks in the `system.tables` table if possible. [#43840](https://github.com/ClickHouse/ClickHouse/pull/43840) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize ThreadPool. The performance experiments of SSB (Star Schema Benchmark) on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) shows that this change could effectively decrease the lock contention for ThreadPoolImpl::mutex by **75%**, increasing the CPU utilization and improving the overall performance by **2.4%**. [#44308](https://github.com/ClickHouse/ClickHouse/pull/44308) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
-* Now the optimisation for predicting the hash table size is applied only if the cached hash table size is sufficiently large (thresholds were determined empirically and hardcoded). [#44455](https://github.com/ClickHouse/ClickHouse/pull/44455) ([Nikita Taranov](https://github.com/nickitat)).
-* Small performance improvement for asynchronous reading from remote filesystems. [#44868](https://github.com/ClickHouse/ClickHouse/pull/44868) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Add fast path for: - `col like '%%'`; - `col like '%'`; - `col not like '%'`; - `col not like '%'`; - `match(col, '.*')`. [#45244](https://github.com/ClickHouse/ClickHouse/pull/45244) ([李扬](https://github.com/taiyang-li)).
-* Slightly improve happy path optimisation in filtering (WHERE clause). [#45289](https://github.com/ClickHouse/ClickHouse/pull/45289) ([Nikita Taranov](https://github.com/nickitat)).
-* Provide monotonicity info for `toUnixTimestamp64*` to enable more algebraic optimizations for index analysis. [#44116](https://github.com/ClickHouse/ClickHouse/pull/44116) ([Nikita Taranov](https://github.com/nickitat)).
-* Allow the configuration of temporary data for query processing (spilling to disk) to cooperate with the filesystem cache (taking up the space from the cache disk) [#43972](https://github.com/ClickHouse/ClickHouse/pull/43972) ([Vladimir C](https://github.com/vdimir)). This mainly improves [ClickHouse Cloud](https://clickhouse.cloud/), but can be used for self-managed setups as well, if you know what to do.
-* Make `system.replicas` table do parallel fetches of replicas statuses. Closes [#43918](https://github.com/ClickHouse/ClickHouse/issues/43918). [#43998](https://github.com/ClickHouse/ClickHouse/pull/43998) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Optimize memory consumption during backup to S3: files to S3 now will be copied directly without using `WriteBufferFromS3` (which could use a lot of memory). [#45188](https://github.com/ClickHouse/ClickHouse/pull/45188) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Add a cache for async block ids. This will reduce the number of requests of ZooKeeper when we enable async inserts deduplication. [#45106](https://github.com/ClickHouse/ClickHouse/pull/45106) ([Han Fei](https://github.com/hanfei1991)).
-
-#### Improvement
-
-* Use structure from insertion table in generateRandom without arguments. [#45239](https://github.com/ClickHouse/ClickHouse/pull/45239) ([Kruglov Pavel](https://github.com/Avogar)).
-* Allow to implicitly convert floats stored in string fields of JSON to integers in `JSONExtract` functions. E.g. `JSONExtract('{"a": "1000.111"}', 'a', 'UInt64')` -> `1000`, previously it returned 0. [#45432](https://github.com/ClickHouse/ClickHouse/pull/45432) ([Anton Popov](https://github.com/CurtizJ)).
-* Added fields `supports_parallel_parsing` and `supports_parallel_formatting` to table `system.formats` for better introspection. [#45499](https://github.com/ClickHouse/ClickHouse/pull/45499) ([Anton Popov](https://github.com/CurtizJ)).
-* Improve reading CSV field in CustomSeparated/Template format. Closes [#42352](https://github.com/ClickHouse/ClickHouse/issues/42352) Closes [#39620](https://github.com/ClickHouse/ClickHouse/issues/39620). [#43332](https://github.com/ClickHouse/ClickHouse/pull/43332) ([Kruglov Pavel](https://github.com/Avogar)).
-* Unify query elapsed time measurements. [#43455](https://github.com/ClickHouse/ClickHouse/pull/43455) ([Raúl Marín](https://github.com/Algunenano)).
-* Improve automatic usage of structure from insertion table in table functions file/hdfs/s3 when virtual columns are present in a select query, it fixes the possible error `Block structure mismatch` or `number of columns mismatch`. [#43695](https://github.com/ClickHouse/ClickHouse/pull/43695) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add support for signed arguments in the function `range`. Fixes [#43333](https://github.com/ClickHouse/ClickHouse/issues/43333). [#43733](https://github.com/ClickHouse/ClickHouse/pull/43733) ([sanyu](https://github.com/wineternity)).
-* Remove redundant sorting, for example, sorting related ORDER BY clauses in subqueries. Implemented on top of query plan. It does similar optimization as `optimize_duplicate_order_by_and_distinct` regarding `ORDER BY` clauses, but more generic, since it's applied to any redundant sorting steps (not only caused by ORDER BY clause) and applied to subqueries of any depth. Related to [#42648](https://github.com/ClickHouse/ClickHouse/issues/42648). [#43905](https://github.com/ClickHouse/ClickHouse/pull/43905) ([Igor Nikonov](https://github.com/devcrafter)).
-* Add the ability to disable deduplication of files for BACKUP (for backups without deduplication ATTACH can be used instead of full RESTORE). For example `BACKUP foo TO S3(...) SETTINGS deduplicate_files=0` (default `deduplicate_files=1`). [#43947](https://github.com/ClickHouse/ClickHouse/pull/43947) ([Azat Khuzhin](https://github.com/azat)).
-* Refactor and improve schema inference for text formats. Add new setting `schema_inference_make_columns_nullable` that controls making result types `Nullable` (enabled by default);. [#44019](https://github.com/ClickHouse/ClickHouse/pull/44019) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better support for `PROXYv1` protocol. [#44135](https://github.com/ClickHouse/ClickHouse/pull/44135) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Add information about the latest part check by cleanup threads into `system.parts` table. [#44244](https://github.com/ClickHouse/ClickHouse/pull/44244) ([Dmitry Novik](https://github.com/novikd)).
-* Disable table functions in readonly mode for inserts. [#44290](https://github.com/ClickHouse/ClickHouse/pull/44290) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add a setting `simultaneous_parts_removal_limit` to allow limiting the number of parts being processed by one iteration of CleanupThread. [#44461](https://github.com/ClickHouse/ClickHouse/pull/44461) ([Dmitry Novik](https://github.com/novikd)).
-* Do not initialize ReadBufferFromS3 when only virtual columns are needed in a query. This may be helpful to [#44246](https://github.com/ClickHouse/ClickHouse/issues/44246). [#44493](https://github.com/ClickHouse/ClickHouse/pull/44493) ([chen](https://github.com/xiedeyantu)).
-* Prevent duplicate column names hints. Closes [#44130](https://github.com/ClickHouse/ClickHouse/issues/44130). [#44519](https://github.com/ClickHouse/ClickHouse/pull/44519) ([Joanna Hulboj](https://github.com/jh0x)).
-* Allow macro substitution in endpoint of disks. Resolve [#40951](https://github.com/ClickHouse/ClickHouse/issues/40951). [#44533](https://github.com/ClickHouse/ClickHouse/pull/44533) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Improve schema inference when `input_format_json_read_object_as_string` is enabled. [#44546](https://github.com/ClickHouse/ClickHouse/pull/44546) ([Kruglov Pavel](https://github.com/Avogar)).
-* Add a user-level setting `database_replicated_allow_replicated_engine_arguments` which allows banning the creation of `ReplicatedMergeTree` tables with arguments in `DatabaseReplicated`. [#44566](https://github.com/ClickHouse/ClickHouse/pull/44566) ([alesapin](https://github.com/alesapin)).
-* Prevent users from mistakenly specifying zero (invalid) value for `index_granularity`. This closes [#44536](https://github.com/ClickHouse/ClickHouse/issues/44536). [#44578](https://github.com/ClickHouse/ClickHouse/pull/44578) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Added possibility to set path to service keytab file in `keytab` parameter in `kerberos` section of config.xml. [#44594](https://github.com/ClickHouse/ClickHouse/pull/44594) ([Roman Vasin](https://github.com/rvasin)).
-* Use already written part of the query for fuzzy search (pass to the `skim` library, which is written in Rust and linked statically to ClickHouse). [#44600](https://github.com/ClickHouse/ClickHouse/pull/44600) ([Azat Khuzhin](https://github.com/azat)).
-* Enable `input_format_json_read_objects_as_strings` by default to be able to read nested JSON objects while JSON Object type is experimental. [#44657](https://github.com/ClickHouse/ClickHouse/pull/44657) ([Kruglov Pavel](https://github.com/Avogar)).
-* Improvement for deduplication of async inserts: when users do duplicate async inserts, we should deduplicate inside the memory before we query Keeper. [#44682](https://github.com/ClickHouse/ClickHouse/pull/44682) ([Han Fei](https://github.com/hanfei1991)).
-* Input/output `Avro` format will parse bool type as ClickHouse bool type. [#44684](https://github.com/ClickHouse/ClickHouse/pull/44684) ([Kruglov Pavel](https://github.com/Avogar)).
-* Support Bool type in Arrow/Parquet/ORC. Closes [#43970](https://github.com/ClickHouse/ClickHouse/issues/43970). [#44698](https://github.com/ClickHouse/ClickHouse/pull/44698) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't greedily parse beyond the quotes when reading UUIDs - it may lead to mistakenly successful parsing of incorrect data. [#44686](https://github.com/ClickHouse/ClickHouse/pull/44686) ([Raúl Marín](https://github.com/Algunenano)).
-* Infer UInt64 in case of Int64 overflow and fix some transforms in schema inference. [#44696](https://github.com/ClickHouse/ClickHouse/pull/44696) ([Kruglov Pavel](https://github.com/Avogar)).
-* Previously dependency resolving inside `Replicated` database was done in a hacky way, and now it's done right using an explicit graph. [#44697](https://github.com/ClickHouse/ClickHouse/pull/44697) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-* Fix `output_format_pretty_row_numbers` does not preserve the counter across the blocks. Closes [#44815](https://github.com/ClickHouse/ClickHouse/issues/44815). [#44832](https://github.com/ClickHouse/ClickHouse/pull/44832) ([flynn](https://github.com/ucasfl)).
-* Don't report errors in `system.errors` due to parts being merged concurrently with the background cleanup process. [#44874](https://github.com/ClickHouse/ClickHouse/pull/44874) ([Raúl Marín](https://github.com/Algunenano)).
-* Optimize and fix metrics for Distributed async INSERT. [#44922](https://github.com/ClickHouse/ClickHouse/pull/44922) ([Azat Khuzhin](https://github.com/azat)).
-* Added settings to disallow concurrent backups and restores resolves [#43891](https://github.com/ClickHouse/ClickHouse/issues/43891) Implementation: * Added server-level settings to disallow concurrent backups and restores, which are read and set when BackupWorker is created in Context. * Settings are set to true by default. * Before starting backup or restores, added a check to see if any other backups/restores are running. For internal requests, it checks if it is from the self node using backup_uuid. [#45072](https://github.com/ClickHouse/ClickHouse/pull/45072) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Add `<storage_policy>` config parameter for system logs. [#45320](https://github.com/ClickHouse/ClickHouse/pull/45320) ([Stig Bakken](https://github.com/stigsb)).
-
-#### Build/Testing/Packaging Improvement
-* Statically link with the `skim` library (it is written in Rust) for fuzzy search in clickhouse client/local history. [#44239](https://github.com/ClickHouse/ClickHouse/pull/44239) ([Azat Khuzhin](https://github.com/azat)).
-* We removed support for shared linking because of Rust. Actually, Rust is only an excuse for this removal, and we wanted to remove it nevertheless. [#44828](https://github.com/ClickHouse/ClickHouse/pull/44828) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Remove the dependency on the `adduser` tool from the packages, because we don't use it. This fixes [#44934](https://github.com/ClickHouse/ClickHouse/issues/44934). [#45011](https://github.com/ClickHouse/ClickHouse/pull/45011) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* The `SQLite` library is updated to the latest. It is used for the SQLite database and table integration engines. Also, fixed a false-positive TSan report. This closes [#45027](https://github.com/ClickHouse/ClickHouse/issues/45027). [#45031](https://github.com/ClickHouse/ClickHouse/pull/45031) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* CRC-32 changes to address the WeakHash collision issue in PowerPC. [#45144](https://github.com/ClickHouse/ClickHouse/pull/45144) ([MeenaRenganathan22](https://github.com/MeenaRenganathan22)).
-* Update aws-c* submodules [#43020](https://github.com/ClickHouse/ClickHouse/pull/43020) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Automatically merge green backport PRs and green approved PRs [#41110](https://github.com/ClickHouse/ClickHouse/pull/41110) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-* Introduce a [website](https://aretestsgreenyet.com/) for the status of ClickHouse CI. [Source](https://github.com/ClickHouse/aretestsgreenyet).
-
-#### Bug Fix
-
-* Replace domain IP types (IPv4, IPv6) with native. [#43221](https://github.com/ClickHouse/ClickHouse/pull/43221) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)). It automatically fixes some missing implementations in the code.
-* Fix the backup process if mutations get killed during the backup process. [#45351](https://github.com/ClickHouse/ClickHouse/pull/45351) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix the `Invalid number of rows in Chunk` exception message. [#41404](https://github.com/ClickHouse/ClickHouse/issues/41404). [#42126](https://github.com/ClickHouse/ClickHouse/pull/42126) ([Alexander Gololobov](https://github.com/davenger)).
-* Fix possible use of an uninitialized value after executing expressions after sorting. Closes [#43386](https://github.com/ClickHouse/ClickHouse/issues/43386) [#43635](https://github.com/ClickHouse/ClickHouse/pull/43635) ([Kruglov Pavel](https://github.com/Avogar)).
-* Better handling of NULL in aggregate combinators, fix possible segfault/logical error while using an obscure optimization `optimize_rewrite_sum_if_to_count_if`. Closes [#43758](https://github.com/ClickHouse/ClickHouse/issues/43758). [#43813](https://github.com/ClickHouse/ClickHouse/pull/43813) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix CREATE USER/ROLE query settings constraints. [#43993](https://github.com/ClickHouse/ClickHouse/pull/43993) ([Nikolay Degterinsky](https://github.com/evillique)).
-* Fixed bug with non-parsable default value for `EPHEMERAL` column in table metadata. [#44026](https://github.com/ClickHouse/ClickHouse/pull/44026) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix parsing of bad version from compatibility setting. [#44224](https://github.com/ClickHouse/ClickHouse/pull/44224) ([Kruglov Pavel](https://github.com/Avogar)).
-* Bring interval subtraction from datetime in line with addition. [#44241](https://github.com/ClickHouse/ClickHouse/pull/44241) ([ltrk2](https://github.com/ltrk2)).
-* Remove limits on the maximum size of the result for view. [#44261](https://github.com/ClickHouse/ClickHouse/pull/44261) ([lizhuoyu5](https://github.com/lzydmxy)).
-* Fix possible logical error in cache if `do_not_evict_index_and_mrk_files=1`. Closes [#42142](https://github.com/ClickHouse/ClickHouse/issues/42142). [#44268](https://github.com/ClickHouse/ClickHouse/pull/44268) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible too early cache write interruption in write-through cache (caching could be stopped due to false assumption when it shouldn't have). [#44289](https://github.com/ClickHouse/ClickHouse/pull/44289) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Fix possible crash in the case function `IN` with constant arguments was used as a constant argument together with `LowCardinality`. Fixes [#44221](https://github.com/ClickHouse/ClickHouse/issues/44221). [#44346](https://github.com/ClickHouse/ClickHouse/pull/44346) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix support for complex parameters (like arrays) of parametric aggregate functions. This closes [#30975](https://github.com/ClickHouse/ClickHouse/issues/30975). The aggregate function `sumMapFiltered` was unusable in distributed queries before this change. [#44358](https://github.com/ClickHouse/ClickHouse/pull/44358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix reading ObjectId in BSON schema inference. [#44382](https://github.com/ClickHouse/ClickHouse/pull/44382) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix race which can lead to premature temp parts removal before merge finishes in ReplicatedMergeTree. This issue could lead to errors like `No such file or directory: xxx`. Fixes [#43983](https://github.com/ClickHouse/ClickHouse/issues/43983). [#44383](https://github.com/ClickHouse/ClickHouse/pull/44383) ([alesapin](https://github.com/alesapin)).
-* Some invalid `SYSTEM ... ON CLUSTER` queries worked in an unexpected way if a cluster name was not specified. It's fixed, now invalid queries throw `SYNTAX_ERROR` as they should. Fixes [#44264](https://github.com/ClickHouse/ClickHouse/issues/44264). [#44387](https://github.com/ClickHouse/ClickHouse/pull/44387) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix reading Map type in ORC format. [#44400](https://github.com/ClickHouse/ClickHouse/pull/44400) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix reading columns that are not presented in input data in Parquet/ORC formats. Previously it could lead to error `INCORRECT_NUMBER_OF_COLUMNS`. Closes [#44333](https://github.com/ClickHouse/ClickHouse/issues/44333). [#44405](https://github.com/ClickHouse/ClickHouse/pull/44405) ([Kruglov Pavel](https://github.com/Avogar)).
-* Previously the `bar` function used the same '▋' (U+258B "Left five eighths block") character to display both 5/8 and 6/8 bars. This change corrects this behavior by using '▊' (U+258A "Left three quarters block") for displaying 6/8 bar. [#44410](https://github.com/ClickHouse/ClickHouse/pull/44410) ([Alexander Gololobov](https://github.com/davenger)).
-* Placing profile settings after profile settings constraints in the configuration file made constraints ineffective. [#44411](https://github.com/ClickHouse/ClickHouse/pull/44411) ([Konstantin Bogdanov](https://github.com/thevar1able)).
-* Fix `SYNTAX_ERROR` while running `EXPLAIN AST INSERT` queries with data. Closes [#44207](https://github.com/ClickHouse/ClickHouse/issues/44207). [#44413](https://github.com/ClickHouse/ClickHouse/pull/44413) ([save-my-heart](https://github.com/save-my-heart)).
-* Fix reading bool value with CRLF in CSV format. Closes [#44401](https://github.com/ClickHouse/ClickHouse/issues/44401). [#44442](https://github.com/ClickHouse/ClickHouse/pull/44442) ([Kruglov Pavel](https://github.com/Avogar)).
-* Don't execute and/or/if/multiIf on a LowCardinality dictionary, so the result type cannot be LowCardinality. It could lead to the error `Illegal column ColumnLowCardinality` in some cases. Fixes [#43603](https://github.com/ClickHouse/ClickHouse/issues/43603). [#44469](https://github.com/ClickHouse/ClickHouse/pull/44469) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix mutations with the setting `max_streams_for_merge_tree_reading`. [#44472](https://github.com/ClickHouse/ClickHouse/pull/44472) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix potential null pointer dereference with GROUPING SETS in ASTSelectQuery::formatImpl ([#43049](https://github.com/ClickHouse/ClickHouse/issues/43049)). [#44479](https://github.com/ClickHouse/ClickHouse/pull/44479) ([Robert Schulze](https://github.com/rschu1ze)).
-* Validate types in table function arguments, CAST function arguments, JSONAsObject schema inference according to settings. [#44501](https://github.com/ClickHouse/ClickHouse/pull/44501) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix IN function with LowCardinality and const column, close [#44503](https://github.com/ClickHouse/ClickHouse/issues/44503). [#44506](https://github.com/ClickHouse/ClickHouse/pull/44506) ([Duc Canh Le](https://github.com/canhld94)).
-* Fixed a bug in the normalization of a `DEFAULT` expression in `CREATE TABLE` statement. The second argument of the function `in` (or the right argument of operator `IN`) might be replaced with the result of its evaluation during CREATE query execution. Fixes [#44496](https://github.com/ClickHouse/ClickHouse/issues/44496). [#44547](https://github.com/ClickHouse/ClickHouse/pull/44547) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Projections do not work in presence of WITH ROLLUP, WITH CUBE and WITH TOTALS. In previous versions, a query produced an exception instead of skipping the usage of projections. This closes [#44614](https://github.com/ClickHouse/ClickHouse/issues/44614). This closes [#42772](https://github.com/ClickHouse/ClickHouse/issues/42772). [#44615](https://github.com/ClickHouse/ClickHouse/pull/44615) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Async blocks were not cleaned because the function `get all blocks sorted by time` didn't get async blocks. [#44651](https://github.com/ClickHouse/ClickHouse/pull/44651) ([Han Fei](https://github.com/hanfei1991)).
-* Fix `LOGICAL_ERROR` `The top step of the right pipeline should be ExpressionStep` for JOIN with subquery, UNION, and TOTALS. Fixes [#43687](https://github.com/ClickHouse/ClickHouse/issues/43687). [#44673](https://github.com/ClickHouse/ClickHouse/pull/44673) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Avoid `std::out_of_range` exception in the Executable table engine. [#44681](https://github.com/ClickHouse/ClickHouse/pull/44681) ([Kruglov Pavel](https://github.com/Avogar)).
-* Do not apply `optimize_syntax_fuse_functions` to quantiles on AST, close [#44712](https://github.com/ClickHouse/ClickHouse/issues/44712). [#44713](https://github.com/ClickHouse/ClickHouse/pull/44713) ([Vladimir C](https://github.com/vdimir)).
-* Fix bug with wrong type in Merge table and PREWHERE, close [#43324](https://github.com/ClickHouse/ClickHouse/issues/43324). [#44716](https://github.com/ClickHouse/ClickHouse/pull/44716) ([Vladimir C](https://github.com/vdimir)).
-* Fix a possible crash during shutdown (while destroying TraceCollector). Fixes [#44757](https://github.com/ClickHouse/ClickHouse/issues/44757). [#44758](https://github.com/ClickHouse/ClickHouse/pull/44758) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix a possible crash in distributed query processing. The crash could happen if a query with totals or extremes returned an empty result and there are mismatched types in the Distributed and the local tables. Fixes [#44738](https://github.com/ClickHouse/ClickHouse/issues/44738). [#44760](https://github.com/ClickHouse/ClickHouse/pull/44760) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix fsync for fetches (`min_compressed_bytes_to_fsync_after_fetch`)/small files (ttl.txt, columns.txt) in mutations (`min_rows_to_fsync_after_merge`/`min_compressed_bytes_to_fsync_after_merge`). [#44781](https://github.com/ClickHouse/ClickHouse/pull/44781) ([Azat Khuzhin](https://github.com/azat)).
-* A rare race condition was possible when querying the `system.parts` or `system.parts_columns` tables in the presence of parts being moved between disks. Introduced in [#41145](https://github.com/ClickHouse/ClickHouse/issues/41145). [#44809](https://github.com/ClickHouse/ClickHouse/pull/44809) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix the error `Context has expired` which could appear with enabled projections optimization. Can be reproduced for queries with specific functions, like `dictHas/dictGet` which use context in runtime. Fixes [#44844](https://github.com/ClickHouse/ClickHouse/issues/44844). [#44850](https://github.com/ClickHouse/ClickHouse/pull/44850) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* A fix for `Cannot read all data` error which could happen while reading `LowCardinality` dictionary from remote fs. Fixes [#44709](https://github.com/ClickHouse/ClickHouse/issues/44709). [#44875](https://github.com/ClickHouse/ClickHouse/pull/44875) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Ignore cases when hardware monitor sensors cannot be read instead of showing a full exception message in logs. [#44895](https://github.com/ClickHouse/ClickHouse/pull/44895) ([Raúl Marín](https://github.com/Algunenano)).
-* Use `max_delay_to_insert` value in case the calculated time to delay INSERT exceeds the setting value. Related to [#44902](https://github.com/ClickHouse/ClickHouse/issues/44902). [#44916](https://github.com/ClickHouse/ClickHouse/pull/44916) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix error `Different order of columns in UNION subquery` for queries with `UNION`. Fixes [#44866](https://github.com/ClickHouse/ClickHouse/issues/44866). [#44920](https://github.com/ClickHouse/ClickHouse/pull/44920) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Delay for INSERT can be calculated incorrectly, which can lead to always using `max_delay_to_insert` setting as delay instead of a correct value. Using simple formula `max_delay_to_insert * (parts_over_threshold/max_allowed_parts_over_threshold)` i.e. delay grows proportionally to parts over threshold. Closes [#44902](https://github.com/ClickHouse/ClickHouse/issues/44902). [#44954](https://github.com/ClickHouse/ClickHouse/pull/44954) ([Igor Nikonov](https://github.com/devcrafter)).
-* Fix alter table TTL error when a wide part has the lightweight delete mask. [#44959](https://github.com/ClickHouse/ClickHouse/pull/44959) ([Mingliang Pan](https://github.com/liangliangpan)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native [#43221](https://github.com/ClickHouse/ClickHouse/issues/43221). [#45024](https://github.com/ClickHouse/ClickHouse/pull/45024) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Follow-up fix for Replace domain IP types (IPv4, IPv6) with native https://github.com/ClickHouse/ClickHouse/pull/43221. [#45043](https://github.com/ClickHouse/ClickHouse/pull/45043) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* A buffer overflow was possible in the parser. Found by fuzzer. [#45047](https://github.com/ClickHouse/ClickHouse/pull/45047) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
-* Fix possible cannot-read-all-data error in storage FileLog. Closes [#45051](https://github.com/ClickHouse/ClickHouse/issues/45051), [#38257](https://github.com/ClickHouse/ClickHouse/issues/38257). [#45057](https://github.com/ClickHouse/ClickHouse/pull/45057) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Memory efficient aggregation (setting `distributed_aggregation_memory_efficient`) is disabled when grouping sets are present in the query. [#45058](https://github.com/ClickHouse/ClickHouse/pull/45058) ([Nikita Taranov](https://github.com/nickitat)).
-* Fix `RANGE_HASHED` dictionary to count range columns as part of the primary key during updates when `update_field` is specified. Closes [#44588](https://github.com/ClickHouse/ClickHouse/issues/44588). [#45061](https://github.com/ClickHouse/ClickHouse/pull/45061) ([Maksim Kita](https://github.com/kitaisreal)).
-* Fix error `Cannot capture column` for `LowCardinality` captured argument of nested lambda. Fixes [#45028](https://github.com/ClickHouse/ClickHouse/issues/45028). [#45065](https://github.com/ClickHouse/ClickHouse/pull/45065) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix the wrong query result of `additional_table_filters` (additional filter was not applied) in case the minmax/count projection is used. [#45133](https://github.com/ClickHouse/ClickHouse/pull/45133) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fixed bug in `histogram` function accepting negative values. [#45147](https://github.com/ClickHouse/ClickHouse/pull/45147) ([simpleton](https://github.com/rgzntrade)).
-* Fix wrong column nullability in StoreageJoin, close [#44940](https://github.com/ClickHouse/ClickHouse/issues/44940). [#45184](https://github.com/ClickHouse/ClickHouse/pull/45184) ([Vladimir C](https://github.com/vdimir)).
-* Fix `background_fetches_pool_size` settings reload (increase at runtime). [#45189](https://github.com/ClickHouse/ClickHouse/pull/45189) ([Raúl Marín](https://github.com/Algunenano)).
-* Correctly process `SELECT` queries on KV engines (e.g. KeeperMap, EmbeddedRocksDB) using `IN` on the key with subquery producing different type. [#45215](https://github.com/ClickHouse/ClickHouse/pull/45215) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix logical error in SEMI JOIN & join_use_nulls in some cases, close [#45163](https://github.com/ClickHouse/ClickHouse/issues/45163), close [#45209](https://github.com/ClickHouse/ClickHouse/issues/45209). [#45230](https://github.com/ClickHouse/ClickHouse/pull/45230) ([Vladimir C](https://github.com/vdimir)).
-* Fix heap-use-after-free in reading from s3. [#45253](https://github.com/ClickHouse/ClickHouse/pull/45253) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug when the Avro Union type is ['null', Nested type], closes [#45275](https://github.com/ClickHouse/ClickHouse/issues/45275). Fix bug that incorrectly infers `bytes` type to `Float`. [#45276](https://github.com/ClickHouse/ClickHouse/pull/45276) ([flynn](https://github.com/ucasfl)).
-* Throw a correct exception when explicit PREWHERE cannot be used with a table using the storage engine `Merge`. [#45319](https://github.com/ClickHouse/ClickHouse/pull/45319) ([Antonio Andelic](https://github.com/antonio2368)).
-* Under WSL1 Ubuntu self-extracting ClickHouse fails to decompress due to inconsistency - /proc/self/maps reporting 32bit file's inode, while stat reporting 64bit inode. [#45339](https://github.com/ClickHouse/ClickHouse/pull/45339) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* Fix race in Distributed table startup (that could lead to processing file of async INSERT multiple times). [#45360](https://github.com/ClickHouse/ClickHouse/pull/45360) ([Azat Khuzhin](https://github.com/azat)).
-* Fix a possible crash while reading from storage `S3` and table function `s3` in the case when `ListObject` request has failed. [#45371](https://github.com/ClickHouse/ClickHouse/pull/45371) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix `SELECT ... FROM system.dictionaries` exception when there is a dictionary with a bad structure (e.g. incorrect type in XML config). [#45399](https://github.com/ClickHouse/ClickHouse/pull/45399) ([Aleksei Filatov](https://github.com/aalexfvk)).
-* Fix s3Cluster schema inference when structure from insertion table is used in `INSERT INTO ... SELECT * FROM s3Cluster` queries. [#45422](https://github.com/ClickHouse/ClickHouse/pull/45422) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fix bug in JSON/BSONEachRow parsing with HTTP that could lead to using default values for some columns instead of values from data. [#45424](https://github.com/ClickHouse/ClickHouse/pull/45424) ([Kruglov Pavel](https://github.com/Avogar)).
-* Fixed bug (Code: 632. DB::Exception: Unexpected data ... after parsed IPv6 value ...) with typed parsing of IP types from text source. [#45425](https://github.com/ClickHouse/ClickHouse/pull/45425) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
-* close [#45297](https://github.com/ClickHouse/ClickHouse/issues/45297) Add check for empty regular expressions. [#45428](https://github.com/ClickHouse/ClickHouse/pull/45428) ([Han Fei](https://github.com/hanfei1991)).
-* Fix possible (likely distributed) query hung. [#45448](https://github.com/ClickHouse/ClickHouse/pull/45448) ([Azat Khuzhin](https://github.com/azat)).
-* Fix possible deadlock with `allow_asynchronous_read_from_io_pool_for_merge_tree` enabled in case of exception from `ThreadPool::schedule`. [#45481](https://github.com/ClickHouse/ClickHouse/pull/45481) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* Fix possible in-use table after DETACH. [#45493](https://github.com/ClickHouse/ClickHouse/pull/45493) ([Azat Khuzhin](https://github.com/azat)).
-* Fix rare abort in the case when a query is canceled and parallel parsing was used during its execution. [#45498](https://github.com/ClickHouse/ClickHouse/pull/45498) ([Anton Popov](https://github.com/CurtizJ)).
-* Fix a race between Distributed table creation and INSERT into it (could lead to CANNOT_LINK during INSERT into the table). [#45502](https://github.com/ClickHouse/ClickHouse/pull/45502) ([Azat Khuzhin](https://github.com/azat)).
-* Add proper default (SLRU) to cache policy getter. Closes [#45514](https://github.com/ClickHouse/ClickHouse/issues/45514). [#45524](https://github.com/ClickHouse/ClickHouse/pull/45524) ([Kseniia Sumarokova](https://github.com/kssenii)).
-* Disallow array join in mutations closes [#42637](https://github.com/ClickHouse/ClickHouse/issues/42637) [#44447](https://github.com/ClickHouse/ClickHouse/pull/44447) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-* Fix for qualified asterisks with alias table name and column transformer. Resolves [#44736](https://github.com/ClickHouse/ClickHouse/issues/44736). [#44755](https://github.com/ClickHouse/ClickHouse/pull/44755) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
-
-## [Changelog for 2022](https://clickhouse.com/docs/en/whats-new/changelog/2022)
+## [Changelog for 2023](https://clickhouse.com/docs/en/whats-new/changelog/2023)

From bcc99a216d1f697b0a28ed98bd35688b3e078c47 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 09:10:11 +0300
Subject: [PATCH 0399/1081] Update json.md

---
 docs/en/sql-reference/data-types/json.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/data-types/json.md b/docs/en/sql-reference/data-types/json.md
index f727f0d75f7..fd548a0d5a2 100644
--- a/docs/en/sql-reference/data-types/json.md
+++ b/docs/en/sql-reference/data-types/json.md
@@ -7,7 +7,7 @@ sidebar_label: JSON
 # JSON
 
 :::note
-This feature is experimental and is not production ready. If you need to work with JSON documents, consider using [this guide](/docs/en/integrations/data-ingestion/data-formats/json.md) instead.
+This feature is experimental and is not production-ready. If you need to work with JSON documents, consider using [this guide](/docs/en/integrations/data-ingestion/data-formats/json.md) instead.
 :::
 
 Stores JavaScript Object Notation (JSON) documents in a single column.
@@ -15,7 +15,8 @@ Stores JavaScript Object Notation (JSON) documents in a single column.
 `JSON` is an alias for `Object('json')`.
 
 :::note
-The JSON data type is an experimental feature. To use it, set `allow_experimental_object_type = 1`.
+The JSON data type is an obsolete feature. Do not use it.
+If you want to use it, set `allow_experimental_object_type = 1`.
 :::
 
 ## Example

From 4f12ca249d4d728c403f52c1d68edda68a9af286 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Tue, 30 Jan 2024 07:01:07 +0000
Subject: [PATCH 0400/1081] Fix typo

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp          | 2 +-
 src/Interpreters/replaceForPositionalArguments.cpp | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 54767c88993..d9434c878d2 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2180,7 +2180,7 @@ void QueryAnalyzer::replaceNodesWithPositionalArguments(QueryTreeNodePtr & node_
                 if (static_cast<size_t>(std::abs(value)) > projection_nodes.size())
                     throw Exception(
                         ErrorCodes::BAD_ARGUMENTS,
-                        "Negtive positional argument number {} is out of bounds. Expected in range [-{}, -1]. In scope {}",
+                        "Negative positional argument number {} is out of bounds. Expected in range [-{}, -1]. In scope {}",
                         value,
                         projection_nodes.size(),
                         scope.scope_node->formatASTForErrorMessage());
diff --git a/src/Interpreters/replaceForPositionalArguments.cpp b/src/Interpreters/replaceForPositionalArguments.cpp
index c72cac25c9d..cceb0650fcd 100644
--- a/src/Interpreters/replaceForPositionalArguments.cpp
+++ b/src/Interpreters/replaceForPositionalArguments.cpp
@@ -47,7 +47,7 @@ bool replaceForPositionalArguments(ASTPtr & argument, const ASTSelectQuery * sel
             if (static_cast<size_t>(std::abs(value)) > columns.size())
                 throw Exception(
                     ErrorCodes::BAD_ARGUMENTS,
-                    "Negtive positional argument number {} is out of bounds. Expected in range [-{}, -1]",
+                    "Negative positional argument number {} is out of bounds. Expected in range [-{}, -1]",
                     value,
                     columns.size());
             pos = columns.size() + value + 1;

From bfb6d284d99817c791409f42ec4c269ee2327e22 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 30 Jan 2024 07:16:21 +0000
Subject: [PATCH 0401/1081] Make test non-parallel

---
 tests/queries/0_stateless/02971_analyzer_remote_id.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
index 88bbe38729b..21141fa47ff 100755
--- a/tests/queries/0_stateless/02971_analyzer_remote_id.sh
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -1,4 +1,5 @@
 #!/usr/bin/env bash
+# Tags: no-parallel
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 37bcd59508f5f9095afe5bdaf8f2eca9b1cd410e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 08:48:42 +0100
Subject: [PATCH 0402/1081] Remove wrong (Kernigan & Ritchie) notation for
 functions. Use pure mathematical notation instead.

---
 CHANGELOG.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ea3c954776a..b097757a7ee 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -25,14 +25,14 @@
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
-* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
-* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
-* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add function `arrayShingles` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode`, `punycodeDecode`, `idnaEncode` and `idnaDecode` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance`, `jaroSimilarity` and `jaroWinklerSimilarity`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
 * Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
 * Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
-* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added function `sqidDecode` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
 * Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
-* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Added function `seriesDecomposeSTL` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
 * Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
 * Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
 * Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).

From be5b3722b733d0aad17216cf6eb85b4d538c53f9 Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Tue, 30 Jan 2024 08:54:41 +0000
Subject: [PATCH 0403/1081] fix spelling

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 1f6b24597da..77152804740 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2016,7 +2016,6 @@ pcre
 performant
 perl
 persistency
-personal_ws-1.1 en 2657 
 phpclickhouse
 pipelining
 plaintext

From 7e0bea4a66dee89e00e1be60e97656085107aba2 Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Tue, 30 Jan 2024 08:55:40 +0000
Subject: [PATCH 0404/1081] fix spelling

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 1f6b24597da..77152804740 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2016,7 +2016,6 @@ pcre
 performant
 perl
 persistency
-personal_ws-1.1 en 2657 
 phpclickhouse
 pipelining
 plaintext

From 1b748fc7b24649c0018abe3175bfcad546f5bf1f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 10:18:39 +0100
Subject: [PATCH 0405/1081] Fixes

---
 contrib/llvm-project-cmake/CMakeLists.txt              | 4 +++-
 tests/queries/0_stateless/02252_jit_profile_events.sql | 2 +-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/contrib/llvm-project-cmake/CMakeLists.txt b/contrib/llvm-project-cmake/CMakeLists.txt
index ed73af1277c..76e620314a2 100644
--- a/contrib/llvm-project-cmake/CMakeLists.txt
+++ b/contrib/llvm-project-cmake/CMakeLists.txt
@@ -1,5 +1,7 @@
 if (APPLE OR SANITIZE STREQUAL "memory")
-    # llvm-tblgen, that is used during LLVM build, doesn't work with MSAN.
+    # llvm-tblgen, that is used during LLVM build, will throw MSAN errors when running (breaking the build)
+    # TODO: Retest when upgrading LLVM or build only llvm-tblgen without sanitizers
+    set (ENABLE_EMBEDDED_COMPILER_DEFAULT OFF)
     set (ENABLE_DWARF_PARSER_DEFAULT OFF)
 else()
     set (ENABLE_EMBEDDED_COMPILER_DEFAULT ${ENABLE_LIBRARIES})
diff --git a/tests/queries/0_stateless/02252_jit_profile_events.sql b/tests/queries/0_stateless/02252_jit_profile_events.sql
index 4b69dde2a45..fb7f806c46b 100644
--- a/tests/queries/0_stateless/02252_jit_profile_events.sql
+++ b/tests/queries/0_stateless/02252_jit_profile_events.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest, no-cpu-aarch64, no-msan
+-- Tags: no-fasttest, no-parallel, no-cpu-aarch64, no-msan
 
 SET compile_expressions = 1;
 SET min_count_to_compile_expression = 0;

From f984770223c96bb33f851358e98ccc3144fa334b Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Tue, 30 Jan 2024 11:23:07 +0100
Subject: [PATCH 0406/1081] Minor typos in Settings.h

---
 src/Core/Settings.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 747c755f3ea..2e453bfe480 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -230,7 +230,7 @@ class IColumn;
     \
     M(Bool, force_index_by_date, false, "Throw an exception if there is a partition key in a table, and it is not used.", 0) \
     M(Bool, force_primary_key, false, "Throw an exception if there is primary key in a table, and it is not used.", 0) \
-    M(Bool, use_skip_indexes, true, "Use data skinipping indexes during query execution.", 0) \
+    M(Bool, use_skip_indexes, true, "Use data skipping indexes during query execution.", 0) \
     M(Bool, use_skip_indexes_if_final, false, "If query has FINAL, then skipping data based on indexes may produce incorrect result, hence disabled by default.", 0) \
     M(String, ignore_data_skipping_indices, "", "Comma separated list of strings or literals with the name of the data skipping indices that should be excluded during query execution.", 0) \
     \
@@ -591,7 +591,7 @@ class IColumn;
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
     M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
-    M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped taraget table during pushing to views", 0) \
+    M(Bool, ignore_materialized_views_with_dropped_target_table, false, "Ignore MVs with dropped target table during pushing to views", 0) \
     M(Bool, allow_experimental_refreshable_materialized_view, false, "Allow refreshable materialized views (CREATE MATERIALIZED VIEW <name> REFRESH ...).", 0) \
     M(Bool, stop_refreshable_materialized_views_on_startup, false, "On server startup, prevent scheduling of refreshable materialized views, as if with SYSTEM STOP VIEWS. You can manually start them with SYSTEM START VIEWS or SYSTEM START VIEW <name> afterwards. Also applies to newly created views. Has no effect on non-refreshable materialized views.", 0) \
     M(Bool, use_compact_format_in_distributed_parts_names, true, "Changes format of directories names for distributed table insert parts.", 0) \

From ccc4295542bec3e93935682186ba3b0821fc30e1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 11:35:14 +0100
Subject: [PATCH 0407/1081] More typos in settings

---
 src/Core/Settings.h | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 2e453bfe480..4bb48cb3a29 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -154,7 +154,7 @@ class IColumn;
     M(Float, totals_auto_threshold, 0.5, "The threshold for totals_mode = 'auto'.", 0) \
     \
     M(Bool, allow_suspicious_low_cardinality_types, false, "In CREATE TABLE statement allows specifying LowCardinality modifier for types of small fixed size (8 or less). Enabling this may increase merge times and memory consumption.", 0) \
-    M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misusage", 0) \
+    M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misuse", 0) \
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
     M(Bool, allow_suspicious_ttl_expressions, false, "Reject TTL expressions that don't depend on any of table's columns. It indicates a user error most of the time.", 0) \
     M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
@@ -253,7 +253,7 @@ class IColumn;
     M(LogQueriesType, log_queries_min_type, QueryLogElementType::QUERY_START, "Minimal type in query_log to log, possible values (from low to high): QUERY_START, QUERY_FINISH, EXCEPTION_BEFORE_START, EXCEPTION_WHILE_PROCESSING.", 0) \
     M(Milliseconds, log_queries_min_query_duration_ms, 0, "Minimal time for the query to run, to get to the query_log/query_thread_log/query_views_log.", 0) \
     M(UInt64, log_queries_cut_to_length, 100000, "If query length is greater than specified threshold (in bytes), then cut query when writing to query log. Also limit length of printed query in ordinary text log.", 0) \
-    M(Float, log_queries_probability, 1., "Log queries with the specified probabality.", 0) \
+    M(Float, log_queries_probability, 1., "Log queries with the specified probability.", 0) \
     \
     M(Bool, log_processors_profiles, false, "Log Processors profile events.", 0) \
     M(DistributedProductMode, distributed_product_mode, DistributedProductMode::DENY, "How are distributed subqueries performed inside IN or JOIN sections?", IMPORTANT) \
@@ -261,8 +261,8 @@ class IColumn;
     M(UInt64, max_concurrent_queries_for_all_users, 0, "The maximum number of concurrent requests for all users.", 0) \
     M(UInt64, max_concurrent_queries_for_user, 0, "The maximum number of concurrent requests per user.", 0) \
     \
-    M(Bool, insert_deduplicate, true, "For INSERT queries in the replicated table, specifies that deduplication of insertings blocks should be performed", 0) \
-    M(Bool, async_insert_deduplicate, false, "For async INSERT queries in the replicated table, specifies that deduplication of insertings blocks should be performed", 0) \
+    M(Bool, insert_deduplicate, true, "For INSERT queries in the replicated table, specifies that deduplication of inserting blocks should be performed", 0) \
+    M(Bool, async_insert_deduplicate, false, "For async INSERT queries in the replicated table, specifies that deduplication of inserting blocks should be performed", 0) \
     \
     M(UInt64Auto, insert_quorum, 0, "For INSERT queries in the replicated table, wait writing for the specified number of replicas and linearize the addition of the data. 0 - disabled, 'auto' - use majority", 0) \
     M(Milliseconds, insert_quorum_timeout, 600000, "If the quorum of replicas did not meet in specified time (in milliseconds), exception will be thrown and insertion is aborted.", 0) \
@@ -587,7 +587,7 @@ class IColumn;
     M(Bool, optimize_substitute_columns, false, "Use constraints for column substitution", 0)                                                                                                                                         \
     M(Bool, optimize_append_index, false, "Use constraints in order to append index condition (indexHint)", 0) \
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \
-    M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there're constants there", 0) \
+    M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there are constants there", 0) \
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
     M(Bool, update_insert_deduplication_token_in_dependent_materialized_views, false, "Should update insert deduplication token with table identifier during insert in dependent materialized views.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
@@ -765,8 +765,8 @@ class IColumn;
     \
     M(Bool, load_marks_asynchronously, false, "Load MergeTree marks asynchronously", 0) \
     M(Bool, enable_filesystem_read_prefetches_log, false, "Log to system.filesystem prefetch_log during query. Should be used only for testing or debugging, not recommended to be turned on by default", 0) \
-    M(Bool, allow_prefetched_read_pool_for_remote_filesystem, true, "Prefer prefethed threadpool if all parts are on remote filesystem", 0) \
-    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefethed threadpool if all parts are on remote filesystem", 0) \
+    M(Bool, allow_prefetched_read_pool_for_remote_filesystem, true, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
+    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
     \
     M(UInt64, prefetch_buffer_size, DBMS_DEFAULT_BUFFER_SIZE, "The maximum size of the prefetch buffer to read from the filesystem.", 0) \
     M(UInt64, filesystem_prefetch_step_bytes, 0, "Prefetch step in bytes. Zero means `auto` - approximately the best prefetch step will be auto deduced, but might not be 100% the best. The actual value might be different because of setting filesystem_prefetch_min_bytes_for_single_read_task", 0) \
@@ -811,7 +811,7 @@ class IColumn;
     \
     M(String, rename_files_after_processing, "", "Rename successfully processed files according to the specified pattern; Pattern can include the following placeholders: `%a` (full original file name), `%f` (original filename without extension), `%e` (file extension with dot), `%t` (current timestamp in µs), and `%%` (% sign)", 0) \
     \
-    M(Bool, parallelize_output_from_storages, true, "Parallelize output for reading step from storage. It allows parallelizing query processing right after reading from storage if possible", 0) \
+    M(Bool, parallelize_output_from_storages, true, "Parallelize output for reading step from storage. It allows parallelization of  query processing right after reading from storage if possible", 0) \
     M(String, insert_deduplication_token, "", "If not empty, used for duplicate detection instead of data digest", 0) \
     M(Bool, count_distinct_optimization, false, "Rewrite count distinct to subquery of group by", 0) \
     M(Bool, throw_if_no_data_to_insert, true, "Allows or forbids empty INSERTs, enabled by default (throws an error on an empty insert)", 0) \
@@ -1105,7 +1105,7 @@ class IColumn;
     M(Bool, insert_distributed_one_random_shard, false, "If setting is enabled, inserting into distributed table will choose a random shard to write when there is no sharding key", 0) \
     \
     M(Bool, exact_rows_before_limit, false, "When enabled, ClickHouse will provide exact value for rows_before_limit_at_least statistic, but with the cost that the data before limit will have to be read completely", 0) \
-    M(UInt64, cross_to_inner_join_rewrite, 1, "Use inner join instead of comma/cross join if there're joining expressions in the WHERE section. Values: 0 - no rewrite, 1 - apply if possible for comma/cross, 2 - force rewrite all comma joins, cross - if possible", 0) \
+    M(UInt64, cross_to_inner_join_rewrite, 1, "Use inner join instead of comma/cross join if there are joining expressions in the WHERE section. Values: 0 - no rewrite, 1 - apply if possible for comma/cross, 2 - force rewrite all comma joins, cross - if possible", 0) \
     \
     M(Bool, output_format_arrow_low_cardinality_as_dictionary, false, "Enable output LowCardinality type as Dictionary Arrow type", 0) \
     M(Bool, output_format_arrow_use_signed_indexes_for_dictionary, true, "Use signed integers for dictionary indexes in Arrow format", 0) \

From bab6e6fe3402f8408acba177a6d4318c9b90ea1b Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 11:37:32 +0100
Subject: [PATCH 0408/1081] Fix tests

---
 tests/integration/test_storage_azure_blob_storage/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index 75ef50ec12a..e1d636f3831 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -967,7 +967,7 @@ def test_union_schema_inference_mode(cluster):
         f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference*.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') settings schema_inference_mode='union', describe_compact_output=1 format TSV",
         expect_error="true",
     )
-    assert "Cannot extract table structure" in error
+    assert "CANNOT_EXTRACT_TABLE_STRUCTURE" in error
 
 
 def test_schema_inference_cache(cluster):

From 13770645542c2c6b51fec3b1c634874b79937105 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:45:57 +0100
Subject: [PATCH 0409/1081] Update changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b097757a7ee..50db3292ca8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -21,7 +21,7 @@
 #### New Feature
 * Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
 * Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
-* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Add `quantileDD` aggregate function as well as the corresponding `quantilesDD` and `medianDD`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).

From 798f655276afe25fde8616ad8d4ba78123f61728 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:49:56 +0100
Subject: [PATCH 0410/1081] Rename quantileDDSketch to quantileDD

---
 .../aggregate-functions/reference/index.md    |  3 +-
 .../aggregate-functions/reference/median.md   |  2 +-
 .../reference/quantileddsketch.md             |  8 ++---
 .../reference/quantiles.md                    |  2 +-
 .../AggregateFunctionQuantile.h               |  8 ++---
 ...ch.cpp => AggregateFunctionQuantileDD.cpp} | 14 ++++-----
 .../{QuantileDDSketch.h => QuantileDD.h}      |  8 ++---
 .../registerAggregateFunctions.cpp            |  4 +--
 tests/queries/0_stateless/00273_quantiles.sql |  4 +--
 .../0_stateless/02919_ddsketch_quantile.sql   | 30 +++++++++----------
 .../1_stateful/00178_quantile_ddsketch.sql    |  8 ++---
 .../aspell-ignore/en/aspell-dict.txt          |  4 +--
 12 files changed, 47 insertions(+), 48 deletions(-)
 rename src/AggregateFunctions/{AggregateFunctionQuantileDDSketch.cpp => AggregateFunctionQuantileDD.cpp} (70%)
 rename src/AggregateFunctions/{QuantileDDSketch.h => QuantileDD.h} (93%)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 10bd3e11064..1922672bee9 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -88,7 +88,7 @@ ClickHouse-specific aggregate functions:
 - [quantileTDigestWeighted](/docs/en/sql-reference/aggregate-functions/reference/quantiletdigestweighted.md)
 - [quantileBFloat16](/docs/en/sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16)
 - [quantileBFloat16Weighted](/docs/en/sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16weighted)
-- [quantileDDSketch](/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch)
+- [quantileDD](/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch)
 - [simpleLinearRegression](/docs/en/sql-reference/aggregate-functions/reference/simplelinearregression.md)
 - [stochasticLinearRegression](/docs/en/sql-reference/aggregate-functions/reference/stochasticlinearregression.md)
 - [stochasticLogisticRegression](/docs/en/sql-reference/aggregate-functions/reference/stochasticlogisticregression.md)
@@ -105,4 +105,3 @@ ClickHouse-specific aggregate functions:
 - [sparkBar](./sparkbar.md)
 - [sumCount](./sumcount.md)
 - [largestTriangleThreeBuckets](./largestTriangleThreeBuckets.md)
-
diff --git a/docs/en/sql-reference/aggregate-functions/reference/median.md b/docs/en/sql-reference/aggregate-functions/reference/median.md
index 7467a47cf5f..2a166c83dad 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/median.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/median.md
@@ -18,7 +18,7 @@ Functions:
 - `medianTDigest` — Alias for [quantileTDigest](../../../sql-reference/aggregate-functions/reference/quantiletdigest.md#quantiletdigest).
 - `medianTDigestWeighted` — Alias for [quantileTDigestWeighted](../../../sql-reference/aggregate-functions/reference/quantiletdigestweighted.md#quantiletdigestweighted).
 - `medianBFloat16` — Alias for [quantileBFloat16](../../../sql-reference/aggregate-functions/reference/quantilebfloat16.md#quantilebfloat16).
-- `medianDDSketch` — Alias for [quantileDDSketch](../../../sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch).
+- `medianDD` — Alias for [quantileDD](../../../sql-reference/aggregate-functions/reference/quantileddsketch.md#quantileddsketch).
 
 **Example**
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md b/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
index 9cb73dfc9d8..f9acd2e20cb 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/quantileddsketch.md
@@ -1,10 +1,10 @@
 ---
 slug: /en/sql-reference/aggregate-functions/reference/quantileddsketch
 sidebar_position: 211
-title: quantileDDSketch
+title: quantileDD
 ---
 
-Computes an approximate [quantile](https://en.wikipedia.org/wiki/Quantile) of a sample with relative-error guarantees. It works by building a [DDSketch](https://www.vldb.org/pvldb/vol12/p2195-masson.pdf).
+Computes an approximate [quantile](https://en.wikipedia.org/wiki/Quantile) of a sample with relative-error guarantees. It works by building a [DD](https://www.vldb.org/pvldb/vol12/p2195-masson.pdf).
 
 **Syntax**
 
@@ -44,13 +44,13 @@ Input table has an integer and a float columns:
 Query to calculate 0.75-quantile (third quartile):
 
 ``` sql
-SELECT quantileDDSketch(0.01, 0.75)(a), quantileDDSketch(0.01, 0.75)(b) FROM example_table;
+SELECT quantileDD(0.01, 0.75)(a), quantileDD(0.01, 0.75)(b) FROM example_table;
 ```
 
 Result:
 
 ``` text
-┌─quantileDDSketch(0.01, 0.75)(a)─┬─quantileDDSketch(0.01, 0.75)(b)─┐
+┌─quantileDD(0.01, 0.75)(a)─┬─quantileDD(0.01, 0.75)(b)─┐
 │               2.974233423476717 │                            1.01 │
 └─────────────────────────────────┴─────────────────────────────────┘
 ```
diff --git a/docs/en/sql-reference/aggregate-functions/reference/quantiles.md b/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
index e5da6a9c1de..e2a5bc53e32 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/quantiles.md
@@ -9,7 +9,7 @@ sidebar_position: 201
 
 Syntax: `quantiles(level1, level2, …)(x)`
 
-All the quantile functions also have corresponding quantiles functions: `quantiles`, `quantilesDeterministic`, `quantilesTiming`, `quantilesTimingWeighted`, `quantilesExact`, `quantilesExactWeighted`, `quantileInterpolatedWeighted`, `quantilesTDigest`, `quantilesBFloat16`, `quantilesDDSketch`. These functions calculate all the quantiles of the listed levels in one pass, and return an array of the resulting values.
+All the quantile functions also have corresponding quantiles functions: `quantiles`, `quantilesDeterministic`, `quantilesTiming`, `quantilesTimingWeighted`, `quantilesExact`, `quantilesExactWeighted`, `quantileInterpolatedWeighted`, `quantilesTDigest`, `quantilesBFloat16`, `quantilesDD`. These functions calculate all the quantiles of the listed levels in one pass, and return an array of the resulting values.
 
 ## quantilesExactExclusive
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.h b/src/AggregateFunctions/AggregateFunctionQuantile.h
index 5a0509a5b8d..315be2123a7 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.h
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.h
@@ -31,7 +31,7 @@ namespace ErrorCodes
 
 template <typename> class QuantileTiming;
 template <typename> class QuantileGK;
-template <typename> class QuantileDDSketch;
+template <typename> class QuantileDD;
 
 /** Generic aggregate function for calculation of quantiles.
   * It depends on quantile calculation data structure. Look at Quantile*.h for various implementations.
@@ -64,7 +64,7 @@ private:
     using ColVecType = ColumnVectorOrDecimal<Value>;
 
     static constexpr bool returns_float = !(std::is_same_v<FloatReturnType, void>);
-    static constexpr bool is_quantile_ddsketch = std::is_same_v<Data, QuantileDDSketch<Value>>;
+    static constexpr bool is_quantile_ddsketch = std::is_same_v<Data, QuantileDD<Value>>;
     static_assert(!is_decimal<Value> || !returns_float);
 
     QuantileLevels<Float64> levels;
@@ -334,7 +334,7 @@ struct NameQuantilesBFloat16Weighted { static constexpr auto name = "quantilesBF
 struct NameQuantileGK { static constexpr auto name = "quantileGK"; };
 struct NameQuantilesGK { static constexpr auto name = "quantilesGK"; };
 
-struct NameQuantileDDSketch { static constexpr auto name = "quantileDDSketch"; };
-struct NameQuantilesDDSketch { static constexpr auto name = "quantilesDDSketch"; };
+struct NameQuantileDD { static constexpr auto name = "quantileDD"; };
+struct NameQuantilesDD { static constexpr auto name = "quantilesDD"; };
 
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
similarity index 70%
rename from src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp
rename to src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index 0c5c992920c..4d1b2069dcc 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDDSketch.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -1,5 +1,5 @@
 #include <AggregateFunctions/AggregateFunctionQuantile.h>
-#include <AggregateFunctions/QuantileDDSketch.h>
+#include <AggregateFunctions/QuantileDD.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <AggregateFunctions/Helpers.h>
 #include <DataTypes/DataTypeDate.h>
@@ -19,8 +19,8 @@ namespace ErrorCodes
 namespace
 {
 
-template <typename Value, bool float_return> using FuncQuantileDDSketch = AggregateFunctionQuantile<Value, QuantileDDSketch<Value>, NameQuantileDDSketch, false, std::conditional_t<float_return, Float64, void>, false, true>;
-template <typename Value, bool float_return> using FuncQuantilesDDSketch = AggregateFunctionQuantile<Value, QuantileDDSketch<Value>, NameQuantilesDDSketch, false, std::conditional_t<float_return, Float64, void>, true, true>;
+template <typename Value, bool float_return> using FuncQuantileDD = AggregateFunctionQuantile<Value, QuantileDD<Value>, NameQuantileDD, false, std::conditional_t<float_return, Float64, void>, false, true>;
+template <typename Value, bool float_return> using FuncQuantilesDD = AggregateFunctionQuantile<Value, QuantileDD<Value>, NameQuantilesDD, false, std::conditional_t<float_return, Float64, void>, true, true>;
 
 
 template <template <typename, bool> class Function>
@@ -46,16 +46,16 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
 
 }
 
-void registerAggregateFunctionsQuantileDDSketch(AggregateFunctionFactory & factory)
+void registerAggregateFunctionsQuantileDD(AggregateFunctionFactory & factory)
 {
     /// For aggregate functions returning array we cannot return NULL on empty set.
     AggregateFunctionProperties properties = { .returns_default_when_only_null = true };
 
-    factory.registerFunction(NameQuantileDDSketch::name, createAggregateFunctionQuantile<FuncQuantileDDSketch>);
-    factory.registerFunction(NameQuantilesDDSketch::name, { createAggregateFunctionQuantile<FuncQuantilesDDSketch>, properties });
+    factory.registerFunction(NameQuantileDD::name, createAggregateFunctionQuantile<FuncQuantileDD>);
+    factory.registerFunction(NameQuantilesDD::name, { createAggregateFunctionQuantile<FuncQuantilesDD>, properties });
 
     /// 'median' is an alias for 'quantile'
-    factory.registerAlias("medianDDSketch", NameQuantileDDSketch::name);
+    factory.registerAlias("medianDD", NameQuantileDD::name);
 }
 
 }
diff --git a/src/AggregateFunctions/QuantileDDSketch.h b/src/AggregateFunctions/QuantileDD.h
similarity index 93%
rename from src/AggregateFunctions/QuantileDDSketch.h
rename to src/AggregateFunctions/QuantileDD.h
index 05e92f3b869..1d063c7a014 100644
--- a/src/AggregateFunctions/QuantileDDSketch.h
+++ b/src/AggregateFunctions/QuantileDD.h
@@ -33,14 +33,14 @@ namespace DB
 */
 
 template <typename Value>
-class QuantileDDSketch
+class QuantileDD
 {
 public:
     using Weight = UInt64;
 
-    QuantileDDSketch() = default;
+    QuantileDD() = default;
 
-    explicit QuantileDDSketch(Float64 relative_accuracy) : data(relative_accuracy) { }
+    explicit QuantileDD(Float64 relative_accuracy) : data(relative_accuracy) { }
 
     void add(const Value & x)
     {
@@ -53,7 +53,7 @@ public:
             data.add(x, w);
     }
 
-    void merge(const QuantileDDSketch &other)
+    void merge(const QuantileDD &other)
     {
         data.merge(other.data);
     }
diff --git a/src/AggregateFunctions/registerAggregateFunctions.cpp b/src/AggregateFunctions/registerAggregateFunctions.cpp
index 6d3a144fa49..10c5cc36f9a 100644
--- a/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/src/AggregateFunctions/registerAggregateFunctions.cpp
@@ -31,7 +31,7 @@ void registerAggregateFunctionsQuantileTimingWeighted(AggregateFunctionFactory &
 void registerAggregateFunctionsQuantileTDigest(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileTDigestWeighted(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileBFloat16(AggregateFunctionFactory &);
-void registerAggregateFunctionsQuantileDDSketch(AggregateFunctionFactory &);
+void registerAggregateFunctionsQuantileDD(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileBFloat16Weighted(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantileApprox(AggregateFunctionFactory &);
 void registerAggregateFunctionsSequenceMatch(AggregateFunctionFactory &);
@@ -128,7 +128,7 @@ void registerAggregateFunctions()
         registerAggregateFunctionsQuantileTDigest(factory);
         registerAggregateFunctionsQuantileTDigestWeighted(factory);
         registerAggregateFunctionsQuantileBFloat16(factory);
-        registerAggregateFunctionsQuantileDDSketch(factory);
+        registerAggregateFunctionsQuantileDD(factory);
         registerAggregateFunctionsQuantileBFloat16Weighted(factory);
         registerAggregateFunctionsQuantileApprox(factory);
         registerAggregateFunctionsSequenceMatch(factory);
diff --git a/tests/queries/0_stateless/00273_quantiles.sql b/tests/queries/0_stateless/00273_quantiles.sql
index eba5e772997..791ced6bc5d 100644
--- a/tests/queries/0_stateless/00273_quantiles.sql
+++ b/tests/queries/0_stateless/00273_quantiles.sql
@@ -2,13 +2,13 @@ SELECT quantiles(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001
 SELECT quantilesExact(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesTDigest(0.5)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesDeterministic(0.5)(x, x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
-SELECT arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.5)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
+SELECT arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.5)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 
 SELECT quantiles(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesExact(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesTDigest(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesDeterministic(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x, x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
-SELECT arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
+SELECT arrayMap(a -> round(a, 2), quantilesDD(0.01, 0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x)) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 
 -- The result slightly differs but it's ok since `quantilesDeterministic` is an approximate function.
 SET max_bytes_before_external_group_by = 0;
diff --git a/tests/queries/0_stateless/02919_ddsketch_quantile.sql b/tests/queries/0_stateless/02919_ddsketch_quantile.sql
index 99eace15d2d..d98978c117e 100644
--- a/tests/queries/0_stateless/02919_ddsketch_quantile.sql
+++ b/tests/queries/0_stateless/02919_ddsketch_quantile.sql
@@ -1,23 +1,23 @@
 SELECT '1'; -- simple test
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2) FROM numbers(200);
-SELECT round(quantileDDSketch(0.0001, 0.69)(number), 2) FROM numbers(500);
-SELECT round(quantileDDSketch(0.003, 0.42)(number), 2) FROM numbers(200);
-SELECT round(quantileDDSketch(0.02, 0.99)(number), 2) FROM numbers(500);
+SELECT round(quantileDD(0.01, 0.5)(number), 2) FROM numbers(200);
+SELECT round(quantileDD(0.0001, 0.69)(number), 2) FROM numbers(500);
+SELECT round(quantileDD(0.003, 0.42)(number), 2) FROM numbers(200);
+SELECT round(quantileDD(0.02, 0.99)(number), 2) FROM numbers(500);
 
 SELECT '2'; -- median is close to 0
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toInt64(number), number - 10]) AS number
     FROM numbers(0, 10)
 );
-SELECT round(quantileDDSketch(0.01, 0.5)(number - 10), 2) FROM numbers(21);
+SELECT round(quantileDD(0.01, 0.5)(number - 10), 2) FROM numbers(21);
 
 SELECT '3'; -- all values are negative
-SELECT round(quantileDDSketch(0.01, 0.99)(-number), 2) FROM numbers(1, 500);
+SELECT round(quantileDD(0.01, 0.99)(-number), 2) FROM numbers(1, 500);
 
 SELECT '4'; -- min and max values of integer types (-2^63, 2^63-1)
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toInt64(number), number - 9223372036854775808, toInt64(number + 9223372036854775798)]) AS number
@@ -25,7 +25,7 @@ FROM
 );
 
 SELECT '5'; -- min and max values of floating point types
-SELECT round(quantileDDSketch(0.01, 0.42)(number), 2)
+SELECT round(quantileDD(0.01, 0.42)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), number - 3.4028235e+38, toFloat32(number + 3.4028235e+38)]) AS number
@@ -33,7 +33,7 @@ FROM
 );
 
 SELECT '6'; -- denormalized floats
-SELECT round(quantileDDSketch(0.01, 0.69)(number), 2)
+SELECT round(quantileDD(0.01, 0.69)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), number - 1.1754944e-38, toFloat32(number + 1.1754944e-38)]) AS number
@@ -41,7 +41,7 @@ FROM
 );
 
 SELECT '7'; -- NaNs
-SELECT round(quantileDDSketch(0.01, 0.5)(number), 2)
+SELECT round(quantileDD(0.01, 0.5)(number), 2)
 FROM
 (
     SELECT arrayJoin([toFloat32(number), NaN * number]) AS number
@@ -50,7 +50,7 @@ FROM
 
 SELECT '8'; -- sparse sketch
 
-SELECT round(quantileDDSketch(0.01, 0.75)(number), 2)
+SELECT round(quantileDD(0.01, 0.75)(number), 2)
 FROM
 (
     SELECT number * 1e7 AS number
@@ -63,11 +63,11 @@ DROP TABLE IF EXISTS `02919_ddsketch_quantile`;
 
 CREATE TABLE `02919_ddsketch_quantile`
 ENGINE = Log AS
-SELECT quantilesDDSketchState(0.001, 0.9)(number) AS sketch
+SELECT quantilesDDState(0.001, 0.9)(number) AS sketch
 FROM numbers(1000);
 
-INSERT INTO `02919_ddsketch_quantile` SELECT quantilesDDSketchState(0.001, 0.9)(number + 1000)
+INSERT INTO `02919_ddsketch_quantile` SELECT quantilesDDState(0.001, 0.9)(number + 1000)
 FROM numbers(1000);
 
-SELECT arrayMap(a -> round(a, 2), (quantilesDDSketchMerge(0.001, 0.9)(sketch)))
+SELECT arrayMap(a -> round(a, 2), (quantilesDDMerge(0.001, 0.9)(sketch)))
 FROM `02919_ddsketch_quantile`;
diff --git a/tests/queries/1_stateful/00178_quantile_ddsketch.sql b/tests/queries/1_stateful/00178_quantile_ddsketch.sql
index 6844dc05cf9..c1ef4b9f4f2 100644
--- a/tests/queries/1_stateful/00178_quantile_ddsketch.sql
+++ b/tests/queries/1_stateful/00178_quantile_ddsketch.sql
@@ -1,5 +1,5 @@
-SELECT CounterID AS k, round(quantileDDSketch(0.01, 0.5)(ResolutionWidth), 2) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
-SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, round(quantileDD(0.01, 0.5)(ResolutionWidth), 2) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM test.hits GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
 
-SELECT CounterID AS k, round(quantileDDSketch(0.01, 0.5)(ResolutionWidth), 2) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
-SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDDSketch(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, round(quantileDD(0.01, 0.5)(ResolutionWidth), 2) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
+SELECT CounterID AS k, arrayMap(a -> round(a, 2), quantilesDD(0.01, 0.1, 0.5, 0.9, 0.99, 0.999)(ResolutionWidth)) FROM remote('127.0.0.{1,2}', test.hits) GROUP BY k ORDER BY count() DESC, CounterID LIMIT 10;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 93e2a12d69c..a71c7cd88c5 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -214,7 +214,7 @@ DatabaseOrdinaryThreadsActive
 DateTime
 DateTimes
 DbCL
-DDSketch
+DD
 Decrypted
 Deduplicate
 Deduplication
@@ -2136,7 +2136,7 @@ quantiletdigestweighted
 quantiletiming
 quantiletimingweighted
 quantileddsketch
-quantileDDSketch
+quantileDD
 quartile
 queryID
 queryString

From 2087de548674d158fab63d18fb1b590aea5eaab2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 11:45:57 +0100
Subject: [PATCH 0411/1081] Update changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ea3c954776a..a7e44b00f85 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -21,7 +21,7 @@
 #### New Feature
 * Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
 * Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
-* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Add `quantileDD` aggregate function as well as the corresponding `quantilesDD` and `medianDD`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).

From 49d2b26820e5b184b21a6f131c3f89a34e9eaa41 Mon Sep 17 00:00:00 2001
From: Aleksandr Musorin <aleksandr.musorin@semrush.com>
Date: Tue, 30 Jan 2024 12:11:00 +0100
Subject: [PATCH 0412/1081] Added new words in aspell-dict

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index f4be6ebcf09..2614a0f55bc 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2703,3 +2703,6 @@ znode
 znodes
 zookeeperSessionUptime
 zstd
+iTerm
+shortkeys
+Shortkeys

From 5ea2afa981f9efe5d2a9e736e27a614256129fa4 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 13:16:22 +0100
Subject: [PATCH 0413/1081] Fix

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh   | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 764c6a2af54..946f0c09007 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,5 +5,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "a.tsv"
-
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "(in file/uri a.tsv)"

From b3483eede3b39bac256ec69069e1978ecb7fbc3e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 29 Jan 2024 22:31:29 +0100
Subject: [PATCH 0414/1081] Fix translate() return type

---
 src/Functions/translate.cpp                   | 20 ++++++++++++++-----
 .../02981_translate_fixedstring.reference     |  5 +++++
 .../02981_translate_fixedstring.sql           |  2 ++
 3 files changed, 22 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02981_translate_fixedstring.reference
 create mode 100644 tests/queries/0_stateless/02981_translate_fixedstring.sql

diff --git a/src/Functions/translate.cpp b/src/Functions/translate.cpp
index ad5be7d9dfd..c7173909029 100644
--- a/src/Functions/translate.cpp
+++ b/src/Functions/translate.cpp
@@ -1,12 +1,15 @@
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnConst.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnString.h>
+#include <DataTypes/DataTypeFixedString.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
-#include <Common/iota.h>
+#include <Functions/FunctionHelpers.h>
+#include <Common/HashTable/HashMap.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/UTF8Helpers.h>
-#include <Common/HashTable/HashMap.h>
+#include <Common/iota.h>
+
 #include <numeric>
 
 
@@ -298,7 +301,14 @@ public:
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of third argument of function {}",
                 arguments[2]->getName(), getName());
 
-        return std::make_shared<DataTypeString>();
+        if (isString(arguments[0]))
+            return std::make_shared<DataTypeString>();
+        else
+        {
+            const auto * ptr = checkAndGetDataType<DataTypeFixedString>(arguments[0].get());
+            chassert(ptr);
+            return std::make_shared<DataTypeFixedString>(ptr->getN());
+        }
     }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
diff --git a/tests/queries/0_stateless/02981_translate_fixedstring.reference b/tests/queries/0_stateless/02981_translate_fixedstring.reference
new file mode 100644
index 00000000000..e506d4a22f7
--- /dev/null
+++ b/tests/queries/0_stateless/02981_translate_fixedstring.reference
@@ -0,0 +1,5 @@
+AAA\0\0\0\0\0\0\0
+A
+1
+2
+3
diff --git a/tests/queries/0_stateless/02981_translate_fixedstring.sql b/tests/queries/0_stateless/02981_translate_fixedstring.sql
new file mode 100644
index 00000000000..209efa4ba4a
--- /dev/null
+++ b/tests/queries/0_stateless/02981_translate_fixedstring.sql
@@ -0,0 +1,2 @@
+SELECT translate('aaa'::FixedString(10), 'a','A');
+SELECT translate(number::String::FixedString(1), '0','A') from numbers(4);

From 416910db00b2a7fe1cc32aeb7396b494ce2cc2f3 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 30 Jan 2024 13:03:43 +0000
Subject: [PATCH 0415/1081] Remove unnecessary outer loop

---
 src/Common/PoolWithFailoverBase.h | 69 ++++++++++++++-----------------
 1 file changed, 31 insertions(+), 38 deletions(-)

diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index 6da4445950c..ef4bb40535f 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -249,51 +249,44 @@ PoolWithFailoverBase<TNestedPool>::getMany(
     });
 
     std::string fail_messages;
-    bool finished = false;
-    while (!finished)
+    for (size_t i = 0; i < shuffled_pools.size(); ++i)
     {
-        for (size_t i = 0; i < shuffled_pools.size(); ++i)
+        if (up_to_date_count >= max_entries /// Already enough good entries.
+            || entries_count + failed_pools_count >= nested_pools.size()) /// No more good entries will be produced.
+            break;
+
+        ShuffledPool & shuffled_pool = shuffled_pools[i];
+        TryResult & result = try_results[i];
+        if (max_tries && (shuffled_pool.error_count >= max_tries || !result.entry.isNull()))
+            continue;
+
+        std::string fail_message;
+        result = try_get_entry(*shuffled_pool.pool, fail_message);
+
+        if (!fail_message.empty())
+            fail_messages += fail_message + '\n';
+
+        if (!result.entry.isNull())
         {
-            if (up_to_date_count >= max_entries /// Already enough good entries.
-                || entries_count + failed_pools_count >= nested_pools.size()) /// No more good entries will be produced.
+            ++entries_count;
+            if (result.is_usable)
             {
-                finished = true;
-                break;
+                ++usable_count;
+                if (result.is_up_to_date)
+                    ++up_to_date_count;
             }
+        }
+        else
+        {
+            LOG_WARNING(log, "Connection failed at try №{}, reason: {}", (shuffled_pool.error_count + 1), fail_message);
+            ProfileEvents::increment(ProfileEvents::DistributedConnectionFailTry);
 
-            ShuffledPool & shuffled_pool = shuffled_pools[i];
-            TryResult & result = try_results[i];
-            if (max_tries && (shuffled_pool.error_count >= max_tries || !result.entry.isNull()))
-                continue;
+            shuffled_pool.error_count = std::min(max_error_cap, shuffled_pool.error_count + 1);
 
-            std::string fail_message;
-            result = try_get_entry(*shuffled_pool.pool, fail_message);
-
-            if (!fail_message.empty())
-                fail_messages += fail_message + '\n';
-
-            if (!result.entry.isNull())
+            if (shuffled_pool.error_count >= max_tries)
             {
-                ++entries_count;
-                if (result.is_usable)
-                {
-                    ++usable_count;
-                    if (result.is_up_to_date)
-                        ++up_to_date_count;
-                }
-            }
-            else
-            {
-                LOG_WARNING(log, "Connection failed at try №{}, reason: {}", (shuffled_pool.error_count + 1), fail_message);
-                ProfileEvents::increment(ProfileEvents::DistributedConnectionFailTry);
-
-                shuffled_pool.error_count = std::min(max_error_cap, shuffled_pool.error_count + 1);
-
-                if (shuffled_pool.error_count >= max_tries)
-                {
-                    ++failed_pools_count;
-                    ProfileEvents::increment(ProfileEvents::DistributedConnectionFailAtAll);
-                }
+                ++failed_pools_count;
+                ProfileEvents::increment(ProfileEvents::DistributedConnectionFailAtAll);
             }
         }
     }

From 6624e34580caaac255c39d5edcd1b136007839c9 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 30 Jan 2024 13:06:47 +0000
Subject: [PATCH 0416/1081] RemoteQueryExecutor constructors formatting

---
 src/QueryPipeline/RemoteQueryExecutor.cpp | 36 ++++++++++++++++-------
 src/QueryPipeline/RemoteQueryExecutor.h   | 33 +++++++++++++++------
 2 files changed, 50 insertions(+), 19 deletions(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 136a3bb09c6..1caedfc8511 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -64,9 +64,14 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 
 RemoteQueryExecutor::RemoteQueryExecutor(
     Connection & connection,
-    const String & query_, const Block & header_, ContextPtr context_,
-    ThrottlerPtr throttler, const Scalars & scalars_, const Tables & external_tables_,
-    QueryProcessingStage::Enum stage_, std::optional<Extension> extension_)
+    const String & query_,
+    const Block & header_,
+    ContextPtr context_,
+    ThrottlerPtr throttler,
+    const Scalars & scalars_,
+    const Tables & external_tables_,
+    QueryProcessingStage::Enum stage_,
+    std::optional<Extension> extension_)
     : RemoteQueryExecutor(query_, header_, context_, scalars_, external_tables_, stage_, extension_)
 {
     create_connections = [this, &connection, throttler, extension_](AsyncCallback)
@@ -80,9 +85,14 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 
 RemoteQueryExecutor::RemoteQueryExecutor(
     std::shared_ptr<Connection> connection_ptr,
-    const String & query_, const Block & header_, ContextPtr context_,
-    ThrottlerPtr throttler, const Scalars & scalars_, const Tables & external_tables_,
-    QueryProcessingStage::Enum stage_, std::optional<Extension> extension_)
+    const String & query_,
+    const Block & header_,
+    ContextPtr context_,
+    ThrottlerPtr throttler,
+    const Scalars & scalars_,
+    const Tables & external_tables_,
+    QueryProcessingStage::Enum stage_,
+    std::optional<Extension> extension_)
     : RemoteQueryExecutor(query_, header_, context_, scalars_, external_tables_, stage_, extension_)
 {
     create_connections = [this, connection_ptr, throttler, extension_](AsyncCallback)
@@ -96,12 +106,18 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 
 RemoteQueryExecutor::RemoteQueryExecutor(
     std::vector<IConnectionPool::Entry> && connections_,
-    const String & query_, const Block & header_, ContextPtr context_,
-    const ThrottlerPtr & throttler, const Scalars & scalars_, const Tables & external_tables_,
-    QueryProcessingStage::Enum stage_, std::optional<Extension> extension_)
+    const String & query_,
+    const Block & header_,
+    ContextPtr context_,
+    const ThrottlerPtr & throttler,
+    const Scalars & scalars_,
+    const Tables & external_tables_,
+    QueryProcessingStage::Enum stage_,
+    std::optional<Extension> extension_)
     : RemoteQueryExecutor(query_, header_, context_, scalars_, external_tables_, stage_, extension_)
 {
-    create_connections = [this, connections_, throttler, extension_](AsyncCallback) mutable {
+    create_connections = [this, connections_, throttler, extension_](AsyncCallback) mutable
+    {
         auto res = std::make_unique<MultiplexedConnections>(std::move(connections_), context->getSettingsRef(), throttler);
         if (extension_ && extension_->replica_info)
             res->setReplicaInfo(*extension_->replica_info);
diff --git a/src/QueryPipeline/RemoteQueryExecutor.h b/src/QueryPipeline/RemoteQueryExecutor.h
index 444f1258f3e..e874b4be726 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.h
+++ b/src/QueryPipeline/RemoteQueryExecutor.h
@@ -56,23 +56,38 @@ public:
     /// Takes already set connection.
     RemoteQueryExecutor(
         Connection & connection,
-        const String & query_, const Block & header_, ContextPtr context_,
-        ThrottlerPtr throttler_ = nullptr, const Scalars & scalars_ = Scalars(), const Tables & external_tables_ = Tables(),
-        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete, std::optional<Extension> extension_ = std::nullopt);
+        const String & query_,
+        const Block & header_,
+        ContextPtr context_,
+        ThrottlerPtr throttler_ = nullptr,
+        const Scalars & scalars_ = Scalars(),
+        const Tables & external_tables_ = Tables(),
+        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete,
+        std::optional<Extension> extension_ = std::nullopt);
 
     /// Takes already set connection.
     RemoteQueryExecutor(
         std::shared_ptr<Connection> connection,
-        const String & query_, const Block & header_, ContextPtr context_,
-        ThrottlerPtr throttler_ = nullptr, const Scalars & scalars_ = Scalars(), const Tables & external_tables_ = Tables(),
-        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete, std::optional<Extension> extension_ = std::nullopt);
+        const String & query_,
+        const Block & header_,
+        ContextPtr context_,
+        ThrottlerPtr throttler_ = nullptr,
+        const Scalars & scalars_ = Scalars(),
+        const Tables & external_tables_ = Tables(),
+        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete,
+        std::optional<Extension> extension_ = std::nullopt);
 
     /// Accepts several connections already taken from pool.
     RemoteQueryExecutor(
         std::vector<IConnectionPool::Entry> && connections_,
-        const String & query_, const Block & header_, ContextPtr context_,
-        const ThrottlerPtr & throttler = nullptr, const Scalars & scalars_ = Scalars(), const Tables & external_tables_ = Tables(),
-        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete, std::optional<Extension> extension_ = std::nullopt);
+        const String & query_,
+        const Block & header_,
+        ContextPtr context_,
+        const ThrottlerPtr & throttler = nullptr,
+        const Scalars & scalars_ = Scalars(),
+        const Tables & external_tables_ = Tables(),
+        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete,
+        std::optional<Extension> extension_ = std::nullopt);
 
     /// Takes a pool and gets one or several connections from it.
     RemoteQueryExecutor(

From f79a402e6d92fc0e14bf9684d731c76a51fcdca0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 14:10:07 +0100
Subject: [PATCH 0417/1081] Add sanity checks for function return types

---
 src/Columns/ColumnFunction.cpp         | 7 +++++++
 src/DataTypes/DataTypeDate.h           | 1 +
 src/DataTypes/DataTypeDate32.h         | 1 +
 src/DataTypes/DataTypeDateTime.h       | 1 +
 src/DataTypes/DataTypeEnum.h           | 1 +
 src/DataTypes/DataTypeInterval.h       | 1 +
 src/DataTypes/IDataType.h              | 2 ++
 src/Interpreters/ActionsDAG.cpp        | 7 +++++++
 src/Interpreters/ExpressionActions.cpp | 7 +++++++
 9 files changed, 28 insertions(+)

diff --git a/src/Columns/ColumnFunction.cpp b/src/Columns/ColumnFunction.cpp
index d8eea26b7d5..0ab9d15ad50 100644
--- a/src/Columns/ColumnFunction.cpp
+++ b/src/Columns/ColumnFunction.cpp
@@ -308,6 +308,13 @@ ColumnWithTypeAndName ColumnFunction::reduce() const
         ProfileEvents::increment(ProfileEvents::CompiledFunctionExecute);
 
     res.column = function->execute(columns, res.type, elements_size);
+    if (res.column->getDataType() != res.type->getColumnType())
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Unexpected return type from {}. Expected {}. Got {}",
+            function->getName(),
+            res.type->getColumnType(),
+            res.column->getDataType());
     if (recursively_convert_result_to_full_column_if_low_cardinality)
     {
         res.column = recursiveRemoveLowCardinality(res.column);
diff --git a/src/DataTypes/DataTypeDate.h b/src/DataTypes/DataTypeDate.h
index 2f17207cc07..0e08b9ba2ca 100644
--- a/src/DataTypes/DataTypeDate.h
+++ b/src/DataTypes/DataTypeDate.h
@@ -12,6 +12,7 @@ public:
     static constexpr auto family_name = "Date";
 
     TypeIndex getTypeId() const override { return TypeIndex::Date; }
+    TypeIndex getColumnType() const override { return TypeIndex::UInt16; }
     const char * getFamilyName() const override { return family_name; }
 
     bool canBeUsedAsVersion() const override { return true; }
diff --git a/src/DataTypes/DataTypeDate32.h b/src/DataTypes/DataTypeDate32.h
index 9160b62dc15..02e818f10df 100644
--- a/src/DataTypes/DataTypeDate32.h
+++ b/src/DataTypes/DataTypeDate32.h
@@ -12,6 +12,7 @@ public:
     static constexpr auto family_name = "Date32";
 
     TypeIndex getTypeId() const override { return TypeIndex::Date32; }
+    TypeIndex getColumnType() const override { return TypeIndex::Int32; }
     const char * getFamilyName() const override { return family_name; }
 
     Field getDefault() const override
diff --git a/src/DataTypes/DataTypeDateTime.h b/src/DataTypes/DataTypeDateTime.h
index a4a05917ba5..5519240dee1 100644
--- a/src/DataTypes/DataTypeDateTime.h
+++ b/src/DataTypes/DataTypeDateTime.h
@@ -40,6 +40,7 @@ public:
     const char * getFamilyName() const override { return family_name; }
     String doGetName() const override;
     TypeIndex getTypeId() const override { return TypeIndex::DateTime; }
+    TypeIndex getColumnType() const override { return TypeIndex::UInt32; }
 
     bool canBeUsedAsVersion() const override { return true; }
     bool canBeInsideNullable() const override { return true; }
diff --git a/src/DataTypes/DataTypeEnum.h b/src/DataTypes/DataTypeEnum.h
index 2f607fc2aa6..075d2d274ae 100644
--- a/src/DataTypes/DataTypeEnum.h
+++ b/src/DataTypes/DataTypeEnum.h
@@ -54,6 +54,7 @@ public:
     const char * getFamilyName() const override;
 
     TypeIndex getTypeId() const override { return type_id; }
+    TypeIndex getColumnType() const override { return sizeof(FieldType) == 1 ? TypeIndex::Int8 : TypeIndex::Int16; }
 
     FieldType readValue(ReadBuffer & istr) const
     {
diff --git a/src/DataTypes/DataTypeInterval.h b/src/DataTypes/DataTypeInterval.h
index b0e747555e3..8bb9ae8d7b6 100644
--- a/src/DataTypes/DataTypeInterval.h
+++ b/src/DataTypes/DataTypeInterval.h
@@ -28,6 +28,7 @@ public:
     std::string doGetName() const override { return fmt::format("Interval{}", kind.toString()); }
     const char * getFamilyName() const override { return "Interval"; }
     TypeIndex getTypeId() const override { return TypeIndex::Interval; }
+    TypeIndex getColumnType() const override { return TypeIndex::Int64; }
 
     bool equals(const IDataType & rhs) const override;
 
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 4533c23a89f..48cc127746f 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -86,6 +86,8 @@ public:
 
     /// Data type id. It's used for runtime type checks.
     virtual TypeIndex getTypeId() const = 0;
+    /// Storage type (e.g. Int64 for Interval)
+    virtual TypeIndex getColumnType() const { return getTypeId(); }
 
     bool hasSubcolumn(std::string_view subcolumn_name) const;
 
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 1124ba94bc1..6512def9202 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -282,6 +282,13 @@ const ActionsDAG::Node & ActionsDAG::addFunctionImpl(
         {
             size_t num_rows = arguments.empty() ? 0 : arguments.front().column->size();
             column = node.function->execute(arguments, node.result_type, num_rows, true);
+            if (column->getDataType() != node.result_type->getColumnType())
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "Unexpected return type from {}. Expected {}. Got {}",
+                    node.function->getName(),
+                    node.result_type->getColumnType(),
+                    column->getDataType());
         }
         else
         {
diff --git a/src/Interpreters/ExpressionActions.cpp b/src/Interpreters/ExpressionActions.cpp
index f1c577948eb..1bd1e2c318f 100644
--- a/src/Interpreters/ExpressionActions.cpp
+++ b/src/Interpreters/ExpressionActions.cpp
@@ -611,6 +611,13 @@ static void executeAction(const ExpressionActions::Action & action, ExecutionCon
                     ProfileEvents::increment(ProfileEvents::CompiledFunctionExecute);
 
                 res_column.column = action.node->function->execute(arguments, res_column.type, num_rows, dry_run);
+                if (res_column.column->getDataType() != res_column.type->getColumnType())
+                    throw Exception(
+                        ErrorCodes::LOGICAL_ERROR,
+                        "Unexpected return type from {}. Expected {}. Got {}",
+                        action.node->function->getName(),
+                        res_column.type->getColumnType(),
+                        res_column.column->getDataType());
             }
             break;
         }

From c891ed03c1ae5d85acc1b5f124433d634d23b278 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 30 Jan 2024 14:19:10 +0100
Subject: [PATCH 0418/1081] update test to use CLICKHOUSE_TEST_UNIQUE_NAME so
 parallel tests don't fail

---
 .../00937_format_schema_rows_template.sh         | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/tests/queries/0_stateless/00937_format_schema_rows_template.sh b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
index d773fedfd3d..0221527f9c9 100755
--- a/tests/queries/0_stateless/00937_format_schema_rows_template.sh
+++ b/tests/queries/0_stateless/00937_format_schema_rows_template.sh
@@ -20,10 +20,11 @@ format_template_rows_between_delimiter = ';\n'";
 
 echo -e "\n"
 
-# Test that if both format_template_row_format setting and format_template_row are provided, error is thrown 
-echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > "$CURDIR"/00937_template_output_format_row.tmp
+# Test that if both format_template_row_format setting and format_template_row are provided, error is thrown
+row_format_file="$CURDIR"/"${CLICKHOUSE_TEST_UNIQUE_NAME}"_template_output_format_row.tmp
+echo -ne 'Question: ${question:Quoted}, Answer: ${answer:Quoted}, Number of Likes: ${likes:Raw}, Date: ${date:Raw}' > $row_format_file
 $CLICKHOUSE_CLIENT --multiline --multiquery --query "SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
-format_template_row = '$CURDIR/00937_template_output_format_row.tmp', \
+format_template_row = '$row_format_file', \
 format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
 format_template_rows_between_delimiter = ';\n'; --{clientError 474}"
 
@@ -35,13 +36,14 @@ format_template_resultset_format = '===== Results ===== \n\${data}\n============
 format_template_rows_between_delimiter = ';\n'";
 
 # Test that if both format_template_result_format setting and format_template_resultset are provided, error is thrown
-echo -ne '===== Resultset ===== \n \${data} \n ===============' > "$CURDIR"/00937_template_output_format_resultset.tmp
+resultset_output_file="$CURDIR"/"$CLICKHOUSE_TEST_UNIQUE_NAME"_template_output_format_resultset.tmp
+echo -ne '===== Resultset ===== \n \${data} \n ===============' > $resultset_output_file
 $CLICKHOUSE_CLIENT --multiline --multiquery --query "SELECT * FROM template GROUP BY question, answer, likes, date WITH TOTALS ORDER BY date LIMIT 3 FORMAT Template SETTINGS \
-format_template_resultset = '$CURDIR/00937_template_output_format_resultset.tmp', \
+format_template_resultset = '$resultset_output_file', \
 format_template_resultset_format = '===== Resultset ===== \n \${data} \n ===============', \
 format_template_row_format = 'Question: \${question:Quoted}, Answer: \${answer:Quoted}, Number of Likes: \${likes:Raw}, Date: \${date:Raw}', \
 format_template_rows_between_delimiter = ';\n'; --{clientError 474}"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE template";
-rm "$CURDIR"/00937_template_output_format_row.tmp
-rm "$CURDIR"/00937_template_output_format_resultset.tmp
+rm $row_format_file
+rm $resultset_output_file

From df439dcfdd1c23c3e029f070a314511bc88d24e1 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 30 Jan 2024 14:36:08 +0100
Subject: [PATCH 0419/1081] updated development documentation to warn about
 parallel tests failing if .tmp file names aren't unique (for new
 contributors)

---
 docs/en/development/tests.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/en/development/tests.md b/docs/en/development/tests.md
index 1d3e7d4964e..efbce54d44b 100644
--- a/docs/en/development/tests.md
+++ b/docs/en/development/tests.md
@@ -109,6 +109,9 @@ Do not check for a particular wording of error message, it may change in the fut
 
 If you want to use distributed queries in functional tests, you can leverage `remote` table function with `127.0.0.{1..2}` addresses for the server to query itself; or you can use predefined test clusters in server configuration file like `test_shard_localhost`. Remember to add the words `shard` or `distributed` to the test name, so that it is run in CI in correct configurations, where the server is configured to support distributed queries.
 
+### Working with Temporary Files
+
+Sometimes in a shell test you may need to create a file on the fly to work with. Keep in mind that some CI checks run tests in parallel, so if you are creating or removing a temporary file in your script without a unique name this can cause some of the CI checks, such as Flaky, to fail. To get around this you should use environment variable `$CLICKHOUSE_TEST_UNIQUE_NAME` to give temporary files a name unique to the test that is running. That way you can be sure that the file you are creating during setup or removing during cleanup is the file only in use by that test and not some other test which is running in parallel. 
 
 ## Known Bugs {#known-bugs}
 

From 20c1f0c18f65b3ab149b84abc18dfe1a4d3b3383 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 19 Jan 2024 18:37:02 +0300
Subject: [PATCH 0420/1081] Revert "Revert "Add new aggregation function
 groupArraySorted()""

---
 .../reference/grouparraysorted.md             |  48 +++
 .../aggregate-functions/reference/index.md    |   1 +
 .../AggregateFunctionGroupArraySorted.cpp     |  82 ++++
 .../AggregateFunctionGroupArraySorted.h       | 355 ++++++++++++++++++
 .../registerAggregateFunctions.cpp            |   2 +
 tests/performance/group_array_sorted.xml      |  31 ++
 .../02841_group_array_sorted.reference        |  12 +
 .../0_stateless/02841_group_array_sorted.sql  |  41 ++
 .../aspell-ignore/en/aspell-dict.txt          |   2 +
 9 files changed, 574 insertions(+)
 create mode 100644 docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
 create mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
 create mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
 create mode 100644 tests/performance/group_array_sorted.xml
 create mode 100644 tests/queries/0_stateless/02841_group_array_sorted.reference
 create mode 100644 tests/queries/0_stateless/02841_group_array_sorted.sql

diff --git a/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md b/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
new file mode 100644
index 00000000000..cc601c097fe
--- /dev/null
+++ b/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
@@ -0,0 +1,48 @@
+ ---
+ toc_priority: 112
+ ---
+
+ # groupArraySorted {#groupArraySorted}
+
+ Returns an array with the first N items in ascending order.
+
+ ``` sql
+ groupArraySorted(N)(column)
+ ```
+
+ **Arguments**
+
+ -   `N` – The number of elements to return.
+
+ If the parameter is omitted, default value is the size of input.
+
+ -   `column` – The value (Integer, String, Float and other Generic types).
+
+ **Example**
+
+ Gets the first 10 numbers:
+
+ ``` sql
+ SELECT groupArraySorted(10)(number) FROM numbers(100)
+ ```
+
+ ``` text
+ ┌─groupArraySorted(10)(number)─┐
+ │ [0,1,2,3,4,5,6,7,8,9]        │
+ └──────────────────────────────┘
+ ```
+
+
+ Gets all the String implementations of all numbers in column:
+
+ ``` sql
+SELECT groupArraySorted(str) FROM (SELECT toString(number) as str FROM numbers(5));
+
+ ```
+
+ ``` text
+ ┌─groupArraySorted(str)────────┐
+ │ ['0','1','2','3','4']        │
+ └──────────────────────────────┘
+ ```
+ 
\ No newline at end of file
diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 10bd3e11064..0834fef60f6 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -54,6 +54,7 @@ ClickHouse-specific aggregate functions:
 - [groupArrayMovingAvg](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingavg.md)
 - [groupArrayMovingSum](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingsum.md)
 - [groupArraySample](./grouparraysample.md)
+- [groupArraySorted](/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md)
 - [groupBitAnd](/docs/en/sql-reference/aggregate-functions/reference/groupbitand.md)
 - [groupBitOr](/docs/en/sql-reference/aggregate-functions/reference/groupbitor.md)
 - [groupBitXor](/docs/en/sql-reference/aggregate-functions/reference/groupbitxor.md)
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
new file mode 100644
index 00000000000..debc9b6d565
--- /dev/null
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -0,0 +1,82 @@
+#include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <AggregateFunctions/AggregateFunctionGroupArraySorted.h>
+#include <AggregateFunctions/Helpers.h>
+#include <AggregateFunctions/FactoryHelpers.h>
+#include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <Common/Exception.h>
+
+namespace DB
+{
+struct Settings;
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int BAD_ARGUMENTS;
+}
+
+namespace
+{
+
+template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
+AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type, TArgs && ... args)
+{
+    WhichDataType which(argument_type);
+    if (which.idx == TypeIndex::Date) return std::make_shared<AggregateFunctionTemplate<UInt16>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::DateTime) return std::make_shared<AggregateFunctionTemplate<UInt32>>(std::forward<TArgs>(args)...);
+    if (which.idx == TypeIndex::IPv4) return std::make_shared<AggregateFunctionTemplate<IPv4>>(std::forward<TArgs>(args)...);
+    return AggregateFunctionPtr(createWithNumericType<AggregateFunctionTemplate, TArgs...>(argument_type, std::forward<TArgs>(args)...));
+}
+
+template <typename ... TArgs>
+inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
+{
+    if (auto res = createWithNumericOrTimeType<GroupArraySortedNumericImpl>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+        return AggregateFunctionPtr(res);
+
+    WhichDataType which(argument_type);
+    return std::make_shared<GroupArraySortedGeneralImpl<GroupArraySortedNodeGeneral>>(argument_type, parameters, std::forward<TArgs>(args)...);
+}
+
+AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
+    const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
+{
+    assertUnary(name, argument_types);
+
+    UInt64 max_elems = std::numeric_limits<UInt64>::max();
+
+    if (parameters.empty())
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should have limit argument", name);
+    }
+    else if (parameters.size() == 1)
+    {
+        auto type = parameters[0].getType();
+        if (type != Field::Types::Int64 && type != Field::Types::UInt64)
+               throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
+
+        if ((type == Field::Types::Int64 && parameters[0].get<Int64>() < 0) ||
+            (type == Field::Types::UInt64 && parameters[0].get<UInt64>() == 0))
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
+
+        max_elems = parameters[0].get<UInt64>();
+    }
+    else
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+            "Function {} does not support this number of arguments", name);
+
+    return createAggregateFunctionGroupArraySortedImpl(argument_types[0], parameters, max_elems);
+}
+
+}
+
+
+void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory)
+{
+    AggregateFunctionProperties properties = { .returns_default_when_only_null = false, .is_order_dependent = false };
+
+    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArraySorted, properties });
+}
+
+}
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
new file mode 100644
index 00000000000..5079eaad756
--- /dev/null
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
@@ -0,0 +1,355 @@
+#pragma once
+
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVector.h>
+#include <Functions/array/arraySort.h>
+
+#include <Common/Exception.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/assert_cast.h>
+#include <Columns/ColumnConst.h>
+#include <DataTypes/IDataType.h>
+#include <base/sort.h>
+#include <Columns/IColumn.h>
+
+#include <AggregateFunctions/IAggregateFunction.h>
+
+#include <Common/RadixSort.h>
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+
+#define AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE 0xFFFFFF
+
+namespace DB
+{
+struct Settings;
+
+namespace ErrorCodes
+{
+    extern const int TOO_LARGE_ARRAY_SIZE;
+}
+
+template <typename T>
+struct GroupArraySortedData;
+
+template <typename T>
+struct GroupArraySortedData
+{
+    /// For easy serialization.
+    static_assert(std::has_unique_object_representations_v<T> || std::is_floating_point_v<T>);
+
+    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array value;
+};
+
+template <typename T>
+class GroupArraySortedNumericImpl final
+    : public IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>
+{
+    using Data = GroupArraySortedData<T>;
+    UInt64 max_elems;
+    SerializationPtr serialization;
+
+public:
+    explicit GroupArraySortedNumericImpl(
+        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
+        : IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , max_elems(max_elems_)
+        , serialization(data_type_->getDefaultSerialization())
+    {
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        const auto & row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
+        auto & cur_elems = this->data(place);
+
+        cur_elems.value.push_back(row_value, arena);
+
+        /// To optimize, we sort (2 * max_size) elements of input array over and over again
+        /// and after each loop we delete the last half of sorted array
+        if (cur_elems.value.size() >= max_elems * 2)
+        {
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
+            cur_elems.value.resize(max_elems, arena);
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & cur_elems = this->data(place);
+        auto & rhs_elems = this->data(rhs);
+
+        if (rhs_elems.value.empty())
+            return;
+
+        if (rhs_elems.value.size())
+            cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
+
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
+
+        size_t elems_size = cur_elems.value.size() < max_elems ? cur_elems.value.size() : max_elems;
+        cur_elems.value.resize(elems_size, arena);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & value = this->data(place).value;
+        size_t size = value.size();
+        writeVarUInt(size, buf);
+
+        for (const auto & elem : value)
+            writeBinaryLittleEndian(elem, buf);
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
+
+        auto & value = this->data(place).value;
+
+        value.resize(size, arena);
+        for (auto & element : value)
+            readBinaryLittleEndian(element, buf);
+    }
+
+    static void checkArraySize(size_t elems, size_t max_elems)
+    {
+        if (unlikely(elems > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
+                            "Too large array size {} (maximum: {})", elems, max_elems);
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        auto& value = this->data(place).value;
+
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
+        size_t elems_size = value.size() < max_elems ? value.size() : max_elems;
+        value.resize(elems_size, arena);
+        size_t size = value.size();
+
+        ColumnArray & arr_to = assert_cast<ColumnArray &>(to);
+        ColumnArray::Offsets & offsets_to = arr_to.getOffsets();
+
+        offsets_to.push_back(offsets_to.back() + size);
+
+        if (size)
+        {
+            typename ColumnVector<T>::Container & data_to = assert_cast<ColumnVector<T> &>(arr_to.getData()).getData();
+            data_to.insert(this->data(place).value.begin(), this->data(place).value.end());
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
+            value.resize(elems_size, arena);
+        }
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+};
+
+
+template <typename Node, bool has_sampler>
+struct GroupArraySortedGeneralData;
+
+template <typename Node>
+struct GroupArraySortedGeneralData<Node, false>
+{
+    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
+    using Allocator = MixedAlignedArenaAllocator<alignof(Node *), 4096>;
+    using Array = PODArray<Field, 32, Allocator>;
+
+    Array value;
+};
+
+template <typename Node>
+struct GroupArraySortedNodeBase
+{
+    UInt64 size; // size of payload
+
+    /// Returns pointer to actual payload
+    char * data() { return reinterpret_cast<char *>(this) + sizeof(Node); }
+
+    const char * data() const { return reinterpret_cast<const char *>(this) + sizeof(Node); }
+};
+
+struct GroupArraySortedNodeString : public GroupArraySortedNodeBase<GroupArraySortedNodeString>
+{
+    using Node = GroupArraySortedNodeString;
+
+};
+
+struct GroupArraySortedNodeGeneral : public GroupArraySortedNodeBase<GroupArraySortedNodeGeneral>
+{
+    using Node = GroupArraySortedNodeGeneral;
+
+};
+
+/// Implementation of groupArraySorted for Generic data via Array
+template <typename Node>
+class GroupArraySortedGeneralImpl final
+    : public IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>
+{
+    using Data = GroupArraySortedGeneralData<Node, false>;
+    static Data & data(AggregateDataPtr __restrict place) { return *reinterpret_cast<Data *>(place); }
+    static const Data & data(ConstAggregateDataPtr __restrict place) { return *reinterpret_cast<const Data *>(place); }
+
+    DataTypePtr & data_type;
+    UInt64 max_elems;
+    SerializationPtr serialization;
+
+
+public:
+    GroupArraySortedGeneralImpl(const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
+        : IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , data_type(this->argument_types[0])
+        , max_elems(max_elems_)
+        , serialization(data_type->getDefaultSerialization())
+    {
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        auto & cur_elems = data(place);
+
+        cur_elems.value.push_back(columns[0][0][row_num], arena);
+
+        /// To optimize, we sort (2 * max_size) elements of input array over and over again and
+        /// after each loop we delete the last half of sorted array
+
+        if (cur_elems.value.size() >= max_elems * 2)
+        {
+            std::sort(cur_elems.value.begin(), cur_elems.value.begin() + (max_elems * 2));
+            cur_elems.value.erase(cur_elems.value.begin() + max_elems, cur_elems.value.begin() + (max_elems * 2));
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & cur_elems = data(place);
+        auto & rhs_elems = data(rhs);
+
+        if (rhs_elems.value.empty())
+            return;
+
+        UInt64 new_elems = rhs_elems.value.size();
+
+        for (UInt64 i = 0; i < new_elems; ++i)
+            cur_elems.value.push_back(rhs_elems.value[i], arena);
+
+        checkArraySize(cur_elems.value.size(), AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+
+        if (!cur_elems.value.empty())
+        {
+            std::sort(cur_elems.value.begin(), cur_elems.value.end());
+
+            if (cur_elems.value.size() > max_elems)
+                cur_elems.value.resize(max_elems, arena);
+        }
+    }
+
+    static void checkArraySize(size_t elems, size_t max_elems)
+    {
+        if (unlikely(elems > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
+                            "Too large array size {} (maximum: {})", elems, max_elems);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & value = data(place).value;
+        size_t size = value.size();
+        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+        writeVarUInt(size, buf);
+
+        for (const Field & elem : value)
+        {
+            if (elem.isNull())
+            {
+                writeBinary(false, buf);
+            }
+            else
+            {
+                writeBinary(true, buf);
+                serialization->serializeBinary(elem, buf, {});
+            }
+        }
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elems))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
+
+        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
+        auto & value = data(place).value;
+
+        value.resize(size, arena);
+        for (Field & elem : value)
+        {
+            UInt8 is_null = 0;
+            readBinary(is_null, buf);
+            if (!is_null)
+                serialization->deserializeBinary(elem, buf, {});
+        }
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        auto & column_array = assert_cast<ColumnArray &>(to);
+        auto & value = data(place).value;
+
+        if (!value.empty())
+        {
+            std::sort(value.begin(), value.end());
+
+            if (value.size() > max_elems)
+                value.resize_exact(max_elems, arena);
+        }
+        auto & offsets = column_array.getOffsets();
+        offsets.push_back(offsets.back() + value.size());
+
+        auto & column_data = column_array.getData();
+
+        if (std::is_same_v<Node, GroupArraySortedNodeString>)
+        {
+            auto & string_offsets = assert_cast<ColumnString &>(column_data).getOffsets();
+            string_offsets.reserve(string_offsets.size() + value.size());
+        }
+
+        for (const Field& field : value)
+            column_data.insert(field);
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+};
+
+#undef AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ARRAY_SIZE
+
+}
diff --git a/src/AggregateFunctions/registerAggregateFunctions.cpp b/src/AggregateFunctions/registerAggregateFunctions.cpp
index 6d3a144fa49..f44bc9e126c 100644
--- a/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/src/AggregateFunctions/registerAggregateFunctions.cpp
@@ -15,6 +15,7 @@ void registerAggregateFunctionCount(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSum(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSumTimestamp(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArray(AggregateFunctionFactory &);
+void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory);
 void registerAggregateFunctionGroupUniqArray(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArrayInsertAt(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantile(AggregateFunctionFactory &);
@@ -112,6 +113,7 @@ void registerAggregateFunctions()
         registerAggregateFunctionDeltaSum(factory);
         registerAggregateFunctionDeltaSumTimestamp(factory);
         registerAggregateFunctionGroupArray(factory);
+        registerAggregateFunctionGroupArraySorted(factory);
         registerAggregateFunctionGroupUniqArray(factory);
         registerAggregateFunctionGroupArrayInsertAt(factory);
         registerAggregateFunctionsQuantile(factory);
diff --git a/tests/performance/group_array_sorted.xml b/tests/performance/group_array_sorted.xml
new file mode 100644
index 00000000000..d5887998341
--- /dev/null
+++ b/tests/performance/group_array_sorted.xml
@@ -0,0 +1,31 @@
+<test>
+    <settings>
+        <max_memory_usage>30000000000</max_memory_usage>
+    </settings>
+
+    <substitutions>
+        <substitution>
+            <name>millions</name>
+            <values>
+                <value>50</value>
+                <value>100</value>
+            </values>
+        </substitution>
+        <substitution>
+            <name>window</name>
+            <values>
+                <value>10</value>
+                <value>1000</value>
+                <value>10000</value>
+            </values>
+        </substitution>
+    </substitutions>
+
+    <create_query>create table sorted_{millions}m engine MergeTree order by k as select number % 100 k, rand() v from numbers_mt(1000000 * {millions})</create_query>
+    <create_query>optimize table sorted_{millions}m final</create_query>
+
+    <query>select k, groupArraySorted({window})(v) from sorted_{millions}m group by k format Null</query>
+    <query>select k % 10 kk, groupArraySorted({window})(v) from sorted_{millions}m group by kk format Null</query>
+
+    <drop_query>drop table if exists sorted_{millions}m</drop_query>
+</test>
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.reference b/tests/queries/0_stateless/02841_group_array_sorted.reference
new file mode 100644
index 00000000000..1043f949590
--- /dev/null
+++ b/tests/queries/0_stateless/02841_group_array_sorted.reference
@@ -0,0 +1,12 @@
+[0,1,2,3,4]
+[0,1,2,3,4]
+[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99]
+['0','1','10','11','12','13','14','15','16','17','18','19','2','20','21','22','23','24','25','26','27','28','29','3','4','5','6','7','8','9']
+[0,0,1,1,2,2,3,3,4,4]
+[[1,2,3,4],[2,3,4,5],[3,4,5,6]]
+[(2,1),(15,25),(30,60),(100,200)]
+[0.2,2.2,6.6,12.5]
+['AAA','Aaa','aaa','abc','bbc']
+1000000
+1000000
+[0,1]
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.sql b/tests/queries/0_stateless/02841_group_array_sorted.sql
new file mode 100644
index 00000000000..a8cd6791ff3
--- /dev/null
+++ b/tests/queries/0_stateless/02841_group_array_sorted.sql
@@ -0,0 +1,41 @@
+SELECT groupArraySorted(5)(number) FROM numbers(100);
+
+SELECT groupArraySorted(10)(number) FROM numbers(5);
+
+SELECT groupArraySorted(100)(number) FROM numbers(1000);
+
+SELECT groupArraySorted(30)(str) FROM (SELECT toString(number) as str FROM numbers(30));
+
+SELECT groupArraySorted(10)(toInt64(number/2)) FROM numbers(100);
+
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a Array(UInt64)) engine=MergeTree ORDER BY a;
+INSERT INTO test VALUES ([3,4,5,6]), ([1,2,3,4]), ([2,3,4,5]);
+SELECT groupArraySorted(3)(a) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data Tuple(Int32, Int32)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, (100, 200)), (2, (15, 25)), (3, (2, 1)), (4, (30, 60));
+SELECT groupArraySorted(4)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data Decimal32(2)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, 12.5), (2, 0.2), (3, 6.6), (4, 2.2);
+SELECT groupArraySorted(4)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE IF NOT EXISTS test (id Int32, data FixedString(3)) ENGINE = MergeTree() ORDER BY id;
+INSERT INTO test (id, data) VALUES (1, 'AAA'), (2, 'bbc'), (3, 'abc'), (4, 'aaa'), (5, 'Aaa');
+SELECT groupArraySorted(5)(data) FROM test;
+DROP TABLE test;
+
+CREATE TABLE test (id Decimal(76, 53), str String) ENGINE = MergeTree ORDER BY id;
+INSERT INTO test SELECT number, 'test' FROM numbers(1000000);
+SELECT count(id) FROM test;
+SELECT count(concat(toString(id), 'a')) FROM test;
+DROP TABLE test;
+
+CREATE TABLE test (id UInt64, agg AggregateFunction(groupArraySorted(2), UInt64)) engine=MergeTree ORDER BY id;
+INSERT INTO test SELECT 1, groupArraySortedState(2)(number) FROM numbers(10);
+SELECT groupArraySortedMerge(2)(agg) FROM test;
+DROP TABLE test;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 93e2a12d69c..cacba174237 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1593,6 +1593,7 @@ groupArrayLast
 groupArrayMovingAvg
 groupArrayMovingSum
 groupArraySample
+groupArraySorted
 groupBitAnd
 groupBitOr
 groupBitXor
@@ -1607,6 +1608,7 @@ grouparraylast
 grouparraymovingavg
 grouparraymovingsum
 grouparraysample
+grouparraysorted
 groupbitand
 groupbitmap
 groupbitmapand

From 86a542b5c4bb9978830b82e07c7dc80f3c6a5df3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 24 Jan 2024 15:06:21 +0300
Subject: [PATCH 0421/1081] Updated implementation

---
 base/base/sort.h                              |  20 +-
 .../AggregateFunctionGroupArraySorted.cpp     | 333 +++++++++++++++-
 .../AggregateFunctionGroupArraySorted.h       | 355 ------------------
 .../examples/CMakeLists.txt                   |   3 +
 .../examples/group_array_sorted.cpp           | 205 ++++++++++
 5 files changed, 543 insertions(+), 373 deletions(-)
 delete mode 100644 src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
 create mode 100644 src/AggregateFunctions/examples/group_array_sorted.cpp

diff --git a/base/base/sort.h b/base/base/sort.h
index 1a814587763..99bf8a0830e 100644
--- a/base/base/sort.h
+++ b/base/base/sort.h
@@ -64,19 +64,14 @@ using ComparatorWrapper = Comparator;
 
 #include <miniselect/floyd_rivest_select.h>
 
-template <typename RandomIt>
-void nth_element(RandomIt first, RandomIt nth, RandomIt last)
+template <typename RandomIt, typename Compare>
+void nth_element(RandomIt first, RandomIt nth, RandomIt last, Compare compare)
 {
-    using value_type = typename std::iterator_traits<RandomIt>::value_type;
-    using comparator = std::less<value_type>;
-
-    comparator compare;
-    ComparatorWrapper<comparator> compare_wrapper = compare;
-
 #ifndef NDEBUG
     ::shuffle(first, last);
 #endif
 
+    ComparatorWrapper<Compare> compare_wrapper = compare;
     ::miniselect::floyd_rivest_select(first, nth, last, compare_wrapper);
 
 #ifndef NDEBUG
@@ -87,6 +82,15 @@ void nth_element(RandomIt first, RandomIt nth, RandomIt last)
 #endif
 }
 
+template <typename RandomIt>
+void nth_element(RandomIt first, RandomIt nth, RandomIt last)
+{
+    using value_type = typename std::iterator_traits<RandomIt>::value_type;
+    using comparator = std::less<value_type>;
+
+    ::nth_element(first, nth, last, comparator());
+}
+
 template <typename RandomIt, typename Compare>
 void partial_sort(RandomIt first, RandomIt middle, RandomIt last, Compare compare)
 {
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index debc9b6d565..5eb20f9d14d 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -1,45 +1,356 @@
+#include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/AggregateFunctionGroupArraySorted.h>
 #include <AggregateFunctions/Helpers.h>
 #include <AggregateFunctions/FactoryHelpers.h>
+
+#include <base/sort.h>
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+
+#include <Common/RadixSort.h>
+#include <Common/Exception.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/assert_cast.h>
+
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+
+#include <DataTypes/IDataType.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
-#include <Common/Exception.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnVector.h>
+
+#include <Columns/IColumn.h>
+#include <Columns/ColumnConst.h>
 
 namespace DB
 {
+
 struct Settings;
 
 namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int BAD_ARGUMENTS;
+    extern const int UNSUPPORTED_METHOD;
+    extern const int TOO_LARGE_ARRAY_SIZE;
 }
 
 namespace
 {
 
+enum class GroupArraySortedStrategy
+{
+    heap,
+    sort
+};
+
+constexpr size_t group_array_sorted_sort_strategy_max_elements_threshold = 1000000;
+
+template <typename T, GroupArraySortedStrategy strategy>
+struct GroupArraySortedData
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    static constexpr size_t partial_sort_max_elements_factor = 2;
+
+    static constexpr bool is_value_generic_field = std::is_same_v<T, Field>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        if constexpr (is_value_generic_field)
+        {
+            return lhs < rhs;
+        }
+        else
+        {
+            return CompareHelper<T>::less(lhs, rhs, -1);
+        }
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void heapReplaceTop()
+    {
+        size_t size = values.size();
+        if (size < 2)
+            return;
+
+        size_t child_index = 1;
+
+        if (values.size() > 2 && compare(values[1], values[2]))
+            ++child_index;
+
+        /// Check if we are in order
+        if (compare(values[child_index], values[0]))
+            return;
+
+        size_t current_index = 0;
+        auto current = values[current_index];
+
+        do
+        {
+            /// We are not in heap-order, swap the parent with it's largest child.
+            values[current_index] = values[child_index];
+            current_index = child_index;
+
+            // Recompute the child based off of the updated parent
+            child_index = 2 * child_index + 1;
+
+            if (child_index >= size)
+                break;
+
+            if ((child_index + 1) < size && compare(values[child_index], values[child_index + 1]))
+            {
+                /// Right child exists and is greater than left child.
+                ++child_index;
+            }
+
+            /// Check if we are in order.
+        } while (!compare(values[child_index], current));
+
+        values[current_index] = current;
+    }
+
+    ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
+    {
+        if constexpr (is_value_generic_field)
+            ::sort(values.begin(), values.end(), Comparator());
+        else
+            RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+
+        if (values.size() > max_elements)
+            values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void partialSortAndLimitIfNeeded(size_t max_elements, Arena * arena)
+    {
+        if (values.size() < max_elements * partial_sort_max_elements_factor)
+            return;
+
+        ::nth_element(values.begin(), values.begin() + max_elements, values.end(), Comparator());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void addElement(T && element, size_t max_elements, Arena * arena)
+    {
+        if constexpr (strategy == GroupArraySortedStrategy::heap)
+        {
+            if (values.size() >= max_elements)
+            {
+                /// Element is greater or equal than current max element, it cannot be in k min elements
+                if (!compare(element, values[0]))
+                    return;
+
+                values[0] = std::move(element);
+                heapReplaceTop();
+                return;
+            }
+
+            values.push_back(std::move(element), arena);
+            std::push_heap(values.begin(), values.end(), Comparator());
+        }
+        else
+        {
+            values.push_back(std::move(element), arena);
+            partialSortAndLimitIfNeeded(max_elements, arena);
+        }
+    }
+
+    ALWAYS_INLINE void insertResultInto(IColumn & to, size_t max_elements, Arena * arena)
+    {
+        auto & result_array = assert_cast<ColumnArray &>(to);
+        auto & result_array_offsets = result_array.getOffsets();
+
+        sortAndLimit(max_elements, arena);
+
+        result_array_offsets.push_back(result_array_offsets.back() + values.size());
+
+        if (values.empty())
+            return;
+
+        if constexpr (is_value_generic_field)
+        {
+            auto & result_array_data = result_array.getData();
+            for (auto & value : values)
+                result_array_data.insert(value);
+        }
+        else
+        {
+            auto & result_array_data = assert_cast<ColumnVector<T> &>(result_array.getData()).getData();
+
+            size_t result_array_data_insert_begin = result_array_data.size();
+            result_array_data.resize(result_array_data_insert_begin + values.size());
+
+            for (size_t i = 0; i < values.size(); ++i)
+                result_array_data[result_array_data_insert_begin + i] = values[i];
+        }
+    }
+};
+
+template <typename T>
+using GroupArraySortedDataHeap = GroupArraySortedData<T, GroupArraySortedStrategy::heap>;
+
+template <typename T>
+using GroupArraySortedDataSort = GroupArraySortedData<T, GroupArraySortedStrategy::sort>;
+
+constexpr UInt64 aggregate_function_group_array_sorted_max_element_size = 0xFFFFFF;
+
+template <typename Data, typename T>
+class GroupArraySorted final
+    : public IAggregateFunctionDataHelper<Data, GroupArraySorted<Data, T>>
+{
+public:
+    explicit GroupArraySorted(
+        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elements_)
+        : IAggregateFunctionDataHelper<Data, GroupArraySorted<Data, T>>(
+            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
+        , max_elements(max_elements_)
+        , serialization(data_type_->getDefaultSerialization())
+    {
+        if (max_elements > aggregate_function_group_array_sorted_max_element_size)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Too large limit parameter for groupArraySorted aggregate function, it should not exceed {}",
+                aggregate_function_group_array_sorted_max_element_size);
+    }
+
+    String getName() const override { return "groupArraySorted"; }
+
+    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
+    {
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            auto row_value = (*columns[0])[row_num];
+            this->data(place).addElement(std::move(row_value), max_elements, arena);
+        }
+        else
+        {
+            auto row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
+            this->data(place).addElement(std::move(row_value), max_elements, arena);
+        }
+    }
+
+    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
+    {
+        auto & rhs_values = this->data(rhs).values;
+        for (auto rhs_element : rhs_values)
+            this->data(place).addElement(std::move(rhs_element), max_elements, arena);
+    }
+
+    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
+    {
+        auto & values = this->data(place).values;
+        size_t size = values.size();
+        writeVarUInt(size, buf);
+
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            for (const Field & element : values)
+            {
+                if (element.isNull())
+                {
+                    writeBinary(false, buf);
+                }
+                else
+                {
+                    writeBinary(true, buf);
+                    serialization->serializeBinary(element, buf, {});
+                }
+            }
+        }
+        else
+        {
+            for (const auto & element : values)
+                writeBinaryLittleEndian(element, buf);
+        }
+    }
+
+    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
+    {
+        size_t size = 0;
+        readVarUInt(size, buf);
+
+        if (unlikely(size > max_elements))
+            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elements);
+
+        auto & values = this->data(place).values;
+        values.resize(size, arena);
+
+        if constexpr (std::is_same_v<T, Field>)
+        {
+            for (Field & element : values)
+            {
+                UInt8 is_null = 0;
+                readBinary(is_null, buf);
+                if (!is_null)
+                    serialization->deserializeBinary(element, buf, {});
+            }
+        }
+        else
+        {
+            for (auto & element : values)
+                readBinaryLittleEndian(element, buf);
+        }
+    }
+
+    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
+    {
+        this->data(place).insertResultInto(to, max_elements, arena);
+    }
+
+    bool allocatesMemoryInArena() const override { return true; }
+
+private:
+    UInt64 max_elements;
+    SerializationPtr serialization;
+};
+
+template <typename T>
+using GroupArraySortedHeap = GroupArraySorted<GroupArraySortedDataHeap<T>, T>;
+
+template <typename T>
+using GroupArraySortedSort = GroupArraySorted<GroupArraySortedDataSort<T>, T>;
+
 template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
 AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type, TArgs && ... args)
 {
     WhichDataType which(argument_type);
+
     if (which.idx == TypeIndex::Date) return std::make_shared<AggregateFunctionTemplate<UInt16>>(std::forward<TArgs>(args)...);
     if (which.idx == TypeIndex::DateTime) return std::make_shared<AggregateFunctionTemplate<UInt32>>(std::forward<TArgs>(args)...);
     if (which.idx == TypeIndex::IPv4) return std::make_shared<AggregateFunctionTemplate<IPv4>>(std::forward<TArgs>(args)...);
+
     return AggregateFunctionPtr(createWithNumericType<AggregateFunctionTemplate, TArgs...>(argument_type, std::forward<TArgs>(args)...));
 }
 
-template <typename ... TArgs>
+template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
 inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
 {
-    if (auto res = createWithNumericOrTimeType<GroupArraySortedNumericImpl>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
+    if (auto res = createWithNumericOrTimeType<AggregateFunctionTemplate>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
         return AggregateFunctionPtr(res);
 
-    WhichDataType which(argument_type);
-    return std::make_shared<GroupArraySortedGeneralImpl<GroupArraySortedNodeGeneral>>(argument_type, parameters, std::forward<TArgs>(args)...);
+    return std::make_shared<AggregateFunctionTemplate<Field>>(argument_type, parameters, std::forward<TArgs>(args)...);
 }
 
-AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
+AggregateFunctionPtr createAggregateFunctionGroupArray(
     const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
 {
     assertUnary(name, argument_types);
@@ -66,17 +377,19 @@ AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
         throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
             "Function {} does not support this number of arguments", name);
 
-    return createAggregateFunctionGroupArraySortedImpl(argument_types[0], parameters, max_elems);
+    if (max_elems > group_array_sorted_sort_strategy_max_elements_threshold)
+        return createAggregateFunctionGroupArraySortedImpl<GroupArraySortedSort>(argument_types[0], parameters, max_elems);
+
+    return createAggregateFunctionGroupArraySortedImpl<GroupArraySortedHeap>(argument_types[0], parameters, max_elems);
 }
 
 }
 
-
 void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory)
 {
     AggregateFunctionProperties properties = { .returns_default_when_only_null = false, .is_order_dependent = false };
 
-    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArraySorted, properties });
+    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArray, properties });
 }
 
 }
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
deleted file mode 100644
index 5079eaad756..00000000000
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
+++ /dev/null
@@ -1,355 +0,0 @@
-#pragma once
-
-#include <IO/ReadHelpers.h>
-#include <IO/WriteHelpers.h>
-#include <IO/ReadBufferFromString.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/Operators.h>
-
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnVector.h>
-#include <Functions/array/arraySort.h>
-
-#include <Common/Exception.h>
-#include <Common/ArenaAllocator.h>
-#include <Common/assert_cast.h>
-#include <Columns/ColumnConst.h>
-#include <DataTypes/IDataType.h>
-#include <base/sort.h>
-#include <Columns/IColumn.h>
-
-#include <AggregateFunctions/IAggregateFunction.h>
-
-#include <Common/RadixSort.h>
-#include <algorithm>
-#include <type_traits>
-#include <utility>
-
-#define AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE 0xFFFFFF
-
-namespace DB
-{
-struct Settings;
-
-namespace ErrorCodes
-{
-    extern const int TOO_LARGE_ARRAY_SIZE;
-}
-
-template <typename T>
-struct GroupArraySortedData;
-
-template <typename T>
-struct GroupArraySortedData
-{
-    /// For easy serialization.
-    static_assert(std::has_unique_object_representations_v<T> || std::is_floating_point_v<T>);
-
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
-    using Array = PODArray<T, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename T>
-class GroupArraySortedNumericImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>
-{
-    using Data = GroupArraySortedData<T>;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-public:
-    explicit GroupArraySortedNumericImpl(
-        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , max_elems(max_elems_)
-        , serialization(data_type_->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        const auto & row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
-        auto & cur_elems = this->data(place);
-
-        cur_elems.value.push_back(row_value, arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again
-        /// and after each loop we delete the last half of sorted array
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-            cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = this->data(place);
-        auto & rhs_elems = this->data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        if (rhs_elems.value.size())
-            cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-
-        size_t elems_size = cur_elems.value.size() < max_elems ? cur_elems.value.size() : max_elems;
-        cur_elems.value.resize(elems_size, arena);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = this->data(place).value;
-        size_t size = value.size();
-        writeVarUInt(size, buf);
-
-        for (const auto & elem : value)
-            writeBinaryLittleEndian(elem, buf);
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        auto & value = this->data(place).value;
-
-        value.resize(size, arena);
-        for (auto & element : value)
-            readBinaryLittleEndian(element, buf);
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto& value = this->data(place).value;
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-        size_t elems_size = value.size() < max_elems ? value.size() : max_elems;
-        value.resize(elems_size, arena);
-        size_t size = value.size();
-
-        ColumnArray & arr_to = assert_cast<ColumnArray &>(to);
-        ColumnArray::Offsets & offsets_to = arr_to.getOffsets();
-
-        offsets_to.push_back(offsets_to.back() + size);
-
-        if (size)
-        {
-            typename ColumnVector<T>::Container & data_to = assert_cast<ColumnVector<T> &>(arr_to.getData()).getData();
-            data_to.insert(this->data(place).value.begin(), this->data(place).value.end());
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-            value.resize(elems_size, arena);
-        }
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-
-template <typename Node, bool has_sampler>
-struct GroupArraySortedGeneralData;
-
-template <typename Node>
-struct GroupArraySortedGeneralData<Node, false>
-{
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(Node *), 4096>;
-    using Array = PODArray<Field, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename Node>
-struct GroupArraySortedNodeBase
-{
-    UInt64 size; // size of payload
-
-    /// Returns pointer to actual payload
-    char * data() { return reinterpret_cast<char *>(this) + sizeof(Node); }
-
-    const char * data() const { return reinterpret_cast<const char *>(this) + sizeof(Node); }
-};
-
-struct GroupArraySortedNodeString : public GroupArraySortedNodeBase<GroupArraySortedNodeString>
-{
-    using Node = GroupArraySortedNodeString;
-
-};
-
-struct GroupArraySortedNodeGeneral : public GroupArraySortedNodeBase<GroupArraySortedNodeGeneral>
-{
-    using Node = GroupArraySortedNodeGeneral;
-
-};
-
-/// Implementation of groupArraySorted for Generic data via Array
-template <typename Node>
-class GroupArraySortedGeneralImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>
-{
-    using Data = GroupArraySortedGeneralData<Node, false>;
-    static Data & data(AggregateDataPtr __restrict place) { return *reinterpret_cast<Data *>(place); }
-    static const Data & data(ConstAggregateDataPtr __restrict place) { return *reinterpret_cast<const Data *>(place); }
-
-    DataTypePtr & data_type;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-
-public:
-    GroupArraySortedGeneralImpl(const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , data_type(this->argument_types[0])
-        , max_elems(max_elems_)
-        , serialization(data_type->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-
-        cur_elems.value.push_back(columns[0][0][row_num], arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again and
-        /// after each loop we delete the last half of sorted array
-
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.begin() + (max_elems * 2));
-            cur_elems.value.erase(cur_elems.value.begin() + max_elems, cur_elems.value.begin() + (max_elems * 2));
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-        auto & rhs_elems = data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        UInt64 new_elems = rhs_elems.value.size();
-
-        for (UInt64 i = 0; i < new_elems; ++i)
-            cur_elems.value.push_back(rhs_elems.value[i], arena);
-
-        checkArraySize(cur_elems.value.size(), AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-
-        if (!cur_elems.value.empty())
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.end());
-
-            if (cur_elems.value.size() > max_elems)
-                cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = data(place).value;
-        size_t size = value.size();
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        writeVarUInt(size, buf);
-
-        for (const Field & elem : value)
-        {
-            if (elem.isNull())
-            {
-                writeBinary(false, buf);
-            }
-            else
-            {
-                writeBinary(true, buf);
-                serialization->serializeBinary(elem, buf, {});
-            }
-        }
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        auto & value = data(place).value;
-
-        value.resize(size, arena);
-        for (Field & elem : value)
-        {
-            UInt8 is_null = 0;
-            readBinary(is_null, buf);
-            if (!is_null)
-                serialization->deserializeBinary(elem, buf, {});
-        }
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto & column_array = assert_cast<ColumnArray &>(to);
-        auto & value = data(place).value;
-
-        if (!value.empty())
-        {
-            std::sort(value.begin(), value.end());
-
-            if (value.size() > max_elems)
-                value.resize_exact(max_elems, arena);
-        }
-        auto & offsets = column_array.getOffsets();
-        offsets.push_back(offsets.back() + value.size());
-
-        auto & column_data = column_array.getData();
-
-        if (std::is_same_v<Node, GroupArraySortedNodeString>)
-        {
-            auto & string_offsets = assert_cast<ColumnString &>(column_data).getOffsets();
-            string_offsets.reserve(string_offsets.size() + value.size());
-        }
-
-        for (const Field& field : value)
-            column_data.insert(field);
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-#undef AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ARRAY_SIZE
-
-}
diff --git a/src/AggregateFunctions/examples/CMakeLists.txt b/src/AggregateFunctions/examples/CMakeLists.txt
index b11f8d37d69..a9033fd8508 100644
--- a/src/AggregateFunctions/examples/CMakeLists.txt
+++ b/src/AggregateFunctions/examples/CMakeLists.txt
@@ -1,2 +1,5 @@
 clickhouse_add_executable (quantile-t-digest quantile-t-digest.cpp)
 target_link_libraries (quantile-t-digest PRIVATE dbms clickhouse_aggregate_functions)
+
+clickhouse_add_executable (group_array_sorted group_array_sorted.cpp)
+target_link_libraries (group_array_sorted PRIVATE dbms clickhouse_aggregate_functions)
diff --git a/src/AggregateFunctions/examples/group_array_sorted.cpp b/src/AggregateFunctions/examples/group_array_sorted.cpp
new file mode 100644
index 00000000000..22f7b8d2446
--- /dev/null
+++ b/src/AggregateFunctions/examples/group_array_sorted.cpp
@@ -0,0 +1,205 @@
+#include <algorithm>
+#include <type_traits>
+#include <utility>
+#include <iostream>
+
+#include "pcg_random.hpp"
+
+#include <Columns/ColumnVector.h>
+#include <Common/ArenaAllocator.h>
+#include <Common/RadixSort.h>
+#include <Columns/ColumnArray.h>
+
+
+using namespace DB;
+
+template <typename T>
+struct GroupArraySortedDataHeap
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        return lhs < rhs;
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void replaceTop()
+    {
+        size_t size = values.size();
+        if (size < 2)
+            return;
+
+        size_t child_index = 1;
+
+        if (values.size() > 2 && compare(values[1], values[2]))
+            ++child_index;
+
+        /// Check if we are in order
+        if (compare(values[child_index], values[0]))
+            return;
+
+        size_t current_index = 0;
+        auto current = values[current_index];
+
+        do
+        {
+            /// We are not in heap-order, swap the parent with it's largest child.
+            values[current_index] = values[child_index];
+            current_index = child_index;
+
+            // Recompute the child based off of the updated parent
+            child_index = 2 * child_index + 1;
+
+            if (child_index >= size)
+                break;
+
+            if ((child_index + 1) < size && compare(values[child_index], values[child_index + 1]))
+            {
+                /// Right child exists and is greater than left child.
+                ++child_index;
+            }
+
+            /// Check if we are in order.
+        } while (!compare(values[child_index], current));
+
+        values[current_index] = current;
+    }
+
+    ALWAYS_INLINE void addElement(const T & element, size_t max_elements, Arena * arena)
+    {
+        if (values.size() >= max_elements)
+        {
+            /// Element is greater or equal than current max element, it cannot be in k min elements
+            if (!compare(element, values[0]))
+                return;
+
+            values[0] = element;
+            replaceTop();
+            return;
+        }
+
+        values.push_back(element, arena);
+        std::push_heap(values.begin(), values.end(), Comparator());
+    }
+
+    ALWAYS_INLINE void dump()
+    {
+        while (!values.empty())
+        {
+            std::pop_heap(values.begin(), values.end(), Comparator());
+            std::cerr << values.back() << ' ';
+            values.pop_back();
+        }
+
+        std::cerr << '\n';
+    }
+};
+
+template <typename T>
+struct GroupArraySortedDataSort
+{
+    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
+    using Array = PODArray<T, 32, Allocator>;
+
+    Array values;
+
+    static bool compare(const T & lhs, const T & rhs)
+    {
+        return lhs < rhs;
+    }
+
+    struct Comparator
+    {
+        bool operator()(const T & lhs, const T & rhs)
+        {
+            return compare(lhs, rhs);
+        }
+    };
+
+    ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
+    {
+        RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void partialSortAndLimitIfNeeded(size_t max_elements, Arena * arena)
+    {
+        if (values.size() < max_elements * 4)
+            return;
+
+        std::nth_element(values.begin(), values.begin() + max_elements, values.end(), Comparator());
+        values.resize(max_elements, arena);
+    }
+
+    ALWAYS_INLINE void addElement(const T & element, size_t max_elements, Arena * arena)
+    {
+        values.push_back(element, arena);
+        partialSortAndLimitIfNeeded(max_elements, arena);
+    }
+};
+
+template <typename SortedData>
+NO_INLINE void benchmark(size_t elements, size_t max_elements)
+{
+    Stopwatch watch;
+    watch.start();
+
+    SortedData data;
+    pcg64_fast rng;
+
+    Arena arena;
+
+    for (size_t i = 0; i < elements; ++i)
+    {
+        uint64_t value = rng();
+        data.addElement(value, max_elements, &arena);
+    }
+
+    watch.stop();
+    std::cerr << "Elapsed " << watch.elapsedMilliseconds() << " milliseconds" << '\n';
+}
+
+int main(int argc, char ** argv)
+{
+    (void)(argc);
+    (void)(argv);
+
+    if (argc != 4)
+    {
+        std::cerr << "./group_array_sorted method elements max_elements" << '\n';
+        return 1;
+    }
+
+    std::string method = std::string(argv[1]);
+    uint64_t elements = std::atol(argv[2]);
+    uint64_t max_elements = std::atol(argv[3]);
+
+    std::cerr << "Method " << method << " elements " << elements << " max elements " << max_elements << '\n';
+
+    if (method == "heap")
+    {
+        benchmark<GroupArraySortedDataHeap<UInt64>>(elements, max_elements);
+    }
+    else if (method == "sort")
+    {
+        benchmark<GroupArraySortedDataSort<UInt64>>(elements, max_elements);
+    }
+    else
+    {
+        std::cerr << "Invalid method " << method << '\n';
+        return 1;
+    }
+
+    return 0;
+}

From 948f3f1f623df5ea51c885fc8088080b66ae4660 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 24 Jan 2024 16:23:35 +0300
Subject: [PATCH 0422/1081] Fixed style check

---
 src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 5eb20f9d14d..751bc4630e7 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -41,7 +41,6 @@ namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int BAD_ARGUMENTS;
-    extern const int UNSUPPORTED_METHOD;
     extern const int TOO_LARGE_ARRAY_SIZE;
 }
 

From 0ba3f92248574bbd95a78850200aab25a6aef574 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 30 Jan 2024 16:11:43 +0100
Subject: [PATCH 0423/1081] Add a workaround for ASAN

---
 tests/queries/0_stateless/02971_analyzer_remote_id.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02971_analyzer_remote_id.sh b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
index 21141fa47ff..463e4cc1f0c 100755
--- a/tests/queries/0_stateless/02971_analyzer_remote_id.sh
+++ b/tests/queries/0_stateless/02971_analyzer_remote_id.sh
@@ -9,6 +9,7 @@ ${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"
 ${CLICKHOUSE_CLIENT} --query="CREATE DATABASE test_02971"
 
 ${CLICKHOUSE_CLIENT} --query="CREATE TABLE test_02971.x ENGINE = MergeTree() ORDER BY number AS SELECT * FROM numbers(2)"
-${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1"
+${CLICKHOUSE_LOCAL} --query="SELECT count() FROM remote('127.0.0.{2,3}', 'test_02971.x') SETTINGS allow_experimental_analyzer = 1" 2>&1 \
+        | grep -av "ASan doesn't fully support makecontext/swapcontext functions"
 
 ${CLICKHOUSE_CLIENT} --query="DROP DATABASE IF EXISTS test_02971"

From b379adde9266a1afd45ccc228d84f9a36e0af92d Mon Sep 17 00:00:00 2001
From: Joshua Hildred <jthildred@gmail.com>
Date: Tue, 30 Jan 2024 07:23:13 -0800
Subject: [PATCH 0424/1081] Include proper version information

---
 .../linux_x86_64/include/libxml/xmlversion.h          | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
index 010bc2787a1..d8535e91a0e 100644
--- a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
+++ b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
@@ -29,28 +29,28 @@ XMLPUBFUN void xmlCheckVersion(int version);
  *
  * the version string like "1.2.3"
  */
-#define LIBXML_DOTTED_VERSION "2.12.2"
+#define LIBXML_DOTTED_VERSION "2.12.4"
 
 /**
  * LIBXML_VERSION:
  *
  * the version number: 1.2.3 value is 10203
  */
-#define LIBXML_VERSION 21202
+#define LIBXML_VERSION 21204
 
 /**
  * LIBXML_VERSION_STRING:
  *
  * the version number string, 1.2.3 value is "10203"
  */
-#define LIBXML_VERSION_STRING "21202"
+#define LIBXML_VERSION_STRING "21204"
 
 /**
  * LIBXML_VERSION_EXTRA:
  *
  * extra version information, used to show a git commit description
  */
-#define LIBXML_VERSION_EXTRA "-GITv2.12.2-5-g23dd0b76"
+#define LIBXML_VERSION_EXTRA "-GITv2.12.4"
 
 /**
  * LIBXML_TEST_VERSION:
@@ -58,7 +58,7 @@ XMLPUBFUN void xmlCheckVersion(int version);
  * Macro to check that the libxml version in use is compatible with
  * the version the software has been compiled against
  */
-#define LIBXML_TEST_VERSION xmlCheckVersion(21202);
+#define LIBXML_TEST_VERSION xmlCheckVersion(21204);
 
 #ifndef VMS
 #if 0
@@ -507,4 +507,3 @@ XMLPUBFUN void xmlCheckVersion(int version);
 }
 #endif /* __cplusplus */
 #endif
-

From 145f6a31cbb4a1063de5b98704ab9357ec48dd0b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 30 Jan 2024 15:58:35 +0100
Subject: [PATCH 0425/1081] Fix

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp   |  8 ++------
 src/Storages/S3Queue/S3QueueFilesMetadata.h     |  1 -
 src/Storages/S3Queue/S3QueueSource.cpp          |  2 +-
 tests/integration/test_storage_s3_queue/test.py | 10 ++++++++--
 4 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 30bb561204f..61f6b7fe052 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -160,11 +160,7 @@ void S3QueueFilesMetadata::deactivateCleanupTask()
 
 zkutil::ZooKeeperPtr S3QueueFilesMetadata::getZooKeeper() const
 {
-    if (!zookeeper || zookeeper->expired())
-    {
-        zookeeper = Context::getGlobalContextInstance()->getZooKeeper();
-    }
-    return zookeeper;
+    return Context::getGlobalContextInstance()->getZooKeeper();
 }
 
 S3QueueFilesMetadata::FileStatusPtr S3QueueFilesMetadata::getFileStatus(const std::string & path)
@@ -318,7 +314,7 @@ size_t S3QueueFilesMetadata::getIdForProcessingThread(size_t thread_id, size_t s
 
 size_t S3QueueFilesMetadata::getProcessingIdForPath(const std::string & path) const
 {
-    return sipHash64(path.data(), path.size()) % getProcessingIdsNum();
+    return sipHash64(path) % getProcessingIdsNum();
 }
 
 S3QueueFilesMetadata::ProcessingNodeHolderPtr S3QueueFilesMetadata::trySetFileAsProcessing(const std::string & path)
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index 66e36b4122e..c83c6f20b92 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -129,7 +129,6 @@ private:
     const fs::path zookeeper_cleanup_lock_path;
 
     LoggerPtr log;
-    mutable zkutil::ZooKeeperPtr zookeeper;
 
     std::atomic_bool shutdown = false;
     BackgroundSchedulePool::TaskHolder task;
diff --git a/src/Storages/S3Queue/S3QueueSource.cpp b/src/Storages/S3Queue/S3QueueSource.cpp
index e277a81a923..b4f5f957f76 100644
--- a/src/Storages/S3Queue/S3QueueSource.cpp
+++ b/src/Storages/S3Queue/S3QueueSource.cpp
@@ -100,7 +100,7 @@ StorageS3QueueSource::KeyWithInfoPtr StorageS3QueueSource::FileIterator::next(si
                     {
                         if (metadata->isProcessingIdBelongsToShard(processing_id_for_key, current_shard))
                         {
-                            LOG_TEST(log, "Putting key {} into queue of shard {} (total: {})",
+                            LOG_TEST(log, "Putting key {} into queue of processor {} (total: {})",
                                      val->key, processing_id_for_key, sharded_keys.size());
 
                             if (auto it = sharded_keys.find(idx); it != sharded_keys.end())
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 1495e4954b1..5e86b798bf7 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -1209,6 +1209,12 @@ def test_shards_distributed(started_cluster, mode, processing_threads):
         shard_nodes = zk.get_children(f"{keeper_path}/shards/")
         assert len(shard_nodes) == shards_num
 
+    node.restart_clickhouse()
+    time.sleep(10)
+    assert (
+        get_count(node, dst_table_name) + get_count(node_2, dst_table_name)
+    ) == total_rows
+
 
 def test_settings_check(started_cluster):
     node = started_cluster.instances["instance"]
@@ -1219,8 +1225,6 @@ def test_settings_check(started_cluster):
     files_path = f"{table_name}_data"
     mode = "ordered"
 
-    node.restart_clickhouse()
-
     create_table(
         started_cluster,
         node,
@@ -1271,7 +1275,9 @@ def test_settings_check(started_cluster):
     assert "s3queue_current_shard_num = 0" in node.query(
         f"SHOW CREATE TABLE {table_name}"
     )
+
     node.restart_clickhouse()
+
     assert "s3queue_current_shard_num = 0" in node.query(
         f"SHOW CREATE TABLE {table_name}"
     )

From 0557cdb8a9def2e4c8df81d23cb526153ce023f8 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 30 Jan 2024 15:31:04 +0000
Subject: [PATCH 0426/1081] fix due to review

---
 src/Functions/FunctionBinaryArithmetic.h | 40 ++++++++++--------------
 1 file changed, 17 insertions(+), 23 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 831c1cf3aeb..62a50f5e0c2 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -156,14 +156,18 @@ public:
             only_integer && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>),
             Switch<
                 Case<
-                    IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>,
+                    IsDataTypeDecimal<LeftDataType>,
+                    Switch<
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal256>, DataTypeInt256>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal128>, DataTypeInt128>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal64>, DataTypeInt64>,
+                        Case<std::is_same_v<LeftDataType, DataTypeDecimal32>, DataTypeInt32>>>,
+                Case<
+                    IsDataTypeDecimal<RightDataType>,
                     Switch<
                         Case<IsIntegralOrExtended<LeftDataType>, LeftDataType>,
-                        Case<IsIntegralOrExtended<RightDataType>, RightDataType>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>, DataTypeInt256>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>, DataTypeInt128>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>, DataTypeInt64>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal32> || std::is_same_v<RightDataType, DataTypeDecimal32>, DataTypeInt32>>>>>,
+                        Case<std::is_same_v<LeftDataType, DataTypeFloat64>, DataTypeInt64>,
+                        Case<std::is_same_v<LeftDataType, DataTypeFloat32>, DataTypeInt32>>>>>,
 
         /// Decimal cases
         Case<!allow_decimal && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>), InvalidType>,
@@ -1684,11 +1688,11 @@ public:
                     {
                         if constexpr (is_div_int || is_div_int_or_zero)
                         {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256> || std::is_same_v<RightDataType, DataTypeDecimal256>)
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
                                 type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128> || std::is_same_v<RightDataType, DataTypeDecimal128>)
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
                                 type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeDecimal64>)
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
                                 type_res = std::make_shared<DataTypeInt64>();
                             else
                                 type_res = std::make_shared<DataTypeInt32>();
@@ -1723,18 +1727,14 @@ public:
                                 type_res = std::make_shared<DataTypeInt256>();
                             else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
                                 type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64> || std::is_same_v<RightDataType, DataTypeFloat64>)
+                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
                                 type_res = std::make_shared<DataTypeInt64>();
                             else
                                 type_res = std::make_shared<DataTypeInt32>();
                         }
                         else if constexpr (is_div_int || is_div_int_or_zero)
                         {
-                            if constexpr (std::is_same_v<RightDataType, DataTypeDecimal256>)
-                                type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal128>)
-                                type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal64> || std::is_same_v<LeftDataType, DataTypeFloat64>)
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeFloat64>)
                                 type_res = std::make_shared<DataTypeInt64>();
                             else
                                 type_res = std::make_shared<DataTypeInt32>();
@@ -1744,9 +1744,7 @@ public:
                     }
                     else if constexpr (IsDataTypeDecimal<LeftDataType>)
                     {
-                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegralOrExtended<RightDataType>)
-                            type_res = std::make_shared<RightDataType>();
-                        else if constexpr (is_div_int || is_div_int_or_zero)
+                        if constexpr (is_div_int || is_div_int_or_zero)
                         {
                             if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
                                 type_res = std::make_shared<DataTypeInt256>();
@@ -1766,11 +1764,7 @@ public:
                             type_res = std::make_shared<LeftDataType>();
                         else if constexpr (is_div_int || is_div_int_or_zero)
                         {
-                            if constexpr (std::is_same_v<RightDataType, DataTypeDecimal256>)
-                                type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal128>)
-                                type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<RightDataType, DataTypeDecimal64>)
+                            if constexpr (std::is_same_v<LeftDataType, DataTypeFloat64>)
                                 type_res = std::make_shared<DataTypeInt64>();
                             else
                                 type_res = std::make_shared<DataTypeInt32>();

From 998c56fc3d3602a1151c7e310863e12666e595e9 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 17:36:34 +0100
Subject: [PATCH 0427/1081] Move code

---
 src/Compression/CompressionCodecT64.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Compression/CompressionCodecT64.cpp b/src/Compression/CompressionCodecT64.cpp
index 42c6a18aa77..3ddc56fe4f6 100644
--- a/src/Compression/CompressionCodecT64.cpp
+++ b/src/Compression/CompressionCodecT64.cpp
@@ -168,6 +168,7 @@ TypeIndex baseType(TypeIndex type_idx)
             return TypeIndex::Int16;
         case TypeIndex::Int32:
         case TypeIndex::Decimal32:
+        case TypeIndex::Date32:
             return TypeIndex::Int32;
         case TypeIndex::Int64:
         case TypeIndex::Decimal64:
@@ -180,8 +181,6 @@ TypeIndex baseType(TypeIndex type_idx)
         case TypeIndex::Enum16:
         case TypeIndex::Date:
             return TypeIndex::UInt16;
-        case TypeIndex::Date32:
-            return TypeIndex::Int32;
         case TypeIndex::UInt32:
         case TypeIndex::DateTime:
         case TypeIndex::IPv4:

From 1c5b377b3a2e516ec79ad1b230e29d9b6821cdde Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 19:36:40 +0300
Subject: [PATCH 0428/1081] Fixed code review issues

---
 .../AggregateFunctionGroupArraySorted.cpp                 | 8 +++++++-
 src/AggregateFunctions/examples/group_array_sorted.cpp    | 4 ++--
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 751bc4630e7..c8ab947e8e8 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -132,9 +132,15 @@ struct GroupArraySortedData
     ALWAYS_INLINE void sortAndLimit(size_t max_elements, Arena * arena)
     {
         if constexpr (is_value_generic_field)
+        {
             ::sort(values.begin(), values.end(), Comparator());
+        }
         else
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        {
+            bool is_sorted = trySort(values.begin(), values.end(), Comparator());
+            if (!is_sorted)
+                RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
+        }
 
         if (values.size() > max_elements)
             values.resize(max_elements, arena);
diff --git a/src/AggregateFunctions/examples/group_array_sorted.cpp b/src/AggregateFunctions/examples/group_array_sorted.cpp
index 22f7b8d2446..06592892c35 100644
--- a/src/AggregateFunctions/examples/group_array_sorted.cpp
+++ b/src/AggregateFunctions/examples/group_array_sorted.cpp
@@ -182,8 +182,8 @@ int main(int argc, char ** argv)
     }
 
     std::string method = std::string(argv[1]);
-    uint64_t elements = std::atol(argv[2]);
-    uint64_t max_elements = std::atol(argv[3]);
+    uint64_t elements = std::atol(argv[2]); /// NOLINT
+    uint64_t max_elements = std::atol(argv[3]); /// NOLINT
 
     std::cerr << "Method " << method << " elements " << elements << " max elements " << max_elements << '\n';
 

From 0576aa2b7fd060c68f482f8205575bd904356ebe Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 30 Jan 2024 16:45:36 +0000
Subject: [PATCH 0429/1081] fix fuzzer

---
 src/Functions/FunctionBinaryArithmetic.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 62a50f5e0c2..e31183573c3 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -1719,7 +1719,7 @@ public:
                         }
                     }
                     else if constexpr (((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
-                        (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)) && !(is_div_int || is_div_int_or_zero))
+                        (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)))
                     {
                         if constexpr ((is_div_int || is_div_int_or_zero) && IsDataTypeDecimal<LeftDataType>)
                         {
@@ -1760,7 +1760,7 @@ public:
                     }
                     else if constexpr (IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegral<LeftDataType>)
+                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegralOrExtended<LeftDataType>)
                             type_res = std::make_shared<LeftDataType>();
                         else if constexpr (is_div_int || is_div_int_or_zero)
                         {

From 023b8cbd53c1d3788e97d17b0329e3330c1cc0eb Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Tue, 30 Jan 2024 17:47:11 +0100
Subject: [PATCH 0430/1081] Retry disconnects and expired sessions

---
 .../System/StorageSystemZooKeeper.cpp         | 39 +++++++++++++++++--
 1 file changed, 36 insertions(+), 3 deletions(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 37fe9074950..9a671f08138 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -424,9 +424,35 @@ void ReadFromSystemZooKeeper::applyFilters()
     paths = extractPath(getFilterNodes().nodes, context, context->getSettingsRef().allow_unrestricted_reads_from_keeper);
 }
 
+/// Executes a request to Keeper and retries it in case of expired sessions and disconnects
+template <typename Result, typename Operation>
+static Result runWithReconnects(Operation && operation, ContextPtr context, QueryStatusPtr query_status)
+{
+    constexpr int max_retries = 20; /// Limit retries by some reasonable number to avoid infinite loops
+    for (int attempt = 0; ; ++attempt)
+    {
+        if (query_status)
+            query_status->checkTimeLimit();
+
+        zkutil::ZooKeeperPtr keeper = context->getZooKeeper();
+
+        try
+        {
+            return operation(keeper);
+        }
+        catch (const Coordination::Exception & e)
+        {
+            if (!Coordination::isHardwareError(e.code) ||
+                attempt >= max_retries ||
+                e.code == Coordination::Error::ZOPERATIONTIMEOUT)
+                throw;
+        }
+    }
+}
+
 void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
 {
-    zkutil::ZooKeeperPtr zookeeper = context->getZooKeeper();
+    QueryStatusPtr query_status = context->getProcessListElement();
 
     if (paths.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -448,6 +474,9 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
     std::unordered_set<String> added;
     while (!paths.empty())
     {
+        if (query_status)
+            query_status->checkTimeLimit();
+
         list_tasks.clear();
         std::vector<String> paths_to_list;
         while (!paths.empty() && static_cast<Int64>(list_tasks.size()) < max_inflight_requests)
@@ -470,7 +499,9 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
             paths_to_list.emplace_back(task.path_corrected);
             list_tasks.emplace_back(std::move(task));
         }
-        auto list_responses = zookeeper->tryGetChildren(paths_to_list);
+        auto list_responses = runWithReconnects<zkutil::ZooKeeper::MultiTryGetChildrenResponse>(
+            [&paths_to_list](zkutil::ZooKeeperPtr zookeeper) { return zookeeper->tryGetChildren(paths_to_list); },
+            context, query_status);
 
         struct GetTask
         {
@@ -514,7 +545,9 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
             }
         }
 
-        auto get_responses = zookeeper->tryGet(paths_to_get);
+        auto get_responses = runWithReconnects<zkutil::ZooKeeper::MultiTryGetResponse>(
+            [&paths_to_get](zkutil::ZooKeeperPtr zookeeper) { return zookeeper->tryGet(paths_to_get); },
+            context, query_status);
 
         for (size_t i = 0, size = get_tasks.size(); i < size; ++i)
         {

From 600eae00ccb0f5328ea66cad2045049bf7b67a91 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 19:50:18 +0300
Subject: [PATCH 0431/1081] Fixed code review issues

---
 .../AggregateFunctionGroupArray.cpp           | 25 ++++++++++++++---
 .../AggregateFunctionGroupArraySorted.cpp     | 28 ++++++++++++++-----
 2 files changed, 42 insertions(+), 11 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index f27c3c21a73..d72ddb42d9e 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -291,8 +291,17 @@ public:
         const UInt64 size = value.size();
         checkArraySize(size, max_elems);
         writeVarUInt(size, buf);
-        for (const auto & element : value)
-            writeBinaryLittleEndian(element, buf);
+
+
+        if constexpr (std::endian::native == std::endian::little)
+        {
+            buf.write(reinterpret_cast<const char *>(value.data()), size * sizeof(value[0]));
+        }
+        else
+        {
+            for (const auto & element : value)
+                writeBinaryLittleEndian(element, buf);
+        }
 
         if constexpr (Trait::last)
             writeBinaryLittleEndian(this->data(place).total_values, buf);
@@ -315,8 +324,16 @@ public:
         auto & value = this->data(place).value;
 
         value.resize_exact(size, arena);
-        for (auto & element : value)
-            readBinaryLittleEndian(element, buf);
+
+        if constexpr (std::endian::native == std::endian::little)
+        {
+            buf.readStrict(reinterpret_cast<char *>(value.data()), size * sizeof(value[0]));
+        }
+        else
+        {
+            for (auto & element : value)
+                readBinaryLittleEndian(element, buf);
+        }
 
         if constexpr (Trait::last)
             readBinaryLittleEndian(this->data(place).total_values, buf);
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index c8ab947e8e8..0e9856cfab9 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -137,8 +137,8 @@ struct GroupArraySortedData
         }
         else
         {
-            bool is_sorted = trySort(values.begin(), values.end(), Comparator());
-            if (!is_sorted)
+            bool try_sort = trySort(values.begin(), values.end(), Comparator());
+            if (!try_sort)
                 RadixSort<RadixSortNumTraits<T>>::executeLSD(values.data(), values.size());
         }
 
@@ -283,8 +283,15 @@ public:
         }
         else
         {
-            for (const auto & element : values)
-                writeBinaryLittleEndian(element, buf);
+            if constexpr (std::endian::native == std::endian::little)
+            {
+                buf.write(reinterpret_cast<const char *>(values.data()), size * sizeof(values[0]));
+            }
+            else
+            {
+                for (const auto & element : values)
+                    writeBinaryLittleEndian(element, buf);
+            }
         }
     }
 
@@ -297,7 +304,7 @@ public:
             throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elements);
 
         auto & values = this->data(place).values;
-        values.resize(size, arena);
+        values.resize_exact(size, arena);
 
         if constexpr (std::is_same_v<T, Field>)
         {
@@ -311,8 +318,15 @@ public:
         }
         else
         {
-            for (auto & element : values)
-                readBinaryLittleEndian(element, buf);
+            if constexpr (std::endian::native == std::endian::little)
+            {
+                buf.readStrict(reinterpret_cast<char *>(values.data()), size * sizeof(values[0]));
+            }
+            else
+            {
+                for (auto & element : values)
+                    readBinaryLittleEndian(element, buf);
+            }
         }
     }
 

From 82c06ca2949601989699afac6a6bddd05ef2d4f6 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Tue, 30 Jan 2024 18:31:37 +0100
Subject: [PATCH 0432/1081] Use ZooKeeperRetriesControl

---
 .../System/StorageSystemZooKeeper.cpp         | 40 ++++---------------
 1 file changed, 8 insertions(+), 32 deletions(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 9a671f08138..61919f53b24 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -1,6 +1,7 @@
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <Storages/MergeTree/ZooKeeperRetries.h>
 #include <Storages/System/StorageSystemZooKeeper.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Parsers/ASTSelectQuery.h>
@@ -424,32 +425,6 @@ void ReadFromSystemZooKeeper::applyFilters()
     paths = extractPath(getFilterNodes().nodes, context, context->getSettingsRef().allow_unrestricted_reads_from_keeper);
 }
 
-/// Executes a request to Keeper and retries it in case of expired sessions and disconnects
-template <typename Result, typename Operation>
-static Result runWithReconnects(Operation && operation, ContextPtr context, QueryStatusPtr query_status)
-{
-    constexpr int max_retries = 20; /// Limit retries by some reasonable number to avoid infinite loops
-    for (int attempt = 0; ; ++attempt)
-    {
-        if (query_status)
-            query_status->checkTimeLimit();
-
-        zkutil::ZooKeeperPtr keeper = context->getZooKeeper();
-
-        try
-        {
-            return operation(keeper);
-        }
-        catch (const Coordination::Exception & e)
-        {
-            if (!Coordination::isHardwareError(e.code) ||
-                attempt >= max_retries ||
-                e.code == Coordination::Error::ZOPERATIONTIMEOUT)
-                throw;
-        }
-    }
-}
-
 void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
 {
     QueryStatusPtr query_status = context->getProcessListElement();
@@ -499,9 +474,10 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
             paths_to_list.emplace_back(task.path_corrected);
             list_tasks.emplace_back(std::move(task));
         }
-        auto list_responses = runWithReconnects<zkutil::ZooKeeper::MultiTryGetChildrenResponse>(
-            [&paths_to_list](zkutil::ZooKeeperPtr zookeeper) { return zookeeper->tryGetChildren(paths_to_list); },
-            context, query_status);
+
+        zkutil::ZooKeeper::MultiTryGetChildrenResponse list_responses;
+        ZooKeeperRetriesControl("", nullptr, ZooKeeperRetriesInfo(20, 1, 1000), query_status).retryLoop(
+            [&]() { list_responses = context->getZooKeeper()->tryGetChildren(paths_to_list); });
 
         struct GetTask
         {
@@ -545,9 +521,9 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
             }
         }
 
-        auto get_responses = runWithReconnects<zkutil::ZooKeeper::MultiTryGetResponse>(
-            [&paths_to_get](zkutil::ZooKeeperPtr zookeeper) { return zookeeper->tryGet(paths_to_get); },
-            context, query_status);
+        zkutil::ZooKeeper::MultiTryGetResponse get_responses;
+        ZooKeeperRetriesControl("", nullptr, ZooKeeperRetriesInfo(20, 1, 1000), query_status).retryLoop(
+            [&]() { get_responses = context->getZooKeeper()->tryGet(paths_to_get); });
 
         for (size_t i = 0, size = get_tasks.size(); i < size; ++i)
         {

From 4ddba907c8cf4796d549a607daf8a29a06dd70b1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 30 Jan 2024 18:49:28 +0100
Subject: [PATCH 0433/1081] Update autogenerated version to 24.2.1.1 and
 contributors

---
 cmake/autogenerated_versions.txt              | 10 ++++-----
 .../StorageSystemContributors.generated.cpp   | 22 +++++++++++++++++++
 2 files changed, 27 insertions(+), 5 deletions(-)

diff --git a/cmake/autogenerated_versions.txt b/cmake/autogenerated_versions.txt
index e5a8c064808..885080a3e38 100644
--- a/cmake/autogenerated_versions.txt
+++ b/cmake/autogenerated_versions.txt
@@ -2,11 +2,11 @@
 
 # NOTE: has nothing common with DBMS_TCP_PROTOCOL_VERSION,
 # only DBMS_TCP_PROTOCOL_VERSION should be incremented on protocol changes.
-SET(VERSION_REVISION 54482)
+SET(VERSION_REVISION 54483)
 SET(VERSION_MAJOR 24)
-SET(VERSION_MINOR 1)
+SET(VERSION_MINOR 2)
 SET(VERSION_PATCH 1)
-SET(VERSION_GITHASH a2faa65b080a587026c86844f3a20c74d23a86f8)
-SET(VERSION_DESCRIBE v24.1.1.1-testing)
-SET(VERSION_STRING 24.1.1.1)
+SET(VERSION_GITHASH 5a024dfc0936e062770d0cfaad0805b57c1fba17)
+SET(VERSION_DESCRIBE v24.2.1.1-testing)
+SET(VERSION_STRING 24.2.1.1)
 # end of autochange
diff --git a/src/Storages/System/StorageSystemContributors.generated.cpp b/src/Storages/System/StorageSystemContributors.generated.cpp
index fbd5afd3274..b5a985fec9b 100644
--- a/src/Storages/System/StorageSystemContributors.generated.cpp
+++ b/src/Storages/System/StorageSystemContributors.generated.cpp
@@ -109,6 +109,7 @@ const char * auto_contributors[] {
     "Ali Demirci",
     "Aliaksandr Pliutau",
     "Aliaksandr Shylau",
+    "Aliaksei Khatskevich",
     "Alina Terekhova",
     "Amesaru",
     "Amila Welihinda",
@@ -179,6 +180,7 @@ const char * auto_contributors[] {
     "Arsen Hakobyan",
     "Arslan G",
     "ArtCorp",
+    "Artem Alperin",
     "Artem Andreenko",
     "Artem Gavrilov",
     "Artem Hnilov",
@@ -223,7 +225,9 @@ const char * auto_contributors[] {
     "Bill",
     "Bin Xie",
     "BiteTheDDDDt",
+    "Blacksmith",
     "BlahGeek",
+    "Blargian",
     "Bo Lu",
     "Bogdan",
     "Bogdan Voronin",
@@ -373,6 +377,7 @@ const char * auto_contributors[] {
     "Evgeny Kruglov",
     "Evgeny Markov",
     "Ewout",
+    "Eyal Halpern Shalev",
     "FArthur-cmd",
     "FFFFFFFHHHHHHH",
     "FFish",
@@ -513,6 +518,7 @@ const char * auto_contributors[] {
     "Javi santana bot",
     "JaySon",
     "JaySon-Huang",
+    "Jayme Bird",
     "Jean Baptiste Favre",
     "Jeffrey Dang",
     "Jens Hoevenaars",
@@ -613,6 +619,7 @@ const char * auto_contributors[] {
     "Lewinma",
     "Li Shuai",
     "Li Yin",
+    "Lino Uruñuela",
     "Lirikl",
     "Liu Cong",
     "LiuCong",
@@ -636,6 +643,7 @@ const char * auto_contributors[] {
     "MagiaGroz",
     "Maks Skorokhod",
     "Maksim",
+    "Maksim Alekseev",
     "Maksim Buren",
     "Maksim Fedotov",
     "Maksim Kita",
@@ -653,6 +661,7 @@ const char * auto_contributors[] {
     "Mariano Benítez Mulet",
     "Mark Andreev",
     "Mark Frost",
+    "Mark Needham",
     "Mark Papadakis",
     "Mark Polokhov",
     "Maroun Maroun",
@@ -662,6 +671,7 @@ const char * auto_contributors[] {
     "Martijn Bakker",
     "Marvin Taschenberger",
     "Masha",
+    "Mathieu Rey",
     "Matthew Peveler",
     "Matwey V. Kornilov",
     "Max",
@@ -733,6 +743,7 @@ const char * auto_contributors[] {
     "Mingliang Pan",
     "Misko Lee",
     "Misz606",
+    "MochiXu",
     "Mohamad Fadhil",
     "Mohammad Arab Anvari",
     "Mohammad Hossein Sekhavat",
@@ -780,6 +791,7 @@ const char * auto_contributors[] {
     "Nikolai Sorokin",
     "Nikolay",
     "Nikolay Degterinsky",
+    "Nikolay Edigaryev",
     "Nikolay Kirsh",
     "Nikolay Semyachkin",
     "Nikolay Shcheglov",
@@ -876,6 +888,7 @@ const char * auto_contributors[] {
     "Roman Bug",
     "Roman Chyrva",
     "Roman G",
+    "Roman Glinskikh",
     "Roman Heinrich",
     "Roman Lipovsky",
     "Roman Nikolaev",
@@ -948,6 +961,7 @@ const char * auto_contributors[] {
     "Seyed Mehrshad Hosseini",
     "Shane Andrade",
     "Shani Elharrar",
+    "Shaun Struwig",
     "Sherry Wang",
     "Shoh Jahon",
     "Shri Bodas",
@@ -1015,6 +1029,7 @@ const char * auto_contributors[] {
     "Tian Xinhui",
     "Tiaonmmn",
     "Tigran Khudaverdyan",
+    "Tim Liou",
     "Tim Windelschmidt",
     "Timur Magomedov",
     "Timur Solodovnikov",
@@ -1109,6 +1124,7 @@ const char * auto_contributors[] {
     "Wang Fenjin",
     "WangZengrui",
     "Wangyang Guo",
+    "Waterkin",
     "Weiqing Xu",
     "William Shallum",
     "Winter Zhang",
@@ -1152,6 +1168,7 @@ const char * auto_contributors[] {
     "Yury Stankevich",
     "Yusuke Tanaka",
     "Zach Naimon",
+    "Zheng Miao",
     "ZhiYong Wang",
     "Zhichang Yu",
     "Zhichun Wu",
@@ -1213,6 +1230,7 @@ const char * auto_contributors[] {
     "attack204",
     "auxten",
     "avasiliev",
+    "avinzhang",
     "avogar",
     "avoiderboi",
     "avsharapov",
@@ -1253,6 +1271,7 @@ const char * auto_contributors[] {
     "chengy8934",
     "chenjian",
     "chenqi",
+    "chenwei",
     "chenxing-xc",
     "chenxing.xc",
     "chertus",
@@ -1301,6 +1320,7 @@ const char * auto_contributors[] {
     "ducle.canh",
     "eaxdev",
     "edef",
+    "edpyt",
     "eejoin",
     "egatov",
     "ekrasikov",
@@ -1540,6 +1560,7 @@ const char * auto_contributors[] {
     "mlkui",
     "mnkonkova",
     "mo-avatar",
+    "mochi",
     "monchickey",
     "morty",
     "moscas",
@@ -1671,6 +1692,7 @@ const char * auto_contributors[] {
     "sundy-li",
     "sundyli",
     "sunlisheng",
+    "sunny19930321",
     "svladykin",
     "tai",
     "taichong",

From 584694ed51a0e24b811054d19863915577e2e7aa Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 30 Jan 2024 18:01:12 +0000
Subject: [PATCH 0434/1081] Add function variantType

---
 docs/en/sql-reference/data-types/variant.md   |  29 +++++
 .../functions/other-functions.md              |  45 +++++++
 src/Functions/array/variantType.cpp           |   3 +
 src/Functions/variantElement.cpp              |   2 +-
 src/Functions/variantType.cpp                 | 112 ++++++++++++++++++
 .../02981_variant_type_function.reference     |  10 ++
 .../02981_variant_type_function.sql           |  13 ++
 7 files changed, 213 insertions(+), 1 deletion(-)
 create mode 100644 src/Functions/array/variantType.cpp
 create mode 100644 src/Functions/variantType.cpp
 create mode 100644 tests/queries/0_stateless/02981_variant_type_function.reference
 create mode 100644 tests/queries/0_stateless/02981_variant_type_function.sql

diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index 0058e13b4ca..17d51878420 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -156,6 +156,35 @@ SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantEleme
 └───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
 ```
 
+To know what variant is stored in each row function `variantType(variant_column)` can be used. It returns `Enum` with variant type name for each row (or `'None'` if row is `NULL`).
+
+Example:
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) from test;
+```
+
+```text
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+```
+
+```sql
+SELECT toTypeName(variantType(v)) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(variantType(v))──────────────────────────────────────────┐
+│ Enum8('None' = -1, 'Array(UInt64)' = 0, 'String' = 1, 'UInt64' = 2) │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
 ## Conversion between Variant column and other columns
 
 There are 3 possible conversions that can be performed with Variant column.
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index ebc80e4d308..d05e7bbfe51 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -2869,6 +2869,51 @@ SELECT v, variantElement(v, 'String'), variantElement(v, 'UInt64'), variantEleme
 └───────────────┴─────────────────────────────┴─────────────────────────────┴────────────────────────────────────┘
 ```
 
+## variantType
+
+Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns `'None'` for it.
+
+**Syntax**
+
+```sql
+variantType(variant)
+```
+
+**Arguments**
+
+- `variant` — Variant column. [Variant](../../sql-reference/data-types/variant.md).
+
+**Returned value**
+
+- Enum8 column with variant type name for each row.
+
+**Example**
+
+```sql
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) FROM test;
+```
+
+```text
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+```
+
+```sql
+SELECT toTypeName(variantType(v)) FROM test LIMIT 1;
+```
+
+```text
+┌─toTypeName(variantType(v))──────────────────────────────────────────┐
+│ Enum8('None' = -1, 'Array(UInt64)' = 0, 'String' = 1, 'UInt64' = 2) │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
 ## minSampleSizeConversion
 
 Calculates minimum required sample size for an A/B test comparing conversions (proportions) in two samples.
diff --git a/src/Functions/array/variantType.cpp b/src/Functions/array/variantType.cpp
new file mode 100644
index 00000000000..a120cc213ec
--- /dev/null
+++ b/src/Functions/array/variantType.cpp
@@ -0,0 +1,3 @@
+//
+// Created by Павел Круглов on 30/01/2024.
+//
diff --git a/src/Functions/variantElement.cpp b/src/Functions/variantElement.cpp
index 7c63e1266e6..2744a0dabb8 100644
--- a/src/Functions/variantElement.cpp
+++ b/src/Functions/variantElement.cpp
@@ -212,7 +212,7 @@ REGISTER_FUNCTION(VariantElement)
         .description = R"(
 Extracts a column with specified type from a `Variant` column.
 )",
-        .syntax{"tupleElement(variant, type_name, [, default_value])"},
+        .syntax{"variantElement(variant, type_name, [, default_value])"},
         .arguments{{
             {"variant", "Variant column"},
             {"type_name", "The name of the variant type to extract"},
diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
new file mode 100644
index 00000000000..9549f4c5210
--- /dev/null
+++ b/src/Functions/variantType.cpp
@@ -0,0 +1,112 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/IDataType.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/ColumnsNumber.h>
+#include <Common/assert_cast.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+namespace
+{
+
+/// Return enum with type name for each row in Variant column.
+class FunctionVariantType : public IFunction
+{
+public:
+    static constexpr auto name = "variantType";
+    static constexpr auto enum_name_for_null = "None";
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionVariantType>(); }
+    String getName() const override { return name; }
+    size_t getNumberOfArguments() const override { return 1; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        if (arguments.empty() || arguments.size() > 1)
+            throw Exception(
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                "Number of arguments for function {} doesn't match: passed {}, should be 1",
+                getName(), arguments.empty());
+
+        const DataTypeVariant * variant_type = checkAndGetDataType<DataTypeVariant>(arguments[0].type.get());
+
+        if (!variant_type)
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "First argument for function {} must be Variant, got {} instead",
+                getName(), arguments[0].type->getName());
+
+        const auto & variants = variant_type->getVariants();
+        std::vector<std::pair<String, Int8>> enum_values;
+        enum_values.reserve(variants.size() + 1);
+        for (ColumnVariant::Discriminator i = 0; i != variants.size(); ++i)
+            enum_values.emplace_back(variants[i]->getName(), i);
+        enum_values.emplace_back(enum_name_for_null, ColumnVariant::NULL_DISCRIMINATOR);
+        return std::make_shared<DataTypeEnum<Int8>>(enum_values);
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        const ColumnVariant * variant_column = checkAndGetColumn<ColumnVariant>(arguments[0].column.get());
+        if (!variant_column)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "First argument for function {} must be Variant, got {} instead",
+                getName(), arguments[0].type->getName());
+
+        auto res = result_type->createColumn();
+        auto & res_data = typeid_cast<ColumnInt8 *>(res.get())->getData();
+        res_data.reserve(input_rows_count);
+        for (size_t i = 0; i != input_rows_count; ++i)
+            res_data.push_back(variant_column->globalDiscriminatorAt(i));
+
+        return res;
+    }
+};
+
+}
+
+REGISTER_FUNCTION(VariantType)
+{
+    factory.registerFunction<FunctionVariantType>(FunctionDocumentation{
+        .description = R"(
+Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
+)",
+        .syntax{"variantType(variant)"},
+        .arguments{{
+            {"variant", "Variant column"}}},
+        .examples{{{
+            "Example",
+            R"(
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) FROM test;)",
+            R"(
+┌─variantType(v)─┐
+│ None           │
+│ UInt64         │
+│ String         │
+│ Array(UInt64)  │
+└────────────────┘
+)"}}},
+        .categories{"Variant"},
+    });
+}
+
+}
diff --git a/tests/queries/0_stateless/02981_variant_type_function.reference b/tests/queries/0_stateless/02981_variant_type_function.reference
new file mode 100644
index 00000000000..4fae89810ef
--- /dev/null
+++ b/tests/queries/0_stateless/02981_variant_type_function.reference
@@ -0,0 +1,10 @@
+None
+UInt64
+String
+Array(UInt64)
+Enum8(\'None\' = -1, \'Array(UInt64)\' = 0, \'String\' = 1, \'UInt64\' = 2)
+None
+UInt64
+String
+Array(UInt64)
+Enum8(\'None\' = -1, \'Array(UInt64)\' = 0, \'Date\' = 1, \'String\' = 2, \'UInt64\' = 3)
diff --git a/tests/queries/0_stateless/02981_variant_type_function.sql b/tests/queries/0_stateless/02981_variant_type_function.sql
new file mode 100644
index 00000000000..cba653d7374
--- /dev/null
+++ b/tests/queries/0_stateless/02981_variant_type_function.sql
@@ -0,0 +1,13 @@
+SET allow_experimental_variant_type = 1;
+CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;
+INSERT INTO test VALUES (NULL), (42), ('Hello, World!'), ([1, 2, 3]);
+SELECT variantType(v) as type FROM test;
+SELECT toTypeName(variantType(v)) from test limit 1;
+
+SELECT variantType() FROM test; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT variantType(v, v) FROM test; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT variantType(v.String) FROM test; -- {serverError ILLEGAL_TYPE_OF_ARGUMENT}
+
+SELECT variantType(v::Variant(UInt64, String, Array(UInt64), Date)) as type FROM test;
+SELECT toTypeName(variantType(v::Variant(UInt64, String, Array(UInt64), Date))) from test limit 1;
+

From ef6c90c71bad65552ac1bb38769487fe5c106ed9 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 30 Jan 2024 18:01:46 +0000
Subject: [PATCH 0435/1081] Update version_date.tsv and changelogs after
 v24.1.1.2048-stable

---
 SECURITY.md                            |   3 +-
 docker/keeper/Dockerfile               |   2 +-
 docker/server/Dockerfile.alpine        |   2 +-
 docker/server/Dockerfile.ubuntu        |   2 +-
 docs/changelogs/v24.1.1.2048-stable.md | 438 +++++++++++++++++++++++++
 utils/list-versions/version_date.tsv   |   1 +
 6 files changed, 444 insertions(+), 4 deletions(-)
 create mode 100644 docs/changelogs/v24.1.1.2048-stable.md

diff --git a/SECURITY.md b/SECURITY.md
index a200e172a3b..79ca0269838 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -13,9 +13,10 @@ The following versions of ClickHouse server are currently being supported with s
 
 | Version | Supported |
 |:-|:-|
+| 24.1 | ✔️ |
 | 23.12 | ✔️ |
 | 23.11 | ✔️ |
-| 23.10 | ✔️ |
+| 23.10 | ❌ |
 | 23.9 | ❌ |
 | 23.8 | ✔️ |
 | 23.7 | ❌ |
diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 4b5e8cd3970..82405d63df9 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 452d8539a48..f48e14aba50 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 0cefa3c14cb..60ef7a67563 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -30,7 +30,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="23.12.2.59"
+ARG VERSION="24.1.1.2048"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.1.2048-stable.md b/docs/changelogs/v24.1.1.2048-stable.md
new file mode 100644
index 00000000000..8e4647da86e
--- /dev/null
+++ b/docs/changelogs/v24.1.1.2048-stable.md
@@ -0,0 +1,438 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.1.2048-stable (5a024dfc093) FIXME as compared to v23.12.1.1368-stable (a2faa65b080)
+
+#### Backward Incompatible Change
+* The setting `print_pretty_type_names` is turned on by default. You can turn it off to keep the old behavior or `SET compatibility = '23.12'`. [#57726](https://github.com/ClickHouse/ClickHouse/pull/57726) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58316](https://github.com/ClickHouse/ClickHouse/pull/58316) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* The function `reverseDNSQuery` is no longer available. This closes [#58368](https://github.com/ClickHouse/ClickHouse/issues/58368). [#58369](https://github.com/ClickHouse/ClickHouse/pull/58369) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Enable various changes to improve the access control in the configuration file. These changes affect the behavior, and you check the `config.xml` in the `access_control_improvements` section. In case you are not confident, keep the values in the configuration file as they were in the previous version. [#58584](https://github.com/ClickHouse/ClickHouse/pull/58584) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow queries without aliases for subqueries for `PASTE JOIN`. [#58654](https://github.com/ClickHouse/ClickHouse/pull/58654) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix sumMapFiltered with NaN values. NaN values are now placed at the end (instead of randomly) and considered different from any values. `-0` is now also treated as equal to `0`; since 0 values are discarded, `-0` values are discarded too. [#58959](https://github.com/ClickHouse/ClickHouse/pull/58959) ([Raúl Marín](https://github.com/Algunenano)).
+* The function `visibleWidth` will behave according to the docs. In previous versions, it simply counted code points after string serialization, like the `lengthUTF8` function, but didn't consider zero-width and combining characters, full-width characters, tabs, and deletes. Now the behavior is changed accordingly. If you want to keep the old behavior, set `function_visible_width_behavior` to `0`, or set `compatibility` to `23.12` or lower. [#59022](https://github.com/ClickHouse/ClickHouse/pull/59022) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Kusto dialect is disabled until these two bugs will be fixed: [#59037](https://github.com/ClickHouse/ClickHouse/issues/59037) and [#59036](https://github.com/ClickHouse/ClickHouse/issues/59036). [#59305](https://github.com/ClickHouse/ClickHouse/pull/59305) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/ split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
+* Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
+* Certain settings (currently `min_compress_block_size` and `max_compress_block_size`) can now be specified at column-level where they take precedence over the corresponding table-level setting. Example: `CREATE TABLE tab (col String SETTINGS (min_compress_block_size = 81920, max_compress_block_size = 163840)) ENGINE = MergeTree ORDER BY tuple();`. [#55201](https://github.com/ClickHouse/ClickHouse/pull/55201) ([Duc Canh Le](https://github.com/canhld94)).
+* Add `quantileDDSketch` aggregate function as well as the corresponding `quantilesDDSketch` and `medianDDSketch`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
+* Added function `seriesDecomposeSTL()` which decomposes a time series into a season, a trend and a residual component. [#57078](https://github.com/ClickHouse/ClickHouse/pull/57078) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Introduced MySQL Binlog Client for MaterializedMySQL: One binlog connection for many databases. [#57323](https://github.com/ClickHouse/ClickHouse/pull/57323) ([Val Doroshchuk](https://github.com/valbok)).
+* Intel QuickAssist Technology (QAT) provides hardware-accelerated compression and cryptograpy. ClickHouse got a new compression codec `ZSTD_QAT` which utilizes QAT for zstd compression. The codec uses [Intel's QATlib](https://github.com/intel/qatlib) and [Inte's QAT ZSTD Plugin](https://github.com/intel/QAT-ZSTD-Plugin). Right now, only compression can be accelerated in hardware (a software fallback kicks in in case QAT could not be initialized), decompression always runs in software. [#57509](https://github.com/ClickHouse/ClickHouse/pull/57509) ([jasperzhu](https://github.com/jinjunzh)).
+* Implementing the new way how object storage keys are generated for s3 disks. Now the format could be defined in terms of `re2` regex syntax with `key_template` option in disc description. [#57663](https://github.com/ClickHouse/ClickHouse/pull/57663) ([Sema Checherinda](https://github.com/CheSema)).
+* Table system.dropped_tables_parts contains parts of system.dropped_tables tables (dropped but not yet removed tables). [#58038](https://github.com/ClickHouse/ClickHouse/pull/58038) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Implement Variant data type that represents a union of other data types. Type `Variant(T1, T2, ..., TN)` means that each row of this type has a value of either type `T1` or `T2` or ... or `TN` or none of them (`NULL` value). Variant type is available under a setting `allow_experimental_variant_type`. Reference: [#54864](https://github.com/ClickHouse/ClickHouse/issues/54864). [#58047](https://github.com/ClickHouse/ClickHouse/pull/58047) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add settings `max_materialized_views_size_for_table` to limit the number of materialized views attached to a table. [#58068](https://github.com/ClickHouse/ClickHouse/pull/58068) ([zhongyuankai](https://github.com/zhongyuankai)).
+* `clickhouse-format` improvements: * support INSERT queries with `VALUES` * support comments (use `--comments` to output them) * support `--max_line_length` option to format only long queries in multiline. [#58246](https://github.com/ClickHouse/ClickHouse/pull/58246) ([vdimir](https://github.com/vdimir)).
+* Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Add table `system.database_engines`. [#58390](https://github.com/ClickHouse/ClickHouse/pull/58390) ([Bharat Nallan](https://github.com/bharatnc)).
+* Added FROM <Replicas> modifier for SYSTEM SYNC REPLICA LIGHTWEIGHT query. The FROM modifier ensures we wait for for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
+* Add function `arrayShingles()` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
+* Added functions `punycodeEncode()`, `punycodeDecode()`, `idnaEncode()` and `idnaDecode()` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added string similarity functions `dramerauLevenshteinDistance()`, `jaroSimilarity()` and `jaroWinklerSimilarity()`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add two settings `output_format_compression_level` to change output compression level and `output_format_compression_zstd_window_log` to explicitly set compression window size and enable long-range mode for zstd compression if output compression method is `zstd`. Applied for `INTO OUTFILE` and when writing to table functions `file`, `url`, `hdfs`, `s3`, and `azureBlobStorage`. [#58539](https://github.com/ClickHouse/ClickHouse/pull/58539) ([Duc Canh Le](https://github.com/canhld94)).
+* Automatically disable ANSI escape sequences in Pretty formats if the output is not a terminal. Add new `auto` mode to setting `output_format_pretty_color`. [#58614](https://github.com/ClickHouse/ClickHouse/pull/58614) ([Shaun Struwig](https://github.com/Blargian)).
+* Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
+
+#### Performance Improvement
+* More cache-friendly final implementation. Note on the behaviour change: previously queries with `FINAL` modifier that read with a single stream (e.g. `max_threads=1`) produced sorted output without explicitly provided `ORDER BY` clause. This behaviour no longer exists when `enable_vertical_final = true` (and it is so by default). [#54366](https://github.com/ClickHouse/ClickHouse/pull/54366) ([Duc Canh Le](https://github.com/canhld94)).
+* Optimize array element function when input is array(map)/array(array(num)/array(array(string))/array(bigint)/array(decimal). Current implementation causes too many reallocs. The optimization speed up by ~6x especially when input type is array(map). [#56403](https://github.com/ClickHouse/ClickHouse/pull/56403) ([李扬](https://github.com/taiyang-li)).
+* Bypass `Poco::BasicBufferedStreamBuf` abstraction when reading from S3 (namely `ReadBufferFromIStream`) to avoid extra copying of data. [#56961](https://github.com/ClickHouse/ClickHouse/pull/56961) ([Nikita Taranov](https://github.com/nickitat)).
+* Read column once while reading more that one subcolumn from it in Compact parts. [#57631](https://github.com/ClickHouse/ClickHouse/pull/57631) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rewrite the AST of sum(column + literal) function. [#57853](https://github.com/ClickHouse/ClickHouse/pull/57853) ([Jiebin Sun](https://github.com/jiebinn)).
+* The evaluation of function `match()` now utilizes skipping indices `ngrambf_v1` and `tokenbf_v1`. [#57882](https://github.com/ClickHouse/ClickHouse/pull/57882) ([凌涛](https://github.com/lingtaolf)).
+* Default coordinator for parallel replicas is rewritten for better cache locality (same mark ranges are almost always assigned to the same replicas). Consistent hashing is used also during work stealing, so better tail latency is expected. It has been tested for linear scalability on a hundred of replicas. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).
+* MergeTree FINAL to not compare rows from same non-L0 part. [#58142](https://github.com/ClickHouse/ClickHouse/pull/58142) ([Duc Canh Le](https://github.com/canhld94)).
+* Speed up iota calls (filling array with consecutive numbers). [#58271](https://github.com/ClickHouse/ClickHouse/pull/58271) ([Raúl Marín](https://github.com/Algunenano)).
+* The evaluation of function `match()` now utilizes inverted indices. [#58284](https://github.com/ClickHouse/ClickHouse/pull/58284) ([凌涛](https://github.com/lingtaolf)).
+* Speedup MIN/MAX for non numeric types. [#58334](https://github.com/ClickHouse/ClickHouse/pull/58334) ([Raúl Marín](https://github.com/Algunenano)).
+* Enable JIT compilation for aggregation without a key. Closes [#41461](https://github.com/ClickHouse/ClickHouse/issues/41461). Originally [#53757](https://github.com/ClickHouse/ClickHouse/issues/53757). [#58440](https://github.com/ClickHouse/ClickHouse/pull/58440) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The performance experiments of **OnTime** on the Intel server with up to AVX2 (and BMI2) support show that this change could effectively improve the QPS of **Q2** and **Q3** by **5.0%** and **3.7%** through reducing the cycle ratio of the hotspot, **_DB::MergeTreeRangeReader::ReadResult::optimize_**, **from 11.48% to 1.09%** and **from 8.09% to 0.67%** respectively while having no impact on others. [#58800](https://github.com/ClickHouse/ClickHouse/pull/58800) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Use one thread less in `clickhouse-local`. [#58968](https://github.com/ClickHouse/ClickHouse/pull/58968) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Large aggregation states of `uniqExact` will be merged in parallel in distrubuted queries. [#59009](https://github.com/ClickHouse/ClickHouse/pull/59009) ([Nikita Taranov](https://github.com/nickitat)).
+* Lower memory usage after reading from `MergeTree` tables. [#59290](https://github.com/ClickHouse/ClickHouse/pull/59290) ([Anton Popov](https://github.com/CurtizJ)).
+* Lower memory usage in vertical merges. [#59340](https://github.com/ClickHouse/ClickHouse/pull/59340) ([Anton Popov](https://github.com/CurtizJ)).
+
+#### Improvement
+* Enable MySQL/MariaDB on macOS. This closes [#21191](https://github.com/ClickHouse/ClickHouse/issues/21191). [#46316](https://github.com/ClickHouse/ClickHouse/pull/46316) ([Robert Schulze](https://github.com/rschu1ze)).
+* Do not interpret numbers with leading zeroes as octals. [#55575](https://github.com/ClickHouse/ClickHouse/pull/55575) ([Joanna Hulboj](https://github.com/jh0x)).
+* Replace HTTP outgoing buffering based on std ostream with CH Buffer. Add bytes counting metrics for interfaces. [#56064](https://github.com/ClickHouse/ClickHouse/pull/56064) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Disable `max_rows_in_set_to_optimize_join` by default. [#56396](https://github.com/ClickHouse/ClickHouse/pull/56396) ([vdimir](https://github.com/vdimir)).
+* Add `<host_name>` config parameter that allows avoiding resolving hostnames in DDLWorker. This mitigates the possibility of the queue being stuck in case of a change in cluster definition. Closes [#57573](https://github.com/ClickHouse/ClickHouse/issues/57573). [#57603](https://github.com/ClickHouse/ClickHouse/pull/57603) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Increase `load_metadata_threads` to 16 for the filesystem cache. It will make the server start up faster. [#57732](https://github.com/ClickHouse/ClickHouse/pull/57732) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve the `multiIf` function performance when the type is Nullable. [#57745](https://github.com/ClickHouse/ClickHouse/pull/57745) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Add ability to throttle merges/mutations (`max_mutations_bandwidth_for_server`/`max_merges_bandwidth_for_server`). [#57877](https://github.com/ClickHouse/ClickHouse/pull/57877) ([Azat Khuzhin](https://github.com/azat)).
+* Replaced undocumented (boolean) column `is_hot_reloadable` in system table `system.server_settings` by (Enum8) column `changeable_without_restart` with possible values `No`, `Yes`, `IncreaseOnly` and `DecreaseOnly`. Also documented the column. [#58029](https://github.com/ClickHouse/ClickHouse/pull/58029) ([skyoct](https://github.com/skyoct)).
+* ClusterDiscovery supports setting username and password, close [#58063](https://github.com/ClickHouse/ClickHouse/issues/58063). [#58123](https://github.com/ClickHouse/ClickHouse/pull/58123) ([vdimir](https://github.com/vdimir)).
+* Support query parameters in ALTER TABLE ... PART. [#58297](https://github.com/ClickHouse/ClickHouse/pull/58297) ([Azat Khuzhin](https://github.com/azat)).
+* Create consumers for Kafka tables on fly (but keep them for some period - `kafka_consumers_pool_ttl_ms`, since last used), this should fix problem with statistics for `system.kafka_consumers` (that does not consumed when nobody reads from Kafka table, which leads to live memory leak and slow table detach) and also this PR enables stats for `system.kafka_consumers` by default again. [#58310](https://github.com/ClickHouse/ClickHouse/pull/58310) ([Azat Khuzhin](https://github.com/azat)).
+* Sparkbar as an alias to sparkbar. [#58335](https://github.com/ClickHouse/ClickHouse/pull/58335) ([凌涛](https://github.com/lingtaolf)).
+* Avoid sending ComposeObject requests after upload to GCS. [#58343](https://github.com/ClickHouse/ClickHouse/pull/58343) ([Azat Khuzhin](https://github.com/azat)).
+* Correctly handle keys with dot in the name in configurations XMLs. [#58354](https://github.com/ClickHouse/ClickHouse/pull/58354) ([Azat Khuzhin](https://github.com/azat)).
+* Added comments (brief descriptions) to all columns of system tables. The are several reasons fro this: - We use system tables a lot and sometimes is could be very difficult for developer to understand the purpose and the meaning of a particular column. - We change (add new ones or modify existing) system tables a lot and the documentation for them is always outdated. For example take a look at the documentation page for [`system.parts`](https://clickhouse.com/docs/en/operations/system-tables/parts). It misses a lot of columns - We would like to eventually generate documentation directly from ClickHouse. [#58356](https://github.com/ClickHouse/ClickHouse/pull/58356) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Make function `format` return constant on constant arguments. This closes [#58355](https://github.com/ClickHouse/ClickHouse/issues/58355). [#58358](https://github.com/ClickHouse/ClickHouse/pull/58358) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Attach all system tables in `clickhouse-local`, including `system.parts`. This closes [#58312](https://github.com/ClickHouse/ClickHouse/issues/58312). [#58359](https://github.com/ClickHouse/ClickHouse/pull/58359) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support for `Enum` data types in function `transform`. This closes [#58241](https://github.com/ClickHouse/ClickHouse/issues/58241). [#58360](https://github.com/ClickHouse/ClickHouse/pull/58360) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow registering database engines independently. [#58365](https://github.com/ClickHouse/ClickHouse/pull/58365) ([Bharat Nallan](https://github.com/bharatnc)).
+* Adding a setting `max_estimated_execution_time` to separate `max_execution_time` and `max_estimated_execution_time`. [#58402](https://github.com/ClickHouse/ClickHouse/pull/58402) ([Zhang Yifan](https://github.com/zhangyifan27)).
+* Allow registering interpreters independently. [#58443](https://github.com/ClickHouse/ClickHouse/pull/58443) ([Bharat Nallan](https://github.com/bharatnc)).
+* Provide hint when an invalid database engine name is used. [#58444](https://github.com/ClickHouse/ClickHouse/pull/58444) ([Bharat Nallan](https://github.com/bharatnc)).
+* Avoid huge memory consumption during Keeper startup for more cases. [#58455](https://github.com/ClickHouse/ClickHouse/pull/58455) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add settings for better control of indexes type in Arrow dictionary. Use signed integer type for indexes by default as Arrow recommends. Closes [#57401](https://github.com/ClickHouse/ClickHouse/issues/57401). [#58519](https://github.com/ClickHouse/ClickHouse/pull/58519) ([Kruglov Pavel](https://github.com/Avogar)).
+* Added function `sqidDecode()` which decodes [Sqids](https://sqids.org/). [#58544](https://github.com/ClickHouse/ClickHouse/pull/58544) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow to read Bool values into String in JSON input formats. It's done under a setting `input_format_json_read_bools_as_strings` that is enabled by default. [#58561](https://github.com/ClickHouse/ClickHouse/pull/58561) ([Kruglov Pavel](https://github.com/Avogar)).
+* Implement [#58575](https://github.com/ClickHouse/ClickHouse/issues/58575) Support `CLICKHOUSE_PASSWORD_FILE ` environment variable when running the docker image. [#58583](https://github.com/ClickHouse/ClickHouse/pull/58583) ([Eyal Halpern Shalev](https://github.com/Eyal-Shalev)).
+* When executing some queries, which require a lot of streams for reading data, the error `"Paste JOIN requires sorted tables only"` was previously thrown. Now the numbers of streams resize to 1 in that case. [#58608](https://github.com/ClickHouse/ClickHouse/pull/58608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Better message for INVALID_IDENTIFIER error. [#58703](https://github.com/ClickHouse/ClickHouse/pull/58703) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Improved handling of signed numeric literals in normalizeQuery. [#58710](https://github.com/ClickHouse/ClickHouse/pull/58710) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Support Point data type for MySQL. [#58721](https://github.com/ClickHouse/ClickHouse/pull/58721) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* When comparing a Float32 column and a const string, read the string as Float32 (instead of Float64). [#58724](https://github.com/ClickHouse/ClickHouse/pull/58724) ([Raúl Marín](https://github.com/Algunenano)).
+* Improve S3 compatible, add Ecloud EOS storage support. [#58786](https://github.com/ClickHouse/ClickHouse/pull/58786) ([xleoken](https://github.com/xleoken)).
+* Allow `KILL QUERY` to cancel backups / restores. This PR also makes running backups and restores visible in `system.processes`. Also there is a new setting in the server configuration now - `shutdown_wait_backups_and_restores` (default=true) which makes the server either wait on shutdown for all running backups and restores to finish or just cancel them. [#58804](https://github.com/ClickHouse/ClickHouse/pull/58804) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Avro format support Zstd codec. Closes [#58735](https://github.com/ClickHouse/ClickHouse/issues/58735). [#58805](https://github.com/ClickHouse/ClickHouse/pull/58805) ([flynn](https://github.com/ucasfl)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#58835](https://github.com/ClickHouse/ClickHouse/pull/58835) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Fixing a problem described in [#58719](https://github.com/ClickHouse/ClickHouse/issues/58719). [#58841](https://github.com/ClickHouse/ClickHouse/pull/58841) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Make sure that for custom (created from SQL) disks ether `filesystem_caches_path` (a common directory prefix for all filesystem caches) or `custom_cached_disks_base_directory` (a common directory prefix for only filesystem caches created from custom disks) is specified in server config. `custom_cached_disks_base_directory` has higher priority for custom disks over `filesystem_caches_path`, which is used if the former one is absent. Filesystem cache setting `path` must lie inside that directory, otherwise exception will be thrown preventing disk to be created. This will not affect disks created on an older version and server was upgraded - then the exception will not be thrown to allow the server to successfully start). `custom_cached_disks_base_directory` is added to default server config as `/var/lib/clickhouse/caches/`. Closes [#57825](https://github.com/ClickHouse/ClickHouse/issues/57825). [#58869](https://github.com/ClickHouse/ClickHouse/pull/58869) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* MySQL interface gained compatibility with `SHOW WARNINGS`/`SHOW COUNT(*) WARNINGS` queries, though the returned result is always an empty set. [#58929](https://github.com/ClickHouse/ClickHouse/pull/58929) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Skip unavailable replicas when executing parallel distributed `INSERT SELECT`. [#58931](https://github.com/ClickHouse/ClickHouse/pull/58931) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Display word-descriptive log level while enabling structured log formatting in json. [#58936](https://github.com/ClickHouse/ClickHouse/pull/58936) ([Tim Liou](https://github.com/wheatdog)).
+* MySQL interface gained support for `CAST(x AS SIGNED)` and `CAST(x AS UNSIGNED)` statements via data type aliases: `SIGNED` for Int64, and `UNSIGNED` for UInt64. This improves compatibility with BI tools such as Looker Studio. [#58954](https://github.com/ClickHouse/ClickHouse/pull/58954) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Function `seriesDecomposeSTL()` now returns a baseline component as season + trend components. [#58961](https://github.com/ClickHouse/ClickHouse/pull/58961) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Fix memory management in copyDataToS3File. [#58962](https://github.com/ClickHouse/ClickHouse/pull/58962) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Change working directory to data path in docker container. [#58975](https://github.com/ClickHouse/ClickHouse/pull/58975) ([cangyin](https://github.com/cangyin)).
+* Added setting for Azure Blob Storage `azure_max_unexpected_write_error_retries` , can also be set from config under azure section. [#59001](https://github.com/ClickHouse/ClickHouse/pull/59001) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Keeper improvement: reduce Keeper's memory usage for stored nodes. [#59002](https://github.com/ClickHouse/ClickHouse/pull/59002) ([Antonio Andelic](https://github.com/antonio2368)).
+* Allow server to start with broken data lake table. Closes [#58625](https://github.com/ClickHouse/ClickHouse/issues/58625). [#59080](https://github.com/ClickHouse/ClickHouse/pull/59080) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fixes https://github.com/ClickHouse/ClickHouse/pull/59120#issuecomment-1906177350. [#59122](https://github.com/ClickHouse/ClickHouse/pull/59122) ([Arthur Passos](https://github.com/arthurpassos)).
+* The state of URL's #hash in the dashboard is now compressed using [lz-string](https://github.com/pieroxy/lz-string). The default size of the state string is compressed from 6856B to 2823B. [#59124](https://github.com/ClickHouse/ClickHouse/pull/59124) ([Amos Bird](https://github.com/amosbird)).
+* Allow to ignore schema evolution in Iceberg table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prohibit mutable operations (`INSERT`/`ALTER`/`OPTIMIZE`/...) on read-only/write-once storages with a proper `TABLE_IS_READ_ONLY` error (to avoid leftovers). Avoid leaving left-overs on write-once disks (`format_version.txt`) on `CREATE`/`ATTACH`. Ignore `DROP` for `ReplicatedMergeTree` (so as for `MergeTree`). Fix iterating over `s3_plain` (`MetadataStorageFromPlainObjectStorage::iterateDirectory`). Note read-only is `web` disk, and write-once is `s3_plain`. [#59170](https://github.com/ClickHouse/ClickHouse/pull/59170) ([Azat Khuzhin](https://github.com/azat)).
+* MySQL interface gained support for `net_write_timeout` and `net_read_timeout` settings. `net_write_timeout` is translated into the native `send_timeout` ClickHouse setting and, similarly, `net_read_timeout` into `receive_timeout`. Fixed an issue where it was possible to set MySQL `sql_select_limit` setting only if the entire statement was in upper case. [#59293](https://github.com/ClickHouse/ClickHouse/pull/59293) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Fix bug in experimental `_block_number` column which could lead to logical error during complex combination of `ALTER`s and `merge`s. Fixes [#56202](https://github.com/ClickHouse/ClickHouse/issues/56202). Replaces [#58601](https://github.com/ClickHouse/ClickHouse/issues/58601). CC @SmitaRKulkarni. [#59295](https://github.com/ClickHouse/ClickHouse/pull/59295) ([alesapin](https://github.com/alesapin)).
+* Play UI understands when an exception is returned inside JSON. Adjustment for [#52853](https://github.com/ClickHouse/ClickHouse/issues/52853). [#59303](https://github.com/ClickHouse/ClickHouse/pull/59303) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `/binary` HTTP handler allows to specify user, host, and optionally, password in the query string. [#59311](https://github.com/ClickHouse/ClickHouse/pull/59311) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support backups for compressed in-memory tables. This closes [#57893](https://github.com/ClickHouse/ClickHouse/issues/57893). [#59315](https://github.com/ClickHouse/ClickHouse/pull/59315) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve exception message of function regexp_extract, close [#56393](https://github.com/ClickHouse/ClickHouse/issues/56393). [#59319](https://github.com/ClickHouse/ClickHouse/pull/59319) ([李扬](https://github.com/taiyang-li)).
+* Support the FORMAT clause in BACKUP and RESTORE queries. [#59338](https://github.com/ClickHouse/ClickHouse/pull/59338) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Function `concatWithSeparator()` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). For example, `SELECT concatWithSeparator('.', 'number', 1)` now returns `number.1`. [#59341](https://github.com/ClickHouse/ClickHouse/pull/59341) ([Robert Schulze](https://github.com/rschu1ze)).
+
+#### Build/Testing/Packaging Improvement
+* Improve aliases for clickhouse binary (now `ch`/`clickhouse` is `clickhouse-local` or `clickhouse` depends on the arguments) and add bash completion for new aliases. [#58344](https://github.com/ClickHouse/ClickHouse/pull/58344) ([Azat Khuzhin](https://github.com/azat)).
+* Add settings changes check to CI to check that all settings changes are reflected in settings changes history. [#58555](https://github.com/ClickHouse/ClickHouse/pull/58555) ([Kruglov Pavel](https://github.com/Avogar)).
+* Use tables directly attached from S3 in stateful tests. [#58791](https://github.com/ClickHouse/ClickHouse/pull/58791) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Save the whole `fuzzer.log` as an archive instead of the last 100k lines. `tail -n 100000` often removes lines with table definitions. Example:. [#58821](https://github.com/ClickHouse/ClickHouse/pull/58821) ([Dmitry Novik](https://github.com/novikd)).
+* Enable Rust on OSX ARM64 (this will add fuzzy search in client with skim and prql language, though I don't think that are people who hosts ClickHouse on darwin, so it is mostly for fuzzy search in client I would say). [#59272](https://github.com/ClickHouse/ClickHouse/pull/59272) ([Azat Khuzhin](https://github.com/azat)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Add join keys conversion for nested lowcardinality [#51550](https://github.com/ClickHouse/ClickHouse/pull/51550) ([vdimir](https://github.com/vdimir)).
+* Flatten only true Nested type if flatten_nested=1, not all Array(Tuple) [#56132](https://github.com/ClickHouse/ClickHouse/pull/56132) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix a bug with projections and the aggregate_functions_null_for_empty setting during insertion. [#56944](https://github.com/ClickHouse/ClickHouse/pull/56944) ([Amos Bird](https://github.com/amosbird)).
+* Fixed potential exception due to stale profile UUID [#57263](https://github.com/ClickHouse/ClickHouse/pull/57263) ([Vasily Nemkov](https://github.com/Enmk)).
+* Fix working with read buffers in StreamingFormatExecutor [#57438](https://github.com/ClickHouse/ClickHouse/pull/57438) ([Kruglov Pavel](https://github.com/Avogar)).
+* Ignore MVs with dropped target table during pushing to views [#57520](https://github.com/ClickHouse/ClickHouse/pull/57520) ([Kruglov Pavel](https://github.com/Avogar)).
+* [RFC] Eliminate possible race between ALTER_METADATA and MERGE_PARTS [#57755](https://github.com/ClickHouse/ClickHouse/pull/57755) ([Azat Khuzhin](https://github.com/azat)).
+* Fix the exprs order bug in group by with rollup [#57786](https://github.com/ClickHouse/ClickHouse/pull/57786) ([Chen768959](https://github.com/Chen768959)).
+* Fix lost blobs after dropping a replica with broken detached parts [#58333](https://github.com/ClickHouse/ClickHouse/pull/58333) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Allow users to work with symlinks in user_files_path (again) [#58447](https://github.com/ClickHouse/ClickHouse/pull/58447) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix segfault when graphite table does not have agg function [#58453](https://github.com/ClickHouse/ClickHouse/pull/58453) ([Duc Canh Le](https://github.com/canhld94)).
+* Delay reading from StorageKafka to allow multiple reads in materialized views [#58477](https://github.com/ClickHouse/ClickHouse/pull/58477) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTreePrefetchedReadPool disable for LIMIT only queries [#58505](https://github.com/ClickHouse/ClickHouse/pull/58505) ([Maksim Kita](https://github.com/kitaisreal)).
+* Enable ordinary databases while restoration [#58520](https://github.com/ClickHouse/ClickHouse/pull/58520) ([Jihyuk Bok](https://github.com/tomahawk28)).
+* Fix hive threadpool read ORC/Parquet/... Failed [#58537](https://github.com/ClickHouse/ClickHouse/pull/58537) ([sunny](https://github.com/sunny19930321)).
+* Hide credentials in system.backup_log base_backup_name column [#58550](https://github.com/ClickHouse/ClickHouse/pull/58550) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* toStartOfInterval for milli- microsencods values rounding [#58557](https://github.com/ClickHouse/ClickHouse/pull/58557) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Disable max_joined_block_rows in ConcurrentHashJoin [#58595](https://github.com/ClickHouse/ClickHouse/pull/58595) ([vdimir](https://github.com/vdimir)).
+* Fix join using nullable in old analyzer [#58596](https://github.com/ClickHouse/ClickHouse/pull/58596) ([vdimir](https://github.com/vdimir)).
+* `makeDateTime64()`: Allow non-const fraction argument [#58597](https://github.com/ClickHouse/ClickHouse/pull/58597) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix possible NULL dereference during symbolizing inline frames [#58607](https://github.com/ClickHouse/ClickHouse/pull/58607) ([Azat Khuzhin](https://github.com/azat)).
+* Improve isolation of query cache entries under re-created users or role switches [#58611](https://github.com/ClickHouse/ClickHouse/pull/58611) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix broken partition key analysis when doing projection optimization [#58638](https://github.com/ClickHouse/ClickHouse/pull/58638) ([Amos Bird](https://github.com/amosbird)).
+* Query cache: Fix per-user quota [#58731](https://github.com/ClickHouse/ClickHouse/pull/58731) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't process requests in Keeper during shutdown [#58765](https://github.com/ClickHouse/ClickHouse/pull/58765) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Segfault in `SlabsPolygonIndex::find` [#58771](https://github.com/ClickHouse/ClickHouse/pull/58771) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* Table CREATE DROP Poco::Logger memory leak fix [#58831](https://github.com/ClickHouse/ClickHouse/pull/58831) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix HTTP compressors finalization [#58846](https://github.com/ClickHouse/ClickHouse/pull/58846) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Multiple read file log storage in mv [#58877](https://github.com/ClickHouse/ClickHouse/pull/58877) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Restriction for the access key id for s3. [#58900](https://github.com/ClickHouse/ClickHouse/pull/58900) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix possible crash in clickhouse-local during loading suggestions [#58907](https://github.com/ClickHouse/ClickHouse/pull/58907) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash when indexHint() is used [#58911](https://github.com/ClickHouse/ClickHouse/pull/58911) ([Dmitry Novik](https://github.com/novikd)).
+* Fix StorageURL forgetting headers on server restart [#58933](https://github.com/ClickHouse/ClickHouse/pull/58933) ([Michael Kolupaev](https://github.com/al13n321)).
+* Analyzer: fix storage replacement with insertion block [#58958](https://github.com/ClickHouse/ClickHouse/pull/58958) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix seek in ReadBufferFromZipArchive [#58966](https://github.com/ClickHouse/ClickHouse/pull/58966) ([Michael Kolupaev](https://github.com/al13n321)).
+* `DROP INDEX` of inverted index now removes all relevant files from persistence [#59040](https://github.com/ClickHouse/ClickHouse/pull/59040) ([mochi](https://github.com/MochiXu)).
+* Fix data race on query_factories_info [#59049](https://github.com/ClickHouse/ClickHouse/pull/59049) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Disable "Too many redirects" error  retry [#59099](https://github.com/ClickHouse/ClickHouse/pull/59099) ([skyoct](https://github.com/skyoct)).
+* Fix aggregation issue in mixed x86_64 and ARM clusters [#59132](https://github.com/ClickHouse/ClickHouse/pull/59132) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Fix not started database shutdown deadlock [#59137](https://github.com/ClickHouse/ClickHouse/pull/59137) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash with nullable timezone for `toString` [#59190](https://github.com/ClickHouse/ClickHouse/pull/59190) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix abort in iceberg metadata on bad file paths [#59275](https://github.com/ClickHouse/ClickHouse/pull/59275) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix architecture name in select of Rust target [#59307](https://github.com/ClickHouse/ClickHouse/pull/59307) ([p1rattttt](https://github.com/p1rattttt)).
+* Fix not-ready set for system.tables [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix lazy initialization in RabbitMQ [#59352](https://github.com/ClickHouse/ClickHouse/pull/59352) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Refreshable materialized views (takeover)"'. [#58296](https://github.com/ClickHouse/ClickHouse/pull/58296) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Fix an error in the release script - it didn't allow to make 23.12."'. [#58381](https://github.com/ClickHouse/ClickHouse/pull/58381) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* NO CL ENTRY:  'Revert "Use CH Buffer for HTTP out stream, add metrics for interfaces"'. [#58450](https://github.com/ClickHouse/ClickHouse/pull/58450) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Second attempt: Use CH Buffer for HTTP out stream, add metrics for interfaces'. [#58475](https://github.com/ClickHouse/ClickHouse/pull/58475) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* NO CL ENTRY:  'Revert "Merging [#53757](https://github.com/ClickHouse/ClickHouse/issues/53757)"'. [#58542](https://github.com/ClickHouse/ClickHouse/pull/58542) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Add support for MySQL `net_write_timeout` and `net_read_timeout` settings"'. [#58872](https://github.com/ClickHouse/ClickHouse/pull/58872) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Extend performance test norm_dist.xml"'. [#58989](https://github.com/ClickHouse/ClickHouse/pull/58989) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Add a test for [#47892](https://github.com/ClickHouse/ClickHouse/issues/47892)"'. [#58990](https://github.com/ClickHouse/ClickHouse/pull/58990) ([Raúl Marín](https://github.com/Algunenano)).
+* NO CL ENTRY:  'Revert "Allow parallel replicas for JOIN with analyzer [part 1]."'. [#59059](https://github.com/ClickHouse/ClickHouse/pull/59059) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Consume leading zeroes when parsing a number in ConstantExpressionTemplate"'. [#59070](https://github.com/ClickHouse/ClickHouse/pull/59070) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Revert "Allow parallel replicas for JOIN with analyzer [part 1].""'. [#59076](https://github.com/ClickHouse/ClickHouse/pull/59076) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* NO CL ENTRY:  'Revert "Allow to attach partition from table with different partition expression when destination partition expression doesn't re-partition"'. [#59120](https://github.com/ClickHouse/ClickHouse/pull/59120) ([Robert Schulze](https://github.com/rschu1ze)).
+* NO CL ENTRY:  'DisksApp.cpp: fix typo (specifiged → specified)'. [#59140](https://github.com/ClickHouse/ClickHouse/pull/59140) ([Nikolay Edigaryev](https://github.com/edigaryev)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Analyzer: Fix resolving subcolumns in JOIN [#49703](https://github.com/ClickHouse/ClickHouse/pull/49703) ([vdimir](https://github.com/vdimir)).
+* Analyzer: always qualify execution names [#53705](https://github.com/ClickHouse/ClickHouse/pull/53705) ([Dmitry Novik](https://github.com/novikd)).
+* Insert quorum: check host node version in addition [#55528](https://github.com/ClickHouse/ClickHouse/pull/55528) ([Igor Nikonov](https://github.com/devcrafter)).
+* Remove more old code of projection analysis [#55579](https://github.com/ClickHouse/ClickHouse/pull/55579) ([Anton Popov](https://github.com/CurtizJ)).
+* Better exception messages in input formats [#57053](https://github.com/ClickHouse/ClickHouse/pull/57053) ([Kruglov Pavel](https://github.com/Avogar)).
+* Parallel replicas custom key: skip unavailable replicas [#57235](https://github.com/ClickHouse/ClickHouse/pull/57235) ([Igor Nikonov](https://github.com/devcrafter)).
+* Small change in log message in MergeTreeDataMergerMutator [#57550](https://github.com/ClickHouse/ClickHouse/pull/57550) ([Nikita Taranov](https://github.com/nickitat)).
+* fs cache: small optimization [#57615](https://github.com/ClickHouse/ClickHouse/pull/57615) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Customizable dependency failure handling for AsyncLoader [#57697](https://github.com/ClickHouse/ClickHouse/pull/57697) ([Sergei Trifonov](https://github.com/serxa)).
+* Bring test back [#57700](https://github.com/ClickHouse/ClickHouse/pull/57700) ([Nikita Taranov](https://github.com/nickitat)).
+* Change default database name in clickhouse-local to 'default' [#57774](https://github.com/ClickHouse/ClickHouse/pull/57774) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add option `--show-whitespaces-in-diff` to clickhouse-test [#57870](https://github.com/ClickHouse/ClickHouse/pull/57870) ([vdimir](https://github.com/vdimir)).
+* Update `query_masking_rules` when reloading the config, attempt 2 [#57993](https://github.com/ClickHouse/ClickHouse/pull/57993) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Remove unneeded parameter `use_external_buffer` from `AsynchronousReadBuffer*` [#58077](https://github.com/ClickHouse/ClickHouse/pull/58077) ([Nikita Taranov](https://github.com/nickitat)).
+* Print another message in Bugfix check if internal check had been failed [#58091](https://github.com/ClickHouse/ClickHouse/pull/58091) ([vdimir](https://github.com/vdimir)).
+* Refactor StorageMerge virtual columns filtering. [#58255](https://github.com/ClickHouse/ClickHouse/pull/58255) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Analyzer: fix tuple comparison when result is always null [#58266](https://github.com/ClickHouse/ClickHouse/pull/58266) ([vdimir](https://github.com/vdimir)).
+* Fix an error in the release script - it didn't allow to make 23.12. [#58288](https://github.com/ClickHouse/ClickHouse/pull/58288) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.12.1.1368-stable [#58290](https://github.com/ClickHouse/ClickHouse/pull/58290) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Fix test_storage_s3_queue/test.py::test_drop_table [#58293](https://github.com/ClickHouse/ClickHouse/pull/58293) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix timeout in 01732_race_condition_storage_join_long [#58298](https://github.com/ClickHouse/ClickHouse/pull/58298) ([vdimir](https://github.com/vdimir)).
+* Handle another case for preprocessing in Keeper [#58308](https://github.com/ClickHouse/ClickHouse/pull/58308) ([Antonio Andelic](https://github.com/antonio2368)).
+* Disable max_bytes_before_external* in 00172_hits_joins [#58309](https://github.com/ClickHouse/ClickHouse/pull/58309) ([vdimir](https://github.com/vdimir)).
+* Analyzer: support functional arguments in USING clause [#58317](https://github.com/ClickHouse/ClickHouse/pull/58317) ([Dmitry Novik](https://github.com/novikd)).
+* Fixed logical error in CheckSortedTransform [#58318](https://github.com/ClickHouse/ClickHouse/pull/58318) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Refreshable materialized views again [#58320](https://github.com/ClickHouse/ClickHouse/pull/58320) ([Michael Kolupaev](https://github.com/al13n321)).
+* Organize symbols from src/* into DB namespace [#58336](https://github.com/ClickHouse/ClickHouse/pull/58336) ([Amos Bird](https://github.com/amosbird)).
+* Add a style check against DOS and Windows [#58345](https://github.com/ClickHouse/ClickHouse/pull/58345) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Check what happen if remove array joined columns from KeyCondition [#58346](https://github.com/ClickHouse/ClickHouse/pull/58346) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Upload time of the perf tests into artifacts as test_duration_ms [#58348](https://github.com/ClickHouse/ClickHouse/pull/58348) ([Azat Khuzhin](https://github.com/azat)).
+* Keep exception format string in retries ctl [#58351](https://github.com/ClickHouse/ClickHouse/pull/58351) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix replication.lib helper (system.mutations has database not current_database) [#58352](https://github.com/ClickHouse/ClickHouse/pull/58352) ([Azat Khuzhin](https://github.com/azat)).
+* Refactor StorageHDFS and StorageFile virtual columns filtering [#58353](https://github.com/ClickHouse/ClickHouse/pull/58353) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix suspended workers for AsyncLoader [#58362](https://github.com/ClickHouse/ClickHouse/pull/58362) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove stale events from README [#58364](https://github.com/ClickHouse/ClickHouse/pull/58364) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Do not fail the CI on an expired token [#58384](https://github.com/ClickHouse/ClickHouse/pull/58384) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add a test for [#38534](https://github.com/ClickHouse/ClickHouse/issues/38534) [#58391](https://github.com/ClickHouse/ClickHouse/pull/58391) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fix database engine validation inside database factory [#58395](https://github.com/ClickHouse/ClickHouse/pull/58395) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix bad formatting of the `timeDiff` compatibility alias [#58398](https://github.com/ClickHouse/ClickHouse/pull/58398) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix a comment; remove unused method; stop using pointers [#58399](https://github.com/ClickHouse/ClickHouse/pull/58399) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test_user_valid_until [#58409](https://github.com/ClickHouse/ClickHouse/pull/58409) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Make a test not depend on the lack of floating point associativity [#58439](https://github.com/ClickHouse/ClickHouse/pull/58439) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `02944_dynamically_change_filesystem_cache_size` [#58445](https://github.com/ClickHouse/ClickHouse/pull/58445) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Analyzer: Fix LOGICAL_ERROR with LowCardinality [#58457](https://github.com/ClickHouse/ClickHouse/pull/58457) ([Dmitry Novik](https://github.com/novikd)).
+* Replace `std::regex` by re2 [#58458](https://github.com/ClickHouse/ClickHouse/pull/58458) ([Robert Schulze](https://github.com/rschu1ze)).
+* Improve perf tests [#58478](https://github.com/ClickHouse/ClickHouse/pull/58478) ([Raúl Marín](https://github.com/Algunenano)).
+* Check if I can remove KeyCondition analysis on AST. [#58480](https://github.com/ClickHouse/ClickHouse/pull/58480) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix some thread pool settings not updating at runtime [#58485](https://github.com/ClickHouse/ClickHouse/pull/58485) ([Michael Kolupaev](https://github.com/al13n321)).
+* Lower log levels for some Raft logs to new test level [#58487](https://github.com/ClickHouse/ClickHouse/pull/58487) ([Antonio Andelic](https://github.com/antonio2368)).
+* PartsSplitter small refactoring [#58506](https://github.com/ClickHouse/ClickHouse/pull/58506) ([Maksim Kita](https://github.com/kitaisreal)).
+* Sync content of the docker test images [#58507](https://github.com/ClickHouse/ClickHouse/pull/58507) ([Max K.](https://github.com/maxknv)).
+* CI: move ci-specifics from job scripts to ci.py [#58516](https://github.com/ClickHouse/ClickHouse/pull/58516) ([Max K.](https://github.com/maxknv)).
+* Minor fixups for `sqid()` [#58517](https://github.com/ClickHouse/ClickHouse/pull/58517) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update version_date.tsv and changelogs after v23.12.2.59-stable [#58545](https://github.com/ClickHouse/ClickHouse/pull/58545) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.11.4.24-stable [#58546](https://github.com/ClickHouse/ClickHouse/pull/58546) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.8.9.54-lts [#58547](https://github.com/ClickHouse/ClickHouse/pull/58547) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.10.6.60-stable [#58548](https://github.com/ClickHouse/ClickHouse/pull/58548) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.19.32-lts [#58549](https://github.com/ClickHouse/ClickHouse/pull/58549) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update CHANGELOG.md [#58559](https://github.com/ClickHouse/ClickHouse/pull/58559) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Fix test 02932_kill_query_sleep [#58560](https://github.com/ClickHouse/ClickHouse/pull/58560) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI fix. Add packager script to build digest [#58571](https://github.com/ClickHouse/ClickHouse/pull/58571) ([Max K.](https://github.com/maxknv)).
+* fix and test that S3Clients are reused [#58573](https://github.com/ClickHouse/ClickHouse/pull/58573) ([Sema Checherinda](https://github.com/CheSema)).
+* Follow-up to [#58482](https://github.com/ClickHouse/ClickHouse/issues/58482) [#58574](https://github.com/ClickHouse/ClickHouse/pull/58574) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Do not load database engines in suggest [#58586](https://github.com/ClickHouse/ClickHouse/pull/58586) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix wrong message in Keeper [#58588](https://github.com/ClickHouse/ClickHouse/pull/58588) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add some missing LLVM includes [#58594](https://github.com/ClickHouse/ClickHouse/pull/58594) ([Raúl Marín](https://github.com/Algunenano)).
+* Small fix in Keeper [#58598](https://github.com/ClickHouse/ClickHouse/pull/58598) ([Antonio Andelic](https://github.com/antonio2368)).
+* Update analyzer_tech_debt.txt [#58599](https://github.com/ClickHouse/ClickHouse/pull/58599) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Simplify release.py script [#58600](https://github.com/ClickHouse/ClickHouse/pull/58600) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update analyzer_tech_debt.txt [#58602](https://github.com/ClickHouse/ClickHouse/pull/58602) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Refactor stacktrace symbolizer to avoid copy-paste [#58610](https://github.com/ClickHouse/ClickHouse/pull/58610) ([Azat Khuzhin](https://github.com/azat)).
+* Add intel AMX checking [#58617](https://github.com/ClickHouse/ClickHouse/pull/58617) ([Roman Glinskikh](https://github.com/omgronny)).
+* Optional `client` argument for `S3Helper` [#58619](https://github.com/ClickHouse/ClickHouse/pull/58619) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add sorting to 02366_kql_summarize.sql [#58621](https://github.com/ClickHouse/ClickHouse/pull/58621) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix possible race in ManyAggregatedData dtor. [#58624](https://github.com/ClickHouse/ClickHouse/pull/58624) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Remove more projections code [#58628](https://github.com/ClickHouse/ClickHouse/pull/58628) ([Anton Popov](https://github.com/CurtizJ)).
+* Remove finalize() from ~WriteBufferFromEncryptedFile [#58629](https://github.com/ClickHouse/ClickHouse/pull/58629) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Update test_replicated_database/test.py [#58647](https://github.com/ClickHouse/ClickHouse/pull/58647) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Try disabling `muzzy_decay_ms` in jemalloc [#58648](https://github.com/ClickHouse/ClickHouse/pull/58648) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix test_replicated_database::test_startup_without_zk flakiness [#58649](https://github.com/ClickHouse/ClickHouse/pull/58649) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 01600_remerge_sort_lowered_memory_bytes_ratio flakiness (due to settings randomization) [#58650](https://github.com/ClickHouse/ClickHouse/pull/58650) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Fix assertion in HashJoin with duplicate columns [#58652](https://github.com/ClickHouse/ClickHouse/pull/58652) ([vdimir](https://github.com/vdimir)).
+* Document that `match()` can use `ngrambf_v1` and `tokenbf_v1` indexes [#58655](https://github.com/ClickHouse/ClickHouse/pull/58655) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix perf tests duration (checks.test_duration_ms) [#58656](https://github.com/ClickHouse/ClickHouse/pull/58656) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Correctly handle constant set in index [#58657](https://github.com/ClickHouse/ClickHouse/pull/58657) ([Dmitry Novik](https://github.com/novikd)).
+* fix a typo in stress randomization setting [#58658](https://github.com/ClickHouse/ClickHouse/pull/58658) ([Sema Checherinda](https://github.com/CheSema)).
+* Small follow-up to `std::regex` --> `re2` conversion ([#58458](https://github.com/ClickHouse/ClickHouse/issues/58458)) [#58678](https://github.com/ClickHouse/ClickHouse/pull/58678) ([Robert Schulze](https://github.com/rschu1ze)).
+* Remove `<regex>` from libcxx [#58681](https://github.com/ClickHouse/ClickHouse/pull/58681) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bad log message [#58698](https://github.com/ClickHouse/ClickHouse/pull/58698) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Some small improvements to version_helper from [#57203](https://github.com/ClickHouse/ClickHouse/issues/57203) [#58712](https://github.com/ClickHouse/ClickHouse/pull/58712) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Small fixes in different helpers [#58717](https://github.com/ClickHouse/ClickHouse/pull/58717) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix bug in new (not released yet) parallel replicas coordinator [#58722](https://github.com/ClickHouse/ClickHouse/pull/58722) ([Nikita Taranov](https://github.com/nickitat)).
+* Analyzer: Fix LOGICAL_ERROR in CountDistinctPass [#58723](https://github.com/ClickHouse/ClickHouse/pull/58723) ([Dmitry Novik](https://github.com/novikd)).
+* Fix reading of offsets subcolumn (`size0`) from `Nested` [#58729](https://github.com/ClickHouse/ClickHouse/pull/58729) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix Mac OS X [#58733](https://github.com/ClickHouse/ClickHouse/pull/58733) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fix stress with generate-template-key [#58740](https://github.com/ClickHouse/ClickHouse/pull/58740) ([Sema Checherinda](https://github.com/CheSema)).
+* more relaxed check [#58751](https://github.com/ClickHouse/ClickHouse/pull/58751) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix usage of small buffers for remote reading [#58768](https://github.com/ClickHouse/ClickHouse/pull/58768) ([Nikita Taranov](https://github.com/nickitat)).
+* Add missing includes when _LIBCPP_REMOVE_TRANSITIVE_INCLUDES enabled [#58770](https://github.com/ClickHouse/ClickHouse/pull/58770) ([Artem Alperin](https://github.com/hdnpth)).
+* Remove some code [#58772](https://github.com/ClickHouse/ClickHouse/pull/58772) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove some code [#58790](https://github.com/ClickHouse/ClickHouse/pull/58790) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix trash in performance tests [#58794](https://github.com/ClickHouse/ClickHouse/pull/58794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix data race in Keeper [#58806](https://github.com/ClickHouse/ClickHouse/pull/58806) ([Antonio Andelic](https://github.com/antonio2368)).
+* Increase log level to trace to help debug `00993_system_parts_race_condition_drop_zookeeper` [#58809](https://github.com/ClickHouse/ClickHouse/pull/58809) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* DatabaseCatalog background tasks add log names [#58832](https://github.com/ClickHouse/ClickHouse/pull/58832) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer: Resolve GROUPING function on shards [#58833](https://github.com/ClickHouse/ClickHouse/pull/58833) ([Dmitry Novik](https://github.com/novikd)).
+* Allow parallel replicas for JOIN with analyzer [part 1]. [#58838](https://github.com/ClickHouse/ClickHouse/pull/58838) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix `isRetry` method [#58839](https://github.com/ClickHouse/ClickHouse/pull/58839) ([alesapin](https://github.com/alesapin)).
+* fs cache: fix data race in slru [#58842](https://github.com/ClickHouse/ClickHouse/pull/58842) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix reading from an invisible part in new (not released yet) parallel replicas coordinator [#58844](https://github.com/ClickHouse/ClickHouse/pull/58844) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix bad log message [#58849](https://github.com/ClickHouse/ClickHouse/pull/58849) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Set max_bytes_before_external_group_by in 01961_roaring_memory_tracking [#58863](https://github.com/ClickHouse/ClickHouse/pull/58863) ([vdimir](https://github.com/vdimir)).
+* Fix `00089_group_by_arrays_of_fixed` with external aggregation [#58873](https://github.com/ClickHouse/ClickHouse/pull/58873) ([Antonio Andelic](https://github.com/antonio2368)).
+* DiskWeb minor improvement in loading [#58874](https://github.com/ClickHouse/ClickHouse/pull/58874) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix RPN construction for indexHint [#58875](https://github.com/ClickHouse/ClickHouse/pull/58875) ([Dmitry Novik](https://github.com/novikd)).
+* Analyzer: add test with GROUP BY on shards [#58876](https://github.com/ClickHouse/ClickHouse/pull/58876) ([Dmitry Novik](https://github.com/novikd)).
+* Jepsen job to reuse builds [#58881](https://github.com/ClickHouse/ClickHouse/pull/58881) ([Max K.](https://github.com/maxknv)).
+* Fix ambiguity in the setting description [#58883](https://github.com/ClickHouse/ClickHouse/pull/58883) ([Denny Crane](https://github.com/den-crane)).
+* Less error prone interface of read buffers [#58886](https://github.com/ClickHouse/ClickHouse/pull/58886) ([Anton Popov](https://github.com/CurtizJ)).
+* Add metric for keeper memory soft limit [#58890](https://github.com/ClickHouse/ClickHouse/pull/58890) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Add a test for [#47988](https://github.com/ClickHouse/ClickHouse/issues/47988) [#58893](https://github.com/ClickHouse/ClickHouse/pull/58893) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Whitespaces [#58894](https://github.com/ClickHouse/ClickHouse/pull/58894) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix data race in `AggregatingTransform` [#58896](https://github.com/ClickHouse/ClickHouse/pull/58896) ([Antonio Andelic](https://github.com/antonio2368)).
+* Update SLRUFileCachePriority.cpp [#58898](https://github.com/ClickHouse/ClickHouse/pull/58898) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add tests for [#57193](https://github.com/ClickHouse/ClickHouse/issues/57193) [#58899](https://github.com/ClickHouse/ClickHouse/pull/58899) ([Raúl Marín](https://github.com/Algunenano)).
+* Add log for already download binary in Jepsen [#58901](https://github.com/ClickHouse/ClickHouse/pull/58901) ([Antonio Andelic](https://github.com/antonio2368)).
+* fs cache: minor refactoring [#58902](https://github.com/ClickHouse/ClickHouse/pull/58902) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Checking on flaky test_parallel_replicas_custom_key_failover [#58909](https://github.com/ClickHouse/ClickHouse/pull/58909) ([Igor Nikonov](https://github.com/devcrafter)).
+* Style fix [#58913](https://github.com/ClickHouse/ClickHouse/pull/58913) ([Dmitry Novik](https://github.com/novikd)).
+* Opentelemetry spans to analyze CPU and S3 bottlenecks on inserts [#58914](https://github.com/ClickHouse/ClickHouse/pull/58914) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix fault handler in case of thread (for fault handler) cannot be spawned [#58917](https://github.com/ClickHouse/ClickHouse/pull/58917) ([Azat Khuzhin](https://github.com/azat)).
+* Analyzer: Support GROUP BY injective function elimination [#58919](https://github.com/ClickHouse/ClickHouse/pull/58919) ([Dmitry Novik](https://github.com/novikd)).
+* Cancel MasterCI in PRs [#58920](https://github.com/ClickHouse/ClickHouse/pull/58920) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix and test for azure [#58697](https://github.com/ClickHouse/ClickHouse/issues/58697) [#58921](https://github.com/ClickHouse/ClickHouse/pull/58921) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Extend performance test norm_dist.xml [#58922](https://github.com/ClickHouse/ClickHouse/pull/58922) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add regression test for parallel replicas (follow up [#58722](https://github.com/ClickHouse/ClickHouse/issues/58722), [#58844](https://github.com/ClickHouse/ClickHouse/issues/58844)) [#58923](https://github.com/ClickHouse/ClickHouse/pull/58923) ([Nikita Taranov](https://github.com/nickitat)).
+* Add a test for [#47892](https://github.com/ClickHouse/ClickHouse/issues/47892) [#58927](https://github.com/ClickHouse/ClickHouse/pull/58927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `FunctionToSubcolumnsPass` in debug build [#58930](https://github.com/ClickHouse/ClickHouse/pull/58930) ([Anton Popov](https://github.com/CurtizJ)).
+* Call `getMaxFileDescriptorCount` once in Keeper [#58938](https://github.com/ClickHouse/ClickHouse/pull/58938) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add missing files to digests [#58942](https://github.com/ClickHouse/ClickHouse/pull/58942) ([Raúl Marín](https://github.com/Algunenano)).
+* Analyzer: fix join column not found with compound identifiers [#58943](https://github.com/ClickHouse/ClickHouse/pull/58943) ([vdimir](https://github.com/vdimir)).
+* CI: pr_info to provide event_type for job scripts [#58947](https://github.com/ClickHouse/ClickHouse/pull/58947) ([Max K.](https://github.com/maxknv)).
+* Using the destination object for  paths generation in S3copy. [#58949](https://github.com/ClickHouse/ClickHouse/pull/58949) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix data race in slru (2) [#58950](https://github.com/ClickHouse/ClickHouse/pull/58950) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix flaky test_postgresql_replica_database_engine_2/test.py::test_dependent_loading [#58951](https://github.com/ClickHouse/ClickHouse/pull/58951) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* More safe way to dump system logs in tests [#58955](https://github.com/ClickHouse/ClickHouse/pull/58955) ([alesapin](https://github.com/alesapin)).
+* Add a comment about sparse checkout [#58960](https://github.com/ClickHouse/ClickHouse/pull/58960) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Follow up to [#58357](https://github.com/ClickHouse/ClickHouse/issues/58357) [#58963](https://github.com/ClickHouse/ClickHouse/pull/58963) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Better error message about tuples [#58971](https://github.com/ClickHouse/ClickHouse/pull/58971) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix timeout for prometheus exporter for HTTP/1.1 (due to keep-alive) [#58981](https://github.com/ClickHouse/ClickHouse/pull/58981) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 02891_array_shingles with analyzer [#58982](https://github.com/ClickHouse/ClickHouse/pull/58982) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix script name in SQL example in executable.md [#58984](https://github.com/ClickHouse/ClickHouse/pull/58984) ([Lino Uruñuela](https://github.com/Wachynaky)).
+* Fix typo [#58986](https://github.com/ClickHouse/ClickHouse/pull/58986) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Revert flaky [#58992](https://github.com/ClickHouse/ClickHouse/pull/58992) ([Raúl Marín](https://github.com/Algunenano)).
+* Revive: Parallel replicas custom key: skip unavailable replicas [#58993](https://github.com/ClickHouse/ClickHouse/pull/58993) ([Igor Nikonov](https://github.com/devcrafter)).
+* Make performance test `test norm_dist.xml` more realistic [#58995](https://github.com/ClickHouse/ClickHouse/pull/58995) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix 02404_memory_bound_merging with analyzer (follow up [#56419](https://github.com/ClickHouse/ClickHouse/issues/56419)) [#58996](https://github.com/ClickHouse/ClickHouse/pull/58996) ([Nikita Taranov](https://github.com/nickitat)).
+* Add test for [#58930](https://github.com/ClickHouse/ClickHouse/issues/58930) [#58999](https://github.com/ClickHouse/ClickHouse/pull/58999) ([Anton Popov](https://github.com/CurtizJ)).
+* initialization ConnectionTimeouts [#59000](https://github.com/ClickHouse/ClickHouse/pull/59000) ([Sema Checherinda](https://github.com/CheSema)).
+* DiskWeb fix loading [#59006](https://github.com/ClickHouse/ClickHouse/pull/59006) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update log level for http buffer [#59008](https://github.com/ClickHouse/ClickHouse/pull/59008) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Change log level for super imporant message in Keeper [#59010](https://github.com/ClickHouse/ClickHouse/pull/59010) ([alesapin](https://github.com/alesapin)).
+* Fix async loader stress test [#59011](https://github.com/ClickHouse/ClickHouse/pull/59011) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove `StaticResourceManager` [#59013](https://github.com/ClickHouse/ClickHouse/pull/59013) ([Sergei Trifonov](https://github.com/serxa)).
+* preserve 'amz-sdk-invocation-id' and 'amz-sdk-request' headers with gcp [#59015](https://github.com/ClickHouse/ClickHouse/pull/59015) ([Sema Checherinda](https://github.com/CheSema)).
+* Update rename.md [#59017](https://github.com/ClickHouse/ClickHouse/pull/59017) ([filimonov](https://github.com/filimonov)).
+* очепятка [#59024](https://github.com/ClickHouse/ClickHouse/pull/59024) ([edpyt](https://github.com/edpyt)).
+* Split resource scheduler off `IO/` into `Common/Scheduler/` [#59025](https://github.com/ClickHouse/ClickHouse/pull/59025) ([Sergei Trifonov](https://github.com/serxa)).
+* Add a parameter for testing purposes [#59027](https://github.com/ClickHouse/ClickHouse/pull/59027) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix test 02932_kill_query_sleep when running with query cache [#59041](https://github.com/ClickHouse/ClickHouse/pull/59041) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI: Jepsen: fix sanity check in ci.py [#59043](https://github.com/ClickHouse/ClickHouse/pull/59043) ([Max K.](https://github.com/maxknv)).
+* CI: add ci_config classes for job and build names [#59046](https://github.com/ClickHouse/ClickHouse/pull/59046) ([Max K.](https://github.com/maxknv)).
+* remove flaky test [#59066](https://github.com/ClickHouse/ClickHouse/pull/59066) ([Sema Checherinda](https://github.com/CheSema)).
+* Followup to 57853 [#59068](https://github.com/ClickHouse/ClickHouse/pull/59068) ([Dmitry Novik](https://github.com/novikd)).
+* Follow-up to [#59027](https://github.com/ClickHouse/ClickHouse/issues/59027) [#59075](https://github.com/ClickHouse/ClickHouse/pull/59075) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix `test_parallel_replicas_invisible_parts` [#59077](https://github.com/ClickHouse/ClickHouse/pull/59077) ([Nikita Taranov](https://github.com/nickitat)).
+* Increase max_bytes_before_external_group_by for 00165_jit_aggregate_functions [#59078](https://github.com/ClickHouse/ClickHouse/pull/59078) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix stateless/run.sh [#59079](https://github.com/ClickHouse/ClickHouse/pull/59079) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* CI: hot fix for reuse [#59081](https://github.com/ClickHouse/ClickHouse/pull/59081) ([Max K.](https://github.com/maxknv)).
+* Fix server shutdown due to exception while loading metadata [#59083](https://github.com/ClickHouse/ClickHouse/pull/59083) ([Sergei Trifonov](https://github.com/serxa)).
+* Coordinator returns ranges for reading in sorted order [#59089](https://github.com/ClickHouse/ClickHouse/pull/59089) ([Nikita Taranov](https://github.com/nickitat)).
+* Raise timeout in 02294_decimal_second_errors [#59090](https://github.com/ClickHouse/ClickHouse/pull/59090) ([Raúl Marín](https://github.com/Algunenano)).
+* Add `[[nodiscard]]` to a couple of methods [#59093](https://github.com/ClickHouse/ClickHouse/pull/59093) ([Nikita Taranov](https://github.com/nickitat)).
+* Docs: Update integer and float aliases [#59100](https://github.com/ClickHouse/ClickHouse/pull/59100) ([Robert Schulze](https://github.com/rschu1ze)).
+* Avoid election timeouts during startup in Keeper [#59102](https://github.com/ClickHouse/ClickHouse/pull/59102) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add missing setting max_estimated_execution_time in  SettingsChangesHistory [#59104](https://github.com/ClickHouse/ClickHouse/pull/59104) ([Kruglov Pavel](https://github.com/Avogar)).
+* Rename some inverted index test files [#59106](https://github.com/ClickHouse/ClickHouse/pull/59106) ([Robert Schulze](https://github.com/rschu1ze)).
+* Further reduce runtime of `norm_distance.xml` [#59108](https://github.com/ClickHouse/ClickHouse/pull/59108) ([Robert Schulze](https://github.com/rschu1ze)).
+* Minor follow-up to [#53710](https://github.com/ClickHouse/ClickHouse/issues/53710) [#59109](https://github.com/ClickHouse/ClickHouse/pull/59109) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update stateless/run.sh [#59116](https://github.com/ClickHouse/ClickHouse/pull/59116) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Followup 57875 [#59117](https://github.com/ClickHouse/ClickHouse/pull/59117) ([Dmitry Novik](https://github.com/novikd)).
+* Fixing build [#59130](https://github.com/ClickHouse/ClickHouse/pull/59130) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Capability check for `s3_plain` [#59145](https://github.com/ClickHouse/ClickHouse/pull/59145) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix `02015_async_inserts_stress_long` [#59146](https://github.com/ClickHouse/ClickHouse/pull/59146) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix AggregateFunctionNothing result type issues introducing it with different names [#59147](https://github.com/ClickHouse/ClickHouse/pull/59147) ([vdimir](https://github.com/vdimir)).
+* Fix url encoding issue [#59162](https://github.com/ClickHouse/ClickHouse/pull/59162) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Upgrade simdjson to v3.6.3 [#59166](https://github.com/ClickHouse/ClickHouse/pull/59166) ([Robert Schulze](https://github.com/rschu1ze)).
+* Decrease log level for one log message [#59168](https://github.com/ClickHouse/ClickHouse/pull/59168) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix broken cache for non-existing temp_path [#59172](https://github.com/ClickHouse/ClickHouse/pull/59172) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Move some headers [#59175](https://github.com/ClickHouse/ClickHouse/pull/59175) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Analyzer: Fix CTE name clash resolution [#59177](https://github.com/ClickHouse/ClickHouse/pull/59177) ([Dmitry Novik](https://github.com/novikd)).
+* Fix another place with special symbols in the URL [#59184](https://github.com/ClickHouse/ClickHouse/pull/59184) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Actions dag build filter actions refactoring [#59228](https://github.com/ClickHouse/ClickHouse/pull/59228) ([Maksim Kita](https://github.com/kitaisreal)).
+* Minor cleanup of msan usage [#59229](https://github.com/ClickHouse/ClickHouse/pull/59229) ([Robert Schulze](https://github.com/rschu1ze)).
+* Load server configs in clickhouse local [#59231](https://github.com/ClickHouse/ClickHouse/pull/59231) ([pufit](https://github.com/pufit)).
+* Make libssh build dependent on `-DENABLE_LIBRARIES` [#59242](https://github.com/ClickHouse/ClickHouse/pull/59242) ([Robert Schulze](https://github.com/rschu1ze)).
+* Disable copy constructor for MultiVersion [#59244](https://github.com/ClickHouse/ClickHouse/pull/59244) ([Vitaly Baranov](https://github.com/vitlibar)).
+* CI: fix ci configuration for nightly job [#59252](https://github.com/ClickHouse/ClickHouse/pull/59252) ([Max K.](https://github.com/maxknv)).
+* Fix 02475_bson_each_row_format flakiness (due to small parsing block) [#59253](https://github.com/ClickHouse/ClickHouse/pull/59253) ([Azat Khuzhin](https://github.com/azat)).
+* Improve pytest --pdb experience by preserving dockerd on SIGINT (v2) [#59255](https://github.com/ClickHouse/ClickHouse/pull/59255) ([Azat Khuzhin](https://github.com/azat)).
+* Fix fasttest by pinning pip dependencies [#59256](https://github.com/ClickHouse/ClickHouse/pull/59256) ([Azat Khuzhin](https://github.com/azat)).
+* Added AtomicLogger [#59273](https://github.com/ClickHouse/ClickHouse/pull/59273) ([Maksim Kita](https://github.com/kitaisreal)).
+* Update test_reload_after_fail_in_cache_dictionary for analyzer [#59274](https://github.com/ClickHouse/ClickHouse/pull/59274) ([vdimir](https://github.com/vdimir)).
+* Update run.sh [#59280](https://github.com/ClickHouse/ClickHouse/pull/59280) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add missing setting optimize_injective_functions_in_group_by to SettingsChangesHistory [#59283](https://github.com/ClickHouse/ClickHouse/pull/59283) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix perf tests (after sumMap starts to filter out -0.) [#59287](https://github.com/ClickHouse/ClickHouse/pull/59287) ([Azat Khuzhin](https://github.com/azat)).
+* Use fresh ZooKeeper client on DROP (to have higher chances on success) [#59288](https://github.com/ClickHouse/ClickHouse/pull/59288) ([Azat Khuzhin](https://github.com/azat)).
+* Additional check [#59292](https://github.com/ClickHouse/ClickHouse/pull/59292) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* No debug symbols in Rust [#59306](https://github.com/ClickHouse/ClickHouse/pull/59306) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix deadlock in `AsyncLoader::stop()` [#59308](https://github.com/ClickHouse/ClickHouse/pull/59308) ([Sergei Trifonov](https://github.com/serxa)).
+* Speed up `00165_jit_aggregate_functions` [#59312](https://github.com/ClickHouse/ClickHouse/pull/59312) ([Nikita Taranov](https://github.com/nickitat)).
+* CI: WA for issue with perf test with artifact reuse [#59325](https://github.com/ClickHouse/ClickHouse/pull/59325) ([Max K.](https://github.com/maxknv)).
+* Fix typo [#59329](https://github.com/ClickHouse/ClickHouse/pull/59329) ([Raúl Marín](https://github.com/Algunenano)).
+* Simplify query_run_metric_arrays in perf tests [#59333](https://github.com/ClickHouse/ClickHouse/pull/59333) ([Raúl Marín](https://github.com/Algunenano)).
+* IVolume constructor improve exception message [#59335](https://github.com/ClickHouse/ClickHouse/pull/59335) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix upgrade check for new setting [#59343](https://github.com/ClickHouse/ClickHouse/pull/59343) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix sccache when building without coverage [#59345](https://github.com/ClickHouse/ClickHouse/pull/59345) ([Raúl Marín](https://github.com/Algunenano)).
+* Loggers initialization fix [#59347](https://github.com/ClickHouse/ClickHouse/pull/59347) ([Maksim Kita](https://github.com/kitaisreal)).
+* Add setting update_insert_deduplication_token_in_dependent_materialized_views to settings changes history [#59349](https://github.com/ClickHouse/ClickHouse/pull/59349) ([Maksim Kita](https://github.com/kitaisreal)).
+* Slightly better memory usage in `AsynchronousBoundedReadBuffer` [#59354](https://github.com/ClickHouse/ClickHouse/pull/59354) ([Anton Popov](https://github.com/CurtizJ)).
+* Try to make variant tests a bit faster [#59355](https://github.com/ClickHouse/ClickHouse/pull/59355) ([Kruglov Pavel](https://github.com/Avogar)).
+* Minor typos in Settings.h [#59371](https://github.com/ClickHouse/ClickHouse/pull/59371) ([Jordi Villar](https://github.com/jrdi)).
+* Rename `quantileDDSketch` to `quantileDD` [#59372](https://github.com/ClickHouse/ClickHouse/pull/59372) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index b2983033e44..34df4a3f0cf 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.1.2048-stable	2024-01-30
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28
 v23.11.4.24-stable	2024-01-05

From c348c4e828e6d2c4978d03936e82e825a5966a59 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Tue, 30 Jan 2024 19:02:17 +0100
Subject: [PATCH 0436/1081] Move ZooKeeperRetries.h to Common

---
 src/Backups/BackupEntriesCollector.h                            | 2 +-
 src/Backups/WithRetries.h                                       | 2 +-
 src/{Storages/MergeTree => Common/ZooKeeper}/ZooKeeperRetries.h | 0
 src/Interpreters/executeDDLQueryOnCluster.h                     | 2 +-
 src/Storages/MergeTree/ReplicatedMergeTreeSink.h                | 2 +-
 src/Storages/System/StorageSystemZooKeeper.cpp                  | 2 +-
 6 files changed, 5 insertions(+), 5 deletions(-)
 rename src/{Storages/MergeTree => Common/ZooKeeper}/ZooKeeperRetries.h (100%)

diff --git a/src/Backups/BackupEntriesCollector.h b/src/Backups/BackupEntriesCollector.h
index bad67e494c4..01e8d594334 100644
--- a/src/Backups/BackupEntriesCollector.h
+++ b/src/Backups/BackupEntriesCollector.h
@@ -6,7 +6,7 @@
 #include <Parsers/ASTBackupQuery.h>
 #include <Storages/IStorage_fwd.h>
 #include <Storages/TableLockHolder.h>
-#include <Storages/MergeTree/ZooKeeperRetries.h>
+#include <Common/ZooKeeper/ZooKeeperRetries.h>
 #include <filesystem>
 #include <queue>
 
diff --git a/src/Backups/WithRetries.h b/src/Backups/WithRetries.h
index 3a6e28996b9..f795a963911 100644
--- a/src/Backups/WithRetries.h
+++ b/src/Backups/WithRetries.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Storages/MergeTree/ZooKeeperRetries.h>
+#include <Common/ZooKeeper/ZooKeeperRetries.h>
 #include <Common/ZooKeeper/Common.h>
 #include <Common/ZooKeeper/ZooKeeperWithFaultInjection.h>
 
diff --git a/src/Storages/MergeTree/ZooKeeperRetries.h b/src/Common/ZooKeeper/ZooKeeperRetries.h
similarity index 100%
rename from src/Storages/MergeTree/ZooKeeperRetries.h
rename to src/Common/ZooKeeper/ZooKeeperRetries.h
diff --git a/src/Interpreters/executeDDLQueryOnCluster.h b/src/Interpreters/executeDDLQueryOnCluster.h
index 7daf9babf9f..d3365553875 100644
--- a/src/Interpreters/executeDDLQueryOnCluster.h
+++ b/src/Interpreters/executeDDLQueryOnCluster.h
@@ -5,7 +5,7 @@
 #include <Processors/ISource.h>
 #include <Interpreters/Context_fwd.h>
 #include <Parsers/IAST_fwd.h>
-#include <Storages/MergeTree/ZooKeeperRetries.h>
+#include <Common/ZooKeeper/ZooKeeperRetries.h>
 
 
 namespace zkutil
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
index bc23204e7d3..29f3183be64 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
@@ -3,7 +3,7 @@
 #include <Processors/Sinks/SinkToStorage.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <base/types.h>
-#include <Storages/MergeTree/ZooKeeperRetries.h>
+#include <Common/ZooKeeper/ZooKeeperRetries.h>
 #include <Common/ZooKeeper/ZooKeeperWithFaultInjection.h>
 #include <Storages/MergeTree/AsyncBlockIDsCache.h>
 
diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 61919f53b24..6aa85e6a9e9 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -1,7 +1,6 @@
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDateTime.h>
-#include <Storages/MergeTree/ZooKeeperRetries.h>
 #include <Storages/System/StorageSystemZooKeeper.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Parsers/ASTSelectQuery.h>
@@ -13,6 +12,7 @@
 #include <Interpreters/ProcessList.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
+#include <Common/ZooKeeper/ZooKeeperRetries.h>
 #include <Common/typeid_cast.h>
 #include <Columns/ColumnSet.h>
 #include <Columns/ColumnConst.h>

From 010f1c6cb79b9f9a5a96b9ce32faac234c1297e9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 30 Jan 2024 19:10:26 +0100
Subject: [PATCH 0437/1081] Forward declaration for PeekableReadBuffer

ReadHelpers.h is very common header and is the root cause of "recompile
everything".

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/IO/ReadHelpers.cpp                                     | 1 +
 src/IO/ReadHelpers.h                                       | 2 +-
 src/Processors/Formats/Impl/CSVRowInputFormat.h            | 1 +
 src/Processors/Formats/Impl/JSONRowInputFormat.cpp         | 1 +
 src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h   | 1 +
 src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp | 1 +
 src/Storages/StorageFile.cpp                               | 1 +
 src/Storages/VirtualColumnUtils.cpp                        | 1 +
 8 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/IO/ReadHelpers.cpp b/src/IO/ReadHelpers.cpp
index 253abb3fee7..bcfe5fd5230 100644
--- a/src/IO/ReadHelpers.cpp
+++ b/src/IO/ReadHelpers.cpp
@@ -6,6 +6,7 @@
 #include <Formats/FormatSettings.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/BufferWithOwnMemory.h>
+#include <IO/PeekableReadBuffer.h>
 #include <IO/readFloatText.h>
 #include <IO/Operators.h>
 #include <base/find_symbols.h>
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 2549b40e243..49530f4787a 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -38,7 +38,6 @@
 #include <IO/CompressionMethod.h>
 #include <IO/ReadBuffer.h>
 #include <IO/ReadBufferFromMemory.h>
-#include <IO/PeekableReadBuffer.h>
 #include <IO/VarInt.h>
 
 #include <pcg_random.hpp>
@@ -51,6 +50,7 @@ namespace DB
 
 template <typename Allocator>
 struct Memory;
+class PeekableReadBuffer;
 
 namespace ErrorCodes
 {
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.h b/src/Processors/Formats/Impl/CSVRowInputFormat.h
index c4b3c8feb8c..fe4d4e3be08 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.h
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.h
@@ -7,6 +7,7 @@
 #include <Processors/Formats/RowInputFormatWithNamesAndTypes.h>
 #include <Processors/Formats/ISchemaReader.h>
 #include <Formats/FormatSettings.h>
+#include <IO/PeekableReadBuffer.h>
 
 
 namespace DB
diff --git a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
index f78ce530ecb..23faa057715 100644
--- a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
@@ -2,6 +2,7 @@
 #include <Formats/JSONUtils.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/EscapingRuleUtils.h>
+#include <IO/PeekableReadBuffer.h>
 #include <IO/ReadHelpers.h>
 
 namespace DB
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
index 00a270e9611..32abd532a52 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
@@ -4,6 +4,7 @@
 #include <Formats/FormatSettings.h>
 #include <Processors/Formats/RowInputFormatWithNamesAndTypes.h>
 #include <Processors/Formats/ISchemaReader.h>
+#include <IO/PeekableReadBuffer.h>
 
 
 namespace DB
diff --git a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
index 478ce41f924..2ad6a825c8f 100644
--- a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
+++ b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
@@ -7,6 +7,7 @@
 #include <IO/ReadHelpers.h>
 #include <IO/Operators.h>
 #include <IO/ReadBufferFromString.h>
+#include <IO/PeekableReadBuffer.h>
 #include <Formats/EscapingRuleUtils.h>
 
 
diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index 8b8a151fb1d..0d9e79d1d54 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -25,6 +25,7 @@
 #include <IO/WriteHelpers.h>
 #include <IO/Archives/createArchiveReader.h>
 #include <IO/Archives/IArchiveReader.h>
+#include <IO/PeekableReadBuffer.h>
 
 #include <Formats/FormatFactory.h>
 #include <Formats/ReadSchemaUtils.h>
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 430ed012fa8..33ff6e7104f 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -1,5 +1,6 @@
 #include <algorithm>
 #include <memory>
+#include <stack>
 #include <Core/NamesAndTypes.h>
 #include <Core/TypeId.h>
 

From e6fcc4847133396958c604392544c26094635f56 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Tue, 30 Jan 2024 17:56:49 +0000
Subject: [PATCH 0438/1081] CI: fix status and report for docker server jobs

 #no_merge_commit
---
 .github/workflows/backport_branches.yml | 15 +++++++++++----
 .github/workflows/master.yml            | 16 +++++++++++-----
 .github/workflows/pull_request.yml      | 15 +++++++++++----
 .github/workflows/release_branches.yml  | 18 +++++++++++++-----
 tests/ci/ci_config.py                   | 25 ++++++++++++++++++++-----
 5 files changed, 66 insertions(+), 23 deletions(-)

diff --git a/.github/workflows/backport_branches.yml b/.github/workflows/backport_branches.yml
index ef554a1b0ff..6b05f1fe9f4 100644
--- a/.github/workflows/backport_branches.yml
+++ b/.github/workflows/backport_branches.yml
@@ -138,19 +138,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 6d150f37a27..fff058ecf87 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -242,20 +242,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      # FIXME: avoid using 0 checkout
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index b3ac2135e50..3165227ce3a 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -273,19 +273,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index 69229ef75df..6d54e558b70 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -153,19 +153,26 @@ jobs:
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
-  DockerServerImages:
+  DockerServerImage:
     needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Docker server and keeper images
+      test_name: Docker server image
       runner_type: style-checker
       data: ${{ needs.RunConfig.outputs.data }}
-      checkout_depth: 0
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+  DockerKeeperImage:
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker keeper image
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
         python3 docker_server.py --release-type head --no-push \
           --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
@@ -456,7 +463,8 @@ jobs:
   FinishCheck:
     if: ${{ !failure() && !cancelled() }}
     needs:
-      - DockerServerImages
+      - DockerServerImage
+      - DockerKeeperImage
       - BuilderReport
       - BuilderSpecialReport
       - MarkReleaseReady
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index e011b8ad3c9..bd28822a229 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -43,7 +43,8 @@ class Build(metaclass=WithIter):
 class JobNames(metaclass=WithIter):
     STYLE_CHECK = "Style check"
     FAST_TEST = "Fast tests"
-    DOCKER_SERVER = "Docker server and keeper images"
+    DOCKER_SERVER = "Docker server image"
+    DOCKER_KEEPER = "Docker keeper image"
     INSTALL_TEST_AMD = "Install packages (amd64)"
     INSTALL_TEST_ARM = "Install packages (arm64)"
 
@@ -786,6 +787,16 @@ CI_CONFIG = CiConfig(
                     include_paths=[
                         "tests/ci/docker_server.py",
                         "./docker/server",
+                    ]
+                )
+            ),
+        ),
+        JobNames.DOCKER_KEEPER: TestConfig(
+            "",
+            job_config=JobConfig(
+                digest=DigestConfig(
+                    include_paths=[
+                        "tests/ci/docker_server.py",
                         "./docker/keeper",
                     ]
                 )
@@ -922,7 +933,7 @@ CI_CONFIG = CiConfig(
             Build.PACKAGE_DEBUG,
             job_config=JobConfig(num_batches=6, **statless_test_common_params),  # type: ignore
         ),
-        JobNames.STATELESS_TEST_S3_DEBUG: TestConfig(
+        JobNames.STATELESS_TEST_S3_TSAN: TestConfig(
             Build.PACKAGE_TSAN,
             job_config=JobConfig(num_batches=5, **statless_test_common_params),  # type: ignore
         ),
@@ -1123,10 +1134,14 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Compatibility check"),
     ),
     CheckDescription(
-        "Docker image for servers",
+        JobNames.DOCKER_SERVER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker image")
-        and (x.endswith("building check") or x.endswith("build and push")),
+        lambda x: x.startswith("Docker server")
+    ),
+    CheckDescription(
+        JobNames.DOCKER_KEEPER,
+        "The check to build and optionally push the mentioned image to docker hub",
+        lambda x: x.startswith("Docker keeper")
     ),
     CheckDescription(
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"

From 80376fdbfa84b3a7bbebefc58252a5f814cb5570 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 19:28:39 +0100
Subject: [PATCH 0439/1081] Fix style

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index ab48a4a798c..7667c97fa6f 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2638,6 +2638,7 @@ varPop
 varSamp
 variadic
 variantElement
+variantType
 varint
 varpop
 varsamp

From 299c390d2b17e118a0fc87a21bc8859d135e006b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 15:56:41 +0100
Subject: [PATCH 0440/1081] Add some fuzzing to ASTLiterals

---
 src/Client/QueryFuzzer.cpp | 57 ++++++++++++++++++++++++++++++++++----
 src/Client/QueryFuzzer.h   |  2 ++
 2 files changed, 54 insertions(+), 5 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 629d36e7960..786d5af0cb3 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -903,6 +903,54 @@ void QueryFuzzer::notifyQueryFailed(ASTPtr ast)
         remove_fuzzed_table(insert->getTable());
 }
 
+ASTPtr QueryFuzzer::fuzzLiteralUnderExpressionList(ASTPtr child)
+{
+    auto * l = child->as<ASTLiteral>();
+    chassert(l);
+    auto type = l->value.getType();
+    if (type == Field::Types::Which::String && fuzz_rand() % 7 == 0)
+    {
+        String value = l->value.get<String>();
+        child = makeASTFunction(
+            "toFixedString", std::make_shared<ASTLiteral>(value), std::make_shared<ASTLiteral>(static_cast<UInt64>(value.size())));
+    }
+
+    if (fuzz_rand() % 11 == 0)
+    {
+        String value = l->value.get<String>();
+        child = makeASTFunction("toNullable", child);
+    }
+
+    if (fuzz_rand() % 11 == 0)
+    {
+        String value = l->value.get<String>();
+        child = makeASTFunction("toLowCardinality", child);
+    }
+
+    if (fuzz_rand() % 11 == 0)
+    {
+        String value = l->value.get<String>();
+        child = makeASTFunction("materialize", child);
+    }
+
+    return child;
+}
+
+
+void QueryFuzzer::fuzzExpressionList(ASTExpressionList & expr_list)
+{
+    for (size_t i = 0; i < expr_list.children.size(); i++)
+    {
+        if (auto * literal = typeid_cast<ASTLiteral *>(expr_list.children[i].get()))
+        {
+            if (fuzz_rand() % 13 == 0)
+                expr_list.children[i] = fuzzLiteralUnderExpressionList(expr_list.children[i]);
+        }
+        else
+            fuzz(expr_list.children[i]);
+    }
+}
+
 void QueryFuzzer::fuzz(ASTs & asts)
 {
     for (auto & ast : asts)
@@ -989,7 +1037,7 @@ void QueryFuzzer::fuzz(ASTPtr & ast)
     }
     else if (auto * expr_list = typeid_cast<ASTExpressionList *>(ast.get()))
     {
-        fuzz(expr_list->children);
+        fuzzExpressionList(*expr_list);
     }
     else if (auto * order_by_element = typeid_cast<ASTOrderByElement *>(ast.get()))
     {
@@ -1108,7 +1156,7 @@ void QueryFuzzer::fuzz(ASTPtr & ast)
     }
     /*
      * The time to fuzz the settings has not yet come.
-     * Apparently we don't have any infractructure to validate the values of
+     * Apparently we don't have any infrastructure to validate the values of
      * the settings, and the first query with max_block_size = -1 breaks
      * because of overflows here and there.
      *//*
@@ -1131,9 +1179,8 @@ void QueryFuzzer::fuzz(ASTPtr & ast)
         // are ASTPtr -- this is redundant ownership, but hides the error if the
         // child field is replaced. Others can be ASTLiteral * or the like, which
         // leads to segfault if the pointed-to AST is replaced.
-        // Replacing children is safe in case of ASTExpressionList. In a more
-        // general case, we can change the value of ASTLiteral, which is what we
-        // do here.
+        // Replacing children is safe in case of ASTExpressionList (done in fuzzExpressionList). In a more
+        // general case, we can change the value of ASTLiteral, which is what we do here
         if (fuzz_rand() % 11 == 0)
         {
             literal->value = fuzzField(literal->value);
diff --git a/src/Client/QueryFuzzer.h b/src/Client/QueryFuzzer.h
index 18c7b8a9241..cdeba2b76fd 100644
--- a/src/Client/QueryFuzzer.h
+++ b/src/Client/QueryFuzzer.h
@@ -95,6 +95,8 @@ struct QueryFuzzer
     void fuzzExplainSettings(ASTSetQuery & settings_ast, ASTExplainQuery::ExplainKind kind);
     void fuzzColumnDeclaration(ASTColumnDeclaration & column);
     void fuzzTableName(ASTTableExpression & table);
+    ASTPtr fuzzLiteralUnderExpressionList(ASTPtr child);
+    void fuzzExpressionList(ASTExpressionList & expr_list);
     void fuzz(ASTs & asts);
     void fuzz(ASTPtr & ast);
     void collectFuzzInfoMain(ASTPtr ast);

From 4b5e992565b060cc002495f8c58cceb79c75d53a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 19:33:31 +0100
Subject: [PATCH 0441/1081] Fix problems

---
 src/Client/QueryFuzzer.cpp | 17 ++++-------------
 1 file changed, 4 insertions(+), 13 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 786d5af0cb3..bb551fcb11e 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -916,22 +916,13 @@ ASTPtr QueryFuzzer::fuzzLiteralUnderExpressionList(ASTPtr child)
     }
 
     if (fuzz_rand() % 11 == 0)
-    {
-        String value = l->value.get<String>();
         child = makeASTFunction("toNullable", child);
-    }
 
     if (fuzz_rand() % 11 == 0)
-    {
-        String value = l->value.get<String>();
         child = makeASTFunction("toLowCardinality", child);
-    }
 
     if (fuzz_rand() % 11 == 0)
-    {
-        String value = l->value.get<String>();
         child = makeASTFunction("materialize", child);
-    }
 
     return child;
 }
@@ -939,15 +930,15 @@ ASTPtr QueryFuzzer::fuzzLiteralUnderExpressionList(ASTPtr child)
 
 void QueryFuzzer::fuzzExpressionList(ASTExpressionList & expr_list)
 {
-    for (size_t i = 0; i < expr_list.children.size(); i++)
+    for (auto & child : expr_list.children)
     {
-        if (auto * literal = typeid_cast<ASTLiteral *>(expr_list.children[i].get()))
+        if (auto * literal = typeid_cast<ASTLiteral *>(child.get()))
         {
             if (fuzz_rand() % 13 == 0)
-                expr_list.children[i] = fuzzLiteralUnderExpressionList(expr_list.children[i]);
+                child = fuzzLiteralUnderExpressionList(child);
         }
         else
-            fuzz(expr_list.children[i]);
+            fuzz(child);
     }
 }
 

From 419ddf7c9d98e5c839609a90f52c5b7b926b204a Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 30 Jan 2024 18:34:56 +0000
Subject: [PATCH 0442/1081] Automatic style fix

---
 tests/ci/ci_config.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index bd28822a229..d18040540c7 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1136,12 +1136,12 @@ CHECK_DESCRIPTIONS = [
     CheckDescription(
         JobNames.DOCKER_SERVER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker server")
+        lambda x: x.startswith("Docker server"),
     ),
     CheckDescription(
         JobNames.DOCKER_KEEPER,
         "The check to build and optionally push the mentioned image to docker hub",
-        lambda x: x.startswith("Docker keeper")
+        lambda x: x.startswith("Docker keeper"),
     ),
     CheckDescription(
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"

From a3f0546f48af77d7c120a7e71d94b992a4446e2c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 19:44:55 +0100
Subject: [PATCH 0443/1081] Handle both fuzzer.log and fuzzer.log.ztd

---
 tests/ci/ast_fuzzer_check.py | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 41e4ef19361..95a887484f2 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -113,7 +113,6 @@ def main():
     paths = {
         "run.log": run_log_path,
         "main.log": main_log_path,
-        "fuzzer.log": workspace_path / "fuzzer.log",
         "report.html": workspace_path / "report.html",
         "core.zst": workspace_path / "core.zst",
         "dmesg.log": workspace_path / "dmesg.log",
@@ -129,6 +128,14 @@ def main():
     if not_compressed_server_log_path.exists():
         paths["server.log"] = not_compressed_server_log_path
 
+    # Same idea but with the fuzzer log
+    compressed_fuzzer_log_path = workspace_path / "fuzzer.log.zst"
+    if compressed_fuzzer_log_path.exists():
+        paths["fuzzer.log.zst"] = compressed_fuzzer_log_path
+    not_compressed_fuzzer_log_path = workspace_path / "fuzzer.log"
+    if not_compressed_fuzzer_log_path.exists():
+        paths["fuzzer.log"] = not_compressed_fuzzer_log_path
+
     # Try to get status message saved by the fuzzer
     try:
         with open(workspace_path / "status.txt", "r", encoding="utf-8") as status_f:

From 8c69a6e28d7a8ea153f6c2ce02ec5e3f1dc799ee Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:28:56 +0100
Subject: [PATCH 0444/1081] Fix build

---
 src/Functions/variantType.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
index 9549f4c5210..48591cb794d 100644
--- a/src/Functions/variantType.cpp
+++ b/src/Functions/variantType.cpp
@@ -89,8 +89,7 @@ REGISTER_FUNCTION(VariantType)
 Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
 )",
         .syntax{"variantType(variant)"},
-        .arguments{{
-            {"variant", "Variant column"}}},
+        .arguments{{{"variant", "Variant column"}}}
         .examples{{{
             "Example",
             R"(

From 4f0c78d66557bd74d21796ce2ea661132c26abc0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 30 Jan 2024 20:25:26 +0100
Subject: [PATCH 0445/1081] Upload one file. Save the planet

---
 docker/test/fuzzer/run-fuzzer.sh |  4 ++--
 tests/ci/ast_fuzzer_check.py     | 18 +++++++++---------
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 050d4b68628..ca6bff9c6be 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -389,8 +389,8 @@ fi
 rg --text -F '<Fatal>' server.log > fatal.log ||:
 dmesg -T > dmesg.log ||:
 
-zstd --threads=0 server.log
-zstd --threads=0 fuzzer.log
+zstd --threads=0 --rm server.log
+zstd --threads=0 --rm fuzzer.log
 
 cat > report.html <<EOF ||:
 <!DOCTYPE html>
diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 95a887484f2..26ce7f5140b 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -121,20 +121,20 @@ def main():
     compressed_server_log_path = workspace_path / "server.log.zst"
     if compressed_server_log_path.exists():
         paths["server.log.zst"] = compressed_server_log_path
-
-    # The script can fail before the invocation of `zstd`, but we are still interested in its log:
-
-    not_compressed_server_log_path = workspace_path / "server.log"
-    if not_compressed_server_log_path.exists():
-        paths["server.log"] = not_compressed_server_log_path
+    else:
+        # The script can fail before the invocation of `zstd`, but we are still interested in its log:
+        not_compressed_server_log_path = workspace_path / "server.log"
+        if not_compressed_server_log_path.exists():
+            paths["server.log"] = not_compressed_server_log_path
 
     # Same idea but with the fuzzer log
     compressed_fuzzer_log_path = workspace_path / "fuzzer.log.zst"
     if compressed_fuzzer_log_path.exists():
         paths["fuzzer.log.zst"] = compressed_fuzzer_log_path
-    not_compressed_fuzzer_log_path = workspace_path / "fuzzer.log"
-    if not_compressed_fuzzer_log_path.exists():
-        paths["fuzzer.log"] = not_compressed_fuzzer_log_path
+    else:
+        not_compressed_fuzzer_log_path = workspace_path / "fuzzer.log"
+        if not_compressed_fuzzer_log_path.exists():
+            paths["fuzzer.log"] = not_compressed_fuzzer_log_path
 
     # Try to get status message saved by the fuzzer
     try:

From 46432da743aa08b45c75f4ec3cca6c48c7e87a75 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:30:17 +0100
Subject: [PATCH 0446/1081] Remove unneded file

---
 src/Functions/array/variantType.cpp | 3 ---
 1 file changed, 3 deletions(-)
 delete mode 100644 src/Functions/array/variantType.cpp

diff --git a/src/Functions/array/variantType.cpp b/src/Functions/array/variantType.cpp
deleted file mode 100644
index a120cc213ec..00000000000
--- a/src/Functions/array/variantType.cpp
+++ /dev/null
@@ -1,3 +0,0 @@
-//
-// Created by Павел Круглов on 30/01/2024.
-//

From bd3bb0530877a4337964e630ed4313c762ec9fbb Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:32:59 +0100
Subject: [PATCH 0447/1081] Fix

---
 src/Functions/variantType.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/variantType.cpp b/src/Functions/variantType.cpp
index 48591cb794d..e867cb03a23 100644
--- a/src/Functions/variantType.cpp
+++ b/src/Functions/variantType.cpp
@@ -88,9 +88,9 @@ REGISTER_FUNCTION(VariantType)
         .description = R"(
 Returns the variant type name for each row of `Variant` column. If row contains NULL, it returns 'None' for it.
 )",
-        .syntax{"variantType(variant)"},
-        .arguments{{{"variant", "Variant column"}}}
-        .examples{{{
+        .syntax = {"variantType(variant)"},
+        .arguments = {{"variant", "Variant column"}},
+        .examples = {{{
             "Example",
             R"(
 CREATE TABLE test (v Variant(UInt64, String, Array(UInt64))) ENGINE = Memory;

From 17ab2674f4c8ad7a09194659e0a0c86d4440f203 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Tue, 30 Jan 2024 20:35:10 +0100
Subject: [PATCH 0448/1081] impl

---
 src/Common/ElapsedTimeProfileEventIncrement.h |  3 +-
 src/Common/ProfileEvents.cpp                  |  7 +++
 .../MergeTreeDataPartWriterOnDisk.cpp         | 15 ++++++
 .../MergeTree/MergeTreeDataPartWriterOnDisk.h |  2 +
 .../MergeTree/MergeTreeDataWriter.cpp         | 47 ++++++++++++++-----
 5 files changed, 60 insertions(+), 14 deletions(-)

diff --git a/src/Common/ElapsedTimeProfileEventIncrement.h b/src/Common/ElapsedTimeProfileEventIncrement.h
index b30afd24a4c..731295a4cfd 100644
--- a/src/Common/ElapsedTimeProfileEventIncrement.h
+++ b/src/Common/ElapsedTimeProfileEventIncrement.h
@@ -14,12 +14,13 @@ enum Time
     Seconds,
 };
 
-template <Time time>
+template <Time unit>
 struct ProfileEventTimeIncrement
 {
     explicit ProfileEventTimeIncrement<time>(ProfileEvents::Event event_)
         : event(event_), watch(CLOCK_MONOTONIC) {}
 
+    template <Time time = unit>
     UInt64 elapsed()
     {
         if constexpr (time == Time::Nanoseconds)
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 8782f895f3f..ef0606162a2 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -197,6 +197,13 @@
     M(MergeTreeDataWriterBlocks, "Number of blocks INSERTed to MergeTree tables. Each block forms a data part of level zero.") \
     M(MergeTreeDataWriterBlocksAlreadySorted, "Number of blocks INSERTed to MergeTree tables that appeared to be already sorted.") \
     \
+    M(MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds, "Time spent calculating secondary indices") \
+    M(MergeTreeDataWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
+    M(MergeTreeDataWriterMergingBlocksMicroseconds, "Time spent merging input blocks (for special MergeTree engines)") \
+    M(MergeTreeDataWriterProjectionsCalculationMicroseconds, "Time spent calculating projections") \
+    M(MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
+    M(MergeTreeDataProjectionWriterMergingBlocksMicroseconds, "Time spent merging input blocks") \
+    \
     M(InsertedWideParts, "Number of parts inserted in Wide format.") \
     M(InsertedCompactParts, "Number of parts inserted in Compact format.") \
     M(MergedIntoWideParts, "Number of parts merged into Wide format.") \
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index 6e544b4a35a..eb9e2f52ad9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -1,6 +1,13 @@
 #include <Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h>
 #include <Storages/MergeTree/MergeTreeIndexInverted.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
 #include <Common/MemoryTrackerBlockerInThread.h>
+#include <Common/logger_useful.h>
+
+namespace ProfileEvents
+{
+extern const Event MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds;
+}
 
 namespace DB
 {
@@ -148,6 +155,7 @@ MergeTreeDataPartWriterOnDisk::MergeTreeDataPartWriterOnDisk(
     , default_codec(default_codec_)
     , compute_granularity(index_granularity.empty())
     , compress_primary_key(settings.compress_primary_key)
+    , log(getLogger(storage.getLogName() + " (DataPartWriter)"))
 {
     if (settings.blocks_are_granules_size && !index_granularity.empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
@@ -354,6 +362,7 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializeSkipIndices(const Block
             store = it->second;
         }
 
+        size_t index_build_us = 0;
         for (const auto & granule : granules_to_write)
         {
             if (skip_index_accumulated_marks[i] == index_helper->index.granularity)
@@ -378,11 +387,17 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializeSkipIndices(const Block
                     writeBinaryLittleEndian(1UL, marks_out);
             }
 
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds);
+
             size_t pos = granule.start_row;
             skip_indices_aggregators[i]->update(skip_indexes_block, &pos, granule.rows_to_write);
             if (granule.is_complete)
                 ++skip_index_accumulated_marks[i];
+
+            index_build_us += watch.elapsed<Microseconds>();
         }
+        // clang-format off
+        LOG_DEBUG(log, "Spent {} ms calculating index {} for the part {}", index_build_us / 1000, skip_indices[i]->index.name, data_part->name);
     }
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
index 4d081778e68..5292c0d5590 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
@@ -190,6 +190,8 @@ private:
     void initStatistics();
 
     virtual void fillIndexGranularity(size_t index_granularity_for_block, size_t rows_in_block) = 0;
+
+    LoggerPtr log;
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index ce3015c5dcb..cba1131bd3e 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -1,21 +1,22 @@
-#include <Storages/MergeTree/MergeTreeDataWriter.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
-#include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Columns/ColumnConst.h>
-#include <Common/OpenTelemetryTraceContext.h>
-#include <Common/HashTable/HashMap.h>
-#include <Common/Exception.h>
+#include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/ObjectUtils.h>
 #include <Disks/createVolume.h>
+#include <IO/HashingWriteBuffer.h>
+#include <IO/WriteHelpers.h>
 #include <Interpreters/AggregationCommon.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/MergeTreeTransaction.h>
-#include <IO/HashingWriteBuffer.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <DataTypes/DataTypeDate.h>
-#include <DataTypes/ObjectUtils.h>
-#include <IO/WriteHelpers.h>
-#include <Common/typeid_cast.h>
 #include <Processors/TTL/ITTLAlgorithm.h>
+#include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
+#include <Storages/MergeTree/MergeTreeDataWriter.h>
+#include <Storages/MergeTree/MergedBlockOutputStream.h>
+#include <Common/ElapsedTimeProfileEventIncrement.h>
+#include <Common/Exception.h>
+#include <Common/HashTable/HashMap.h>
+#include <Common/OpenTelemetryTraceContext.h>
+#include <Common/typeid_cast.h>
 
 #include <Parsers/queryToString.h>
 
@@ -35,11 +36,16 @@ namespace ProfileEvents
     extern const Event MergeTreeDataWriterRows;
     extern const Event MergeTreeDataWriterUncompressedBytes;
     extern const Event MergeTreeDataWriterCompressedBytes;
+    extern const Event MergeTreeDataWriterPrimaryKeyCalculationMicroseconds;
+    extern const Event MergeTreeDataWriterMergingBlocksMicroseconds;
+    extern const Event MergeTreeDataWriterProjectionsCalculationMicroseconds;
     extern const Event MergeTreeDataProjectionWriterBlocks;
     extern const Event MergeTreeDataProjectionWriterBlocksAlreadySorted;
     extern const Event MergeTreeDataProjectionWriterRows;
     extern const Event MergeTreeDataProjectionWriterUncompressedBytes;
     extern const Event MergeTreeDataProjectionWriterCompressedBytes;
+    extern const Event MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds;
+    extern const Event MergeTreeDataProjectionWriterMergingBlocksMicroseconds;
     extern const Event RejectedInserts;
 }
 
@@ -472,6 +478,8 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     IColumn::Permutation perm;
     if (!sort_description.empty())
     {
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterPrimaryKeyCalculationMicroseconds);
+
         if (!isAlreadySorted(block, sort_description))
         {
             stableGetPermutation(block, sort_description, perm);
@@ -483,7 +491,10 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
 
     Names partition_key_columns = metadata_snapshot->getPartitionKey().column_names;
     if (context->getSettingsRef().optimize_on_insert)
+    {
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterMergingBlocksMicroseconds);
         block = mergeBlock(block, sort_description, partition_key_columns, perm_ptr, data.merging_params);
+    }
 
     /// Size of part would not be greater than block.bytes() + epsilon
     size_t expected_size = block.bytes();
@@ -588,7 +599,13 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
 
     for (const auto & projection : metadata_snapshot->getProjections())
     {
-        auto projection_block = projection.calculate(block, context);
+        Block projection_block;
+        {
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterProjectionsCalculationMicroseconds);
+            projection_block = projection.calculate(block, context);
+            LOG_DEBUG(log, "Spent {} ms calculating projection {} for the part {}", watch.elapsed(), projection.name, new_data_part->name);
+        }
+
         if (projection_block.rows())
         {
             auto proj_temp_part = writeProjectionPart(data, log, projection_block, projection, new_data_part.get());
@@ -685,6 +702,8 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
     IColumn::Permutation perm;
     if (!sort_description.empty())
     {
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds);
+
         if (!isAlreadySorted(block, sort_description))
         {
             stableGetPermutation(block, sort_description, perm);
@@ -696,6 +715,8 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
 
     if (projection.type == ProjectionDescription::Type::Aggregate)
     {
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataProjectionWriterMergingBlocksMicroseconds);
+
         MergeTreeData::MergingParams projection_merging_params;
         projection_merging_params.mode = MergeTreeData::MergingParams::Aggregating;
         block = mergeBlock(block, sort_description, {}, perm_ptr, projection_merging_params);

From b6aecc11498eef490eddfcbec2f02da738e06b6f Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 30 Jan 2024 19:35:26 +0000
Subject: [PATCH 0449/1081] Update reference file

---
 tests/queries/0_stateless/02479_mysql_connect_to_self.reference | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02479_mysql_connect_to_self.reference b/tests/queries/0_stateless/02479_mysql_connect_to_self.reference
index 6838dacc3b3..8057b945c5a 100644
--- a/tests/queries/0_stateless/02479_mysql_connect_to_self.reference
+++ b/tests/queries/0_stateless/02479_mysql_connect_to_self.reference
@@ -67,6 +67,6 @@ SELECT
     __table1.a AS a,
     __table1.b AS b,
     __table1.c AS c
-FROM mysql(\'127.0.0.1:9004\', \'default\', foo, \'default\', \'\', SETTINGS connection_wait_timeout = 123, connect_timeout = 40123002, read_write_timeout = 40123001, connection_pool_size = 3) AS __table1
+FROM mysql(\'127.0.0.1:9004\', _CAST(\'default\', \'String\'), foo, \'default\', \'\', SETTINGS connection_wait_timeout = 123, connect_timeout = 40123002, read_write_timeout = 40123001, connection_pool_size = 3) AS __table1
 ---
 5

From 280e04abb297770bcb1fe321ec1ad8d9382306cf Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 30 Jan 2024 20:50:28 +0100
Subject: [PATCH 0450/1081] Fix test one more time

---
 .../0_stateless/02973_s3_compressed_file_in_error_message.sh    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
index 946f0c09007..a4984583637 100755
--- a/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
+++ b/tests/queries/0_stateless/02973_s3_compressed_file_in_error_message.sh
@@ -5,4 +5,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c -F "(in file/uri a.tsv)"
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=none -q "select * from s3('http://localhost:11111/test/a.tsv', TSV, 'x String', 'gzip')" 2>&1 | grep -c "(in file/uri.*a\.tsv)"

From 2859ce4f1cf0856f1fc3d5576c43d28bdc7501ed Mon Sep 17 00:00:00 2001
From: Joanna Hulboj <joanna.hulboj@gmail.com>
Date: Tue, 30 Jan 2024 19:56:22 +0000
Subject: [PATCH 0451/1081] Remove octal issues when parsing with
 input_format_values_interpret_expressions=0

---
 .../Impl/ConstantExpressionTemplate.cpp       |   6 +-
 .../02896_leading_zeroes_no_octal.reference   | 154 ++++++++++++
 .../02896_leading_zeroes_no_octal.sql         | 223 ++++++++++++++++++
 3 files changed, 381 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02896_leading_zeroes_no_octal.reference
 create mode 100644 tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql

diff --git a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
index 2602f8b881d..bf584b759f8 100644
--- a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
+++ b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
@@ -603,6 +603,8 @@ bool ConstantExpressionTemplate::parseLiteralAndAssertType(
             memcpy(buf, istr.position(), bytes_to_copy);
             buf[bytes_to_copy] = 0;
 
+            const bool hex_like = bytes_to_copy >= 2 && buf[0] == '0' && (buf[1] == 'x' || buf[1] == 'X');
+
             char * pos_double = buf;
             errno = 0;
             Float64 float_value = std::strtod(buf, &pos_double);
@@ -614,13 +616,13 @@ bool ConstantExpressionTemplate::parseLiteralAndAssertType(
 
             char * pos_integer = buf;
             errno = 0;
-            UInt64 uint_value = std::strtoull(buf, &pos_integer, 0);
+            UInt64 uint_value = std::strtoull(buf, &pos_integer, hex_like ? 16 : 10);
             if (pos_integer == pos_double && errno != ERANGE && (!negative || uint_value <= (1ULL << 63)))
             {
                 istr.position() += pos_integer - buf;
                 if (negative && type_info.main_type == Type::Int64)
                     number = static_cast<Int64>(-uint_value);
-                else if (!negative && type_info.main_type == Type::UInt64)
+                else if (type_info.main_type == Type::UInt64 && (!negative || uint_value == 0))
                     number = uint_value;
                 else
                     return false;
diff --git a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.reference b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.reference
new file mode 100644
index 00000000000..7c69b7e02aa
--- /dev/null
+++ b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.reference
@@ -0,0 +1,154 @@
+Leading zeroes into Int64 (1XXX without input_format_values_interpret_expressions and 1XXXX with)
+1	1000	0	0	0	Single zero
+1	1001	00	0	0	Double zero
+1	1002	000000000000000	0	0	Mutliple redundant zeroes
+1	1003	01	1	1	Octal like, interpret as decimal
+1	1004	08	8	8	Octal like, interpret as decimal
+1	1005	0100	100	100	Octal like, interpret as decimal
+1	1006	0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes
+1	1010	-0	0	0	Single zero negative
+1	1011	-00	0	0	Double zero negative
+1	1012	-000000000000000	0	0	Mutliple redundant zeroes negative
+1	1013	-01	-1	-1	Octal like, interpret as decimal negative
+1	1014	-08	-8	-8	Octal like, interpret as decimal negative
+1	1015	-0100	-100	-100	Octal like, interpret as decimal negative
+1	1016	-0000000000100	-100	-100	Octal like, interpret as decimal, multiple leading zeroes negative
+1	1020	+0	0	0	Single zero positive
+1	1021	+00	0	0	Double zero negpositiveative
+1	1022	+000000000000000	0	0	Mutliple redundant zeroes positive
+1	1023	+01	1	1	Octal like, interpret as decimal positive
+1	1024	+08	8	8	Octal like, interpret as decimal positive
+1	1025	+0100	100	100	Octal like, interpret as decimal positive
+1	1026	+0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes positive
+1	1030	0000.008	0	0	Floating point should work...
+1	1031	-0000.008	0	0	Floating point should work...
+1	1032	+0000.008	0	0	Floating point should work...
+1	1033	0000.008e3	8	8	Floating point should work...
+1	1034	-0000.008e3	-8	-8	Floating point should work...
+1	1035	+0000.008e3	8	8	Floating point should work...
+1	1036	08000.008e-3	8	8	Floating point should work...
+1	1037	-08000.008e-3	-8	-8	Floating point should work...
+1	1038	+08000.008e-3	8	8	Floating point should work...
+1	1060	0x0abcd	43981	43981	Hex should be parsed
+1	1061	-0x0abcd	-43981	-43981	Hex should be parsed
+1	1062	+0x0abcd	43981	43981	Hex should be parsed
+1	1063	0x0abcdP1	87962	87962	Hex should be parsed
+1	1064	0x0abcdP+1	87962	87962	Hex should be parsed
+1	1065	0x0abcdP-1	21990	21990	Hex should be parsed
+1	1066	0x0abcdP01	87962	87962	Hex should be parsed
+1	1067	0x0abcdP+01	87962	87962	Hex should be parsed
+1	1068	0x0abcdP-01	21990	21990	Hex should be parsed
+1	11000	0	0	0	Single zero
+1	11001	00	0	0	Double zero
+1	11002	000000000000000	0	0	Mutliple redundant zeroes
+1	11003	01	1	1	Octal like, interpret as decimal
+1	11004	08	8	8	Octal like, interpret as decimal
+1	11005	0100	100	100	Octal like, interpret as decimal
+1	11006	0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes
+1	11010	-0	0	0	Single zero negative
+1	11011	-00	0	0	Double zero negative
+1	11012	-000000000000000	0	0	Mutliple redundant zeroes negative
+1	11013	-01	-1	-1	Octal like, interpret as decimal negative
+1	11014	-08	-8	-8	Octal like, interpret as decimal negative
+1	11015	-0100	-100	-100	Octal like, interpret as decimal negative
+1	11016	-0000000000100	-100	-100	Octal like, interpret as decimal, multiple leading zeroes negative
+1	11020	+0	0	0	Single zero positive
+1	11021	+00	0	0	Double zero negpositiveative
+1	11022	+000000000000000	0	0	Mutliple redundant zeroes positive
+1	11023	+01	1	1	Octal like, interpret as decimal positive
+1	11024	+08	8	8	Octal like, interpret as decimal positive
+1	11025	+0100	100	100	Octal like, interpret as decimal positive
+1	11026	+0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes positive
+1	11030	0000.008	0	0	Floating point should work...
+1	11031	-0000.008	0	0	Floating point should work...
+1	11032	+0000.008	0	0	Floating point should work...
+1	11033	0000.008e3	8	8	Floating point should work...
+1	11034	-0000.008e3	-8	-8	Floating point should work...
+1	11035	+0000.008e3	8	8	Floating point should work...
+1	11036	08000.008e-3	8	8	Floating point should work...
+1	11037	-08000.008e-3	-8	-8	Floating point should work...
+1	11038	+08000.008e-3	8	8	Floating point should work...
+1	11050	0b10000	16	16	Binary should be parsed
+1	11051	-0b10000	-16	-16	Binary should be parsed
+1	11052	+0b10000	16	16	Binary should be parsed
+1	11060	0x0abcd	43981	43981	Hex should be parsed
+1	11061	-0x0abcd	-43981	-43981	Hex should be parsed
+1	11062	+0x0abcd	43981	43981	Hex should be parsed
+1	11063	0x0abcdP1	87962	87962	Hex should be parsed
+1	11064	0x0abcdP+1	87962	87962	Hex should be parsed
+1	11065	0x0abcdP-1	21990	21990	Hex should be parsed
+1	11066	0x0abcdP01	87962	87962	Hex should be parsed
+1	11067	0x0abcdP+01	87962	87962	Hex should be parsed
+1	11068	0x0abcdP-01	21990	21990	Hex should be parsed
+Leading zeroes into Float64 (2XXX without input_format_values_interpret_expressions and 2XXXX with)
+1	2000	0	0	0	Single zero
+1	2001	00	0	0	Double zero
+1	2002	000000000000000	0	0	Mutliple redundant zeroes
+1	2003	01	1	1	Octal like, interpret as decimal
+1	2004	08	8	8	Octal like, interpret as decimal
+1	2005	0100	100	100	Octal like, interpret as decimal
+1	2006	0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes
+1	2013	-01	-1	-1	Octal like, interpret as decimal negative
+1	2014	-08	-8	-8	Octal like, interpret as decimal negative
+1	2015	-0100	-100	-100	Octal like, interpret as decimal negative
+1	2016	-0000000000100	-100	-100	Octal like, interpret as decimal, multiple leading zeroes negative
+1	2020	+0	0	0	Single zero positive
+1	2021	+00	0	0	Double zero negpositiveative
+1	2022	+000000000000000	0	0	Mutliple redundant zeroes positive
+1	2023	+01	1	1	Octal like, interpret as decimal positive
+1	2024	+08	8	8	Octal like, interpret as decimal positive
+1	2025	+0100	100	100	Octal like, interpret as decimal positive
+1	2026	+0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes positive
+1	2030	0000.008	0.008	0.008	Floating point should work...
+1	2031	-0000.008	-0.008	-0.008	Floating point should work...
+1	2032	+0000.008	0.008	0.008	Floating point should work...
+1	2033	0000.008e3	8	8	Floating point should work...
+1	2034	-0000.008e3	-8	-8	Floating point should work...
+1	2035	+0000.008e3	8	8	Floating point should work...
+1	2036	08.5e-3	0.0085	0.0085	Floating point should work...
+1	2037	-08.5e-3	-0.0085	-0.0085	Floating point should work...
+1	2038	+08.5e-3	0.0085	0.0085	Floating point should work...
+1	2063	0x0abcdP1	87962	87962	Hex should be parsed
+1	2064	0x0abcdP+1	87962	87962	Hex should be parsed
+1	2065	0x0abcdP-1	21990.5	21990.5	Hex should be parsed
+1	2066	0x0abcdP01	87962	87962	Hex should be parsed
+1	2067	0x0abcdP+01	87962	87962	Hex should be parsed
+1	2068	0x0abcdP-01	21990.5	21990.5	Hex should be parsed
+1	2069	0x01P-01	0.5	0.5	Hex should be parsed
+1	12000	0	0	0	Single zero
+1	12001	00	0	0	Double zero
+1	12002	000000000000000	0	0	Mutliple redundant zeroes
+1	12003	01	1	1	Octal like, interpret as decimal
+1	12004	08	8	8	Octal like, interpret as decimal
+1	12005	0100	100	100	Octal like, interpret as decimal
+1	12006	0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes
+1	12013	-01	-1	-1	Octal like, interpret as decimal negative
+1	12014	-08	-8	-8	Octal like, interpret as decimal negative
+1	12015	-0100	-100	-100	Octal like, interpret as decimal negative
+1	12016	-0000000000100	-100	-100	Octal like, interpret as decimal, multiple leading zeroes negative
+1	12020	+0	0	0	Single zero positive
+1	12021	+00	0	0	Double zero negpositiveative
+1	12022	+000000000000000	0	0	Mutliple redundant zeroes positive
+1	12023	+01	1	1	Octal like, interpret as decimal positive
+1	12024	+08	8	8	Octal like, interpret as decimal positive
+1	12025	+0100	100	100	Octal like, interpret as decimal positive
+1	12026	+0000000000100	100	100	Octal like, interpret as decimal, multiple leading zeroes positive
+1	12030	0000.008	0.008	0.008	Floating point should work...
+1	12031	-0000.008	-0.008	-0.008	Floating point should work...
+1	12032	+0000.008	0.008	0.008	Floating point should work...
+1	12033	0000.008e3	8	8	Floating point should work...
+1	12034	-0000.008e3	-8	-8	Floating point should work...
+1	12035	+0000.008e3	8	8	Floating point should work...
+1	12036	08.5e-3	0.0085	0.0085	Floating point should work...
+1	12037	-08.5e-3	-0.0085	-0.0085	Floating point should work...
+1	12038	+08.5e-3	0.0085	0.0085	Floating point should work...
+1	12050	0b10000	16	16	Binary should be parsed
+1	12051	-0b10000	-16	-16	Binary should be parsed
+1	12052	+0b10000	16	16	Binary should be parsed
+1	12063	0x0abcdP1	87962	87962	Hex should be parsed
+1	12064	0x0abcdP+1	87962	87962	Hex should be parsed
+1	12065	0x0abcdP-1	21990.5	21990.5	Hex should be parsed
+1	12066	0x0abcdP01	87962	87962	Hex should be parsed
+1	12067	0x0abcdP+01	87962	87962	Hex should be parsed
+1	12068	0x0abcdP-01	21990.5	21990.5	Hex should be parsed
+1	12069	0x01P-01	0.5	0.5	Hex should be parsed
diff --git a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
new file mode 100644
index 00000000000..be04224bd52
--- /dev/null
+++ b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
@@ -0,0 +1,223 @@
+DROP TABLE IF EXISTS t_leading_zeroes;
+DROP TABLE IF EXISTS t_leading_zeroes_f;
+
+CREATE TABLE t_leading_zeroes(id Int64, input String, val Int64, expected Int64, comment String) ENGINE=MergeTree ORDER BY id;
+CREATE TABLE t_leading_zeroes_f(id Int64, input String, val Float64, expected Float64, comment String) ENGINE=MergeTree ORDER BY id;
+
+SET input_format_values_interpret_expressions = 0;
+
+INSERT INTO t_leading_zeroes VALUES (1000, '0', 0, 0, 'Single zero');
+INSERT INTO t_leading_zeroes VALUES (1001, '00', 00, 0, 'Double zero');
+INSERT INTO t_leading_zeroes VALUES (1002, '000000000000000', 000000000000000, 0, 'Mutliple redundant zeroes');
+INSERT INTO t_leading_zeroes VALUES (1003, '01', 01, 1, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (1004, '08', 08, 8, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (1005, '0100', 0100, 100, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (1006, '0000000000100', 0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes');
+
+INSERT INTO t_leading_zeroes VALUES (1010, '-0', -0, 0, 'Single zero negative');
+INSERT INTO t_leading_zeroes VALUES (1011, '-00', -00, 0, 'Double zero negative');
+INSERT INTO t_leading_zeroes VALUES (1012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
+INSERT INTO t_leading_zeroes VALUES (1013, '-01', -01, -1, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (1014, '-08', -08, -8, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (1015, '-0100', -0100, -100, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (1016, '-0000000000100', -0000000000100, -100, 'Octal like, interpret as decimal, multiple leading zeroes negative');
+
+INSERT INTO t_leading_zeroes VALUES (1020, '+0', +0, 0, 'Single zero positive');
+INSERT INTO t_leading_zeroes VALUES (1021, '+00', +00, 0, 'Double zero negpositiveative');
+INSERT INTO t_leading_zeroes VALUES (1022, '+000000000000000', +000000000000000, 0, 'Mutliple redundant zeroes positive');
+INSERT INTO t_leading_zeroes VALUES (1023, '+01', +01, 1, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (1024, '+08', +08, 8, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (1025, '+0100', +0100, 100, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (1026, '+0000000000100', +0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes positive');
+
+INSERT INTO t_leading_zeroes VALUES (1030, '0000.008', 0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1031, '-0000.008', -0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1032, '+0000.008', +0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1033, '0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1034, '-0000.008e3', -0000.008e3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1035, '+0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1036, '08000.008e-3', 08000.008e-3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1037, '-08000.008e-3', -08000.008e-3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (1038, '+08000.008e-3', 08000.008e-3, 8, 'Floating point should work...');
+
+INSERT INTO t_leading_zeroes VALUES (1060, '0x0abcd', 0x0abcd, 43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1061, '-0x0abcd', -0x0abcd, -43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1062, '+0x0abcd', +0x0abcd, 43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1063, '0x0abcdP1', 0x0abcdP1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1064, '0x0abcdP+1', 0x0abcdP+1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1065, '0x0abcdP-1', 0x0abcdP-1, 21990, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1066, '0x0abcdP01', 0x0abcdP01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1067, '0x0abcdP+01', 0x0abcdP+01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (1068, '0x0abcdP-01', 0x0abcdP-01, 21990, 'Hex should be parsed');
+
+
+-- Floating point numbers go via readFloatTextFastImpl - so should not be affected
+
+INSERT INTO t_leading_zeroes_f VALUES (2000, '0', 0, 0, 'Single zero');
+INSERT INTO t_leading_zeroes_f VALUES (2001, '00', 00, 0, 'Double zero');
+INSERT INTO t_leading_zeroes_f VALUES (2002, '000000000000000', 000000000000000, 0, 'Mutliple redundant zeroes');
+INSERT INTO t_leading_zeroes_f VALUES (2003, '01', 01, 1, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (2004, '08', 08, 8, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (2005, '0100', 0100, 100, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (2006, '0000000000100', 0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes');
+
+-- Float negative zero is machine/context dependent
+--INSERT INTO t_leading_zeroes_f VALUES (2010, '-0', -0, 0, 'Single zero negative');
+--INSERT INTO t_leading_zeroes_f VALUES (2011, '-00', -00, 0, 'Double zero negative');
+--INSERT INTO t_leading_zeroes_f VALUES (2012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
+INSERT INTO t_leading_zeroes_f VALUES (2013, '-01', -01, -1, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (2014, '-08', -08, -8, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (2015, '-0100', -0100, -100, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (2016, '-0000000000100', -0000000000100, -100, 'Octal like, interpret as decimal, multiple leading zeroes negative');
+
+INSERT INTO t_leading_zeroes_f VALUES (2020, '+0', +0, 0, 'Single zero positive');
+INSERT INTO t_leading_zeroes_f VALUES (2021, '+00', +00, 0, 'Double zero negpositiveative');
+INSERT INTO t_leading_zeroes_f VALUES (2022, '+000000000000000', +000000000000000, 0, 'Mutliple redundant zeroes positive');
+INSERT INTO t_leading_zeroes_f VALUES (2023, '+01', +01, 1, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (2024, '+08', +08, 8, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (2025, '+0100', +0100, 100, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (2026, '+0000000000100', +0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes positive');
+
+INSERT INTO t_leading_zeroes_f VALUES (2030, '0000.008', 0000.008, 0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2031, '-0000.008', -0000.008, -0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2032, '+0000.008', +0000.008, 0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2033, '0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2034, '-0000.008e3', -0000.008e3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2035, '+0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2036, '08.5e-3', 08.5e-3, 0.0085, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2037, '-08.5e-3', -08.5e-3, -0.0085, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (2038, '+08.5e-3', 08.5e-3, 0.0085, 'Floating point should work...');
+
+INSERT INTO t_leading_zeroes_f VALUES (2063, '0x0abcdP1', 0x0abcdP1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2064, '0x0abcdP+1', 0x0abcdP+1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2065, '0x0abcdP-1', 0x0abcdP-1, 21990.5, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2066, '0x0abcdP01', 0x0abcdP01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2067, '0x0abcdP+01', 0x0abcdP+01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2068, '0x0abcdP-01', 0x0abcdP-01, 21990.5, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (2069, '0x01P-01', 0x01P-01, 0.5, 'Hex should be parsed');
+
+-- Coincidentally, the following result in 9 rather than 9e9 because of readFloatTextFastImpl
+-- using readUIntTextUpToNSignificantDigits<4>(exponent, in)
+-- INSERT INTO t_leading_zeroes_f VALUES (2070, '00009e00009', 00009e00009, 9e9, '???');
+
+-- Binary should not work with input_format_values_interpret_expressions = 0;
+
+INSERT INTO t_leading_zeroes_f VALUES (2050, '0b10000', 0b10000, 16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+INSERT INTO t_leading_zeroes_f VALUES (2051, '-0b10000', -0b10000, -16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+INSERT INTO t_leading_zeroes_f VALUES (2052, '+0b10000', +0b10000, 16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+
+INSERT INTO t_leading_zeroes VALUES (1050, '0b10000', 0b10000, 16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+INSERT INTO t_leading_zeroes VALUES (1051, '-0b10000', -0b10000, -16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+INSERT INTO t_leading_zeroes VALUES (1052, '+0b10000', +0b10000, 16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
+
+
+
+SET input_format_values_interpret_expressions = 1;
+
+INSERT INTO t_leading_zeroes VALUES (11000, '0', 0, 0, 'Single zero');
+INSERT INTO t_leading_zeroes VALUES (11001, '00', 00, 0, 'Double zero');
+INSERT INTO t_leading_zeroes VALUES (11002, '000000000000000', 000000000000000, 0, 'Mutliple redundant zeroes');
+INSERT INTO t_leading_zeroes VALUES (11003, '01', 01, 1, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (11004, '08', 08, 8, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (11005, '0100', 0100, 100, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes VALUES (11006, '0000000000100', 0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes');
+
+INSERT INTO t_leading_zeroes VALUES (11010, '-0', -0, 0, 'Single zero negative');
+INSERT INTO t_leading_zeroes VALUES (11011, '-00', -00, 0, 'Double zero negative');
+INSERT INTO t_leading_zeroes VALUES (11012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
+INSERT INTO t_leading_zeroes VALUES (11013, '-01', -01, -1, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (11014, '-08', -08, -8, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (11015, '-0100', -0100, -100, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes VALUES (11016, '-0000000000100', -0000000000100, -100, 'Octal like, interpret as decimal, multiple leading zeroes negative');
+
+INSERT INTO t_leading_zeroes VALUES (11020, '+0', +0, 0, 'Single zero positive');
+INSERT INTO t_leading_zeroes VALUES (11021, '+00', +00, 0, 'Double zero negpositiveative');
+INSERT INTO t_leading_zeroes VALUES (11022, '+000000000000000', +000000000000000, 0, 'Mutliple redundant zeroes positive');
+INSERT INTO t_leading_zeroes VALUES (11023, '+01', +01, 1, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (11024, '+08', +08, 8, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (11025, '+0100', +0100, 100, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes VALUES (11026, '+0000000000100', +0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes positive');
+
+INSERT INTO t_leading_zeroes VALUES (11030, '0000.008', 0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11031, '-0000.008', -0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11032, '+0000.008', +0000.008, 0, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11033, '0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11034, '-0000.008e3', -0000.008e3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11035, '+0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11036, '08000.008e-3', 08000.008e-3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11037, '-08000.008e-3', -08000.008e-3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes VALUES (11038, '+08000.008e-3', 08000.008e-3, 8, 'Floating point should work...');
+
+INSERT INTO t_leading_zeroes VALUES (11050, '0b10000', 0b10000, 16, 'Binary should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11051, '-0b10000', -0b10000, -16, 'Binary should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11052, '+0b10000', +0b10000, 16, 'Binary should be parsed');
+
+INSERT INTO t_leading_zeroes VALUES (11060, '0x0abcd', 0x0abcd, 43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11061, '-0x0abcd', -0x0abcd, -43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11062, '+0x0abcd', +0x0abcd, 43981, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11063, '0x0abcdP1', 0x0abcdP1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11064, '0x0abcdP+1', 0x0abcdP+1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11065, '0x0abcdP-1', 0x0abcdP-1, 21990, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11066, '0x0abcdP01', 0x0abcdP01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11067, '0x0abcdP+01', 0x0abcdP+01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes VALUES (11068, '0x0abcdP-01', 0x0abcdP-01, 21990, 'Hex should be parsed');
+
+-- Floating point numbers go via readFloatTextFastImpl - so should not be affected
+
+INSERT INTO t_leading_zeroes_f VALUES (12000, '0', 0, 0, 'Single zero');
+INSERT INTO t_leading_zeroes_f VALUES (12001, '00', 00, 0, 'Double zero');
+INSERT INTO t_leading_zeroes_f VALUES (12002, '000000000000000', 000000000000000, 0, 'Mutliple redundant zeroes');
+INSERT INTO t_leading_zeroes_f VALUES (12003, '01', 01, 1, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (12004, '08', 08, 8, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (12005, '0100', 0100, 100, 'Octal like, interpret as decimal');
+INSERT INTO t_leading_zeroes_f VALUES (12006, '0000000000100', 0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes');
+
+-- Float negative zero is machine/context dependent
+-- INSERT INTO t_leading_zeroes_f VALUES (12010, '-0', -0, 0, 'Single zero negative');
+-- INSERT INTO t_leading_zeroes_f VALUES (12011, '-00', -00, 0, 'Double zero negative');
+-- INSERT INTO t_leading_zeroes_f VALUES (12012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
+INSERT INTO t_leading_zeroes_f VALUES (12013, '-01', -01, -1, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (12014, '-08', -08, -8, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (12015, '-0100', -0100, -100, 'Octal like, interpret as decimal negative');
+INSERT INTO t_leading_zeroes_f VALUES (12016, '-0000000000100', -0000000000100, -100, 'Octal like, interpret as decimal, multiple leading zeroes negative');
+
+INSERT INTO t_leading_zeroes_f VALUES (12020, '+0', +0, 0, 'Single zero positive');
+INSERT INTO t_leading_zeroes_f VALUES (12021, '+00', +00, 0, 'Double zero negpositiveative');
+INSERT INTO t_leading_zeroes_f VALUES (12022, '+000000000000000', +000000000000000, 0, 'Mutliple redundant zeroes positive');
+INSERT INTO t_leading_zeroes_f VALUES (12023, '+01', +01, 1, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (12024, '+08', +08, 8, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (12025, '+0100', +0100, 100, 'Octal like, interpret as decimal positive');
+INSERT INTO t_leading_zeroes_f VALUES (12026, '+0000000000100', +0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes positive');
+
+INSERT INTO t_leading_zeroes_f VALUES (12030, '0000.008', 0000.008, 0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12031, '-0000.008', -0000.008, -0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12032, '+0000.008', +0000.008, 0.008, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12033, '0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12034, '-0000.008e3', -0000.008e3, -8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12035, '+0000.008e3', 0000.008e3, 8, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12036, '08.5e-3', 08.5e-3, 0.0085, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12037, '-08.5e-3', -08.5e-3, -0.0085, 'Floating point should work...');
+INSERT INTO t_leading_zeroes_f VALUES (12038, '+08.5e-3', 08.5e-3, 0.0085, 'Floating point should work...');
+
+INSERT INTO t_leading_zeroes_f VALUES (12050, '0b10000', 0b10000, 16, 'Binary should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12051, '-0b10000', -0b10000, -16, 'Binary should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12052, '+0b10000', +0b10000, 16, 'Binary should be parsed');
+
+INSERT INTO t_leading_zeroes_f VALUES (12063, '0x0abcdP1', 0x0abcdP1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12064, '0x0abcdP+1', 0x0abcdP+1, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12065, '0x0abcdP-1', 0x0abcdP-1, 21990.5, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12066, '0x0abcdP01', 0x0abcdP01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12067, '0x0abcdP+01', 0x0abcdP+01, 87962, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12068, '0x0abcdP-01', 0x0abcdP-01, 21990.5, 'Hex should be parsed');
+INSERT INTO t_leading_zeroes_f VALUES (12069, '0x01P-01', 0x01P-01, 0.5, 'Hex should be parsed');
+
+SELECT 'Leading zeroes into Int64 (1XXX without input_format_values_interpret_expressions and 1XXXX with)';
+SELECT t.val == t.expected AS ok, * FROM t_leading_zeroes t ORDER BY id;
+
+
+SELECT 'Leading zeroes into Float64 (2XXX without input_format_values_interpret_expressions and 2XXXX with)';
+SELECT t.val == t.expected AS ok, * FROM t_leading_zeroes_f t ORDER BY id;
+
+
+DROP TABLE IF EXISTS t_leading_zeroes;
+DROP TABLE IF EXISTS t_leading_zeroes_f;

From d8a6e53d0b4b0e504982321043bec9f9180e87c1 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 30 Jan 2024 20:27:30 +0000
Subject: [PATCH 0452/1081] Use FQDN as host name by default for TCP

- instead of display_name setting value
---
 src/Interpreters/ProfileEventsExt.cpp |  6 +++---
 src/Interpreters/ProfileEventsExt.h   |  2 +-
 src/Server/TCPHandler.cpp             | 12 ++++++------
 src/Server/TCPHandler.h               |  2 +-
 src/Server/TCPHandlerFactory.h        | 13 +++++++++----
 5 files changed, 20 insertions(+), 15 deletions(-)

diff --git a/src/Interpreters/ProfileEventsExt.cpp b/src/Interpreters/ProfileEventsExt.cpp
index bd421ae8e33..dd8306066e7 100644
--- a/src/Interpreters/ProfileEventsExt.cpp
+++ b/src/Interpreters/ProfileEventsExt.cpp
@@ -99,7 +99,7 @@ static void dumpMemoryTracker(ProfileEventsSnapshot const & snapshot, DB::Mutabl
 }
 
 void getProfileEvents(
-    const String & server_display_name,
+    const String & host_name,
     DB::InternalProfileEventsQueuePtr profile_queue,
     DB::Block & block,
     ThreadIdToCountersSnapshot & last_sent_snapshots)
@@ -139,8 +139,8 @@ void getProfileEvents(
     }
     last_sent_snapshots = std::move(new_snapshots);
 
-    dumpProfileEvents(group_snapshot, columns, server_display_name);
-    dumpMemoryTracker(group_snapshot, columns, server_display_name);
+    dumpProfileEvents(group_snapshot, columns, host_name);
+    dumpMemoryTracker(group_snapshot, columns, host_name);
 
     Block curr_block;
 
diff --git a/src/Interpreters/ProfileEventsExt.h b/src/Interpreters/ProfileEventsExt.h
index cc338530510..9099e6902ec 100644
--- a/src/Interpreters/ProfileEventsExt.h
+++ b/src/Interpreters/ProfileEventsExt.h
@@ -26,7 +26,7 @@ using ThreadIdToCountersSnapshot = std::unordered_map<UInt64, Counters::Snapshot
 void dumpToMapColumn(const Counters::Snapshot & counters, DB::IColumn * column, bool nonzero_only = true);
 
 void getProfileEvents(
-    const String & server_display_name,
+    const String & host_name,
     DB::InternalProfileEventsQueuePtr profile_queue,
     DB::Block & block,
     ThreadIdToCountersSnapshot & last_sent_snapshots);
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index ec6b374518d..339b664640f 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -184,7 +184,7 @@ void validateClientInfo(const ClientInfo & session_client_info, const ClientInfo
 namespace DB
 {
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
+TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string host_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
     : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
@@ -192,11 +192,11 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , log(getLogger("TCPHandler"))
     , read_event(read_event_)
     , write_event(write_event_)
-    , server_display_name(std::move(server_display_name_))
+    , host_name(std::move(host_name_))
 {
 }
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
+TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string host_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
 : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
@@ -206,7 +206,7 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , read_event(read_event_)
     , write_event(write_event_)
     , default_database(stack_data.default_database)
-    , server_display_name(std::move(server_display_name_))
+    , host_name(std::move(host_name_))
 {
     if (!forwarded_for.empty())
         LOG_TRACE(log, "Forwarded client address: {}", forwarded_for);
@@ -1201,7 +1201,7 @@ void TCPHandler::sendExtremes(const Block & extremes)
 void TCPHandler::sendProfileEvents()
 {
     Block block;
-    ProfileEvents::getProfileEvents(server_display_name, state.profile_queue, block, last_sent_snapshots);
+    ProfileEvents::getProfileEvents(host_name, state.profile_queue, block, last_sent_snapshots);
     if (block.rows() != 0)
     {
         initProfileEventsBlockOutput(block);
@@ -1536,7 +1536,7 @@ void TCPHandler::sendHello()
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_SERVER_TIMEZONE)
         writeStringBinary(DateLUT::instance().getTimeZone(), *out);
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_SERVER_DISPLAY_NAME)
-        writeStringBinary(server_display_name, *out);
+        writeStringBinary(host_name, *out);
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_VERSION_PATCH)
         writeVarUInt(VERSION_PATCH, *out);
     if (client_tcp_protocol_version >= DBMS_MIN_PROTOCOL_VERSION_WITH_PASSWORD_COMPLEXITY_RULES)
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index 26cecf46662..80ec484ab1c 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -224,7 +224,7 @@ private:
     ProfileEvents::ThreadIdToCountersSnapshot last_sent_snapshots;
 
     /// It is the name of the server that will be sent to the client.
-    String server_display_name;
+    String host_name;
 
     void runImpl();
 
diff --git a/src/Server/TCPHandlerFactory.h b/src/Server/TCPHandlerFactory.h
index d65c9898b23..212572fb7a7 100644
--- a/src/Server/TCPHandlerFactory.h
+++ b/src/Server/TCPHandlerFactory.h
@@ -19,7 +19,7 @@ private:
     IServer & server;
     bool parse_proxy_protocol = false;
     LoggerPtr log;
-    std::string server_display_name;
+    std::string host_name;
 
     ProfileEvents::Event read_event;
     ProfileEvents::Event write_event;
@@ -42,7 +42,12 @@ public:
         , read_event(read_event_)
         , write_event(write_event_)
     {
-        server_display_name = server.config().getString("display_name", getFQDNOrHostName());
+        const bool use_display_name = server.config().getBool("tcp_use_display_name_as_host_name", false);
+        if (use_display_name)
+            host_name = server.config().getString("display_name", "");
+
+        if (!host_name.length())
+            host_name = getFQDNOrHostName();
     }
 
     Poco::Net::TCPServerConnection * createConnection(const Poco::Net::StreamSocket & socket, TCPServer & tcp_server) override
@@ -50,7 +55,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, server_display_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, host_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {
@@ -64,7 +69,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, stack_data, server_display_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, stack_data, host_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {

From 0f5cb76a618ba5182d9463ed88d8acea1632b89b Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Tue, 30 Jan 2024 20:37:51 +0000
Subject: [PATCH 0453/1081] more words

---
 .../aspell-ignore/en/aspell-dict.txt          | 22 ++++++++++++++++++-
 1 file changed, 21 insertions(+), 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 77152804740..74e32ed31ce 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2697 
+personal_ws-1.1 en 2716 
 AArch
 ACLs
 ALTERs
@@ -12,6 +12,7 @@ ARMv
 ASLR
 ASOF
 ASan
+AWND
 AWST
 Actian
 ActionsMenu
@@ -237,6 +238,7 @@ DistributedSend
 DockerHub
 DoubleDelta
 Doxygen
+Durre
 ECMA
 Ecto
 EdgeAngle
@@ -287,6 +289,7 @@ ForEach
 FreeBSD
 Fuzzer
 Fuzzers
+GHCN
 GTID
 GTest
 Gb
@@ -442,6 +445,7 @@ Khanna
 KittenHouse
 Klickhouse
 Kolmogorov
+Korzeniewski
 Kubernetes
 LDAP
 LGPL
@@ -501,6 +505,7 @@ MaxMind
 MaxPartCountForPartition
 MaxPushedDDLEntryID
 Mbps
+McNeal
 Memcheck
 MemoryCode
 MemoryDataAndStack
@@ -510,6 +515,7 @@ MemorySanitizer
 MemoryShared
 MemoryTracking
 MemoryVirtual
+Menne
 MergeJoin
 MergeState
 MergeTree
@@ -554,6 +560,7 @@ NEWDATE
 NEWDECIMAL
 NFKC
 NFKD
+NOAA
 NULLIF
 NVME
 NVMe
@@ -574,6 +581,7 @@ NetworkSendBytes
 NetworkSendDrop
 NetworkSendErrors
 NetworkSendPackets
+Noaa
 NodeJs
 NuRaft
 NumHexagons
@@ -654,8 +662,10 @@ OrZero
 OvercommitTracker
 PAAMAYIM
 PCRE
+PRCP
 PREWHERE
 PROCESSLIST
+PSUN
 PagerDuty
 ParallelFormattingOutputFormatThreads
 ParallelFormattingOutputFormatThreadsActive
@@ -800,6 +810,7 @@ SIMD
 SLES
 SLRU
 SMALLINT
+SNWD
 SPNEGO
 SQEs
 SQLAlchemy
@@ -872,11 +883,14 @@ SupersetDocker
 SystemReplicasThreads
 SystemReplicasThreadsActive
 TABLUM
+TAVG
 TCPConnection
 TCPThreads
 TDigest
 TINYINT
 TLSv
+TMAX
+TMIN
 TPCH
 TSDB
 TSVRaw
@@ -978,7 +992,9 @@ VersionedCollapsingMergeTree
 VideoContainer
 ViewAllLink
 VirtualBox
+Vose
 WALs
+WSFG
 Welch's
 Werror
 Wether
@@ -997,6 +1013,7 @@ Xeon
 YAML
 YAMLRegExpTree
 YYYY
+YYYYMMDD
 YYYYMMDDToDate
 YYYYMMDDhhmmssToDateTime
 Yandex
@@ -1566,6 +1583,7 @@ getSetting
 getSizeOfEnumType
 getblockinfo
 getevents
+ghcnd
 github
 glibc
 globalIn
@@ -1947,6 +1965,7 @@ ngramSimHashCaseInsensitiveUTF
 ngramSimHashUTF
 ngrambf
 ngrams
+noaa
 nonNegativeDerivative
 noop
 normalizeQuery
@@ -2202,6 +2221,7 @@ reinterpretAsString
 reinterpretAsUInt
 reinterpretAsUUID
 remoteSecure
+repivot
 replaceAll
 replaceOne
 replaceRegexpAll

From db84527dd01742329186c11c5c9be066eb652e8c Mon Sep 17 00:00:00 2001
From: Dale Mcdiarmid <dale@clickhouse.com>
Date: Tue, 30 Jan 2024 20:39:37 +0000
Subject: [PATCH 0454/1081] more words

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 3eb233f2995..1cb24705d19 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2716 
+personal_ws-1.1 en 2724
 AArch
 ACLs
 ALTERs

From 1be8b61c5b0ca501588c618c986dfb32e1586a1b Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Tue, 30 Jan 2024 20:50:03 +0100
Subject: [PATCH 0455/1081] add test

---
 .../MergeTreeDataPartWriterOnDisk.cpp         |  1 -
 .../MergeTree/MergeTreeDataWriter.cpp         |  2 +-
 ...2_perf_introspection_for_inserts.reference |  1 +
 .../02982_perf_introspection_for_inserts.sh   | 46 +++++++++++++++++++
 4 files changed, 48 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02982_perf_introspection_for_inserts.reference
 create mode 100755 tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh

diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index eb9e2f52ad9..153bcaa6320 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -396,7 +396,6 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializeSkipIndices(const Block
 
             index_build_us += watch.elapsed<Microseconds>();
         }
-        // clang-format off
         LOG_DEBUG(log, "Spent {} ms calculating index {} for the part {}", index_build_us / 1000, skip_indices[i]->index.name, data_part->name);
     }
 }
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index cba1131bd3e..8f522832bce 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -603,7 +603,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
         {
             ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterProjectionsCalculationMicroseconds);
             projection_block = projection.calculate(block, context);
-            LOG_DEBUG(log, "Spent {} ms calculating projection {} for the part {}", watch.elapsed(), projection.name, new_data_part->name);
+            LOG_DEBUG(log, "Spent {} ms calculating projection {} for the part {}", watch.elapsed() / 1000, projection.name, new_data_part->name);
         }
 
         if (projection_block.rows())
diff --git a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.reference b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.reference
new file mode 100644
index 00000000000..50d4d226b46
--- /dev/null
+++ b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.reference
@@ -0,0 +1 @@
+1	1	1	1	1
diff --git a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
new file mode 100755
index 00000000000..a45f88fc10f
--- /dev/null
+++ b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
@@ -0,0 +1,46 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+$CLICKHOUSE_CLIENT -q """
+CREATE TABLE t02982
+(
+    n UInt64,
+    s Nullable(String),
+    INDEX idx1 n TYPE minmax GRANULARITY 2,
+    INDEX idx2 n * length(s) TYPE set(1000) GRANULARITY 2,
+    PROJECTION pr_sort
+    (
+        SELECT
+            n,
+            sum(length(s))
+        GROUP BY n
+    )
+)
+ENGINE = MergeTree
+ORDER BY n;
+"""
+
+query_id=$RANDOM
+
+$CLICKHOUSE_CLIENT --query_id $query_id -q """
+INSERT INTO t02982 SELECT
+    number,
+    'a'
+FROM numbers_mt(1000000);
+"""
+
+$CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
+$CLICKHOUSE_CLIENT -q """
+SELECT
+    ProfileEvents['MergeTreeDataProjectionWriterMergingBlocksMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataWriterPrimaryKeyCalculationMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataWriterProjectionsCalculationMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds'] > 0
+FROM system.query_log
+WHERE current_database = currentDatabase() AND query_id='$query_id' AND type = 'QueryFinish';
+"""

From 076fb1de310a144d35541269cb98809dce77a613 Mon Sep 17 00:00:00 2001
From: Alexey Gerasimchuck <a.gerasimchuck@arenadata.io>
Date: Tue, 30 Jan 2024 23:52:33 +0000
Subject: [PATCH 0456/1081] Updated the authentication failures counter logic

---
 src/Access/AccessControl.cpp                  |  29 +++--
 .../02884_authentication_quota.reference      |  66 +++++------
 .../0_stateless/02884_authentication_quota.sh | 103 ++++++++----------
 3 files changed, 99 insertions(+), 99 deletions(-)

diff --git a/src/Access/AccessControl.cpp b/src/Access/AccessControl.cpp
index 7026fda94b1..d02af01126a 100644
--- a/src/Access/AccessControl.cpp
+++ b/src/Access/AccessControl.cpp
@@ -565,19 +565,31 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
     // Then user_id is not generated, and the authentication quota will always be nullptr.
     auto authentication_quota = getAuthenticationQuota(credentials.getUserName(), address, forwarded_address);
     if (authentication_quota)
-        authentication_quota->checkExceeded(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+    {
+        /// Reserve a single try from the quota to check whether we have another authentication try.
+        /// This is required for correct behavior in this situation:
+        /// User has 1 login failures quota.
+        /// * At the first login with an invalid password: Increase the quota counter. 1 (used) > 1 (max) is false.
+        ///   Then try to authenticate the user and throw an AUTHENTICATION_FAILED error.
+        /// * In case of the second try: increase quota counter, 2 (used) > 1 (max), then throw QUOTA_EXCEED
+        ///   and don't let the user authenticate.
+        ///
+        /// The authentication failures counter will be reset after successful authentication.
+        authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1);
+    }
 
-    AuthResult auth_result;
     try
     {
-        auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
-                                                          allow_plaintext_password);
+        const auto auth_result = MultipleAccessStorage::authenticate(credentials, address, *external_authenticators, allow_no_password,
+                                                                     allow_plaintext_password);
+        if (authentication_quota)
+            authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
+
+        return auth_result;
     }
     catch (...)
     {
         tryLogCurrentException(getLogger(), "from: " + address.toString() + ", user: " + credentials.getUserName()  + ": Authentication failed");
-        if (authentication_quota)
-            authentication_quota->used(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS, 1, true);
 
         WriteBufferFromOwnString message;
         message << credentials.getUserName() << ": Authentication failed: password is incorrect, or there is no user with such name.";
@@ -597,11 +609,6 @@ AuthResult AccessControl::authenticate(const Credentials & credentials, const Po
                                             "{}: Authentication failed: password is incorrect, or there is no user with such name.{}"},
                         ErrorCodes::AUTHENTICATION_FAILED);
     }
-
-    if (authentication_quota)
-        authentication_quota->reset(QuotaType::FAILED_SEQUENTIAL_AUTHENTICATIONS);
-
-    return auth_result;
 }
 
 void AccessControl::restoreFromBackup(RestorerFromBackup & restorer)
diff --git a/tests/queries/0_stateless/02884_authentication_quota.reference b/tests/queries/0_stateless/02884_authentication_quota.reference
index 02e410ed56f..638034bab82 100644
--- a/tests/queries/0_stateless/02884_authentication_quota.reference
+++ b/tests/queries/0_stateless/02884_authentication_quota.reference
@@ -2,51 +2,53 @@
 > Create the user with quota with the maximum single authentication attempt.
 > Check if the quota has been created.
 1
+> Try to login to the user account with correct password
 > Login to the user account using the wrong password.
 password is incorrect
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-1	1
-> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	1
-> Login to the user account using the wrong password 2 times to exceed the quota.
-password is incorrect
-QUOTA_EXCEEDED
-> Login to the user account using the correct password, but login is unsuccesful (quota exceed).
+> Quota is exceeded 1 >= 1. Login with correct password should fail.
 QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
 2	1
-> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
-> Login to the user account using the wrong password.
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4
+> Try to login to the user account with correct password
+> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	4
+> Login to the user account using the wrong password before exeeding the quota.
 password is incorrect
+password is incorrect
+password is incorrect
+password is incorrect
+QUOTA_EXCEEDED
+> Also try to login with correct password. Quota should stay exceeded.
+QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-3	3
-> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	3
+6	4
+> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login
+> and check failed_sequential_authentications, max_failed_sequential_authentications.
+0	7
+ ---------------------------------------------------------------------------
 > Create the role with quota with the maximum single authentication attempt.
+> Try to login to the user account with correct password
 > Login to the user account using the wrong password.
 password is incorrect
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-1	1
-> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed.
-> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-0	1
-> Login to the user account using the wrong password 2 times to exceed the quota.
-password is incorrect
+> Quota is exceeded 1 >= 1. Login with correct password should fail.
 QUOTA_EXCEEDED
 > Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
-QUOTA_EXCEEDED
-> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3
-> Login to the user account using the wrong password.
+2	1
+> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4
+> Try to login to the user account with correct password
+> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+0	4
+> Login to the user account using the wrong password before exeeding the quota.
+password is incorrect
+password is incorrect
 password is incorrect
-> Login to the user account using the correct password.
-> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1
-> Login 2 times to the user account using the wrong password to exceed the quota
 password is incorrect
-> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'.
 QUOTA_EXCEEDED
-> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
-QUOTA_EXCEEDED
-> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'.
+> Also try to login with correct password. Quota should stay exceeded.
 QUOTA_EXCEEDED
+> Check the failed_sequential_authentications, max_failed_sequential_authentications fields.
+6	4
+> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login
+> and check failed_sequential_authentications, max_failed_sequential_authentications.
+0	7
diff --git a/tests/queries/0_stateless/02884_authentication_quota.sh b/tests/queries/0_stateless/02884_authentication_quota.sh
index fcb2607c3d6..f013bb4d639 100755
--- a/tests/queries/0_stateless/02884_authentication_quota.sh
+++ b/tests/queries/0_stateless/02884_authentication_quota.sh
@@ -9,6 +9,50 @@ QUOTA="2884_quota_$$"
 USER="2884_user_$$"
 ROLE="2884_role_$$"
 
+
+function login_test()
+{
+    echo "> Try to login to the user account with correct password"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+
+    echo "> Login to the user account using the wrong password."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+
+    echo "> Quota is exceeded 1 >= 1. Login with correct password should fail."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+    echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4"
+    ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 4 TO ${USER}"
+    
+    echo "> Try to login to the user account with correct password"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+    
+    echo "> Successfull login should reset failed authentications counter. Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Login to the user account using the wrong password before exeeding the quota."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+    
+    echo "> Also try to login with correct password. Quota should stay exceeded."
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+
+    echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+
+    echo "> Reset the quota by increasing MAX FAILED SEQUENTIAL AUTHENTICATIONS and succesfull login"
+    echo "> and check failed_sequential_authentications, max_failed_sequential_authentications."
+    ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 7 TO ${USER}"
+    ${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
+    ${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+}
+
 echo "> Drop the user, quota, and role if those were created."
 ${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
 ${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"
@@ -21,69 +65,16 @@ ${CLICKHOUSE_CLIENT} -q "CREATE QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED
 echo "> Check if the quota has been created."
 ${CLICKHOUSE_CLIENT} -q "SELECT COUNT(*) FROM system.quotas WHERE name = '${QUOTA}'"
 
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Login to the user account using the wrong password 2 times to exceed the quota."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using the correct password, but login is unsuccesful (quota exceed)."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-
-echo "> Alter the quota with MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null"  2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Increaseing MAX FAILED SEQUENTIAL AUTHENTICATIONS should now allow the user to login."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
+login_test
 
+echo " ---------------------------------------------------------------------------"
 echo "> Create the role with quota with the maximum single authentication attempt."
 ${CLICKHOUSE_CLIENT} -q "CREATE ROLE ${ROLE}"
 ${CLICKHOUSE_CLIENT} -q "GRANT ALL ON *.* TO ${ROLE}"
 ${CLICKHOUSE_CLIENT} -q "GRANT ${ROLE} to ${USER}"
 ${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${ROLE}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Try to login to the user account again. It should be allowed to login. Current tries 1 <= 1 max tries, so quota not exceed."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} -q "SELECT failed_sequential_authentications, max_failed_sequential_authentications FROM system.quotas_usage WHERE quota_name = '${QUOTA}'"
-echo "> Login to the user account using the wrong password 2 times to exceed the quota."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Check the failed_sequential_authentications, max_failed_sequential_authentications fields."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
 
-echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 3 TO ${USER}"
-echo "> Login to the user account using the wrong password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Login to the user account using the correct password."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null"
-echo "> Alter the quota connected with role by setting MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1"
-${CLICKHOUSE_CLIENT} -q "ALTER QUOTA ${QUOTA} FOR INTERVAL 100 YEAR MAX FAILED SEQUENTIAL AUTHENTICATIONS = 1 TO ${USER}"
-echo "> Login 2 times to the user account using the wrong password to exceed the quota"
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'password is incorrect'
-echo "> Login to the user account using wrong password and check that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
-echo "> Login to the user account using correct password and that the error is 'QUOTA_EXCEEDED'."
-${CLICKHOUSE_CLIENT} --user ${USER} --password "wrong_pass" --query "select 1 format Null" 2>&1 | grep -m1 -o 'QUOTA_EXCEEDED'
+login_test
 
 ${CLICKHOUSE_CLIENT} -q "DROP USER IF EXISTS ${USER}"
 ${CLICKHOUSE_CLIENT} -q "DROP QUOTA IF EXISTS ${QUOTA}"

From 818fb9802ad200bea18aa81ca6de1146727811a1 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 31 Jan 2024 11:48:02 +0800
Subject: [PATCH 0457/1081] change as request

---
 src/Functions/if.cpp | 16 ++++++++++++----
 1 file changed, 12 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index fba50385923..18ba75cbd7e 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -25,8 +25,6 @@
 #include <Functions/FunctionFactory.h>
 #include <type_traits>
 
-#pragma clang diagnostic ignored "-Wundefined-reinterpret-cast"
-
 namespace DB
 {
 namespace ErrorCodes
@@ -59,7 +57,11 @@ concept is_native_int_or_decimal_v
     auto mask = static_cast<UIntType>(static_cast<IntType>(vc) - 1); \
     auto new_a = static_cast<ResultType>(va); \
     auto new_b = static_cast<ResultType>(vb); \
-    auto tmp = (~mask & (*reinterpret_cast<UIntType *>(&new_a))) | (mask & (*reinterpret_cast<UIntType *>(&new_b))); \
+    UIntType uint_a; \
+    std::memcpy(&uint_a, &new_a, sizeof(UIntType)); \
+    UIntType uint_b; \
+    std::memcpy(&uint_b, &new_b, sizeof(UIntType)); \
+    UIntType tmp = (~mask & uint_a) | (mask & uint_b); \
     (vr) = *(reinterpret_cast<ResultType *>(&tmp));
 
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
@@ -220,12 +222,18 @@ template <typename ArrayCond, typename A, typename B, typename ArrayResult, type
 inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult & res)
 {
     size_t size = cond.size();
+
+    /// Int8(alias type of uint8_t) has special aliasing properties that prevents compiler from auto-vectorizing for below codes, refer to https://gist.github.com/alexei-zaripov/dcc14c78819c5f1354afe8b70932007c
+    ///
+    /// for (size_t i = 0; i < size; ++i)
+    ///     res[i] = cond[i] ? static_cast<Int8>(a) : static_cast<Int8>(b);
+    ///
+    /// Therefore, we manually optimize it by avoiding branch miss when ResultType is Int8. Other types like (U)Int128|256 or Decimal128/256 also benefit from this optimization.
     if constexpr (std::is_same_v<ResultType, Int8> || is_over_big_int<ResultType>)
     {
         alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
         for (size_t i = 0; i < size; ++i)
         {
-            /// Introduce memory access to avoid branch miss
             res[i] = ab[!cond[i]];
         }
     }

From a89890babe6ba06825c0a7659db2e37be72a3046 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 30 Jan 2024 19:46:23 +0800
Subject: [PATCH 0458/1081] fix bug of quantileGK

---
 .../AggregateFunctionQuantileGK.cpp           | 90 +++++++++++--------
 .../GatherFunctionQuantileVisitor.cpp         |  1 +
 .../02661_quantile_approx.reference           | 14 +++
 .../0_stateless/02661_quantile_approx.sql     | 13 +++
 4 files changed, 82 insertions(+), 36 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index 2c0b3e55136..2e8ccb2e5e4 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -17,6 +17,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int INCORRECT_DATA;
     extern const int LOGICAL_ERROR;
     extern const int NOT_IMPLEMENTED;
 }
@@ -30,12 +31,12 @@ class ApproxSampler
 public:
     struct Stats
     {
-        T value;      // the sampled value
-        Int64 g;      // the minimum rank jump from the previous value's minimum rank
-        Int64 delta;  // the maximum span of the rank
+        T value;     // The sampled value
+        Int64 g;     // The minimum rank jump from the previous value's minimum rank
+        Int64 delta; // The maximum span of the rank
 
         Stats() = default;
-        Stats(T value_, Int64 g_, Int64 delta_) : value(value_), g(g_), delta(delta_) {}
+        Stats(T value_, Int64 g_, Int64 delta_) : value(value_), g(g_), delta(delta_) { }
     };
 
     struct QueryResult
@@ -49,20 +50,20 @@ public:
 
     ApproxSampler() = default;
 
-    explicit ApproxSampler(
-        double relative_error_,
-        size_t compress_threshold_ = default_compress_threshold,
-        size_t count_ = 0,
-        bool compressed_ = false)
-        : relative_error(relative_error_)
-        , compress_threshold(compress_threshold_)
-        , count(count_)
-        , compressed(compressed_)
+    ApproxSampler(const ApproxSampler & other)
+        : relative_error(other.relative_error)
+        , compress_threshold(other.compress_threshold)
+        , count(other.count)
+        , compressed(other.compressed)
+        , sampled(other.sampled.begin(), other.sampled.end())
+        , backup_sampled(other.backup_sampled.begin(), other.backup_sampled.end())
+        , head_sampled(other.head_sampled.begin(), other.head_sampled.end())
     {
-        sampled.reserve(compress_threshold);
-        backup_sampled.reserve(compress_threshold);
+    }
 
-        head_sampled.reserve(default_head_size);
+    explicit ApproxSampler(double relative_error_)
+        : relative_error(relative_error_), compress_threshold(default_compress_threshold), count(0), compressed(false)
+    {
     }
 
     bool isCompressed() const { return compressed; }
@@ -95,9 +96,9 @@ public:
         Int64 current_max = std::numeric_limits<Int64>::min();
         for (const auto & stats : sampled)
             current_max = std::max(stats.delta + stats.g, current_max);
-        Int64 target_error = current_max/2;
+        Int64 target_error = current_max / 2;
 
-        size_t index= 0;
+        size_t index = 0;
         auto min_rank = sampled[0].g;
         for (size_t i = 0; i < size; ++i)
         {
@@ -118,7 +119,6 @@ public:
                 result[indices[i]] = res.value;
             }
         }
-
     }
 
     void compress()
@@ -256,16 +256,27 @@ public:
     void read(ReadBuffer & buf)
     {
         readBinaryLittleEndian(compress_threshold, buf);
+        if (compress_threshold != default_compress_threshold)
+            throw Exception(
+                ErrorCodes::INCORRECT_DATA,
+                "The compress threshold {} isn't the expected one {}",
+                compress_threshold,
+                default_compress_threshold);
+
         readBinaryLittleEndian(relative_error, buf);
         readBinaryLittleEndian(count, buf);
 
         size_t sampled_len = 0;
         readBinaryLittleEndian(sampled_len, buf);
+        if (sampled_len > compress_threshold)
+            throw Exception(
+                ErrorCodes::INCORRECT_DATA, "The number of elements {} for quantileGK exceeds {}", sampled_len, compress_threshold);
+
         sampled.resize(sampled_len);
 
         for (size_t i = 0; i < sampled_len; ++i)
         {
-            auto stats = sampled[i];
+            auto & stats = sampled[i];
             readBinaryLittleEndian(stats.value, buf);
             readBinaryLittleEndian(stats.g, buf);
             readBinaryLittleEndian(stats.delta, buf);
@@ -291,7 +302,7 @@ private:
                 min_rank += curr_sample.g;
             }
         }
-        return {sampled.size()-1, 0, sampled.back().value};
+        return {sampled.size() - 1, 0, sampled.back().value};
     }
 
     void withHeadBufferInserted()
@@ -389,12 +400,11 @@ private:
 
     double relative_error;
     size_t compress_threshold;
-    size_t count = 0;
+    size_t count;
     bool compressed;
 
     PaddedPODArray<Stats> sampled;
     PaddedPODArray<Stats> backup_sampled;
-
     PaddedPODArray<T> head_sampled;
 
     static constexpr size_t default_compress_threshold = 10000;
@@ -406,17 +416,14 @@ class QuantileGK
 {
 private:
     using Data = ApproxSampler<Value>;
-    mutable Data data;
+    Data data;
 
 public:
     QuantileGK() = default;
 
     explicit QuantileGK(size_t accuracy) : data(1.0 / static_cast<double>(accuracy)) { }
 
-    void add(const Value & x)
-    {
-        data.insert(x);
-    }
+    void add(const Value & x) { data.insert(x); }
 
     template <typename Weight>
     void add(const Value &, const Weight &)
@@ -429,22 +436,34 @@ public:
         if (!data.isCompressed())
             data.compress();
 
-        data.merge(rhs.data);
+        if (rhs.data.isCompressed())
+            data.merge(rhs.data);
+        else
+        {
+            /// We can't modify rhs, so copy it and compress
+            Data rhs_data_copy(rhs.data);
+            rhs_data_copy.compress();
+            data.merge(rhs_data_copy);
+        }
     }
 
     void serialize(WriteBuffer & buf) const
     {
-        /// Always compress before serialization
-        if (!data.isCompressed())
-            data.compress();
-
-        data.write(buf);
+        if (data.isCompressed())
+            data.write(buf);
+        else
+        {
+            /// We can't modify rhs, so copy it and compress
+            Data data_copy(data);
+            data_copy.compress();
+            data_copy.write(buf);
+        }
     }
 
     void deserialize(ReadBuffer & buf)
     {
         data.read(buf);
-
+        /// Serialized data is always compressed
         data.setCompressed();
     }
 
@@ -481,7 +500,6 @@ public:
     }
 };
 
-
 template <typename Value, bool _> using FuncQuantileGK = AggregateFunctionQuantile<Value, QuantileGK<Value>, NameQuantileGK, false, void, false, true>;
 template <typename Value, bool _> using FuncQuantilesGK = AggregateFunctionQuantile<Value, QuantileGK<Value>, NameQuantilesGK, false, void, true, true>;
 
diff --git a/src/Interpreters/GatherFunctionQuantileVisitor.cpp b/src/Interpreters/GatherFunctionQuantileVisitor.cpp
index 664bb9e9383..6b6dc362771 100644
--- a/src/Interpreters/GatherFunctionQuantileVisitor.cpp
+++ b/src/Interpreters/GatherFunctionQuantileVisitor.cpp
@@ -30,6 +30,7 @@ static const std::unordered_map<String, String> quantile_fuse_name_mapping =
     {"quantileTDigestWeighted", "quantilesTDigestWeighted"},
     {"quantileTiming", "quantilesTiming"},
     {"quantileTimingWeighted", "quantilesTimingWeighted"},
+    {"quantileGK", "quantilesGK"},
 };
 
 String GatherFunctionQuantileData::toFusedNameOrSelf(const String & func_name)
diff --git a/tests/queries/0_stateless/02661_quantile_approx.reference b/tests/queries/0_stateless/02661_quantile_approx.reference
index 8369363aa9b..0ee846a268b 100644
--- a/tests/queries/0_stateless/02661_quantile_approx.reference
+++ b/tests/queries/0_stateless/02661_quantile_approx.reference
@@ -19,6 +19,20 @@ select quantilesGK(1000, 100/1000, 200/1000, 250/1000, 314/1000, 777/1000)(numbe
 [99,199,249,313,776]
 select quantilesGK(10000, 100/1000, 200/1000, 250/1000, 314/1000, 777/1000)(number + 1) from numbers(1000);
 [100,200,250,314,777]
+SELECT quantileGKMerge(100, 0.5)(x)
+FROM
+(
+    SELECT quantileGKState(100, 0.5)(number + 1) AS x
+    FROM numbers(49999)
+);
+24902
+SELECT quantilesGKMerge(100, 0.5, 0.9, 0.99)(x)
+FROM
+(
+    SELECT quantilesGKState(100, 0.5, 0.9, 0.99)(number + 1) AS x
+    FROM numbers(49999)
+);
+[24902,44518,49999]
 select medianGK()(number) from numbers(10) SETTINGS allow_experimental_analyzer = 0; -- { serverError BAD_ARGUMENTS }
 select medianGK()(number) from numbers(10) SETTINGS allow_experimental_analyzer = 1; -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
 select quantileGK()(number) from numbers(10) SETTINGS allow_experimental_analyzer = 0; -- { serverError BAD_ARGUMENTS }
diff --git a/tests/queries/0_stateless/02661_quantile_approx.sql b/tests/queries/0_stateless/02661_quantile_approx.sql
index 52c2979ad44..c0004260fa1 100644
--- a/tests/queries/0_stateless/02661_quantile_approx.sql
+++ b/tests/queries/0_stateless/02661_quantile_approx.sql
@@ -15,6 +15,19 @@ select quantilesGK(100, 100/1000, 200/1000, 250/1000, 314/1000, 777/1000)(number
 select quantilesGK(1000, 100/1000, 200/1000, 250/1000, 314/1000, 777/1000)(number + 1) from numbers(1000);
 select quantilesGK(10000, 100/1000, 200/1000, 250/1000, 314/1000, 777/1000)(number + 1) from numbers(1000);
 
+SELECT quantileGKMerge(100, 0.5)(x)
+FROM
+(
+    SELECT quantileGKState(100, 0.5)(number + 1) AS x
+    FROM numbers(49999)
+);
+
+SELECT quantilesGKMerge(100, 0.5, 0.9, 0.99)(x)
+FROM
+(
+    SELECT quantilesGKState(100, 0.5, 0.9, 0.99)(number + 1) AS x
+    FROM numbers(49999)
+);
 
 select medianGK()(number) from numbers(10) SETTINGS allow_experimental_analyzer = 0; -- { serverError BAD_ARGUMENTS }
 select medianGK()(number) from numbers(10) SETTINGS allow_experimental_analyzer = 1; -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }

From 2ad7607bad756ae7e2118513853fe2b821953601 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 31 Jan 2024 17:24:51 +0800
Subject: [PATCH 0459/1081] opt if when input type is map

---
 src/Functions/if.cpp                          | 117 +++++++++++++++++-
 tests/performance/if.xml                      |  21 ++--
 .../0_stateless/02974_if_with_map.reference   |  30 +++++
 .../queries/0_stateless/02974_if_with_map.sql |  15 +++
 4 files changed, 169 insertions(+), 14 deletions(-)
 create mode 100644 tests/queries/0_stateless/02974_if_with_map.reference
 create mode 100644 tests/queries/0_stateless/02974_if_with_map.sql

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index c784b2fca59..15ae04d3a29 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1,9 +1,19 @@
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypesDecimal.h>
+#include <type_traits>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnDecimal.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnMap.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnTuple.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/MaskOperations.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeFixedString.h>
-#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeNullable.h>
+<<<<<<< HEAD
 #include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/NumberTraits.h>
 #include <DataTypes/getLeastSupertype.h>
@@ -20,14 +30,28 @@
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
 #include <Functions/IFunction.h>
+=======
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypesDecimal.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/NumberTraits.h>
+#include <DataTypes/getLeastSupertype.h>
+#include <Functions/FunctionFactory.h>
+>>>>>>> 83434321f39... opt if when input type is map
 #include <Functions/FunctionHelpers.h>
-#include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/FunctionIfBase.h>
+#include <Functions/GatherUtils/Algorithms.h>
+#include <Functions/IFunction.h>
 #include <Interpreters/castColumn.h>
+<<<<<<< HEAD
 #include <Interpreters/Context.h>
 
 #include <Functions/FunctionFactory.h>
 #include <type_traits>
+=======
+#include <Common/assert_cast.h>
+#include <Common/typeid_cast.h>
+>>>>>>> 83434321f39... opt if when input type is map
 
 namespace DB
 {
@@ -36,6 +60,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
+    extern const int SIZES_OF_ARRAYS_DONT_MATCH;
 }
 
 namespace
@@ -679,6 +704,87 @@ private:
         return ColumnTuple::create(tuple_columns);
     }
 
+    ColumnPtr executeMap(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
+    {
+        auto extract_kv_from_map = [](const ColumnMap * map)
+        {
+            const ColumnTuple & tuple = map->getNestedData();
+            const auto & keys = tuple.getColumnPtr(0);
+            const auto & values = tuple.getColumnPtr(1);
+            const auto & offsets = map->getNestedColumn().getOffsetsPtr();
+            return std::make_pair(ColumnArray::create(keys, offsets), ColumnArray::create(values, offsets));
+        };
+
+        /// Extract keys and values from both arguments
+        Columns key_cols(2);
+        Columns value_cols(2);
+        for (size_t i = 0; i < 2; ++i)
+        {
+            const auto & arg = arguments[i + 1];
+            if (const ColumnMap * map = checkAndGetColumn<ColumnMap>(arg.column.get()))
+            {
+                auto [key_col, value_col] = extract_kv_from_map(map);
+                key_cols[i] = std::move(key_col);
+                value_cols[i] = std::move(value_col);
+            }
+            else if (const ColumnConst * const_map = checkAndGetColumnConst<ColumnMap>(arg.column.get()))
+            {
+                const ColumnMap * map_data = assert_cast<const ColumnMap *>(&const_map->getDataColumn());
+                auto [key_col, value_col] = extract_kv_from_map(map_data);
+
+                size_t size = const_map->size();
+                key_cols[i] = ColumnConst::create(std::move(key_col), size);
+                value_cols[i] = ColumnConst::create(std::move(value_col), size);
+            }
+            else
+                return nullptr;
+        }
+
+        /// Compose temporary columns for keys and values
+        ColumnsWithTypeAndName key_columns(3);
+        key_columns[0] = arguments[0];
+        ColumnsWithTypeAndName value_columns(3);
+        value_columns[0] = arguments[0];
+        for (size_t i = 0; i < 2; ++i)
+        {
+            const auto & arg = arguments[i + 1];
+            const DataTypeMap & type = static_cast<const DataTypeMap &>(*arg.type);
+            const auto & key_type = type.getKeyType();
+            const auto & value_type = type.getValueType();
+            key_columns[i + 1] = {key_cols[i], key_type, {}};
+            value_columns[i + 1] = {value_cols[i], value_type, {}};
+        }
+
+        /// Calculate function corresponding keys and values in map
+        const DataTypeMap & map_result_type = static_cast<const DataTypeMap &>(*result_type);
+        auto key_result_type = std::make_shared<DataTypeArray>(map_result_type.getKeyType());
+        auto value_result_type = std::make_shared<DataTypeArray>(map_result_type.getValueType());
+        ColumnPtr key_result = executeImpl(key_columns, key_result_type, input_rows_count);
+        ColumnPtr value_result = executeImpl(value_columns, value_result_type, input_rows_count);
+
+        /// key_result and value_result are not constant columns otherwise we won't reach here in executeMap
+        const auto * key_array = assert_cast<const ColumnArray *>(key_result.get());
+        const auto * value_array = assert_cast<const ColumnArray *>(value_result.get());
+        if (!key_array)
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN, "Illegal key result column {} in executeMap for function {}", key_result->getName(), getName());
+        if (!value_array)
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN,
+                "Illegal value result column {} in executeMap for function {}",
+                value_result->getName(),
+                getName());
+        if (!key_array->hasEqualOffsets(*value_array))
+            throw Exception(
+                ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
+                "Key result column and value result column in executeMap for function {} must have equal sizes",
+                getName());
+
+        auto nested_column = ColumnArray::create(
+            ColumnTuple::create(Columns{key_array->getDataPtr(), value_array->getDataPtr()}), key_array->getOffsetsPtr());
+        return ColumnMap::create(std::move(nested_column));
+    }
+
     static ColumnPtr executeGeneric(
         const ColumnUInt8 * cond_col, const ColumnsWithTypeAndName & arguments, size_t input_rows_count, bool use_variant_when_no_common_type)
     {
@@ -1195,7 +1301,8 @@ public:
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
             || (res = executeString(cond_col, arguments, result_type))
             || (res = executeGenericArray(cond_col, arguments, result_type))
-            || (res = executeTuple(arguments, result_type, input_rows_count))))
+            || (res = executeTuple(arguments, result_type, input_rows_count))
+            || (res = executeMap(arguments, result_type, input_rows_count))))
         {
             return executeGeneric(cond_col, arguments, input_rows_count, use_variant_when_no_common_type);
         }
diff --git a/tests/performance/if.xml b/tests/performance/if.xml
index f4d0e8f9773..a922500ab90 100644
--- a/tests/performance/if.xml
+++ b/tests/performance/if.xml
@@ -1,12 +1,15 @@
 <test>
 
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
-
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
-<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
-
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
+    
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
+    <query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
+    
+    <!-- Tests when branches are maps -->
+    <query>with rand32() % 2 as x select if(x, map(1,2,3,4), map(3,4,5,6)) from numbers(1000000) format Null</query>
+    <query>with rand32() % 2 as x select if(x, materialize(map(1,2,3,4)), materialize(map(3,4,5,6))) from numbers(1000000) format Null</query>
 </test>
diff --git a/tests/queries/0_stateless/02974_if_with_map.reference b/tests/queries/0_stateless/02974_if_with_map.reference
new file mode 100644
index 00000000000..00dca1f95a6
--- /dev/null
+++ b/tests/queries/0_stateless/02974_if_with_map.reference
@@ -0,0 +1,30 @@
+{1:2,3:4}
+{3:4,5:6}
+{1:2,3:4}
+{3:4,5:6}
+{3:4,5:6}
+{1:2,3:4}
+{1:2,3:4}
+{1:2,3:4}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{1:2,3:4}
+{1:2,3:4}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{3:4,5:6}
+{1:2,3:4}
+{1:2,3:4}
+{1:2,3:4}
+{1:2,3:4}
+{3:4,5:6}
+{3:4,5:6}
+{1:2,3:4}
+{1:2,3:4}
+{1:2,3:4}
+{1:2,3:4}
diff --git a/tests/queries/0_stateless/02974_if_with_map.sql b/tests/queries/0_stateless/02974_if_with_map.sql
new file mode 100644
index 00000000000..182d20de07e
--- /dev/null
+++ b/tests/queries/0_stateless/02974_if_with_map.sql
@@ -0,0 +1,15 @@
+select if(number % 2 = 0, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
+select if(number % 2 = 0, materialize(map(1,2,3,4)), map(3,4,5,6)) from numbers(2);
+select if(number % 2 = 0, map(3,4,5,6), materialize(map(1,2,3,4))) from numbers(2);
+select if(1, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
+select if(0, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
+select if(null, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
+select if(1, materialize(map(1,2,3,4)), map(3,4,5,6)) from numbers(2);
+select if(0, materialize(map(1,2,3,4)), map(3,4,5,6)) from numbers(2);
+select if(null, materialize(map(1,2,3,4)), map(3,4,5,6)) from numbers(2);
+select if(1, map(3,4,5,6), materialize(map(1,2,3,4))) from numbers(2);
+select if(0, map(3,4,5,6), materialize(map(1,2,3,4))) from numbers(2);
+select if(null, map(3,4,5,6), materialize(map(1,2,3,4))) from numbers(2);
+select if(1, materialize(map(3,4,5,6)), materialize(map(1,2,3,4))) from numbers(2);
+select if(0, materialize(map(3,4,5,6)), materialize(map(1,2,3,4))) from numbers(2);
+select if(null, materialize(map(3,4,5,6)), materialize(map(1,2,3,4))) from numbers(2);

From dc7b9d8208c9d696c08c6c8aa5332054b187ca7e Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 31 Jan 2024 17:37:37 +0800
Subject: [PATCH 0460/1081] fix conflicts

---
 src/Functions/if.cpp | 29 +++--------------------------
 1 file changed, 3 insertions(+), 26 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 15ae04d3a29..b24c4350649 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -7,51 +7,28 @@
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnTuple.h>
+#include <Columns/ColumnVariant.h>
 #include <Columns/ColumnVector.h>
 #include <Columns/MaskOperations.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeFixedString.h>
 #include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeNullable.h>
-<<<<<<< HEAD
-#include <DataTypes/DataTypeVariant.h>
-#include <DataTypes/NumberTraits.h>
-#include <DataTypes/getLeastSupertype.h>
-#include <Columns/ColumnVector.h>
-#include <Columns/ColumnDecimal.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnConst.h>
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnTuple.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnVariant.h>
-#include <Columns/MaskOperations.h>
-#include <Common/typeid_cast.h>
-#include <Common/assert_cast.h>
-#include <Functions/IFunction.h>
-=======
 #include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeVariant.h>
 #include <DataTypes/DataTypesDecimal.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/NumberTraits.h>
 #include <DataTypes/getLeastSupertype.h>
 #include <Functions/FunctionFactory.h>
->>>>>>> 83434321f39... opt if when input type is map
 #include <Functions/FunctionHelpers.h>
 #include <Functions/FunctionIfBase.h>
 #include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/IFunction.h>
-#include <Interpreters/castColumn.h>
-<<<<<<< HEAD
 #include <Interpreters/Context.h>
-
-#include <Functions/FunctionFactory.h>
-#include <type_traits>
-=======
+#include <Interpreters/castColumn.h>
 #include <Common/assert_cast.h>
 #include <Common/typeid_cast.h>
->>>>>>> 83434321f39... opt if when input type is map
 
 namespace DB
 {

From 79c068571de3dc142f6f1de8bb5a69286c4120ef Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Wed, 31 Jan 2024 12:58:22 +0100
Subject: [PATCH 0461/1081] Fix test test_stop_other_host_during_backup.

---
 tests/integration/test_backup_restore_on_cluster/test.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_backup_restore_on_cluster/test.py b/tests/integration/test_backup_restore_on_cluster/test.py
index 20f538cca58..027c9736c32 100644
--- a/tests/integration/test_backup_restore_on_cluster/test.py
+++ b/tests/integration/test_backup_restore_on_cluster/test.py
@@ -1087,9 +1087,11 @@ def test_stop_other_host_during_backup(kill):
     status = node1.query(f"SELECT status FROM system.backups WHERE id='{id}'").strip()
 
     if kill:
-        assert status in ["BACKUP_CREATED", "BACKUP_FAILED"]
+        expected_statuses = ["BACKUP_CREATED", "BACKUP_FAILED"]
     else:
-        assert status == "BACKUP_CREATED"
+        expected_statuses = ["BACKUP_CREATED", "BACKUP_CANCELLED"]
+
+    assert status in expected_statuses
 
     node2.start_clickhouse()
 

From 60c37fb9bf00f39f5f9637045f302a9efb0f296d Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 31 Jan 2024 13:44:16 +0100
Subject: [PATCH 0462/1081] Update run.sh

---
 docker/test/stateless/run.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 05b9ec2a06f..ea76447aef2 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -293,10 +293,10 @@ if [ $failed_to_save_logs -ne 0 ]; then
     #   for files >64MB, we want this files to be compressed explicitly
     for table in query_log zookeeper_log trace_log transactions_info_log metric_log
     do
-        clickhouse-local "$data_path_config" --only-system-tables -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst ||:
+        clickhouse-local "$data_path_config" --only-system-tables --stacktrace -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.tsv.zst ||:
         if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-            clickhouse-local --path /var/lib/clickhouse1/ --only-system-tables -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst ||:
-            clickhouse-local --path /var/lib/clickhouse2/ --only-system-tables -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst ||:
+            clickhouse-local --path /var/lib/clickhouse1/ --only-system-tables --stacktrace -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.1.tsv.zst ||:
+            clickhouse-local --path /var/lib/clickhouse2/ --only-system-tables --stacktrace -q "select * from system.$table format TSVWithNamesAndTypes" | zstd --threads=0 > /test_output/$table.2.tsv.zst ||:
         fi
     done
 fi

From 3dae643f1960a78324526c827f5cbe5ee33a4e1d Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:29:55 +0100
Subject: [PATCH 0463/1081] Consistent "Fast test" job name

---
 .github/workflows/pull_request.yml |  2 +-
 tests/ci/ci_config.py              |  8 ++++----
 tests/ci/fast_test_check.py        | 10 ++++------
 3 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 3165227ce3a..56617294fb6 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -104,7 +104,7 @@ jobs:
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Fast tests
+      test_name: Fast test
       runner_type: builder
       data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index d18040540c7..69098b1042e 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -6,8 +6,8 @@ from dataclasses import dataclass, field
 from pathlib import Path
 from typing import Callable, Dict, Iterable, List, Literal, Optional, Union
 
-from integration_test_images import IMAGES
 from ci_utils import WithIter
+from integration_test_images import IMAGES
 
 
 class Labels(metaclass=WithIter):
@@ -42,7 +42,7 @@ class Build(metaclass=WithIter):
 
 class JobNames(metaclass=WithIter):
     STYLE_CHECK = "Style check"
-    FAST_TEST = "Fast tests"
+    FAST_TEST = "Fast test"
     DOCKER_SERVER = "Docker server image"
     DOCKER_KEEPER = "Docker keeper image"
     INSTALL_TEST_AMD = "Install packages (amd64)"
@@ -1147,7 +1147,7 @@ CHECK_DESCRIPTIONS = [
         "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"
     ),
     CheckDescription(
-        "Fast test",
+        JobNames.FAST_TEST,
         "Normally this is the first check that is ran for a PR. It builds ClickHouse "
         'and runs most of <a href="https://clickhouse.com/docs/en/development/tests'
         '#functional-tests">stateless functional tests</a>, '
@@ -1155,7 +1155,7 @@ CHECK_DESCRIPTIONS = [
         "Look at the report to see which tests fail, then reproduce the failure "
         'locally as described <a href="https://clickhouse.com/docs/en/development/'
         'tests#functional-test-locally">here</a>',
-        lambda x: x == "Fast test",
+        lambda x: x == JobNames.FAST_TEST,
     ),
     CheckDescription(
         "Flaky tests",
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index c8ddcf25057..b558253ca95 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -1,22 +1,20 @@
 #!/usr/bin/env python3
 import argparse
-import logging
-import subprocess
-import os
 import csv
+import logging
+import os
+import subprocess
 import sys
 from pathlib import Path
 from typing import Tuple
 
 from docker_images_helper import DockerImage, get_docker_image, pull_image
-from env_helper import S3_BUILDS_BUCKET, TEMP_PATH, REPO_COPY
+from env_helper import REPO_COPY, S3_BUILDS_BUCKET, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import JobReport, TestResult, TestResults, read_test_results
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
-NAME = "Fast test"
-
 # Will help to avoid errors like _csv.Error: field larger than field limit (131072)
 csv.field_size_limit(sys.maxsize)
 

From 7af7255b90ad6b36e9051e4152dbb66f8c5a817a Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:44:52 +0100
Subject: [PATCH 0464/1081] Use JobNames.DOCS_CHECK for consistency

---
 tests/ci/ci.py         | 24 ++++++++++++------------
 tests/ci/ci_config.py  |  4 +++-
 tests/ci/docs_check.py |  7 ++-----
 3 files changed, 17 insertions(+), 18 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index f52f28c3a16..86831557456 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -10,7 +10,16 @@ from pathlib import Path
 from typing import Any, Dict, Iterable, List, Optional
 
 import docker_images_helper
-from ci_config import CI_CONFIG, Labels
+import upload_result_helper
+from build_check import get_release_or_pr
+from ci_config import CI_CONFIG, JobNames, Labels
+from clickhouse_helper import (
+    CiLogsCredentials,
+    ClickHouseHelper,
+    get_instance_id,
+    get_instance_type,
+    prepare_tests_results_for_clickhouse,
+)
 from commit_status_helper import (
     CommitStatusData,
     RerunHelper,
@@ -36,15 +45,6 @@ from github import Github
 from pr_info import PRInfo
 from report import SUCCESS, BuildResult, JobReport
 from s3_helper import S3Helper
-from clickhouse_helper import (
-    CiLogsCredentials,
-    ClickHouseHelper,
-    get_instance_id,
-    get_instance_type,
-    prepare_tests_results_for_clickhouse,
-)
-from build_check import get_release_or_pr
-import upload_result_helper
 from version_helper import get_version_from_repo
 
 
@@ -277,7 +277,7 @@ def _check_and_update_for_early_style_check(run_config: dict) -> None:
 
 
 def _update_config_for_docs_only(run_config: dict) -> None:
-    DOCS_CHECK_JOBS = ["Docs check", "Style check"]
+    DOCS_CHECK_JOBS = [JobNames.DOCS_CHECK, JobNames.STYLE_CHECK]
     print(f"NOTE: Will keep only docs related jobs: [{DOCS_CHECK_JOBS}]")
     jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
     run_config["jobs_data"]["jobs_to_do"] = [
@@ -893,7 +893,7 @@ def main() -> int:
             CI_CONFIG.get_digest_config("package_release")
         )
         docs_digest = job_digester.get_job_digest(
-            CI_CONFIG.get_digest_config("Docs check")
+            CI_CONFIG.get_digest_config(JobNames.DOCS_CHECK)
         )
         jobs_data = (
             _configure_jobs(
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 69098b1042e..89f5e5a90ec 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1144,7 +1144,9 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Docker keeper"),
     ),
     CheckDescription(
-        "Docs Check", "Builds and tests the documentation", lambda x: x == "Docs Check"
+        JobNames.DOCS_CHECK,
+        "Builds and tests the documentation",
+        lambda x: x == JobNames.DOCS_CHECK,
     ),
     CheckDescription(
         JobNames.FAST_TEST,
diff --git a/tests/ci/docs_check.py b/tests/ci/docs_check.py
index a982cbc2a32..400d4bc6ad5 100644
--- a/tests/ci/docs_check.py
+++ b/tests/ci/docs_check.py
@@ -6,16 +6,13 @@ import sys
 from pathlib import Path
 
 from docker_images_helper import get_docker_image, pull_image
-from env_helper import TEMP_PATH, REPO_COPY
+from env_helper import REPO_COPY, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport, TestResults, TestResult
+from report import JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
 
-NAME = "Docs Check"
-
-
 def parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,

From bfa722bf6245507868d62f9d615ff229e8cefcf4 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 30 Jan 2024 18:46:53 +0100
Subject: [PATCH 0465/1081] Use JobNames.STYLE_CHECK for consistency

---
 tests/ci/ci.py          | 4 ++--
 tests/ci/ci_config.py   | 4 ++--
 tests/ci/style_check.py | 3 ---
 3 files changed, 4 insertions(+), 7 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 86831557456..433ea4a3a5f 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -268,11 +268,11 @@ def _check_and_update_for_early_style_check(run_config: dict) -> None:
     jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
     docker_to_build = run_config.get("docker_data", {}).get("missing_multi", [])
     if (
-        "Style check" in jobs_to_do
+        JobNames.STYLE_CHECK in jobs_to_do
         and docker_to_build
         and "clickhouse/style-test" not in docker_to_build
     ):
-        index = jobs_to_do.index("Style check")
+        index = jobs_to_do.index(JobNames.STYLE_CHECK)
         jobs_to_do[index] = "Style check early"
 
 
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 89f5e5a90ec..61f75edfa2f 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1231,10 +1231,10 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("Stress test ("),
     ),
     CheckDescription(
-        "Style Check",
+        JobNames.STYLE_CHECK,
         "Runs a set of checks to keep the code style clean. If some of tests failed, "
         "see the related log from the report",
-        lambda x: x == "Style Check",
+        lambda x: x == JobNames.STYLE_CHECK,
     ),
     CheckDescription(
         "Unit tests",
diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 4f791a5ee01..785e29b2359 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -8,7 +8,6 @@ import sys
 from pathlib import Path
 from typing import List, Tuple
 
-
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
@@ -17,8 +16,6 @@ from report import JobReport, TestResults, read_test_results
 from ssh import SSHKey
 from stopwatch import Stopwatch
 
-NAME = "Style Check"
-
 
 def process_result(
     result_directory: Path,

From 0d21004218c8fad0be30493629fd93927f5d71b0 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 31 Jan 2024 13:50:15 +0000
Subject: [PATCH 0466/1081] WIP on StorageMerge

---
 .../OptimizeGroupByInjectiveFunctionsPass.cpp |  2 +-
 .../OptimizeGroupByInjectiveFunctionsPass.h   |  2 +-
 .../RewriteSumFunctionWithSumAndCountPass.cpp |  2 +-
 .../RewriteSumFunctionWithSumAndCountPass.h   |  2 +-
 src/Storages/StorageMerge.cpp                 | 40 ++++++++++++-------
 src/Storages/StorageMerge.h                   |  1 +
 6 files changed, 30 insertions(+), 19 deletions(-)

diff --git a/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.cpp b/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.cpp
index 864752cdbeb..ad649834fb0 100644
--- a/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.cpp
+++ b/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.cpp
@@ -115,7 +115,7 @@ private:
 
 }
 
-void OptimizeGroupByInjectiveFunctionsPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void OptimizeGroupByInjectiveFunctionsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     OptimizeGroupByInjectiveFunctionsVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.h b/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.h
index 22390451824..b3ba9033b92 100644
--- a/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.h
+++ b/src/Analyzer/Passes/OptimizeGroupByInjectiveFunctionsPass.h
@@ -14,7 +14,7 @@ public:
 
     String getDescription() override { return "Replaces injective functions by it's arguments in GROUP BY section."; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 
 }
diff --git a/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.cpp b/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.cpp
index 24ddb7522c8..3c93bf9e1bf 100644
--- a/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.cpp
+++ b/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.cpp
@@ -120,7 +120,7 @@ private:
 
 }
 
-void RewriteSumFunctionWithSumAndCountPass::run(QueryTreeNodePtr query_tree_node, ContextPtr context)
+void RewriteSumFunctionWithSumAndCountPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
     RewriteSumFunctionWithSumAndCountVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
diff --git a/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.h b/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.h
index e878a2c0e7a..4615532e3d9 100644
--- a/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.h
+++ b/src/Analyzer/Passes/RewriteSumFunctionWithSumAndCountPass.h
@@ -20,7 +20,7 @@ public:
 
     String getDescription() override { return "Rewrite sum(column +/- literal) into sum(column) and literal * count(column)"; }
 
-    void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 
 };
 
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 45bd20bd859..cda47596a4f 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -54,6 +54,7 @@
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <base/defines.h>
 #include <base/range.h>
+#include "Common/logger_useful.h"
 #include <Common/Exception.h>
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
@@ -388,7 +389,7 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
 
         Names column_names_as_aliases;
         Aliases aliases;
-        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names_as_aliases, aliases);
+        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names, column_names_as_aliases, aliases);
 
         auto source_pipeline = createSources(
             child_plan.plan,
@@ -524,8 +525,6 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
         Names column_names_as_aliases;
         Names real_column_names = column_names;
 
-        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names_as_aliases, aliases);
-
         const auto & database_name = std::get<0>(table);
         const auto & table_name = std::get<3>(table);
         auto row_policy_filter_ptr = context->getRowPolicyFilter(
@@ -538,6 +537,8 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
             row_policy_data_opt->extendNames(real_column_names);
         }
 
+        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
+
         if (!context->getSettingsRef().allow_experimental_analyzer)
         {
             auto storage_columns = storage_metadata_snapshot->getColumns();
@@ -628,15 +629,14 @@ public:
     }
 };
 
-bool hasUnknownColumn(const QueryTreeNodePtr & node,
-    QueryTreeNodePtr original_table_expression,
-    QueryTreeNodePtr replacement_table_expression)
+bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
 {
     QueryTreeNodes stack = { node };
     while (!stack.empty())
     {
         auto current = stack.back();
         stack.pop_back();
+        LOG_DEBUG(&Poco::Logger::get("hasUnknownColumn"), "Expression: {}", current->formatASTForErrorMessage());
 
         switch (current->getNodeType())
         {
@@ -646,15 +646,13 @@ bool hasUnknownColumn(const QueryTreeNodePtr & node,
             {
                 auto * column_node = current->as<ColumnNode>();
                 auto source = column_node->getColumnSourceOrNull();
-                if (source != original_table_expression)
+                if (source != replacement_table_expression)
                     return true;
-                else
-                    column_node->setColumnSource(replacement_table_expression);
                 break;
             }
             default:
             {
-                for (const auto & child : node->getChildren())
+                for (const auto & child : current->getChildren())
                 {
                     if (child)
                         stack.push_back(child);
@@ -670,9 +668,16 @@ QueryTreeNodePtr removeJoin(
     QueryTreeNodePtr original_table_expression,
     QueryTreeNodePtr replacement_table_expression)
 {
+    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Entered the function");
+
     auto * query_node = query->as<QueryNode>();
     auto join_tree = query_node->getJoinTree();
-    auto modified_query = query_node->cloneAndReplace(join_tree, replacement_table_expression);
+    auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
+
+    auto * modified_query_node = modified_query->as<QueryNode>();
+
+    modified_query = modified_query->cloneAndReplace(modified_query_node->getJoinTree(), replacement_table_expression);
+    modified_query_node = modified_query->as<QueryNode>();
 
     query_node = modified_query->as<QueryNode>();
 
@@ -685,11 +690,12 @@ QueryTreeNodePtr removeJoin(
 
     if (join_tree->as<TableNode>() == nullptr && join_tree->as<TableFunctionNode>() == nullptr)
     {
-        auto & projection = query_node->getProjection().getNodes();
-        auto projection_columns = query_node->getProjectionColumns();
+        auto & projection = modified_query_node->getProjection().getNodes();
+        auto projection_columns = modified_query_node->getProjectionColumns();
         for (size_t i = 0; i < projection.size();)
         {
-            if (hasUnknownColumn(projection[i], original_table_expression, replacement_table_expression))
+            LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Processing: {}", i);
+            if (hasUnknownColumn(projection[i], replacement_table_expression))
             {
                 projection.erase(projection.begin() + i);
                 projection_columns.erase(projection_columns.begin() + i);
@@ -701,6 +707,8 @@ QueryTreeNodePtr removeJoin(
         query_node->resolveProjectionColumns(std::move(projection_columns));
     }
 
+    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Result:\n{}", modified_query->dumpTree());
+
     return modified_query;
 }
 
@@ -709,9 +717,11 @@ QueryTreeNodePtr removeJoin(
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
     const StorageSnapshotPtr & storage_snapshot,
+    Names real_column_names,
     Names & column_names_as_aliases,
     Aliases & aliases) const
 {
+    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Procesing query");
     const auto & [database_name, storage, storage_lock, table_name] = storage_with_lock_and_name;
     const StorageID current_storage_id = storage->getStorageID();
 
@@ -753,7 +763,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         if (with_aliases)
         {
             auto filter_actions_dag = std::make_shared<ActionsDAG>();
-            for (const auto & column : column_names)
+            for (const auto & column : real_column_names)
             {
                 const auto column_default = storage_columns.getDefault(column);
                 bool is_alias = column_default && column_default->kind == ColumnDefaultKind::Alias;
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 5acc06ab8de..c500d1358a3 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -192,6 +192,7 @@ private:
     SelectQueryInfo getModifiedQueryInfo(const ContextPtr & modified_context,
         const StorageWithLockAndName & storage_with_lock_and_name,
         const StorageSnapshotPtr & storage_snapshot,
+        Names real_column_names,
         Names & column_names_as_aliases,
         Aliases & aliases) const;
 

From 572d47acc72f3cc2188a4423a36b31e8e960277a Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 31 Jan 2024 14:43:06 +0000
Subject: [PATCH 0467/1081] Remove logging

---
 src/Storages/StorageMerge.cpp | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index cda47596a4f..17a6ade4059 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -54,7 +54,6 @@
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <base/defines.h>
 #include <base/range.h>
-#include "Common/logger_useful.h"
 #include <Common/Exception.h>
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
@@ -636,7 +635,6 @@ bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacemen
     {
         auto current = stack.back();
         stack.pop_back();
-        LOG_DEBUG(&Poco::Logger::get("hasUnknownColumn"), "Expression: {}", current->formatASTForErrorMessage());
 
         switch (current->getNodeType())
         {
@@ -668,8 +666,6 @@ QueryTreeNodePtr removeJoin(
     QueryTreeNodePtr original_table_expression,
     QueryTreeNodePtr replacement_table_expression)
 {
-    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Entered the function");
-
     auto * query_node = query->as<QueryNode>();
     auto join_tree = query_node->getJoinTree();
     auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
@@ -694,7 +690,6 @@ QueryTreeNodePtr removeJoin(
         auto projection_columns = modified_query_node->getProjectionColumns();
         for (size_t i = 0; i < projection.size();)
         {
-            LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Processing: {}", i);
             if (hasUnknownColumn(projection[i], replacement_table_expression))
             {
                 projection.erase(projection.begin() + i);
@@ -707,8 +702,6 @@ QueryTreeNodePtr removeJoin(
         query_node->resolveProjectionColumns(std::move(projection_columns));
     }
 
-    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Result:\n{}", modified_query->dumpTree());
-
     return modified_query;
 }
 
@@ -721,7 +714,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
     Names & column_names_as_aliases,
     Aliases & aliases) const
 {
-    LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "Procesing query");
     const auto & [database_name, storage, storage_lock, table_name] = storage_with_lock_and_name;
     const StorageID current_storage_id = storage->getStorageID();
 

From 5947e5b5a85ac29d7cb6f7c2a377cda016aa8b64 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Wed, 31 Jan 2024 16:26:47 +0100
Subject: [PATCH 0468/1081] Use retry settings and fault injection

---
 .../System/StorageSystemZooKeeper.cpp         | 32 ++++++++++++++++---
 1 file changed, 28 insertions(+), 4 deletions(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 6aa85e6a9e9..7a2b830b088 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -13,6 +13,7 @@
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Common/ZooKeeper/ZooKeeperRetries.h>
+#include <Common/ZooKeeper/ZooKeeperWithFaultInjection.h>
 #include <Common/typeid_cast.h>
 #include <Columns/ColumnSet.h>
 #include <Columns/ColumnConst.h>
@@ -429,6 +430,29 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
 {
     QueryStatusPtr query_status = context->getProcessListElement();
 
+    const auto & settings = context->getSettingsRef();
+    /// Use insert settings for now in order not to introduce new settings.
+    /// Hopefully insert settings will also be unified and replaced with some generic retry settings.
+    ZooKeeperRetriesInfo retries_seetings(
+        settings.insert_keeper_max_retries,
+        settings.insert_keeper_retry_initial_backoff_ms,
+        settings.insert_keeper_retry_max_backoff_ms);
+
+    ZooKeeperWithFaultInjection::Ptr zookeeper;
+    /// Handles reconnects when needed
+    auto get_zookeeper = [&] ()
+    {
+        if (!zookeeper || zookeeper->expired())
+        {
+            zookeeper = ZooKeeperWithFaultInjection::createInstance(
+                settings.insert_keeper_fault_injection_probability,
+                settings.insert_keeper_fault_injection_seed,
+                context->getZooKeeper(),
+                "", nullptr);
+        }
+        return zookeeper;
+    };
+
     if (paths.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS,
                         "SELECT from system.zookeeper table must contain condition like path = 'path' "
@@ -476,8 +500,8 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
         }
 
         zkutil::ZooKeeper::MultiTryGetChildrenResponse list_responses;
-        ZooKeeperRetriesControl("", nullptr, ZooKeeperRetriesInfo(20, 1, 1000), query_status).retryLoop(
-            [&]() { list_responses = context->getZooKeeper()->tryGetChildren(paths_to_list); });
+        ZooKeeperRetriesControl("", nullptr, retries_seetings, query_status).retryLoop(
+            [&]() { list_responses = get_zookeeper()->tryGetChildren(paths_to_list); });
 
         struct GetTask
         {
@@ -522,8 +546,8 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
         }
 
         zkutil::ZooKeeper::MultiTryGetResponse get_responses;
-        ZooKeeperRetriesControl("", nullptr, ZooKeeperRetriesInfo(20, 1, 1000), query_status).retryLoop(
-            [&]() { get_responses = context->getZooKeeper()->tryGet(paths_to_get); });
+        ZooKeeperRetriesControl("", nullptr, retries_seetings, query_status).retryLoop(
+            [&]() { get_responses = get_zookeeper()->tryGet(paths_to_get); });
 
         for (size_t i = 0, size = get_tasks.size(); i < size; ++i)
         {

From 7c1e318f865c399b2301fc9decba34d183740a81 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Wed, 31 Jan 2024 16:27:32 +0100
Subject: [PATCH 0469/1081] Test retries

---
 .../02975_system_zookeeper_retries.reference  |  3 +++
 .../02975_system_zookeeper_retries.sql        | 21 +++++++++++++++++++
 2 files changed, 24 insertions(+)
 create mode 100644 tests/queries/0_stateless/02975_system_zookeeper_retries.reference
 create mode 100644 tests/queries/0_stateless/02975_system_zookeeper_retries.sql

diff --git a/tests/queries/0_stateless/02975_system_zookeeper_retries.reference b/tests/queries/0_stateless/02975_system_zookeeper_retries.reference
new file mode 100644
index 00000000000..9a636ba56d0
--- /dev/null
+++ b/tests/queries/0_stateless/02975_system_zookeeper_retries.reference
@@ -0,0 +1,3 @@
+/keeper	api_version
+/keeper	feature_flags
+1
diff --git a/tests/queries/0_stateless/02975_system_zookeeper_retries.sql b/tests/queries/0_stateless/02975_system_zookeeper_retries.sql
new file mode 100644
index 00000000000..c23a1ad41c9
--- /dev/null
+++ b/tests/queries/0_stateless/02975_system_zookeeper_retries.sql
@@ -0,0 +1,21 @@
+-- Tags: zookeeper, no-parallel, no-fasttest
+
+SELECT path, name
+FROM system.zookeeper
+WHERE path = '/keeper'
+ORDER BY path, name
+SETTINGS
+  insert_keeper_retry_initial_backoff_ms = 1,
+  insert_keeper_retry_max_backoff_ms = 20,
+  insert_keeper_fault_injection_probability=0.5,
+  log_comment='02975_system_zookeeper_retries';
+
+
+SYSTEM FLUSH LOGS;
+
+-- Check that there where zk session failures
+SELECT ProfileEvents['ZooKeeperHardwareExceptions'] > 0
+FROM system.query_log
+WHERE current_database = currentDatabase() AND type = 'QueryFinish' AND log_comment='02975_system_zookeeper_retries'
+ORDER BY event_time_microseconds DESC
+LIMIT 1;

From 08f91907dc6f1734b948f7da932a94ccb77d9c29 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 31 Jan 2024 15:51:52 +0000
Subject: [PATCH 0470/1081] Fix digest calculation

---
 src/Coordination/KeeperStateMachine.cpp | 12 ++++++------
 src/Coordination/KeeperStorage.cpp      | 13 +++++++++++--
 src/Coordination/KeeperStorage.h        | 16 ++++------------
 tests/config/config.d/keeper_port.xml   |  1 +
 4 files changed, 22 insertions(+), 20 deletions(-)

diff --git a/src/Coordination/KeeperStateMachine.cpp b/src/Coordination/KeeperStateMachine.cpp
index 8d50f0a76b1..c82f8301eff 100644
--- a/src/Coordination/KeeperStateMachine.cpp
+++ b/src/Coordination/KeeperStateMachine.cpp
@@ -136,12 +136,12 @@ namespace
 {
 
 void assertDigest(
-    const KeeperStorage::Digest & first,
-    const KeeperStorage::Digest & second,
+    const KeeperStorage::Digest & expected,
+    const KeeperStorage::Digest & actual,
     const Coordination::ZooKeeperRequest & request,
     bool committing)
 {
-    if (!KeeperStorage::checkDigest(first, second))
+    if (!KeeperStorage::checkDigest(expected, actual))
     {
         LOG_FATAL(
             getLogger("KeeperStateMachine"),
@@ -149,9 +149,9 @@ void assertDigest(
             "{}). Keeper will terminate to avoid inconsistencies.\nExtra information about the request:\n{}",
             committing ? "committing" : "preprocessing",
             request.getOpNum(),
-            first.value,
-            second.value,
-            first.version,
+            expected.value,
+            actual.value,
+            expected.version,
             request.toString());
         std::terminate();
     }
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 992d4ca8a95..f30cbb65182 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -174,7 +174,6 @@ uint64_t calculateDigest(std::string_view path, std::string_view data, const Kee
 
     hash.update(data);
 
-    hash.update(stat.czxid);
     hash.update(stat.czxid);
     hash.update(stat.mzxid);
     hash.update(stat.ctime);
@@ -183,7 +182,6 @@ uint64_t calculateDigest(std::string_view path, std::string_view data, const Kee
     hash.update(stat.cversion);
     hash.update(stat.aversion);
     hash.update(stat.ephemeralOwner);
-    hash.update(data.length());
     hash.update(stat.numChildren);
     hash.update(stat.pzxid);
 
@@ -2531,6 +2529,17 @@ void KeeperStorage::recalculateStats()
     container.recalculateDataSize();
 }
 
+bool KeeperStorage::checkDigest(const Digest & first, const Digest & second)
+{
+    if (first.version != second.version)
+        return true;
+
+    if (first.version == DigestVersion::NO_DIGEST)
+        return true;
+
+    return first.value == second.value;
+}
+
 String KeeperStorage::generateDigest(const String & userdata)
 {
     std::vector<String> user_password;
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 01c1413a884..048adf3ffaa 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -95,10 +95,11 @@ public:
     {
         NO_DIGEST = 0,
         V1 = 1,
-        V2 = 2  // added system nodes that modify the digest on startup so digest from V0 is invalid
+        V2 = 2, // added system nodes that modify the digest on startup so digest from V0 is invalid
+        V3 = 3  // fixed bug with casting, removed duplicate czxid usage
     };
 
-    static constexpr auto CURRENT_DIGEST_VERSION = DigestVersion::V2;
+    static constexpr auto CURRENT_DIGEST_VERSION = DigestVersion::V3;
 
     struct ResponseForSession
     {
@@ -113,16 +114,7 @@ public:
         uint64_t value{0};
     };
 
-    static bool checkDigest(const Digest & first, const Digest & second)
-    {
-        if (first.version != second.version)
-            return true;
-
-        if (first.version == DigestVersion::NO_DIGEST)
-            return true;
-
-        return first.value == second.value;
-    }
+    static bool checkDigest(const Digest & first, const Digest & second);
 
     static String generateDigest(const String & userdata);
 
diff --git a/tests/config/config.d/keeper_port.xml b/tests/config/config.d/keeper_port.xml
index b87014d2485..3cf439a5bdf 100644
--- a/tests/config/config.d/keeper_port.xml
+++ b/tests/config/config.d/keeper_port.xml
@@ -4,6 +4,7 @@
         <server_id>1</server_id>
 
         <create_snapshot_on_exit>1</create_snapshot_on_exit>
+        <digest_enable>1</digest_enabled>
 
         <coordination_settings>
             <operation_timeout_ms>10000</operation_timeout_ms>

From 0f931057e9fbe61bbeb0d27d7ff442fb7ef6e3e7 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 31 Jan 2024 17:59:13 +0100
Subject: [PATCH 0471/1081] Post a failure status if can not run the CI

---
 tests/ci/run_check.py | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/tests/ci/run_check.py b/tests/ci/run_check.py
index 108aa7d1946..a6312872c2a 100644
--- a/tests/ci/run_check.py
+++ b/tests/ci/run_check.py
@@ -1,11 +1,14 @@
 #!/usr/bin/env python3
 import atexit
-import sys
 import logging
+import sys
 from typing import Tuple
 
+# isort: off
 from github import Github
 
+# isort: on
+
 from commit_status_helper import (
     CI_STATUS_NAME,
     create_ci_report,
@@ -18,12 +21,12 @@ from commit_status_helper import (
 )
 from env_helper import GITHUB_REPOSITORY, GITHUB_SERVER_URL
 from get_robot_token import get_best_robot_token
-from pr_info import FORCE_TESTS_LABEL, PRInfo
 from lambda_shared_package.lambda_shared.pr import (
     CATEGORY_TO_LABEL,
     TRUSTED_CONTRIBUTORS,
     check_pr_description,
 )
+from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import FAILURE
 
 TRUSTED_ORG_IDS = {
@@ -146,7 +149,7 @@ def main():
         )
         post_commit_status(
             commit,
-            "failure",
+            FAILURE,
             url,
             format_description(description_error),
             PR_CHECK,
@@ -170,6 +173,14 @@ def main():
         # allow the workflow to continue
 
     if not can_run:
+        post_commit_status(
+            commit,
+            FAILURE,
+            "",
+            description,
+            PR_CHECK,
+            pr_info,
+        )
         print("::notice ::Cannot run")
         sys.exit(1)
 

From cd8e2075313208165992bf425ec2d51987be3346 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Wed, 31 Jan 2024 18:45:42 +0100
Subject: [PATCH 0472/1081] Fix tag

---
 tests/config/config.d/keeper_port.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/config/config.d/keeper_port.xml b/tests/config/config.d/keeper_port.xml
index 3cf439a5bdf..b724d5dd87e 100644
--- a/tests/config/config.d/keeper_port.xml
+++ b/tests/config/config.d/keeper_port.xml
@@ -4,7 +4,7 @@
         <server_id>1</server_id>
 
         <create_snapshot_on_exit>1</create_snapshot_on_exit>
-        <digest_enable>1</digest_enabled>
+        <digest_enabled>1</digest_enabled>
 
         <coordination_settings>
             <operation_timeout_ms>10000</operation_timeout_ms>

From d8b0cca03fd055ec2e544afded0006552e9e3ae9 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Wed, 31 Jan 2024 19:14:57 +0100
Subject: [PATCH 0473/1081] Restart CI

---
 tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
index be04224bd52..1f00dd717eb 100644
--- a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
+++ b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
@@ -62,9 +62,9 @@ INSERT INTO t_leading_zeroes_f VALUES (2005, '0100', 0100, 100, 'Octal like, int
 INSERT INTO t_leading_zeroes_f VALUES (2006, '0000000000100', 0000000000100, 100, 'Octal like, interpret as decimal, multiple leading zeroes');
 
 -- Float negative zero is machine/context dependent
---INSERT INTO t_leading_zeroes_f VALUES (2010, '-0', -0, 0, 'Single zero negative');
---INSERT INTO t_leading_zeroes_f VALUES (2011, '-00', -00, 0, 'Double zero negative');
---INSERT INTO t_leading_zeroes_f VALUES (2012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
+-- INSERT INTO t_leading_zeroes_f VALUES (2010, '-0', -0, 0, 'Single zero negative');
+-- INSERT INTO t_leading_zeroes_f VALUES (2011, '-00', -00, 0, 'Double zero negative');
+-- INSERT INTO t_leading_zeroes_f VALUES (2012, '-000000000000000', -000000000000000, 0, 'Mutliple redundant zeroes negative');
 INSERT INTO t_leading_zeroes_f VALUES (2013, '-01', -01, -1, 'Octal like, interpret as decimal negative');
 INSERT INTO t_leading_zeroes_f VALUES (2014, '-08', -08, -8, 'Octal like, interpret as decimal negative');
 INSERT INTO t_leading_zeroes_f VALUES (2015, '-0100', -0100, -100, 'Octal like, interpret as decimal negative');

From d2ce39387f9a3ef09582a7a914952d76c69e77ac Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Tue, 5 Dec 2023 07:44:42 -0800
Subject: [PATCH 0474/1081] implemented series_outlier method

---
 .../functions/time-series-functions.md        |  51 ++++++
 src/Functions/seriesOutliersTukey.cpp         | 173 ++++++++++++++++++
 .../02813_seriesOutliersTukey.reference       |   3 +
 .../0_stateless/02813_seriesOutliersTukey.sql |  12 ++
 .../aspell-ignore/en/aspell-dict.txt          |   1 +
 5 files changed, 240 insertions(+)
 create mode 100644 src/Functions/seriesOutliersTukey.cpp
 create mode 100644 tests/queries/0_stateless/02813_seriesOutliersTukey.reference
 create mode 100644 tests/queries/0_stateless/02813_seriesOutliersTukey.sql

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 016c3410944..4eb838721b2 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -8,6 +8,57 @@ sidebar_label: Time Series
 
 Below functions are used for time series analysis.
 
+## seriesOutliersTukey
+
+Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
+
+**Syntax**
+
+``` sql
+seriesOutliersTukey(series);
+```
+
+**Arguments**
+
+- `series` - An array of numeric values
+
+**Returned value**
+
+- Returns an array of the same length where each value represents a modified Z-score of possible anomaly of corresponding element in the series.
+- A value greater than 3 or lesser than -3 indicates a possible anomaly.
+
+Type: [Array](../../sql-reference/data-types/array.md).
+
+**Examples**
+
+Query:
+
+``` sql
+seriesOutliersTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+```
+
+Result:
+
+``` text
+┌───────────print_0──────────────────────────────────────────────────────────────────┐
+│[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0] │
+└────────────────────────────────────────────────────────────────────────────────────┘
+```
+
+Query:
+
+``` sql
+seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+```
+
+Result:
+
+``` text
+┌───────────print_0────────────────────────────────────────────┐
+│[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0] │
+└──────────────────────────────────────────────────────────────┘
+```
+
 ## seriesPeriodDetectFFT
 
 Finds the period of the given time series data using FFT
diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersTukey.cpp
new file mode 100644
index 00000000000..1291d5bf09c
--- /dev/null
+++ b/src/Functions/seriesOutliersTukey.cpp
@@ -0,0 +1,173 @@
+#include <cmath>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnsNumber.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/IFunction.h>
+
+namespace DB
+{
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+extern const int ILLEGAL_COLUMN;
+}
+
+//Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
+class FunctionSeriesOutliersTukey : public IFunction
+{
+public:
+    static constexpr auto name = "seriesOutliersTukey";
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSeriesOutliersTukey>(); }
+
+    std::string getName() const override { return name; }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        FunctionArgumentDescriptors args{{"time_series", &isArray<IDataType>, nullptr, "Array"}};
+        validateFunctionArgumentTypes(*this, arguments, args);
+
+        return std::make_shared<DataTypeArray>(std::make_shared<DataTypeFloat64>());
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
+    {
+        ColumnPtr array_ptr = arguments[0].column;
+        const ColumnArray * array = checkAndGetColumn<ColumnArray>(array_ptr.get());
+
+        const IColumn & src_data = array->getData();
+        const ColumnArray::Offsets & src_offsets = array->getOffsets();
+
+        ColumnPtr res;
+
+        if (executeNumber<UInt8>(src_data, src_offsets, res) || executeNumber<UInt16>(src_data, src_offsets, res)
+            || executeNumber<UInt32>(src_data, src_offsets, res) || executeNumber<UInt64>(src_data, src_offsets, res)
+            || executeNumber<Int8>(src_data, src_offsets, res) || executeNumber<Int16>(src_data, src_offsets, res)
+            || executeNumber<Int32>(src_data, src_offsets, res) || executeNumber<Int64>(src_data, src_offsets, res)
+            || executeNumber<Float32>(src_data, src_offsets, res) || executeNumber<Float64>(src_data, src_offsets, res))
+        {
+            return res;
+        }
+        else
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN,
+                "Illegal column {} of first argument of function {}",
+                arguments[0].column->getName(),
+                getName());
+    }
+
+    template <typename T>
+    bool executeNumber(const IColumn & src_data, const ColumnArray::Offsets & src_offsets, ColumnPtr & res_ptr) const
+    {
+        const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&src_data);
+        if (!src_data_concrete)
+            return false;
+
+        const PaddedPODArray<T> & src_vec = src_data_concrete->getData();
+
+        auto outliers = ColumnFloat64::create();
+        auto & outlier_data = outliers->getData();
+
+        ColumnArray::ColumnOffsets::MutablePtr res_offsets = ColumnArray::ColumnOffsets::create();
+        auto & res_offsets_data = res_offsets->getData();
+
+        ColumnArray::Offset prev_src_offset = 0;
+        for (auto curr_src_offset : src_offsets)
+        {
+            chassert(prev_src_offset < curr_src_offset);
+            size_t len = curr_src_offset - prev_src_offset;
+            if (len < 4)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "At least four data points are needed for function {}", getName());
+
+            std::vector<Float64> src_sorted(src_vec.begin() + prev_src_offset, src_vec.begin() + curr_src_offset);
+            std::sort(src_sorted.begin(), src_sorted.end());
+
+            size_t q1_index = len / 4;
+            size_t q3_index = (len * 3) / 4;
+
+            Float64 q1 = (len % 2 != 0) ? src_sorted[q1_index] : (src_sorted[q1_index - 1] + src_sorted[q1_index]) / 2;
+            Float64 q3 = (len % 2 != 0) ? src_sorted[q3_index] : (src_sorted[q3_index - 1] + src_sorted[q3_index]) / 2;
+
+            Float64 iqr = q3 - q1;
+
+            Float64 lower_fence = q1 - 1.5 * iqr;
+            Float64 upper_fence = q3 + 1.5 * iqr;
+
+            for (auto elem : src_vec)
+            {
+                auto score = std::min((elem - lower_fence) / iqr, 0.0) + std::max((elem - upper_fence) / iqr, 0.0);
+                outlier_data.push_back(score);
+            }
+            res_offsets_data.push_back(outlier_data.size());
+            prev_src_offset = curr_src_offset;
+        }
+
+        res_ptr = ColumnArray::create(std::move(outliers), std::move(res_offsets));
+        return true;
+    }
+};
+
+REGISTER_FUNCTION(SeriesOutliersTukey)
+{
+    factory.registerFunction<FunctionSeriesOutliersTukey>(FunctionDocumentation{
+        .description = R"(
+Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
+
+**Syntax**
+
+``` sql
+seriesOutliersTukey(series);
+```
+
+**Arguments**
+
+- `series` - An array of numeric values
+
+**Returned value**
+
+- Returns an array of the same length where each value represents a modified Z-score of possible anomaly of corresponding element in the series.
+- A value greater than 3 or lesser than -3 indicates a possible anomaly.
+
+Type: [Array](../../sql-reference/data-types/array.md).
+
+**Examples**
+
+Query:
+
+``` sql
+seriesOutliersTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+```
+
+Result:
+
+``` text
+┌───────────print_0──────────────────────────────────────────────────────────────────┐
+│[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0] │
+└────────────────────────────────────────────────────────────────────────────────────┘
+```
+
+Query:
+
+``` sql
+seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+```
+
+Result:
+
+``` text
+┌───────────print_0────────────────────────────────────────────┐
+│[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0] │
+└──────────────────────────────────────────────────────────────┘
+```)",
+        .categories{"Time series analysis"}});
+}
+}
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
new file mode 100644
index 00000000000..b370b4b5fe2
--- /dev/null
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
@@ -0,0 +1,3 @@
+[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,5.228971962616823,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
new file mode 100644
index 00000000000..4b24f1bffbb
--- /dev/null
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
@@ -0,0 +1,12 @@
+DROP TABLE IF EXISTS tb1;
+
+CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;
+INSERT INTO tb1 VALUES (1, [-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]);
+INSERT INTO tb1 VALUES (2, [-3,2.4,15,3.9,5,6,4.5,5.2,12,45,12,3.4,3,4,5,6]);
+
+SELECT seriesOutliersTukey(a) FROM tb1 ORDER BY n;
+DROP TABLE IF EXISTS tb1;
+SELECT seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30)));
+SELECT seriesOutliersTukey([-3, 2.4, 15, NULL]); -- { serverError ILLEGAL_COLUMN}
+SELECT seriesOutliersTukey([]); -- { serverError ILLEGAL_COLUMN}
+SELECT seriesOutliersTukey([-3, 2.4, 15]); -- { serverError BAD_ARGUMENTS}
\ No newline at end of file
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 9f87255c9fa..64327aba2d1 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -939,6 +939,7 @@ TotalTemporaryFiles
 Tradeoff
 Transactional
 TwoColumnList
+Tukey
 UBSan
 UDFs
 UInt

From f4c14e15a2c4010b16240dfa4990a2f45c6d2f37 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Wed, 10 Jan 2024 09:20:49 -0800
Subject: [PATCH 0475/1081] added a fix for failing testcase

---
 src/Functions/seriesOutliersTukey.cpp                   | 4 ++--
 tests/queries/0_stateless/02813_seriesOutliersTukey.sql | 3 +--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersTukey.cpp
index 1291d5bf09c..4640258acc1 100644
--- a/src/Functions/seriesOutliersTukey.cpp
+++ b/src/Functions/seriesOutliersTukey.cpp
@@ -102,9 +102,9 @@ public:
             Float64 lower_fence = q1 - 1.5 * iqr;
             Float64 upper_fence = q3 + 1.5 * iqr;
 
-            for (auto elem : src_vec)
+            for (ColumnArray::Offset j = prev_src_offset; j < curr_src_offset; ++j)
             {
-                auto score = std::min((elem - lower_fence) / iqr, 0.0) + std::max((elem - upper_fence) / iqr, 0.0);
+                auto score = std::min((src_vec[j] - lower_fence) / iqr, 0.0) + std::max((src_vec[j] - upper_fence) / iqr, 0.0);
                 outlier_data.push_back(score);
             }
             res_offsets_data.push_back(outlier_data.size());
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
index 4b24f1bffbb..baf8a229403 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
@@ -1,8 +1,7 @@
 DROP TABLE IF EXISTS tb1;
 
 CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;
-INSERT INTO tb1 VALUES (1, [-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]);
-INSERT INTO tb1 VALUES (2, [-3,2.4,15,3.9,5,6,4.5,5.2,12,45,12,3.4,3,4,5,6]);
+INSERT INTO tb1 VALUES (1, [-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]), (2, [-3,2.4,15,3.9,5,6,4.5,5.2,12,45,12,3.4,3,4,5,6]);
 
 SELECT seriesOutliersTukey(a) FROM tb1 ORDER BY n;
 DROP TABLE IF EXISTS tb1;

From 90dfacd5a67e0addde4973484a4bc1944a6ca4b1 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Wed, 10 Jan 2024 09:20:49 -0800
Subject: [PATCH 0476/1081] added a fix for failing testcase

---
 src/Functions/seriesOutliersTukey.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersTukey.cpp
index 4640258acc1..697f32f2046 100644
--- a/src/Functions/seriesOutliersTukey.cpp
+++ b/src/Functions/seriesOutliersTukey.cpp
@@ -83,7 +83,7 @@ public:
         ColumnArray::Offset prev_src_offset = 0;
         for (auto curr_src_offset : src_offsets)
         {
-            chassert(prev_src_offset < curr_src_offset);
+            chassert(prev_src_offset <= curr_src_offset);
             size_t len = curr_src_offset - prev_src_offset;
             if (len < 4)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "At least four data points are needed for function {}", getName());

From 487ef67e9759394de5ebfcc91749db5624d2fd03 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Thu, 18 Jan 2024 07:26:32 -0800
Subject: [PATCH 0477/1081] Added custom tukey

---
 .../functions/time-series-functions.md        |   8 +-
 src/Functions/seriesOutliersTukey.cpp         | 120 ++++++++++++++----
 .../02813_seriesOutliersTukey.reference       |   9 ++
 .../0_stateless/02813_seriesOutliersTukey.sql |  19 ++-
 4 files changed, 124 insertions(+), 32 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 4eb838721b2..9eea5a8eb1f 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -8,14 +8,14 @@ sidebar_label: Time Series
 
 Below functions are used for time series analysis.
 
-## seriesOutliersTukey
+## seriesOutliersDetectTukey
 
 Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
 
 **Syntax**
 
 ``` sql
-seriesOutliersTukey(series);
+seriesOutliersDetectTukey(series);
 ```
 
 **Arguments**
@@ -34,7 +34,7 @@ Type: [Array](../../sql-reference/data-types/array.md).
 Query:
 
 ``` sql
-seriesOutliersTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+seriesOutliersDetectTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
 ```
 
 Result:
@@ -48,7 +48,7 @@ Result:
 Query:
 
 ``` sql
-seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
 ```
 
 Result:
diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersTukey.cpp
index 697f32f2046..72a16949605 100644
--- a/src/Functions/seriesOutliersTukey.cpp
+++ b/src/Functions/seriesOutliersTukey.cpp
@@ -1,5 +1,6 @@
 #include <cmath>
 #include <Columns/ColumnArray.h>
+#include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypesNumber.h>
@@ -16,16 +17,18 @@ extern const int ILLEGAL_COLUMN;
 }
 
 //Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
-class FunctionSeriesOutliersTukey : public IFunction
+class FunctionSeriesOutliersDetectTukey : public IFunction
 {
 public:
-    static constexpr auto name = "seriesOutliersTukey";
+    static constexpr auto name = "seriesOutliersDetectTukey";
 
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSeriesOutliersTukey>(); }
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSeriesOutliersDetectTukey>(); }
 
     std::string getName() const override { return name; }
 
-    size_t getNumberOfArguments() const override { return 1; }
+    bool isVariadic() const override { return true; }
+
+    size_t getNumberOfArguments() const override { return 0; }
 
     bool useDefaultImplementationForConstants() const override { return true; }
 
@@ -33,12 +36,20 @@ public:
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
-        FunctionArgumentDescriptors args{{"time_series", &isArray<IDataType>, nullptr, "Array"}};
-        validateFunctionArgumentTypes(*this, arguments, args);
+        FunctionArgumentDescriptors mandatory_args{{"time_series", &isArray<IDataType>, nullptr, "Array"}};
+        FunctionArgumentDescriptors optional_args{
+            {"kind", &isString<IDataType>, isColumnConst, "const String"},
+            {"min_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"},
+            {"max_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"}
+        };
+
+        validateFunctionArgumentTypes(*this, arguments, mandatory_args, optional_args);
 
         return std::make_shared<DataTypeArray>(std::make_shared<DataTypeFloat64>());
     }
 
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1,2,3}; }
+
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
     {
         ColumnPtr array_ptr = arguments[0].column;
@@ -47,13 +58,54 @@ public:
         const IColumn & src_data = array->getData();
         const ColumnArray::Offsets & src_offsets = array->getOffsets();
 
+        Float64 min_percentile = 0.25;
+        Float64 max_percentile = 0.75;
+
+        if(arguments.size() > 1)
+        {
+            //const IColumn * arg_column = arguments[1].column.get();
+            const ColumnConst * arg_string = checkAndGetColumnConstStringOrFixedString(arguments[1].column.get());
+
+            if (!arg_string)
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "The second argument of function {} must be constant String", getName());
+
+            String kind = arg_string->getValue<String>();
+            if(kind == "ctukey"){
+                min_percentile = 0.10; //default 10th percentile
+                max_percentile = 0.90; //default 90th percentile
+
+                if(arguments.size() > 2)
+                {
+                    Float64 p_min = arguments[2].column->getFloat64(0);
+                    if(p_min >= 2.0 && p_min <= 98.0)
+                        min_percentile = p_min/100;
+                    else
+                      throw Exception(ErrorCodes::BAD_ARGUMENTS, "The third argumet of function {} must be in range [2.0, 98.0]", getName());  
+                }
+
+                if(arguments.size() == 4)
+                {
+                    Float64 p_max = arguments[3].column->getFloat64(0);
+                    if(p_max >= 2.0 && p_max <= 98.0 && p_max > min_percentile*100)
+                        max_percentile = p_max/100;
+                    else
+                      throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fourth argumet of function {} must be in range [2.0, 98.0]", getName());  
+                }
+            } 
+            else
+            {
+                if(kind != "tukey")
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} can only be 'tukey' or 'ctukey'.", getName());
+            }
+        }
+
         ColumnPtr res;
 
-        if (executeNumber<UInt8>(src_data, src_offsets, res) || executeNumber<UInt16>(src_data, src_offsets, res)
-            || executeNumber<UInt32>(src_data, src_offsets, res) || executeNumber<UInt64>(src_data, src_offsets, res)
-            || executeNumber<Int8>(src_data, src_offsets, res) || executeNumber<Int16>(src_data, src_offsets, res)
-            || executeNumber<Int32>(src_data, src_offsets, res) || executeNumber<Int64>(src_data, src_offsets, res)
-            || executeNumber<Float32>(src_data, src_offsets, res) || executeNumber<Float64>(src_data, src_offsets, res))
+        if (executeNumber<UInt8>(src_data, src_offsets, min_percentile, max_percentile, res) || executeNumber<UInt16>(src_data, src_offsets,min_percentile, max_percentile, res)
+            || executeNumber<UInt32>(src_data, src_offsets, min_percentile, max_percentile,res) || executeNumber<UInt64>(src_data, src_offsets,min_percentile, max_percentile, res)
+            || executeNumber<Int8>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Int16>(src_data, src_offsets,min_percentile, max_percentile, res)
+            || executeNumber<Int32>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Int64>(src_data, src_offsets, min_percentile, max_percentile,res)
+            || executeNumber<Float32>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Float64>(src_data, src_offsets,min_percentile, max_percentile, res))
         {
             return res;
         }
@@ -66,7 +118,11 @@ public:
     }
 
     template <typename T>
-    bool executeNumber(const IColumn & src_data, const ColumnArray::Offsets & src_offsets, ColumnPtr & res_ptr) const
+    bool executeNumber(const IColumn & src_data, 
+    const ColumnArray::Offsets & src_offsets, 
+    Float64 min_percentile,
+    Float64 max_percentile,
+    ColumnPtr & res_ptr) const
     {
         const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&src_data);
         if (!src_data_concrete)
@@ -91,16 +147,34 @@ public:
             std::vector<Float64> src_sorted(src_vec.begin() + prev_src_offset, src_vec.begin() + curr_src_offset);
             std::sort(src_sorted.begin(), src_sorted.end());
 
-            size_t q1_index = len / 4;
-            size_t q3_index = (len * 3) / 4;
+            Float64 q1, q2;
 
-            Float64 q1 = (len % 2 != 0) ? src_sorted[q1_index] : (src_sorted[q1_index - 1] + src_sorted[q1_index]) / 2;
-            Float64 q3 = (len % 2 != 0) ? src_sorted[q3_index] : (src_sorted[q3_index - 1] + src_sorted[q3_index]) / 2;
+            auto p1 = len * min_percentile;
+            if(p1 == static_cast<Int64>(p1)){
+                size_t index = static_cast<size_t>(p1)-1;
+                q1 = (src_sorted[index] + src_sorted[index+1])/2;
+            }
+            else
+            {   
+                size_t index = static_cast<size_t>(std::ceil(p1))-1;
+                q1 = src_sorted[index];
+            }
 
-            Float64 iqr = q3 - q1;
+            auto p2 = len * max_percentile;
+            if(p2 == static_cast<Int64>(p2)){
+                size_t index = static_cast<size_t>(p2)-1;
+                q2 = (src_sorted[index] + src_sorted[index+1])/2;
+            }
+            else
+            {   
+                size_t index = static_cast<size_t>(std::ceil(p2))-1;
+                q2 = src_sorted[index];
+            }
+
+            Float64 iqr = q2 - q1;
 
             Float64 lower_fence = q1 - 1.5 * iqr;
-            Float64 upper_fence = q3 + 1.5 * iqr;
+            Float64 upper_fence = q2 + 1.5 * iqr;
 
             for (ColumnArray::Offset j = prev_src_offset; j < curr_src_offset; ++j)
             {
@@ -116,16 +190,16 @@ public:
     }
 };
 
-REGISTER_FUNCTION(SeriesOutliersTukey)
+REGISTER_FUNCTION(SeriesOutliersDetectTukey)
 {
-    factory.registerFunction<FunctionSeriesOutliersTukey>(FunctionDocumentation{
+    factory.registerFunction<FunctionSeriesOutliersDetectTukey>(FunctionDocumentation{
         .description = R"(
 Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
 
 **Syntax**
 
 ``` sql
-seriesOutliersTukey(series);
+seriesOutliersDetectTukey(series);
 ```
 
 **Arguments**
@@ -144,7 +218,7 @@ Type: [Array](../../sql-reference/data-types/array.md).
 Query:
 
 ``` sql
-seriesOutliersTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+seriesOutliersDetectTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
 ```
 
 Result:
@@ -158,7 +232,7 @@ Result:
 Query:
 
 ``` sql
-seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
 ```
 
 Result:
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
index b370b4b5fe2..990c8c11e9e 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
@@ -1,3 +1,12 @@
 [-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,5.228971962616823,0,0,0,0,0,0]
+[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,5.228971962616823,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
+[-0.9615384615384613,0,1.9615384615384612,0,0,0,0,0,0.8076923076923075,19.26923076923077,0.8076923076923075,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,0.8076923076923077,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
+[0,0,0,0]
 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
index baf8a229403..f8debc7b6db 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
@@ -3,9 +3,18 @@ DROP TABLE IF EXISTS tb1;
 CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;
 INSERT INTO tb1 VALUES (1, [-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]), (2, [-3,2.4,15,3.9,5,6,4.5,5.2,12,45,12,3.4,3,4,5,6]);
 
-SELECT seriesOutliersTukey(a) FROM tb1 ORDER BY n;
+SELECT seriesOutliersDetectTukey(a) FROM tb1 ORDER BY n;
+SELECT seriesOutliersDetectTukey(a,'ctukey', 25,75) FROM tb1 ORDER BY n;
 DROP TABLE IF EXISTS tb1;
-SELECT seriesOutliersTukey(arrayMap(x -> sin(x / 10), range(30)));
-SELECT seriesOutliersTukey([-3, 2.4, 15, NULL]); -- { serverError ILLEGAL_COLUMN}
-SELECT seriesOutliersTukey([]); -- { serverError ILLEGAL_COLUMN}
-SELECT seriesOutliersTukey([-3, 2.4, 15]); -- { serverError BAD_ARGUMENTS}
\ No newline at end of file
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6]);
+SELECT seriesOutliersDetectTukey([-3, 2.4, 15, 3.9, 5, 6, 4.5, 5.2, 12, 60, 12, 3.4, 3, 4, 5, 6, 3.4, 2.7]);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 25, 75);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 10, 90);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'tukey', 10, 90);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 2, 98)
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'ctukey', 2, 98);
+SELECT seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30)));
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'xyz', 33, 53); -- { serverError BAD_ARGUMENTS}
+SELECT seriesOutliersDetectTukey([-3, 2.4, 15, NULL]); -- { serverError ILLEGAL_COLUMN}
+SELECT seriesOutliersDetectTukey([]); -- { serverError ILLEGAL_COLUMN}
+SELECT seriesOutliersDetectTukey([-3, 2.4, 15]); -- { serverError BAD_ARGUMENTS}
\ No newline at end of file

From 4bc26fe45fa78fbfd1394d22f73a86cf1f83e586 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Wed, 31 Jan 2024 10:35:08 -0800
Subject: [PATCH 0478/1081] Added support for custom percentiles and K

---
 .../functions/time-series-functions.md        |  41 ++--
 src/Functions/seriesOutliersTukey.cpp         | 184 +++++++++++-------
 .../02813_seriesOutliersTukey.reference       |  20 +-
 .../0_stateless/02813_seriesOutliersTukey.sql |  26 ++-
 .../aspell-ignore/en/aspell-dict.txt          |   3 +
 5 files changed, 168 insertions(+), 106 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index 9eea5a8eb1f..bd50ef556f7 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -6,7 +6,7 @@ sidebar_label: Time Series
 
 # Time Series Functions
 
-Below functions are used for time series analysis.
+Below functions are used for series data analysis.
 
 ## seriesOutliersDetectTukey
 
@@ -16,16 +16,27 @@ Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.o
 
 ``` sql
 seriesOutliersDetectTukey(series);
+seriesOutliersDetectTukey(series, kind, min_percentile, max_percentile, K);
 ```
 
 **Arguments**
 
-- `series` - An array of numeric values
+- `series` - An array of numeric values.
+- `kind` - Kind of algorithm to use. Supported values are 'tukey' for standard tukey and 'ctukey' for custom tukey algorithm. The default is 'ctukey'.
+- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 10. This value is only supported for 'ctukey'.
+- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 90. This value is only supported for 'ctukey'.
+- `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
+
+At least four data points are required in `series` to detect outliers.
+
+Default quantile range:
+- `tukey` - 25%/75%
+- `ctukey` - 10%/90%
 
 **Returned value**
 
-- Returns an array of the same length where each value represents a modified Z-score of possible anomaly of corresponding element in the series.
-- A value greater than 3 or lesser than -3 indicates a possible anomaly.
+- Returns an array of the same length where each value represents score of possible anomaly of corresponding element in the series.
+- A non-zero score indicates a possible anomaly.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -34,34 +45,34 @@ Type: [Array](../../sql-reference/data-types/array.md).
 Query:
 
 ``` sql
-seriesOutliersDetectTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6]) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌───────────print_0──────────────────────────────────────────────────────────────────┐
-│[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0] │
-└────────────────────────────────────────────────────────────────────────────────────┘
+┌───────────print_0───────────────────┐
+│[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0] │
+└─────────────────────────────────────┘
 ```
 
 Query:
 
 ``` sql
-seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 20, 80, 1.5) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌───────────print_0────────────────────────────────────────────┐
-│[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0] │
-└──────────────────────────────────────────────────────────────┘
+┌─print_0────────────────────────────┐
+│ [0,0,0,0,0,0,0,0,0,12,0,0,0,0,0,0] │
+└────────────────────────────────────┘
 ```
 
 ## seriesPeriodDetectFFT
 
-Finds the period of the given time series data using FFT
+Finds the period of the given series data data using FFT
 FFT - [Fast Fourier transform](https://en.wikipedia.org/wiki/Fast_Fourier_transform)
 
 **Syntax**
@@ -76,7 +87,7 @@ seriesPeriodDetectFFT(series);
 
 **Returned value**
 
-- A real value equal to the period of time series
+- A real value equal to the period of series data
 - Returns NAN when number of data points are less than four.
 
 Type: [Float64](../../sql-reference/data-types/float.md).
@@ -111,7 +122,7 @@ Result:
 
 ## seriesDecomposeSTL
 
-Decomposes a time series using STL [(Seasonal-Trend Decomposition Procedure Based on Loess)](https://www.wessa.net/download/stl.pdf) into a season, a trend and a residual component. 
+Decomposes a series data using STL [(Seasonal-Trend Decomposition Procedure Based on Loess)](https://www.wessa.net/download/stl.pdf) into a season, a trend and a residual component. 
 
 **Syntax**
 
diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersTukey.cpp
index 72a16949605..4c2c1ccd882 100644
--- a/src/Functions/seriesOutliersTukey.cpp
+++ b/src/Functions/seriesOutliersTukey.cpp
@@ -1,4 +1,3 @@
-#include <cmath>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
@@ -7,6 +6,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <cmath>
 
 namespace DB
 {
@@ -16,7 +16,7 @@ extern const int BAD_ARGUMENTS;
 extern const int ILLEGAL_COLUMN;
 }
 
-//Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
+///Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
 class FunctionSeriesOutliersDetectTukey : public IFunction
 {
 public:
@@ -40,28 +40,28 @@ public:
         FunctionArgumentDescriptors optional_args{
             {"kind", &isString<IDataType>, isColumnConst, "const String"},
             {"min_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"},
-            {"max_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"}
-        };
+            {"max_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"},
+            {"k", &isNativeNumber<IDataType>, isColumnConst, "Number"}};
 
         validateFunctionArgumentTypes(*this, arguments, mandatory_args, optional_args);
 
         return std::make_shared<DataTypeArray>(std::make_shared<DataTypeFloat64>());
     }
 
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1,2,3}; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3, 4}; }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
     {
-        ColumnPtr array_ptr = arguments[0].column;
-        const ColumnArray * array = checkAndGetColumn<ColumnArray>(array_ptr.get());
+        ColumnPtr col = arguments[0].column;
+        const ColumnArray * col_arr = checkAndGetColumn<ColumnArray>(col.get());
 
-        const IColumn & src_data = array->getData();
-        const ColumnArray::Offsets & src_offsets = array->getOffsets();
+        const IColumn & arr_data = col_arr->getData();
+        const ColumnArray::Offsets & arr_offsets = col_arr->getOffsets();
 
-        Float64 min_percentile = 0.25;
-        Float64 max_percentile = 0.75;
+        Float64 min_percentile = 0.10; //default 10th percentile
+        Float64 max_percentile = 0.90; //default 90th percentile
 
-        if(arguments.size() > 1)
+        if (arguments.size() > 1)
         {
             //const IColumn * arg_column = arguments[1].column.get();
             const ColumnConst * arg_string = checkAndGetColumnConstStringOrFixedString(arguments[1].column.get());
@@ -70,44 +70,62 @@ public:
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "The second argument of function {} must be constant String", getName());
 
             String kind = arg_string->getValue<String>();
-            if(kind == "ctukey"){
-                min_percentile = 0.10; //default 10th percentile
-                max_percentile = 0.90; //default 90th percentile
-
-                if(arguments.size() > 2)
+            if (kind == "ctukey")
+            {
+                if (arguments.size() > 2)
                 {
                     Float64 p_min = arguments[2].column->getFloat64(0);
-                    if(p_min >= 2.0 && p_min <= 98.0)
-                        min_percentile = p_min/100;
+                    if (p_min >= 2.0 && p_min <= 98.0)
+                        min_percentile = p_min / 100;
                     else
-                      throw Exception(ErrorCodes::BAD_ARGUMENTS, "The third argumet of function {} must be in range [2.0, 98.0]", getName());  
+                        throw Exception(
+                            ErrorCodes::BAD_ARGUMENTS, "The third argumet of function {} must be in range [2.0, 98.0]", getName());
                 }
 
-                if(arguments.size() == 4)
+                if (arguments.size() > 3)
                 {
                     Float64 p_max = arguments[3].column->getFloat64(0);
-                    if(p_max >= 2.0 && p_max <= 98.0 && p_max > min_percentile*100)
-                        max_percentile = p_max/100;
+                    if (p_max >= 2.0 && p_max <= 98.0 && p_max > min_percentile * 100)
+                        max_percentile = p_max / 100;
                     else
-                      throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fourth argumet of function {} must be in range [2.0, 98.0]", getName());  
+                        throw Exception(
+                            ErrorCodes::BAD_ARGUMENTS, "The fourth argumet of function {} must be in range [2.0, 98.0]", getName());
                 }
-            } 
-            else
-            {
-                if(kind != "tukey")
-                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} can only be 'tukey' or 'ctukey'.", getName());
             }
+            else if (kind == "tukey")
+            {
+                min_percentile = 0.25;
+                max_percentile = 0.75;
+            }
+            else
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} can only be 'tukey' or 'ctukey'.", getName());
         }
 
-        ColumnPtr res;
-
-        if (executeNumber<UInt8>(src_data, src_offsets, min_percentile, max_percentile, res) || executeNumber<UInt16>(src_data, src_offsets,min_percentile, max_percentile, res)
-            || executeNumber<UInt32>(src_data, src_offsets, min_percentile, max_percentile,res) || executeNumber<UInt64>(src_data, src_offsets,min_percentile, max_percentile, res)
-            || executeNumber<Int8>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Int16>(src_data, src_offsets,min_percentile, max_percentile, res)
-            || executeNumber<Int32>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Int64>(src_data, src_offsets, min_percentile, max_percentile,res)
-            || executeNumber<Float32>(src_data, src_offsets,min_percentile, max_percentile, res) || executeNumber<Float64>(src_data, src_offsets,min_percentile, max_percentile, res))
+        Float64 K = 1.50;
+        if (arguments.size() == 5)
         {
-            return res;
+            auto k_val = arguments[4].column->getFloat64(0);
+            if (k_val >= 0.0)
+                K = k_val;
+            else
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fifth argumet of function {} must be a positive number", getName());
+        }
+
+        ColumnPtr col_res;
+
+        if (executeNumber<UInt8>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<UInt16>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<UInt32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<UInt64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Int8>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Int16>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Int32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Int64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Float32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
+            || executeNumber<Float64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res))
+        {
+            return col_res;
         }
         else
             throw Exception(
@@ -117,14 +135,17 @@ public:
                 getName());
     }
 
+private:
     template <typename T>
-    bool executeNumber(const IColumn & src_data, 
-    const ColumnArray::Offsets & src_offsets, 
-    Float64 min_percentile,
-    Float64 max_percentile,
-    ColumnPtr & res_ptr) const
+    bool executeNumber(
+        const IColumn & arr_data,
+        const ColumnArray::Offsets & arr_offsets,
+        Float64 min_percentile,
+        Float64 max_percentile,
+        Float64 K,
+        ColumnPtr & res_ptr) const
     {
-        const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&src_data);
+        const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&arr_data);
         if (!src_data_concrete)
             return false;
 
@@ -136,53 +157,57 @@ public:
         ColumnArray::ColumnOffsets::MutablePtr res_offsets = ColumnArray::ColumnOffsets::create();
         auto & res_offsets_data = res_offsets->getData();
 
+        std::vector<Float64> src_sorted;
+
         ColumnArray::Offset prev_src_offset = 0;
-        for (auto curr_src_offset : src_offsets)
+        for (auto src_offset : arr_offsets)
         {
-            chassert(prev_src_offset <= curr_src_offset);
-            size_t len = curr_src_offset - prev_src_offset;
+            chassert(prev_src_offset <= src_offset);
+            size_t len = src_offset - prev_src_offset;
             if (len < 4)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "At least four data points are needed for function {}", getName());
 
-            std::vector<Float64> src_sorted(src_vec.begin() + prev_src_offset, src_vec.begin() + curr_src_offset);
+            src_sorted.assign(src_vec.begin() + prev_src_offset, src_vec.begin() + src_offset);
             std::sort(src_sorted.begin(), src_sorted.end());
 
             Float64 q1, q2;
 
             auto p1 = len * min_percentile;
-            if(p1 == static_cast<Int64>(p1)){
-                size_t index = static_cast<size_t>(p1)-1;
-                q1 = (src_sorted[index] + src_sorted[index+1])/2;
+            if (p1 == static_cast<Int64>(p1))
+            {
+                size_t index = static_cast<size_t>(p1) - 1;
+                q1 = (src_sorted[index] + src_sorted[index + 1]) / 2;
             }
             else
-            {   
-                size_t index = static_cast<size_t>(std::ceil(p1))-1;
+            {
+                size_t index = static_cast<size_t>(std::ceil(p1)) - 1;
                 q1 = src_sorted[index];
             }
 
             auto p2 = len * max_percentile;
-            if(p2 == static_cast<Int64>(p2)){
-                size_t index = static_cast<size_t>(p2)-1;
-                q2 = (src_sorted[index] + src_sorted[index+1])/2;
+            if (p2 == static_cast<Int64>(p2))
+            {
+                size_t index = static_cast<size_t>(p2) - 1;
+                q2 = (src_sorted[index] + src_sorted[index + 1]) / 2;
             }
             else
-            {   
-                size_t index = static_cast<size_t>(std::ceil(p2))-1;
+            {
+                size_t index = static_cast<size_t>(std::ceil(p2)) - 1;
                 q2 = src_sorted[index];
             }
 
-            Float64 iqr = q2 - q1;
+            Float64 iqr = q2 - q1; /// interquantile range
 
-            Float64 lower_fence = q1 - 1.5 * iqr;
-            Float64 upper_fence = q2 + 1.5 * iqr;
+            Float64 lower_fence = q1 - K * iqr;
+            Float64 upper_fence = q2 + K * iqr;
 
-            for (ColumnArray::Offset j = prev_src_offset; j < curr_src_offset; ++j)
+            for (ColumnArray::Offset j = prev_src_offset; j < src_offset; ++j)
             {
-                auto score = std::min((src_vec[j] - lower_fence) / iqr, 0.0) + std::max((src_vec[j] - upper_fence) / iqr, 0.0);
+                auto score = std::min((src_vec[j] - lower_fence), 0.0) + std::max((src_vec[j] - upper_fence), 0.0);
                 outlier_data.push_back(score);
             }
             res_offsets_data.push_back(outlier_data.size());
-            prev_src_offset = curr_src_offset;
+            prev_src_offset = src_offset;
         }
 
         res_ptr = ColumnArray::create(std::move(outliers), std::move(res_offsets));
@@ -196,20 +221,31 @@ REGISTER_FUNCTION(SeriesOutliersDetectTukey)
         .description = R"(
 Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
 
+Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
+
 **Syntax**
 
 ``` sql
 seriesOutliersDetectTukey(series);
+seriesOutliersDetectTukey(series, kind, min_percentile, max_percentile, K);
 ```
 
 **Arguments**
 
-- `series` - An array of numeric values
+- `series` - An array of numeric values.
+- `kind` - Kind of algorithm to use. Supported values are 'tukey' for standard tukey and 'ctukey' for custom tukey algorithm. The default is 'ctukey'.
+- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 10. This value is only supported for 'ctukey'.
+- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 90. This value is only supported for 'ctukey'.
+- `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
+
+Default quantile range:
+- `tukey` - 25%/75%
+- `ctukey` - 10%/90%
 
 **Returned value**
 
-- Returns an array of the same length where each value represents a modified Z-score of possible anomaly of corresponding element in the series.
-- A value greater than 3 or lesser than -3 indicates a possible anomaly.
+- Returns an array of the same length where each value represents score of possible anomaly of corresponding element in the series.
+- A non-zero score indicates a possible anomaly.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -218,29 +254,29 @@ Type: [Array](../../sql-reference/data-types/array.md).
 Query:
 
 ``` sql
-seriesOutliersDetectTukey([-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6]) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌───────────print_0──────────────────────────────────────────────────────────────────┐
-│[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0] │
-└────────────────────────────────────────────────────────────────────────────────────┘
+┌───────────print_0───────────────────┐
+│[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0] │
+└─────────────────────────────────────┘
 ```
 
 Query:
 
 ``` sql
-seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30))) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 20, 80, 1.5) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌───────────print_0────────────────────────────────────────────┐
-│[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0] │
-└──────────────────────────────────────────────────────────────┘
+┌─print_0────────────────────────────┐
+│ [0,0,0,0,0,0,0,0,0,12,0,0,0,0,0,0] │
+└────────────────────────────────────┘
 ```)",
         .categories{"Time series analysis"}});
 }
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
index 990c8c11e9e..bdcde0419a4 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
@@ -1,12 +1,14 @@
-[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,5.228971962616823,0,0,0,0,0,0]
-[-2.7121212121212137,0,4.196969696969699,0,0,0,0,0,0,0,0,4.803030303030305,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,5.228971962616823,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
-[-0.9615384615384613,0,1.9615384615384612,0,0,0,0,0,0.8076923076923075,19.26923076923077,0.8076923076923075,0,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,0.8076923076923077,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,4.706896551724138,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,11.100000000000001,0,0,0,0,0,0]
+[-4.475000000000001,0,6.925000000000001,0,0,0,0,0,0,0,0,7.925000000000001,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,27.975,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,26.1,0,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,27.3,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,27.3,0,0,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
 [0,0,0,0]
 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,27,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,18,0,0,0,0,0,0]
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
index f8debc7b6db..7efe4903249 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
@@ -1,19 +1,29 @@
 DROP TABLE IF EXISTS tb1;
 
 CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;
-INSERT INTO tb1 VALUES (1, [-3,2.4,15,3.9,5,6,4.5,5.2,3,4,5,16,7,5,5,4]), (2, [-3,2.4,15,3.9,5,6,4.5,5.2,12,45,12,3.4,3,4,5,6]);
+INSERT INTO tb1 VALUES (1, [-3,2.40,15,3.90,5,6,4.50,5.20,3,4,5,16,7,5,5,4]), (2, [-3,2.40,15,3.90,5,6,4.50,5.20,12,45,12,3.40,3,4,5,6]);
 
+-- non-const inputs
 SELECT seriesOutliersDetectTukey(a) FROM tb1 ORDER BY n;
 SELECT seriesOutliersDetectTukey(a,'ctukey', 25,75) FROM tb1 ORDER BY n;
 DROP TABLE IF EXISTS tb1;
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6]);
-SELECT seriesOutliersDetectTukey([-3, 2.4, 15, 3.9, 5, 6, 4.5, 5.2, 12, 60, 12, 3.4, 3, 4, 5, 6, 3.4, 2.7]);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 25, 75);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 10, 90);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'tukey', 10, 90);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.5, 5, 12, 45, 12, 3.4, 3, 4, 5, 6], 'ctukey', 2, 98)
+
+-- const inputs
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6]);
+SELECT seriesOutliersDetectTukey([-3, 2.40, 15, 3.90, 5, 6, 4.50, 5.20, 12, 60, 12, 3.40, 3, 4, 5, 6, 3.40, 2.7]);
+
+-- const inputs with optional arguments
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 25, 75);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 10, 90);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'tukey', 10, 90);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 2, 98);
 SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'ctukey', 2, 98);
-SELECT seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30)));
+SELECT seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30)), 'tukey');
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, 1.5);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, 3);
+
+-- negative tests
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, -1); -- { serverError BAD_ARGUMENTS}
 SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'xyz', 33, 53); -- { serverError BAD_ARGUMENTS}
 SELECT seriesOutliersDetectTukey([-3, 2.4, 15, NULL]); -- { serverError ILLEGAL_COLUMN}
 SELECT seriesOutliersDetectTukey([]); -- { serverError ILLEGAL_COLUMN}
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 64327aba2d1..3c8ec34de8d 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1332,6 +1332,7 @@ cryptographic
 csv
 csvwithnames
 csvwithnamesandtypes
+ctukey
 curdate
 currentDatabase
 currentProfiles
@@ -2271,6 +2272,7 @@ seektable
 sequenceCount
 sequenceMatch
 sequenceNextNode
+seriesOutliersDetectTukey
 seriesDecomposeSTL
 seriesPeriodDetectFFT
 serverTimeZone
@@ -2564,6 +2566,7 @@ tryPunycodeDecode
 tskv
 tsv
 tui
+tukey
 tumbleEnd
 tumbleStart
 tupleConcat

From 6d24ffc9761d05422f0d98d3a4797d0c348e3303 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Wed, 31 Jan 2024 10:57:43 -0800
Subject: [PATCH 0479/1081] Fix filename and spelling errors

---
 ...eriesOutliersTukey.cpp => seriesOutliersDetectTukey.cpp} | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)
 rename src/Functions/{seriesOutliersTukey.cpp => seriesOutliersDetectTukey.cpp} (98%)

diff --git a/src/Functions/seriesOutliersTukey.cpp b/src/Functions/seriesOutliersDetectTukey.cpp
similarity index 98%
rename from src/Functions/seriesOutliersTukey.cpp
rename to src/Functions/seriesOutliersDetectTukey.cpp
index 4c2c1ccd882..ce5ed391fa0 100644
--- a/src/Functions/seriesOutliersTukey.cpp
+++ b/src/Functions/seriesOutliersDetectTukey.cpp
@@ -79,7 +79,7 @@ public:
                         min_percentile = p_min / 100;
                     else
                         throw Exception(
-                            ErrorCodes::BAD_ARGUMENTS, "The third argumet of function {} must be in range [2.0, 98.0]", getName());
+                            ErrorCodes::BAD_ARGUMENTS, "The third argument of function {} must be in range [2.0, 98.0]", getName());
                 }
 
                 if (arguments.size() > 3)
@@ -89,7 +89,7 @@ public:
                         max_percentile = p_max / 100;
                     else
                         throw Exception(
-                            ErrorCodes::BAD_ARGUMENTS, "The fourth argumet of function {} must be in range [2.0, 98.0]", getName());
+                            ErrorCodes::BAD_ARGUMENTS, "The fourth argument of function {} must be in range [2.0, 98.0]", getName());
                 }
             }
             else if (kind == "tukey")
@@ -109,7 +109,7 @@ public:
             if (k_val >= 0.0)
                 K = k_val;
             else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fifth argumet of function {} must be a positive number", getName());
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fifth argument of function {} must be a positive number", getName());
         }
 
         ColumnPtr col_res;

From a4ea7c401cdd28b3196e5165c1bc7dc006f52d73 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Wed, 31 Jan 2024 21:06:47 +0100
Subject: [PATCH 0480/1081] 2 tests fail, doesnt seem change related - try
 again


From 361b2f107b33e89c6b6694e420cb668bc50d160b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 31 Jan 2024 21:28:18 +0100
Subject: [PATCH 0481/1081] Allow to define a starting point for s3queue
 ordered mode

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 74 ++++++++++++-------
 src/Storages/S3Queue/S3QueueFilesMetadata.h   |  4 +
 src/Storages/S3Queue/S3QueueSettings.h        |  1 +
 src/Storages/S3Queue/StorageS3Queue.cpp       | 13 +++-
 .../integration/test_storage_s3_queue/test.py | 50 +++++++++++++
 5 files changed, 113 insertions(+), 29 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index 61f6b7fe052..ac80ded5792 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -637,25 +637,31 @@ void S3QueueFilesMetadata::setFileProcessedForUnorderedMode(ProcessingNodeHolder
                 "this could be a result of expired zookeeper session", path);
 }
 
+
 void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPtr holder)
+{
+    auto processed_node_path = isShardedProcessing()
+        ? zookeeper_processed_path / toString(getProcessingIdForPath(holder->path))
+        : zookeeper_processed_path;
+
+    return setFileProcessedForOrderedModeImpl(holder->path, holder, processed_node_path);
+}
+
+void S3QueueFilesMetadata::setFileProcessedForOrderedModeImpl(
+    const std::string & path, ProcessingNodeHolderPtr holder, const std::string & processed_node_path)
 {
     /// Update a persistent node in /processed and remove ephemeral node from /processing.
 
-    const auto & path = holder->path;
     const auto node_name = getNodeName(path);
     const auto node_metadata = createNodeMetadata(path).toString();
     const auto zk_client = getZooKeeper();
 
-    auto processed_node = isShardedProcessing()
-        ? zookeeper_processed_path / toString(getProcessingIdForPath(path))
-        : zookeeper_processed_path;
-
-    LOG_TEST(log, "Setting file `{}` as processed", path);
+    LOG_TEST(log, "Setting file `{}` as processed (at {})", path, processed_node_path);
     while (true)
     {
         std::string res;
         Coordination::Stat stat;
-        bool exists = zk_client->tryGet(processed_node, res, &stat);
+        bool exists = zk_client->tryGet(processed_node_path, res, &stat);
         Coordination::Requests requests;
         if (exists)
         {
@@ -664,39 +670,41 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
                 auto metadata = NodeMetadata::fromString(res);
                 if (metadata.file_path >= path)
                 {
-                    /// Here we get in the case that maximum processed file is bigger than ours.
-                    /// This is possible to achieve in case of parallel processing
-                    /// but for local processing we explicitly disable parallel mode and do everything in a single thread
-                    /// (see constructor of StorageS3Queue where s3queue_processing_threads_num is explicitly set to 1 in case of Ordered mode).
-                    /// Nevertheless, in case of distributed processing we cannot do anything with parallelism.
-                    /// What this means?
-                    /// It means that in scenario "distributed processing + Ordered mode"
-                    /// a setting s3queue_loading_retries will not work. It is possible to fix, it is in TODO.
-
-                    /// Return because there is nothing to change,
-                    /// the max processed file is already bigger than ours.
+                    LOG_TRACE(log, "File {} is already processed, current max processed file: {}", path, metadata.file_path);
                     return;
                 }
             }
-            requests.push_back(zkutil::makeSetRequest(processed_node, node_metadata, stat.version));
+            requests.push_back(zkutil::makeSetRequest(processed_node_path, node_metadata, stat.version));
         }
         else
         {
-            requests.push_back(zkutil::makeCreateRequest(processed_node, node_metadata, zkutil::CreateMode::Persistent));
+            requests.push_back(zkutil::makeCreateRequest(processed_node_path, node_metadata, zkutil::CreateMode::Persistent));
         }
 
         Coordination::Responses responses;
-        if (holder->remove(&requests, &responses))
+        if (holder)
         {
-            LOG_TEST(log, "Moved file `{}` to processed", path);
-            if (max_loading_retries)
-                zk_client->tryRemove(zookeeper_failed_path / (node_name + ".retriable"), -1);
-            return;
+            if (holder->remove(&requests, &responses))
+            {
+                LOG_TEST(log, "Moved file `{}` to processed", path);
+                if (max_loading_retries)
+                    zk_client->tryRemove(zookeeper_failed_path / (node_name + ".retriable"), -1);
+                return;
+            }
+        }
+        else
+        {
+            auto code = zk_client->tryMulti(requests, responses);
+            if (code == Coordination::Error::ZOK)
+                return;
         }
 
         /// Failed to update max processed node, retry.
         if (!responses.empty() && responses[0]->error != Coordination::Error::ZOK)
+        {
+            LOG_TRACE(log, "Failed to update processed node ({}). Will retry.", magic_enum::enum_name(responses[0]->error));
             continue;
+        }
 
         LOG_WARNING(log, "Cannot set file ({}) as processed since processing node "
                     "does not exist with expected processing id does not exist, "
@@ -705,6 +713,22 @@ void S3QueueFilesMetadata::setFileProcessedForOrderedMode(ProcessingNodeHolderPt
     }
 }
 
+void S3QueueFilesMetadata::setFileProcessed(const std::string & path, size_t shard_id)
+{
+    if (mode != S3QueueMode::ORDERED)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Can set file as preprocessed only for Ordered mode");
+
+    if (isShardedProcessing())
+    {
+        for (const auto & processor : getProcessingIdsForShard(shard_id))
+            setFileProcessedForOrderedModeImpl(path, nullptr, zookeeper_processed_path / toString(processor));
+    }
+    else
+    {
+        setFileProcessedForOrderedModeImpl(path, nullptr, zookeeper_processed_path);
+    }
+}
+
 void S3QueueFilesMetadata::setFileFailed(ProcessingNodeHolderPtr holder, const String & exception_message)
 {
     auto timer = DB::CurrentThread::getProfileEvents().timer(ProfileEvents::S3QueueSetFileFailedMicroseconds);
diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.h b/src/Storages/S3Queue/S3QueueFilesMetadata.h
index c83c6f20b92..9301ea7ceb8 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.h
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.h
@@ -42,6 +42,7 @@ public:
     ~S3QueueFilesMetadata();
 
     void setFileProcessed(ProcessingNodeHolderPtr holder);
+    void setFileProcessed(const std::string & path, size_t shard_id);
 
     void setFileFailed(ProcessingNodeHolderPtr holder, const std::string & exception_message);
 
@@ -141,6 +142,9 @@ private:
     void setFileProcessedForUnorderedMode(ProcessingNodeHolderPtr holder);
     std::string getZooKeeperPathForShard(size_t shard_id) const;
 
+    void setFileProcessedForOrderedModeImpl(
+        const std::string & path, ProcessingNodeHolderPtr holder, const std::string & processed_node_path);
+
     enum class SetFileProcessingResult
     {
         Success,
diff --git a/src/Storages/S3Queue/S3QueueSettings.h b/src/Storages/S3Queue/S3QueueSettings.h
index d65b38f77f2..5c846b4f294 100644
--- a/src/Storages/S3Queue/S3QueueSettings.h
+++ b/src/Storages/S3Queue/S3QueueSettings.h
@@ -22,6 +22,7 @@ class ASTStorage;
     M(UInt32, s3queue_loading_retries, 0, "Retry loading up to specified number of times", 0) \
     M(UInt32, s3queue_processing_threads_num, 1, "Number of processing threads", 0) \
     M(UInt32, s3queue_enable_logging_to_s3queue_log, 1, "Enable logging to system table system.s3queue_log", 0) \
+    M(String, s3queue_last_processed_path, "", "For Ordered mode. Files with smaller file name are considered already processed", 0) \
     M(UInt32, s3queue_tracked_file_ttl_sec, 0, "Maximum number of seconds to store processed files in ZooKeeper node (store forever by default)", 0) \
     M(UInt32, s3queue_polling_min_timeout_ms, 1000, "Minimal timeout before next polling", 0) \
     M(UInt32, s3queue_polling_max_timeout_ms, 10000, "Maximum timeout before next polling", 0) \
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 23ef9aec980..5fc0d19ce0e 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -155,10 +155,6 @@ StorageS3Queue::StorageS3Queue(
     LOG_INFO(log, "Using zookeeper path: {}", zk_path.string());
     task = getContext()->getSchedulePool().createTask("S3QueueStreamingTask", [this] { threadFunc(); });
 
-    /// Get metadata manager from S3QueueMetadataFactory,
-    /// it will increase the ref count for the metadata object.
-    /// The ref count is decreased when StorageS3Queue::drop() method is called.
-    files_metadata = S3QueueMetadataFactory::instance().getOrCreate(zk_path, *s3queue_settings);
     try
     {
         createOrCheckMetadata(storage_metadata);
@@ -169,6 +165,11 @@ StorageS3Queue::StorageS3Queue(
         throw;
     }
 
+    /// Get metadata manager from S3QueueMetadataFactory,
+    /// it will increase the ref count for the metadata object.
+    /// The ref count is decreased when StorageS3Queue::drop() method is called.
+    files_metadata = S3QueueMetadataFactory::instance().getOrCreate(zk_path, *s3queue_settings);
+
     if (files_metadata->isShardedProcessing())
     {
         if (!s3queue_settings->s3queue_current_shard_num.changed)
@@ -181,6 +182,10 @@ StorageS3Queue::StorageS3Queue(
             files_metadata->registerNewShard(s3queue_settings->s3queue_current_shard_num);
         }
     }
+    if (s3queue_settings->mode == S3QueueMode::ORDERED && !s3queue_settings->s3queue_last_processed_path.value.empty())
+    {
+        files_metadata->setFileProcessed(s3queue_settings->s3queue_last_processed_path.value, s3queue_settings->s3queue_current_shard_num);
+    }
 }
 
 void StorageS3Queue::startup()
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 5e86b798bf7..8c20eb94fad 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -1283,3 +1283,53 @@ def test_settings_check(started_cluster):
     )
 
     node.query(f"DROP TABLE {table_name} SYNC")
+
+
+@pytest.mark.parametrize("processing_threads", [1, 5])
+def test_processed_file_setting(started_cluster, processing_threads):
+    node = started_cluster.instances["instance"]
+    table_name = f"test_processed_file_setting_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 10
+
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        "ordered",
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+            "s3queue_processing_threads_num": processing_threads,
+            "s3queue_last_processed_path": f"{files_path}/test_5.csv",
+        },
+    )
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, start_ind=0, row_num=1
+    )
+
+    create_mv(node, table_name, dst_table_name)
+
+    def get_count():
+        return int(node.query(f"SELECT count() FROM {dst_table_name}"))
+
+    expected_rows = 4
+    for _ in range(20):
+        if expected_rows == get_count():
+            break
+        time.sleep(1)
+
+    assert expected_rows == get_count()
+
+    node.restart_clickhouse()
+    time.sleep(10)
+
+    expected_rows = 4
+    for _ in range(20):
+        if expected_rows == get_count():
+            break
+        time.sleep(1)
+
+    assert expected_rows == get_count()

From 65cfbaaa4b6194937478e98c773ed6ed56a6d70f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 31 Jan 2024 22:24:51 +0100
Subject: [PATCH 0482/1081] Safer Rust (catch panic with catch_unwind())

Crossing boundaries of multiple languages is tricky, but we can do at
least something about this, in particular, use catch_unwind() [1] to
catch possible panic!()s.

  [1]: https://doc.rust-lang.org/std/panic/fn.catch_unwind.html

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 rust/prql/src/lib.rs | 21 +++++++++++++++++++--
 rust/skim/src/lib.rs | 22 +++++++++++++++++++++-
 2 files changed, 40 insertions(+), 3 deletions(-)

diff --git a/rust/prql/src/lib.rs b/rust/prql/src/lib.rs
index fb71d62d527..d51acfbd485 100644
--- a/rust/prql/src/lib.rs
+++ b/rust/prql/src/lib.rs
@@ -2,6 +2,7 @@ use prql_compiler::sql::Dialect;
 use prql_compiler::{Options, Target};
 use std::ffi::{c_char, CString};
 use std::slice;
+use std::panic;
 
 fn set_output(result: String, out: *mut *mut u8, out_size: *mut u64) {
     assert!(!out_size.is_null());
@@ -13,8 +14,7 @@ fn set_output(result: String, out: *mut *mut u8, out_size: *mut u64) {
     *out_ptr = CString::new(result).unwrap().into_raw() as *mut u8;
 }
 
-#[no_mangle]
-pub unsafe extern "C" fn prql_to_sql(
+pub unsafe extern "C" fn prql_to_sql_impl(
     query: *const u8,
     size: u64,
     out: *mut *mut u8,
@@ -50,6 +50,23 @@ pub unsafe extern "C" fn prql_to_sql(
     }
 }
 
+#[no_mangle]
+pub unsafe extern "C" fn prql_to_sql(
+    query: *const u8,
+    size: u64,
+    out: *mut *mut u8,
+    out_size: *mut u64,
+) -> i64 {
+    let ret = panic::catch_unwind(|| {
+        return prql_to_sql_impl(query, size, out, out_size);
+    });
+    return match ret {
+        // NOTE: using cxxbridge we can return proper Result<> type.
+        Err(_err) => 1,
+        Ok(res) => res,
+    }
+}
+
 #[no_mangle]
 pub unsafe extern "C" fn prql_free_pointer(ptr_to_free: *mut u8) {
     std::mem::drop(CString::from_raw(ptr_to_free as *mut c_char));
diff --git a/rust/skim/src/lib.rs b/rust/skim/src/lib.rs
index 2221ed63df4..a20b1b35033 100644
--- a/rust/skim/src/lib.rs
+++ b/rust/skim/src/lib.rs
@@ -1,6 +1,7 @@
 use skim::prelude::*;
 use term::terminfo::TermInfo;
 use cxx::{CxxString, CxxVector};
+use std::panic;
 
 #[cxx::bridge]
 mod ffi {
@@ -36,7 +37,7 @@ impl SkimItem for Item {
     }
 }
 
-fn skim(prefix: &CxxString, words: &CxxVector<CxxString>) -> Result<String, String> {
+fn skim_impl(prefix: &CxxString, words: &CxxVector<CxxString>) -> Result<String, String> {
     // Let's check is terminal available. To avoid panic.
     if let Err(err) = TermInfo::from_env() {
         return Err(format!("{}", err));
@@ -89,3 +90,22 @@ fn skim(prefix: &CxxString, words: &CxxVector<CxxString>) -> Result<String, Stri
     }
     return Ok(output.selected_items[0].output().to_string());
 }
+
+fn skim(prefix: &CxxString, words: &CxxVector<CxxString>) -> Result<String, String> {
+    let ret = panic::catch_unwind(|| {
+        return skim_impl(prefix, words);
+    });
+    return match ret {
+        Err(err) => {
+            let e = if let Some(s) = err.downcast_ref::<String>() {
+                format!("{}", s)
+            } else if let Some(s) = err.downcast_ref::<&str>() {
+                format!("{}", s)
+            } else {
+                format!("Unknown panic type: {:?}", err.type_id())
+            };
+            Err(format!("Rust panic: {:?}", e))
+        },
+        Ok(res) => res,
+    }
+}

From ed3d5ce0a3249c884182a3461fd292a3ac516429 Mon Sep 17 00:00:00 2001
From: Sean Haynes <seanhaynes@live.co.uk>
Date: Wed, 31 Jan 2024 21:52:52 +0000
Subject: [PATCH 0483/1081] Update bench docs to reflect removal of -p (port)
 short option

---
 docs/en/operations/utilities/clickhouse-benchmark.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/utilities/clickhouse-benchmark.md b/docs/en/operations/utilities/clickhouse-benchmark.md
index 8b7d7f85552..9261b22a538 100644
--- a/docs/en/operations/utilities/clickhouse-benchmark.md
+++ b/docs/en/operations/utilities/clickhouse-benchmark.md
@@ -45,11 +45,11 @@ clickhouse-benchmark [keys] < queries_file;
 - `-c N`, `--concurrency=N` — Number of queries that `clickhouse-benchmark` sends simultaneously. Default value: 1.
 - `-d N`, `--delay=N` — Interval in seconds between intermediate reports (to disable reports set 0). Default value: 1.
 - `-h HOST`, `--host=HOST` — Server host. Default value: `localhost`. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-h` keys.
-- `-p N`, `--port=N` — Server port. Default value: 9000. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-p` keys.
 - `-i N`, `--iterations=N` — Total number of queries. Default value: 0 (repeat forever).
 - `-r`, `--randomize` — Random order of queries execution if there is more than one input query.
 - `-s`, `--secure` — Using `TLS` connection.
 - `-t N`, `--timelimit=N` — Time limit in seconds. `clickhouse-benchmark` stops sending queries when the specified time limit is reached. Default value: 0 (time limit disabled).
+- `--port=N` — Server port. Default value: 9000. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-p` keys.
 - `--confidence=N` — Level of confidence for T-test. Possible values: 0 (80%), 1 (90%), 2 (95%), 3 (98%), 4 (99%), 5 (99.5%). Default value: 5. In the [comparison mode](#clickhouse-benchmark-comparison-mode) `clickhouse-benchmark` performs the [Independent two-sample Student’s t-test](https://en.wikipedia.org/wiki/Student%27s_t-test#Independent_two-sample_t-test) to determine whether the two distributions aren’t different with the selected level of confidence.
 - `--cumulative` — Printing cumulative data instead of data per interval.
 - `--database=DATABASE_NAME` — ClickHouse database name. Default value: `default`.

From f7a5f09a0fc76662114a33c60bc3eb0aaebd5f1c Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 31 Jan 2024 22:59:25 +0100
Subject: [PATCH 0484/1081] Add one more test

---
 .../integration/test_storage_s3_queue/test.py | 56 +++++++++++++++++++
 1 file changed, 56 insertions(+)

diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 8c20eb94fad..34146484ced 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -99,6 +99,7 @@ def started_cluster():
             main_configs=[
                 "configs/s3queue_log.xml",
             ],
+            stay_alive=True,
         )
 
         logging.info("Starting cluster...")
@@ -1333,3 +1334,58 @@ def test_processed_file_setting(started_cluster, processing_threads):
         time.sleep(1)
 
     assert expected_rows == get_count()
+
+
+@pytest.mark.parametrize("processing_threads", [1, 5])
+def test_processed_file_setting_distributed(started_cluster, processing_threads):
+    node = started_cluster.instances["instance"]
+    node_2 = started_cluster.instances["instance2"]
+    table_name = f"test_processed_file_setting_distributed_{processing_threads}"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 10
+
+    for instance in [node, node_2]:
+        create_table(
+            started_cluster,
+            instance,
+            table_name,
+            "ordered",
+            files_path,
+            additional_settings={
+                "keeper_path": keeper_path,
+                "s3queue_processing_threads_num": processing_threads,
+                "s3queue_last_processed_path": f"{files_path}/test_5.csv",
+                "s3queue_total_shards_num": 2,
+            },
+        )
+
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, start_ind=0, row_num=1
+    )
+
+    for instance in [node, node_2]:
+        create_mv(instance, table_name, dst_table_name)
+
+    def get_count():
+        query = f"SELECT count() FROM {dst_table_name}"
+        return int(node.query(query)) + int(node_2.query(query))
+
+    expected_rows = 4
+    for _ in range(20):
+        if expected_rows == get_count():
+            break
+        time.sleep(1)
+    assert expected_rows == get_count()
+
+    for instance in [node, node_2]:
+        instance.restart_clickhouse()
+
+    time.sleep(10)
+    expected_rows = 4
+    for _ in range(20):
+        if expected_rows == get_count():
+            break
+        time.sleep(1)
+    assert expected_rows == get_count()

From 31e99ee61f6d80410653dcd73cdec213331303d8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 1 Feb 2024 01:01:59 +0300
Subject: [PATCH 0485/1081] Update clickhouse-benchmark.md

---
 docs/en/operations/utilities/clickhouse-benchmark.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/utilities/clickhouse-benchmark.md b/docs/en/operations/utilities/clickhouse-benchmark.md
index 9261b22a538..6d5148ad965 100644
--- a/docs/en/operations/utilities/clickhouse-benchmark.md
+++ b/docs/en/operations/utilities/clickhouse-benchmark.md
@@ -49,7 +49,7 @@ clickhouse-benchmark [keys] < queries_file;
 - `-r`, `--randomize` — Random order of queries execution if there is more than one input query.
 - `-s`, `--secure` — Using `TLS` connection.
 - `-t N`, `--timelimit=N` — Time limit in seconds. `clickhouse-benchmark` stops sending queries when the specified time limit is reached. Default value: 0 (time limit disabled).
-- `--port=N` — Server port. Default value: 9000. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `-p` keys.
+- `--port=N` — Server port. Default value: 9000. For the [comparison mode](#clickhouse-benchmark-comparison-mode) you can use multiple `--port` keys.
 - `--confidence=N` — Level of confidence for T-test. Possible values: 0 (80%), 1 (90%), 2 (95%), 3 (98%), 4 (99%), 5 (99.5%). Default value: 5. In the [comparison mode](#clickhouse-benchmark-comparison-mode) `clickhouse-benchmark` performs the [Independent two-sample Student’s t-test](https://en.wikipedia.org/wiki/Student%27s_t-test#Independent_two-sample_t-test) to determine whether the two distributions aren’t different with the selected level of confidence.
 - `--cumulative` — Printing cumulative data instead of data per interval.
 - `--database=DATABASE_NAME` — ClickHouse database name. Default value: `default`.

From 2ca634702b3318441e8629985eee7d859d5e3d3f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 31 Jan 2024 23:15:51 +0100
Subject: [PATCH 0486/1081] Fix test

---
 tests/queries/0_stateless/02184_default_table_engine.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02184_default_table_engine.sql b/tests/queries/0_stateless/02184_default_table_engine.sql
index a984ec1b6c9..aff30eeea98 100644
--- a/tests/queries/0_stateless/02184_default_table_engine.sql
+++ b/tests/queries/0_stateless/02184_default_table_engine.sql
@@ -1,3 +1,5 @@
+SET default_table_engine = 'None';
+
 CREATE TABLE table_02184 (x UInt8); --{serverError 119}
 SET default_table_engine = 'Log';
 CREATE TABLE table_02184 (x UInt8);

From 33f6940214282a9ec5908b6fd265f9e3962dad34 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 1 Feb 2024 03:50:09 +0100
Subject: [PATCH 0487/1081] CLion says these headers are unused

---
 src/Storages/MergeTree/MergeTreeData.cpp    |  9 ---------
 src/Storages/StorageReplicatedMergeTree.cpp | 12 ------------
 2 files changed, 21 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index a9f30e6e522..3ca746a7197 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -20,7 +20,6 @@
 #include <Disks/ObjectStorages/DiskObjectStorage.h>
 #include <Disks/TemporaryFileOnDisk.h>
 #include <Disks/createVolume.h>
-#include <Functions/IFunction.h>
 #include <IO/Operators.h>
 #include <IO/S3Common.h>
 #include <IO/SharedThreadPools.h>
@@ -47,7 +46,6 @@
 #include <Parsers/ASTPartition.h>
 #include <Parsers/ASTSetQuery.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
-#include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
 #include <Processors/Formats/IInputFormat.h>
@@ -62,9 +60,7 @@
 #include <Storages/MergeTree/MergeTreeDataPartCloner.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergeTreeDataPartWide.h>
 #include <Storages/Statistics/Estimator.h>
-#include <Storages/MergeTree/MergeTreeSelectProcessor.h>
 #include <Storages/MergeTree/RangesInDataPart.h>
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MutationCommands.h>
@@ -75,12 +71,10 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/Increment.h>
 #include <Common/ProfileEventsScope.h>
-#include <Common/SimpleIncrement.h>
 #include <Common/Stopwatch.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/ThreadFuzzer.h>
 #include <Common/escapeForFileName.h>
-#include <Common/getNumberOfPhysicalCPUCores.h>
 #include <Common/noexcept_scope.h>
 #include <Common/quoteString.h>
 #include <Common/scope_guard_safe.h>
@@ -91,13 +85,10 @@
 
 #include <base/insertAtEnd.h>
 #include <base/interpolate.h>
-#include <base/defines.h>
 
 #include <algorithm>
 #include <atomic>
-#include <cmath>
 #include <chrono>
-#include <iomanip>
 #include <limits>
 #include <optional>
 #include <ranges>
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 1224af4d6cb..6bd57cc4d6d 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -1,6 +1,5 @@
 #include <Core/Defines.h>
 
-#include <cstddef>
 #include <ranges>
 #include <chrono>
 
@@ -29,17 +28,14 @@
 #include <Storages/AlterCommands.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
-#include <Storages/MergeTree/AsyncBlockIDsCache.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/LeaderElection.h>
 #include <Storages/MergeTree/MergeFromLogEntryTask.h>
-#include <Storages/MergeTree/MergeList.h>
 #include <Storages/MergeTree/MergeTreeBackgroundExecutor.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 #include <Storages/MergeTree/MergeTreePartInfo.h>
 #include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
-#include <Storages/MergeTree/MergeTreeReaderCompact.h>
 #include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MutateFromLogEntryTask.h>
 #include <Storages/MergeTree/PinnedPartUUIDs.h>
@@ -64,21 +60,16 @@
 #include <Parsers/formatAST.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/ASTInsertQuery.h>
-#include <Parsers/ASTDropQuery.h>
 #include <Parsers/ASTFunction.h>
-#include <Parsers/ASTOptimizeQuery.h>
 #include <Parsers/ASTPartition.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/queryToString.h>
-#include <Parsers/ASTCheckQuery.h>
-#include <Parsers/ExpressionListParsers.h>
 
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/Sources/RemoteSource.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
 #include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
-#include <Processors/QueryPlan/ReadFromPreparedSource.h>
 #include <Processors/Sinks/EmptySink.h>
 
 #include <Planner/Utils.h>
@@ -106,9 +97,6 @@
 #include <Backups/IRestoreCoordination.h>
 #include <Backups/RestorerFromBackup.h>
 
-#include <Poco/DirectoryIterator.h>
-
-#include <base/scope_guard.h>
 #include <Common/scope_guard_safe.h>
 
 #include <boost/algorithm/string/join.hpp>

From d9820f9704c3851cce6939f1bb25f9f83c8cdf2b Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 1 Feb 2024 11:13:26 +0800
Subject: [PATCH 0488/1081] change as request

---
 src/Functions/if.cpp                           | 18 +++++++++++-------
 .../0_stateless/02974_if_with_map.reference    | 10 ++++++++++
 .../queries/0_stateless/02974_if_with_map.sql  |  5 +++++
 3 files changed, 26 insertions(+), 7 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index d7bcd1291bb..7108ecfbbf3 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1,4 +1,3 @@
-#include <type_traits>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnDecimal.h>
@@ -30,6 +29,8 @@
 #include <Common/assert_cast.h>
 #include <Common/typeid_cast.h>
 
+#include <type_traits>
+
 namespace DB
 {
 namespace ErrorCodes
@@ -841,18 +842,21 @@ private:
         const auto * value_array = assert_cast<const ColumnArray *>(value_result.get());
         if (!key_array)
             throw Exception(
-                ErrorCodes::ILLEGAL_COLUMN, "Illegal key result column {} in executeMap for function {}", key_result->getName(), getName());
+                ErrorCodes::LOGICAL_ERROR,
+                "Key result column should be {} instead of {} in executeMap of function {}",
+                key_result_type->getName(),
+                key_result->getName(),
+                getName());
         if (!value_array)
             throw Exception(
-                ErrorCodes::ILLEGAL_COLUMN,
-                "Illegal value result column {} in executeMap for function {}",
+                ErrorCodes::LOGICAL_ERROR,
+                "Value result column should be {} instead of {} in executeMap of function {}",
+                key_result_type->getName(),
                 value_result->getName(),
                 getName());
         if (!key_array->hasEqualOffsets(*value_array))
             throw Exception(
-                ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
-                "Key result column and value result column in executeMap for function {} must have equal sizes",
-                getName());
+                ErrorCodes::LOGICAL_ERROR, "Key array and value array must have equal sizes in executeMap of function {}", getName());
 
         auto nested_column = ColumnArray::create(
             ColumnTuple::create(Columns{key_array->getDataPtr(), value_array->getDataPtr()}), key_array->getOffsetsPtr());
diff --git a/tests/queries/0_stateless/02974_if_with_map.reference b/tests/queries/0_stateless/02974_if_with_map.reference
index 00dca1f95a6..a4ebf6a9700 100644
--- a/tests/queries/0_stateless/02974_if_with_map.reference
+++ b/tests/queries/0_stateless/02974_if_with_map.reference
@@ -4,6 +4,16 @@
 {3:4,5:6}
 {3:4,5:6}
 {1:2,3:4}
+{3:4,5:6}
+{1:2,3:4}
+{1:2,3:4}
+{3:4}
+{1:2,3:4}
+{3:4}
+{3:4,5:6}
+{1:2}
+{3:4,5:6}
+{1:2}
 {1:2,3:4}
 {1:2,3:4}
 {3:4,5:6}
diff --git a/tests/queries/0_stateless/02974_if_with_map.sql b/tests/queries/0_stateless/02974_if_with_map.sql
index 182d20de07e..2387cffd4bf 100644
--- a/tests/queries/0_stateless/02974_if_with_map.sql
+++ b/tests/queries/0_stateless/02974_if_with_map.sql
@@ -1,6 +1,11 @@
 select if(number % 2 = 0, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
 select if(number % 2 = 0, materialize(map(1,2,3,4)), map(3,4,5,6)) from numbers(2);
 select if(number % 2 = 0, map(3,4,5,6), materialize(map(1,2,3,4))) from numbers(2);
+select if(number % 2 = 0, materialize(map(3,4,5,6)), materialize(map(1,2,3,4))) from numbers(2);
+select if(number % 2 = 0, map(1,2,3,4), map(3,4)) from numbers(2);
+select if(number % 2 = 0, materialize(map(1,2,3,4)), map(3,4)) from numbers(2);
+select if(number % 2 = 0, map(3,4,5,6), materialize(map(1,2))) from numbers(2);
+select if(number % 2 = 0, materialize(map(3,4,5,6)), materialize(map(1,2))) from numbers(2);
 select if(1, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
 select if(0, map(1,2,3,4), map(3,4,5,6)) from numbers(2);
 select if(null, map(1,2,3,4), map(3,4,5,6)) from numbers(2);

From 009c0dc136b8e74c41784011d77e85ce18ff7e8d Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Thu, 1 Feb 2024 05:27:24 +0000
Subject: [PATCH 0489/1081] fix 02720_row_policy_column_with_dots

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 .../0_stateless/02720_row_policy_column_with_dots.reference   | 2 +-
 .../queries/0_stateless/02720_row_policy_column_with_dots.sql | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference b/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
index dd2c30cc9f8..3856762b151 100644
--- a/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
+++ b/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
@@ -1 +1 @@
-2024-01-01	Hello	World
+2124-01-01	Hello	World
diff --git a/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql b/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
index 361bd0e0ec7..732a2f1ebd3 100644
--- a/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
+++ b/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
@@ -1,6 +1,6 @@
 CREATE table if not exists table_with_dot_column (date Date, regular_column String, `other_column.2` String) ENGINE = MergeTree() ORDER BY date;
 INSERT INTO table_with_dot_column select '2020-01-01', 'Hello', 'World';
-INSERT INTO table_with_dot_column select '2024-01-01', 'Hello', 'World';
-CREATE ROW POLICY IF NOT EXISTS row_policy ON table_with_dot_column USING toDate(date) >= today() - 30 TO ALL;
+INSERT INTO table_with_dot_column select '2124-01-01', 'Hello', 'World';
+CREATE ROW POLICY IF NOT EXISTS row_policy ON table_with_dot_column USING toDate(date) >= '2123-01-01' TO ALL;
 SELECT * FROM table_with_dot_column;
 DROP TABLE table_with_dot_column;

From 500e8e505d0bb3531c6fc37587fc9121a929ed45 Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Thu, 1 Feb 2024 08:03:19 +0000
Subject: [PATCH 0490/1081] better

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 .../02720_row_policy_column_with_dots.reference        |  2 +-
 .../0_stateless/02720_row_policy_column_with_dots.sql  | 10 +++++-----
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference b/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
index 3856762b151..d00491fd7e5 100644
--- a/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
+++ b/tests/queries/0_stateless/02720_row_policy_column_with_dots.reference
@@ -1 +1 @@
-2124-01-01	Hello	World
+1
diff --git a/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql b/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
index 732a2f1ebd3..fcb0bf62859 100644
--- a/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
+++ b/tests/queries/0_stateless/02720_row_policy_column_with_dots.sql
@@ -1,6 +1,6 @@
-CREATE table if not exists table_with_dot_column (date Date, regular_column String, `other_column.2` String) ENGINE = MergeTree() ORDER BY date;
-INSERT INTO table_with_dot_column select '2020-01-01', 'Hello', 'World';
-INSERT INTO table_with_dot_column select '2124-01-01', 'Hello', 'World';
-CREATE ROW POLICY IF NOT EXISTS row_policy ON table_with_dot_column USING toDate(date) >= '2123-01-01' TO ALL;
-SELECT * FROM table_with_dot_column;
+CREATE TABLE IF NOT EXISTS table_with_dot_column (date Date, regular_column String, `other_column.2` String) ENGINE = MergeTree() ORDER BY date;
+INSERT INTO table_with_dot_column SELECT '2020-01-01', 'Hello', 'World';
+INSERT INTO table_with_dot_column SELECT toDate(now() + 48*3600), 'Hello', 'World';
+CREATE ROW POLICY IF NOT EXISTS row_policy ON table_with_dot_column USING toDate(date) >= today() - 30 TO ALL;
+SELECT count(*) FROM table_with_dot_column;
 DROP TABLE table_with_dot_column;

From bbaa08199a1657d5591481c1901dabf7fcb73f19 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Sun, 21 Jan 2024 23:32:40 +0000
Subject: [PATCH 0491/1081] Introduce polling timeout for asynchronous queue

The current timeout for checking updates in the asynchronous queue is
equal to the timeout used for queue entry
(async_insert_busy_timeout_ms).
That means that, in the worst case, an entry spends twice the time of the
asynchronous timeout in the queue.
---
 src/Core/Settings.h                          | 1 +
 src/Interpreters/AsynchronousInsertQueue.cpp | 2 +-
 src/Interpreters/Context.cpp                 | 3 +++
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 4bb48cb3a29..bc518ca856b 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -751,6 +751,7 @@ class IColumn;
     M(UInt64, async_insert_max_data_size, 1000000, "Maximum size in bytes of unparsed data collected per query before being inserted", 0) \
     M(UInt64, async_insert_max_query_number, 450, "Maximum number of insert queries before being inserted", 0) \
     M(Milliseconds, async_insert_busy_timeout_ms, 200, "Maximum time to wait before dumping collected data per query since the first data appeared", 0) \
+    M(Milliseconds, async_insert_poll_timeout_ms, 10, "Timeout for polling data from asynchronous insert queue", 0) \
     \
     M(UInt64, remote_fs_read_max_backoff_ms, 10000, "Max wait time when trying to read data for remote disk", 0) \
     M(UInt64, remote_fs_read_backoff_max_tries, 5, "Max attempts to read with backoff", 0) \
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 8206c31624c..3aa61f93924 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -430,7 +430,7 @@ void AsynchronousInsertQueue::processBatchDeadlines(size_t shard_num)
             std::unique_lock lock(shard.mutex);
 
             shard.are_tasks_available.wait_for(lock,
-                Milliseconds(getContext()->getSettingsRef().async_insert_busy_timeout_ms), [&shard, this]
+                Milliseconds(getContext()->getSettingsRef().async_insert_poll_timeout_ms), [&shard, this]
             {
                 if (shutdown)
                     return true;
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 75c20b0a520..0a4d01de86d 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -4867,6 +4867,9 @@ void Context::setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInser
     if (std::chrono::milliseconds(settings.async_insert_busy_timeout_ms) == 0ms)
         throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting async_insert_busy_timeout_ms can't be zero");
 
+    if (std::chrono::milliseconds(settings.async_insert_poll_timeout_ms) == 0ms)
+        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting async_insert_poll_timeout_ms can't be zero");
+
     shared->async_insert_queue = ptr;
 }
 

From 8b26dd0b69ea399e0a4c90907ffc6476882cce1a Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 31 Jan 2024 20:31:40 +0100
Subject: [PATCH 0492/1081] Fix stacktraces for binaries without debug symbols

During refactoring in #58610 it had been broken since itassumes that the
information about file is always available, otherwise it will not print
symbol name.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Common/StackTrace.cpp | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/Common/StackTrace.cpp b/src/Common/StackTrace.cpp
index 4e5c9bd7893..8431630b16c 100644
--- a/src/Common/StackTrace.cpp
+++ b/src/Common/StackTrace.cpp
@@ -317,16 +317,19 @@ constexpr std::pair<std::string_view, std::string_view> replacements[]
 // Demangle @c symbol_name if it's not from __functional header (as such functions don't provide any useful
 // information but pollute stack traces).
 // Replace parts from @c replacements with shorter aliases
-String demangleAndCollapseNames(std::string_view file, const char * const symbol_name)
+String demangleAndCollapseNames(std::optional<std::string_view> file, const char * const symbol_name)
 {
     if (!symbol_name)
         return "?";
 
-    std::string_view file_copy = file;
-    if (auto trim_pos = file.find_last_of('/'); trim_pos != file.npos)
-        file_copy.remove_suffix(file.size() - trim_pos);
-    if (file_copy.ends_with("functional"))
-        return "?";
+    if (file.has_value())
+    {
+        std::string_view file_copy = file.value();
+        if (auto trim_pos = file_copy.find_last_of('/'); trim_pos != file_copy.npos)
+            file_copy.remove_suffix(file_copy.size() - trim_pos);
+        if (file_copy.ends_with("functional"))
+            return "?";
+    }
 
     String haystack = demangle(symbol_name);
 
@@ -393,8 +396,8 @@ toStringEveryLineImpl([[maybe_unused]] bool fatal, const StackTraceRefTriple & s
         if (frame.file.has_value() && frame.line.has_value())
             out << *frame.file << ':' << *frame.line << ": ";
 
-        if (frame.symbol.has_value() && frame.file.has_value())
-            out << demangleAndCollapseNames(*frame.file, frame.symbol->data());
+        if (frame.symbol.has_value())
+            out << demangleAndCollapseNames(frame.file, frame.symbol->data());
         else
             out << "?";
 

From ea720e3171b57171e17a2649b301d31b8572ed9f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 31 Jan 2024 21:24:53 +0100
Subject: [PATCH 0493/1081] Verify that stripped clickhouse shows symbol names

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 docker/test/fasttest/run.sh | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/docker/test/fasttest/run.sh b/docker/test/fasttest/run.sh
index 5af05034415..d78c52f1fe6 100755
--- a/docker/test/fasttest/run.sh
+++ b/docker/test/fasttest/run.sh
@@ -211,6 +211,17 @@ function build
         echo "build_clickhouse_fasttest_binary: [ OK ] $BUILD_SECONDS_ELAPSED sec." \
           | ts '%Y-%m-%d %H:%M:%S' \
           | tee "$FASTTEST_OUTPUT/test_result.txt"
+
+        (
+            # This query should fail, and print stacktrace with proper symbol names (even on a stripped binary)
+            clickhouse_output=$(programs/clickhouse-stripped --stacktrace -q 'select' 2>&1 || :)
+            if [[ $clickhouse_output =~ DB::LocalServer::main ]]; then
+                echo "stripped_clickhouse_shows_symbols_names: [ OK ] 0 sec."
+            else
+                echo -e "stripped_clickhouse_shows_symbols_names: [ FAIL ] 0 sec. - clickhouse output:\n\n$clickhouse_output\n"
+            fi
+        ) | ts '%Y-%m-%d %H:%M:%S' | tee -a "$FASTTEST_OUTPUT/test_result.txt"
+
         if [ "$COPY_CLICKHOUSE_BINARY_TO_OUTPUT" -eq "1" ]; then
             mkdir -p "$FASTTEST_OUTPUT/binaries/"
             cp programs/clickhouse "$FASTTEST_OUTPUT/binaries/clickhouse"

From 596966850394ed4f0ed6b046820963ca6994a8d4 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 31 Jan 2024 19:58:28 +0100
Subject: [PATCH 0494/1081] Concurrent table creation in DatabaseReplicated

---
 programs/server/Server.cpp              |  5 ++
 src/Common/CurrentMetrics.cpp           |  3 ++
 src/Core/ServerSettings.h               |  2 +
 src/Databases/DatabaseReplicated.cpp    | 65 +++++++++++++++++--------
 src/Databases/TablesDependencyGraph.cpp | 12 +++++
 src/Databases/TablesDependencyGraph.h   |  3 ++
 src/IO/SharedThreadPools.cpp            |  9 ++++
 src/IO/SharedThreadPools.h              |  3 ++
 8 files changed, 83 insertions(+), 19 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 75ec574c357..8d63eeb2cab 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -826,6 +826,11 @@ try
         0, // We don't need any threads one all the parts will be deleted
         server_settings.max_parts_cleaning_thread_pool_size);
 
+    getDatabaseReplicatedCreateTablesThreadPool().initialize(
+        server_settings.max_database_replicated_create_table_thread_pool_size,
+        0, // We don't need any threads once all the tables will be created
+        server_settings.max_database_replicated_create_table_thread_pool_size);
+
     /// Initialize global local cache for remote filesystem.
     if (config().has("local_cache_for_remote_fs"))
     {
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index e7534f71dbb..0f546e649f9 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -176,6 +176,9 @@
     M(MergeTreePartsCleanerThreads, "Number of threads in the MergeTree parts cleaner thread pool.") \
     M(MergeTreePartsCleanerThreadsActive, "Number of threads in the MergeTree parts cleaner thread pool running a task.") \
     M(MergeTreePartsCleanerThreadsScheduled, "Number of queued or active jobs in the MergeTree parts cleaner thread pool.") \
+    M(DatabaseReplicatedCreateTablesThreads, "Number of threads in the threadpool for table creation in DatabaseReplicated.") \
+    M(DatabaseReplicatedCreateTablesThreadsActive, "Number of active threads in the threadpool for table creation in DatabaseReplicated.") \
+    M(DatabaseReplicatedCreateTablesThreadsScheduled, "Number of queued or active jobs in the threadpool for table creation in DatabaseReplicated.") \
     M(IDiskCopierThreads, "Number of threads for copying data between disks of different types.") \
     M(IDiskCopierThreadsActive, "Number of threads for copying data between disks of different types running a task.") \
     M(IDiskCopierThreadsScheduled, "Number of queued or active jobs for copying data between disks of different types.") \
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 1940646a22f..0d48ddca687 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -114,6 +114,8 @@ namespace DB
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
+    M(Bool, allow_database_replicated_concurrent_table_creation, false, "Allow concurrent table creation during replica recovery in DatabaseReplicated.", 0) \
+    M(UInt64, max_database_replicated_create_table_thread_pool_size, 32, "The number of threads to create tables during replica recovery in DatabaseReplicated.", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index bb82ef381a5..b184b09f6a6 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -29,6 +29,7 @@
 #include <IO/ReadBufferFromString.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
+#include <IO/SharedThreadPools.h>
 #include <Parsers/ASTAlterQuery.h>
 #include <Parsers/ASTDropQuery.h>
 #include <Parsers/ASTFunction.h>
@@ -1091,31 +1092,57 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
     }
 
     tables_dependencies.checkNoCyclicDependencies();
-    auto tables_to_create = tables_dependencies.getTablesSortedByDependency();
 
-    for (const auto & table_id : tables_to_create)
+    auto allow_concurrent_table_creation = getContext()->getServerSettings().allow_database_replicated_concurrent_table_creation;
+    auto tables_to_create_by_level = tables_dependencies.getTablesSortedByDependencyWithLevels();
+
+    auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "DatabaseReplicatedCreateTables");
+    std::vector<std::future<void>> create_table_futures;
+
+    for (const auto & [_, tables_to_create] : tables_to_create_by_level)
     {
-        auto table_name = table_id.getTableName();
-        auto metadata_it = table_name_to_metadata.find(table_name);
-        if (metadata_it == table_name_to_metadata.end())
+        for (const auto & table_id : tables_to_create)
         {
-            /// getTablesSortedByDependency() may return some not existing tables or tables from other databases
-            LOG_WARNING(log, "Got table name {} when resolving table dependencies, "
-                        "but database {} does not have metadata for that table. Ignoring it", table_id.getNameForLogs(), getDatabaseName());
-            continue;
+            auto task = [&]()
+            {
+                auto table_name = table_id.getTableName();
+                auto metadata_it = table_name_to_metadata.find(table_name);
+                if (metadata_it == table_name_to_metadata.end())
+                {
+                    /// getTablesSortedByDependency() may return some not existing tables or tables from other databases
+                    LOG_WARNING(log, "Got table name {} when resolving table dependencies, "
+                                "but database {} does not have metadata for that table. Ignoring it", table_id.getNameForLogs(), getDatabaseName());
+                    return;
+                }
+
+                const auto & create_query_string = metadata_it->second;
+                if (isTableExist(table_name, getContext()))
+                {
+                    assert(create_query_string == readMetadataFile(table_name) || getTableUUIDIfReplicated(create_query_string, getContext()) != UUIDHelpers::Nil);
+                    return;
+                }
+
+                auto query_ast = parseQueryFromMetadataInZooKeeper(table_name, create_query_string);
+                LOG_INFO(log, "Executing {}", serializeAST(*query_ast));
+                auto create_query_context = make_query_context();
+                InterpreterCreateQuery(query_ast, create_query_context).execute();
+            };
+
+            if (allow_concurrent_table_creation)
+                create_table_futures.push_back(create_tables_runner(task, Priority{0}));
+            else
+                task();
         }
 
-        const auto & create_query_string = metadata_it->second;
-        if (isTableExist(table_name, getContext()))
-        {
-            assert(create_query_string == readMetadataFile(table_name) || getTableUUIDIfReplicated(create_query_string, getContext()) != UUIDHelpers::Nil);
-            continue;
-        }
+        /// First wait for all tasks to finish.
+        for (auto & future : create_table_futures)
+            future.wait();
 
-        auto query_ast = parseQueryFromMetadataInZooKeeper(table_name, create_query_string);
-        LOG_INFO(log, "Executing {}", serializeAST(*query_ast));
-        auto create_query_context = make_query_context();
-        InterpreterCreateQuery(query_ast, create_query_context).execute();
+        /// Now rethrow the first exception if any.
+        for (auto & future : create_table_futures)
+            future.get();
+
+        create_table_futures.clear();
     }
     LOG_INFO(log, "All tables are created successfully");
 
diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index 6b9e202d900..c37c6a74152 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -1,3 +1,4 @@
+#include <unordered_map>
 #include <Databases/TablesDependencyGraph.h>
 #include <Common/logger_useful.h>
 #include <IO/WriteHelpers.h>
@@ -699,6 +700,17 @@ std::vector<StorageID> TablesDependencyGraph::getTablesSortedByDependency() cons
 }
 
 
+std::map<size_t, std::vector<StorageID>> TablesDependencyGraph::getTablesSortedByDependencyWithLevels() const
+{
+    std::map<size_t, std::vector<StorageID>> tables_by_level;
+    for (const auto * node : getNodesSortedByLevel())
+    {
+        tables_by_level[node->level].emplace_back(node->storage_id);
+    }
+    return tables_by_level;
+}
+
+
 void TablesDependencyGraph::log() const
 {
     if (nodes.empty())
diff --git a/src/Databases/TablesDependencyGraph.h b/src/Databases/TablesDependencyGraph.h
index f0553cef321..9d9c926b3a8 100644
--- a/src/Databases/TablesDependencyGraph.h
+++ b/src/Databases/TablesDependencyGraph.h
@@ -107,6 +107,9 @@ public:
     /// tables which depend on the tables which depend on the tables without dependencies, and so on.
     std::vector<StorageID> getTablesSortedByDependency() const;
 
+    /// TODO
+    std::map<size_t, std::vector<StorageID>> getTablesSortedByDependencyWithLevels() const;
+
     /// Outputs information about this graph as a bunch of logging messages.
     void log() const;
 
diff --git a/src/IO/SharedThreadPools.cpp b/src/IO/SharedThreadPools.cpp
index c8506663bc8..2ea30400ad9 100644
--- a/src/IO/SharedThreadPools.cpp
+++ b/src/IO/SharedThreadPools.cpp
@@ -20,6 +20,9 @@ namespace CurrentMetrics
     extern const Metric MergeTreeOutdatedPartsLoaderThreads;
     extern const Metric MergeTreeOutdatedPartsLoaderThreadsActive;
     extern const Metric MergeTreeOutdatedPartsLoaderThreadsScheduled;
+    extern const Metric DatabaseReplicatedCreateTablesThreads;
+    extern const Metric DatabaseReplicatedCreateTablesThreadsActive;
+    extern const Metric DatabaseReplicatedCreateTablesThreadsScheduled;
 }
 
 namespace DB
@@ -148,4 +151,10 @@ StaticThreadPool & getOutdatedPartsLoadingThreadPool()
     return instance;
 }
 
+StaticThreadPool & getDatabaseReplicatedCreateTablesThreadPool()
+{
+    static StaticThreadPool instance("CreateTablesThreadPool", CurrentMetrics::DatabaseReplicatedCreateTablesThreads, CurrentMetrics::DatabaseReplicatedCreateTablesThreadsActive, CurrentMetrics::DatabaseReplicatedCreateTablesThreadsScheduled);
+    return instance;
+}
+
 }
diff --git a/src/IO/SharedThreadPools.h b/src/IO/SharedThreadPools.h
index f37f3acefe7..acc5368f8ac 100644
--- a/src/IO/SharedThreadPools.h
+++ b/src/IO/SharedThreadPools.h
@@ -64,4 +64,7 @@ StaticThreadPool & getPartsCleaningThreadPool();
 /// the number of threads by calling enableTurboMode() :-)
 StaticThreadPool & getOutdatedPartsLoadingThreadPool();
 
+/// ThreadPool used for creating tables in DatabaseReplicated.
+StaticThreadPool & getDatabaseReplicatedCreateTablesThreadPool();
+
 }

From 3de507b545ebaf3d4b9fff0c6fba50cddbb09598 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 31 Jan 2024 22:55:54 +0100
Subject: [PATCH 0495/1081] Update comment

---
 src/Databases/TablesDependencyGraph.h | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Databases/TablesDependencyGraph.h b/src/Databases/TablesDependencyGraph.h
index 9d9c926b3a8..18cdc999ee1 100644
--- a/src/Databases/TablesDependencyGraph.h
+++ b/src/Databases/TablesDependencyGraph.h
@@ -107,7 +107,10 @@ public:
     /// tables which depend on the tables which depend on the tables without dependencies, and so on.
     std::vector<StorageID> getTablesSortedByDependency() const;
 
-    /// TODO
+    /// Returns a map of lists of tables by the number of dependencies they have:
+    /// tables without dependencies first with level 0, then
+    /// tables with depend on the tables without dependencies with level 1, then
+    /// tables which depend on the tables which depend on the tables without dependencies with level 2, and so on.
     std::map<size_t, std::vector<StorageID>> getTablesSortedByDependencyWithLevels() const;
 
     /// Outputs information about this graph as a bunch of logging messages.

From 6871d233e9d1f31d78cc8f4aaf16556bb7701887 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Thu, 1 Feb 2024 02:47:38 +0100
Subject: [PATCH 0496/1081] Adjust threadpool name

---
 src/Databases/DatabaseReplicated.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index b184b09f6a6..6db6bb8c034 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -1096,7 +1096,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
     auto allow_concurrent_table_creation = getContext()->getServerSettings().allow_database_replicated_concurrent_table_creation;
     auto tables_to_create_by_level = tables_dependencies.getTablesSortedByDependencyWithLevels();
 
-    auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "DatabaseReplicatedCreateTables");
+    auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "CreateTables");
     std::vector<std::future<void>> create_table_futures;
 
     for (const auto & [_, tables_to_create] : tables_to_create_by_level)

From 896c55dd98b61143ed3fba98514e1ffc68069ba1 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Thu, 1 Feb 2024 02:59:33 +0100
Subject: [PATCH 0497/1081] Remove redundant dependency

---
 src/Databases/TablesDependencyGraph.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index c37c6a74152..007bcb5ab17 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -1,4 +1,3 @@
-#include <unordered_map>
 #include <Databases/TablesDependencyGraph.h>
 #include <Common/logger_useful.h>
 #include <IO/WriteHelpers.h>

From b3418c506e8a8c3223d66e1f7ba04bbd980b6401 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Thu, 1 Feb 2024 10:28:33 +0100
Subject: [PATCH 0498/1081] Update src/Storages/S3Queue/S3QueueSettings.h

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 src/Storages/S3Queue/S3QueueSettings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/S3Queue/S3QueueSettings.h b/src/Storages/S3Queue/S3QueueSettings.h
index 5c846b4f294..c26e973a1c0 100644
--- a/src/Storages/S3Queue/S3QueueSettings.h
+++ b/src/Storages/S3Queue/S3QueueSettings.h
@@ -22,7 +22,7 @@ class ASTStorage;
     M(UInt32, s3queue_loading_retries, 0, "Retry loading up to specified number of times", 0) \
     M(UInt32, s3queue_processing_threads_num, 1, "Number of processing threads", 0) \
     M(UInt32, s3queue_enable_logging_to_s3queue_log, 1, "Enable logging to system table system.s3queue_log", 0) \
-    M(String, s3queue_last_processed_path, "", "For Ordered mode. Files with smaller file name are considered already processed", 0) \
+    M(String, s3queue_last_processed_path, "", "For Ordered mode. Files that have lexicographically smaller file name are considered already processed", 0) \
     M(UInt32, s3queue_tracked_file_ttl_sec, 0, "Maximum number of seconds to store processed files in ZooKeeper node (store forever by default)", 0) \
     M(UInt32, s3queue_polling_min_timeout_ms, 1000, "Minimal timeout before next polling", 0) \
     M(UInt32, s3queue_polling_max_timeout_ms, 10000, "Maximum timeout before next polling", 0) \

From 25c87b7cb7e1a185300b4850463c311cf9cbee89 Mon Sep 17 00:00:00 2001
From: Fille <fille@imgnry.com>
Date: Thu, 1 Feb 2024 10:37:10 +0100
Subject: [PATCH 0499/1081] Update configuration-files.md

Fixed typo in XML example
---
 docs/en/operations/configuration-files.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index dfe62d591e3..005c7818eb1 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -163,7 +163,7 @@ key: value
 
 Corresponding XML:
 ``` xml
-<key>value</value>
+<key>value</key>
 ```
 
 A nested XML node is represented by a YAML map:

From 88f13817398972e57a069b9eaa326c9146fc6042 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 14:43:53 +0300
Subject: [PATCH 0500/1081] Poco Logger small refactoring

---
 base/poco/Foundation/include/Poco/Logger.h    |  32 ++---
 base/poco/Foundation/src/Logger.cpp           | 111 ++++++++++--------
 .../ObjectStorages/ObjectStorageFactory.cpp   |   2 +-
 .../ObjectStorages/Web/WebObjectStorage.cpp   |   2 +-
 4 files changed, 83 insertions(+), 64 deletions(-)

diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index cf202718662..5bc099bbb42 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -876,16 +876,6 @@ public:
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
-    static Logger & unsafeGet(const std::string & name);
-    /// Returns a reference to the Logger with the given name.
-    /// If the Logger does not yet exist, it is created, based
-    /// on its parent logger.
-    ///
-    /// WARNING: This method is not thread safe. You should
-    /// probably use get() instead.
-    /// The only time this method should be used is during
-    /// program initialization, when only one thread is running.
-
     static Logger & create(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
     /// Creates and returns a reference to a Logger with the
     /// given name. The Logger's Channel and log level as set as
@@ -932,6 +922,16 @@ public:
 
     static const std::string ROOT; /// The name of the root logger ("").
 
+public:
+    struct LoggerEntry
+    {
+        Poco::Logger * logger;
+        bool owned_by_shared_ptr = false;
+    };
+
+    using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
+    using LoggerMapIterator = LoggerMap::iterator;
+
 protected:
     Logger(const std::string & name, Channel * pChannel, int level);
     ~Logger();
@@ -940,12 +940,16 @@ protected:
     void log(const std::string & text, Message::Priority prio, const char * file, int line);
 
     static std::string format(const std::string & fmt, int argc, std::string argv[]);
-    static Logger & unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
-    static Logger & parent(const std::string & name);
-    static void add(Logger * pLogger);
-    static Logger * find(const std::string & name);
 
 private:
+    static std::pair<Logger::LoggerMapIterator, bool> unsafeGet(const std::string & name);
+    static Logger * unsafeGetRawPtr(const std::string & name);
+    static std::pair<LoggerMapIterator, bool> unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
+    static Logger & parent(const std::string & name);
+    static std::pair<LoggerMapIterator, bool> add(Logger * pLogger);
+    static std::optional<LoggerMapIterator> find(const std::string & name);
+    static Logger * findRawPtr(const std::string & name);
+
     Logger();
     Logger(const Logger &);
     Logger & operator=(const Logger &);
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index cfc063c8979..7813faf136a 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -38,14 +38,7 @@ std::mutex & getLoggerMutex()
 	return *logger_mutex;
 }
 
-struct LoggerEntry
-{
-	Poco::Logger * logger;
-	bool owned_by_shared_ptr = false;
-};
-
-using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
-LoggerMap * _pLoggerMap = nullptr;
+Poco::Logger::LoggerMap * _pLoggerMap = nullptr;
 
 }
 
@@ -350,64 +343,71 @@ Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	Logger & logger = unsafeGet(name);
+	auto [it, inserted] = unsafeGet(name);
 
 	/** If there are already shared pointer created for this logger
 	  * we need to increment Logger reference count and now logger
 	  * is owned by logger infrastructure.
 	  */
-	auto it = _pLoggerMap->find(name);
 	if (it->second.owned_by_shared_ptr)
 	{
 		it->second.logger->duplicate();
 		it->second.owned_by_shared_ptr = false;
 	}
 
-	return logger;
+	return *it->second.logger;
 }
 
 
 LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
-	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
+	auto [it, inserted] = unsafeGet(name);
 
-	Logger & logger = unsafeGet(name);
-
-	/** If logger already exists, then this shared pointer does not own it.
-	  * If logger does not exists, logger infrastructure could be already destroyed
-	  * or logger was created.
+	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
+	  * If logger was already created, then this shared pointer does not own it.
 	  */
-	if (logger_exists)
+	if (inserted)
 	{
-		logger.duplicate();
+		it->second.owned_by_shared_ptr = true;
 	}
-	else if (_pLoggerMap)
+	else
 	{
-		_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+		it->second.logger->duplicate();
 	}
 
-	return makeLoggerPtr(logger);
+	return makeLoggerPtr(*it->second.logger);
 }
 
 
-Logger& Logger::unsafeGet(const std::string& name)
+std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string& name)
 {
-	Logger* pLogger = find(name);
-	if (!pLogger)
+	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
+
+	if (!optional_logger_it)
 	{
+		Logger * logger = nullptr;
+
 		if (name == ROOT)
 		{
-			pLogger = new Logger(name, 0, Message::PRIO_INFORMATION);
+			logger = new Logger(name, nullptr, Message::PRIO_INFORMATION);
 		}
 		else
 		{
 			Logger& par = parent(name);
-			pLogger = new Logger(name, par.getChannel(), par.getLevel());
+			logger = new Logger(name, par.getChannel(), par.getLevel());
 		}
-		add(pLogger);
+
+		return add(logger);
 	}
-	return *pLogger;
+
+	return std::make_pair(*optional_logger_it, false);
+}
+
+
+Logger * Logger::unsafeGetRawPtr(const std::string & name)
+{
+	return unsafeGet(name).first->second.logger;
 }
 
 
@@ -415,24 +415,24 @@ Logger& Logger::create(const std::string& name, Channel* pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeCreate(name, pChannel, level);
+	return *unsafeCreate(name, pChannel, level).first->second.logger;
 }
 
 LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	Logger & logger = unsafeCreate(name, pChannel, level);
-	_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+	auto [it, inserted] = unsafeCreate(name, pChannel, level);
+	it->second.owned_by_shared_ptr = true;
 
-	return makeLoggerPtr(logger);
+	return makeLoggerPtr(*it->second.logger);
 }
 
 Logger& Logger::root()
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeGet(ROOT);
+	return *unsafeGetRawPtr(ROOT);
 }
 
 
@@ -440,7 +440,11 @@ Logger* Logger::has(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return find(name);
+	auto optional_it = find(name);
+	if (!optional_it)
+		return nullptr;
+
+	return (*optional_it)->second.logger;
 }
 
 
@@ -459,22 +463,33 @@ void Logger::shutdown()
 		}
 
 		delete _pLoggerMap;
-		_pLoggerMap = 0;
+		_pLoggerMap = nullptr;
 	}
 }
 
 
-Logger* Logger::find(const std::string& name)
+std::optional<Logger::LoggerMapIterator> Logger::find(const std::string& name)
 {
 	if (_pLoggerMap)
 	{
 		LoggerMap::iterator it = _pLoggerMap->find(name);
 		if (it != _pLoggerMap->end())
-			return it->second.logger;
+			return it;
+
+		return {};
 	}
-	return 0;
+
+	return {};
 }
 
+Logger * Logger::findRawPtr(const std::string & name)
+{
+	auto optional_it = find(name);
+	if (!optional_it)
+		return nullptr;
+
+	return (*optional_it)->second.logger;
+}
 
 void Logger::names(std::vector<std::string>& names)
 {
@@ -490,13 +505,11 @@ void Logger::names(std::vector<std::string>& names)
 	}
 }
 
-Logger& Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
+std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
 {
 	if (find(name)) throw ExistsException();
 	Logger* pLogger = new Logger(name, pChannel, level);
-	add(pLogger);
-
-	return *pLogger;
+	return add(pLogger);
 }
 
 Logger& Logger::parent(const std::string& name)
@@ -505,13 +518,13 @@ Logger& Logger::parent(const std::string& name)
 	if (pos != std::string::npos)
 	{
 		std::string pname = name.substr(0, pos);
-		Logger* pParent = find(pname);
+		Logger* pParent = findRawPtr(pname);
 		if (pParent)
 			return *pParent;
 		else
 			return parent(pname);
 	}
-	else return unsafeGet(ROOT);
+	else return *unsafeGetRawPtr(ROOT);
 }
 
 
@@ -579,12 +592,14 @@ namespace
 }
 
 
-void Logger::add(Logger* pLogger)
+std::pair<Logger::LoggerMapIterator, bool> Logger::add(Logger* pLogger)
 {
 	if (!_pLoggerMap)
-		_pLoggerMap = new LoggerMap;
+		_pLoggerMap = new Logger::LoggerMap;
 
-	_pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
+	auto result = _pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
+	assert(result.second);
+	return result;
 }
 
 
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index ec6f7081c85..4a6bb924bdc 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -102,7 +102,7 @@ void checkS3Capabilities(
     if (s3_capabilities.support_batch_delete && !checkBatchRemove(storage, key_with_trailing_slash))
     {
         LOG_WARNING(
-            &Poco::Logger::get("S3ObjectStorage"),
+            getLogger("S3ObjectStorage"),
             "Storage for disk {} does not support batch delete operations, "
             "so `s3_capabilities.support_batch_delete` was automatically turned off during the access check. "
             "To remove this message set `s3_capabilities.support_batch_delete` for the disk to `false`.",
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 0223c24973e..786b23caf48 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -82,7 +82,7 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
             if (!inserted)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Loading data for {} more than once", file_path);
 
-            LOG_TRACE(&Poco::Logger::get("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
+            LOG_TRACE(getLogger("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
             loaded_files.emplace_back(file_path);
         }
 

From ecbea6f625662a971b92d898e7391241191eb913 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 30 Jan 2024 20:13:39 +0300
Subject: [PATCH 0501/1081] Updated implementation

---
 base/poco/Foundation/CMakeLists.txt           |  6 ++
 base/poco/Foundation/include/Poco/Logger.h    | 11 ++-
 .../include/Poco/RefCountedObject.h           |  3 +-
 base/poco/Foundation/src/Logger.cpp           | 74 +++++++++++--------
 src/Common/Logger.h                           | 12 +++
 .../MergeTree/MergeTreeDataPartCloner.cpp     |  2 +-
 utils/keeper-data-dumper/main.cpp             |  2 +-
 7 files changed, 72 insertions(+), 38 deletions(-)

diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index dfb41a33fb1..5fe644d3057 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -166,6 +166,12 @@ set (SRCS
 )
 
 add_library (_poco_foundation ${SRCS})
+target_link_libraries (_poco_foundation
+    PUBLIC
+        boost::headers_only
+        boost::system
+)
+
 add_library (Poco::Foundation ALIAS _poco_foundation)
 
 # TODO: remove these warning exclusions
diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index 5bc099bbb42..1a0820f1433 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -22,6 +22,10 @@
 #include <cstddef>
 #include <map>
 #include <vector>
+
+#include <boost/math/special_functions/fpclassify.hpp>
+#include <boost/smart_ptr/intrusive_ptr.hpp>
+
 #include "Poco/Channel.h"
 #include "Poco/Format.h"
 #include "Poco/Foundation.h"
@@ -34,7 +38,7 @@ namespace Poco
 
 class Exception;
 class Logger;
-using LoggerPtr = std::shared_ptr<Logger>;
+using LoggerPtr = boost::intrusive_ptr<Logger>;
 
 class Foundation_API Logger : public Channel
 /// Logger is a special Channel that acts as the main
@@ -871,7 +875,7 @@ public:
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
-    static LoggerPtr getShared(const std::string & name);
+    static LoggerPtr getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created = true);
     /// Returns a shared pointer to the Logger with the given name.
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
@@ -950,6 +954,9 @@ private:
     static std::optional<LoggerMapIterator> find(const std::string & name);
     static Logger * findRawPtr(const std::string & name);
 
+    friend void intrusive_ptr_add_ref(Logger * ptr);
+    friend void intrusive_ptr_release(Logger * ptr);
+
     Logger();
     Logger(const Logger &);
     Logger & operator=(const Logger &);
diff --git a/base/poco/Foundation/include/Poco/RefCountedObject.h b/base/poco/Foundation/include/Poco/RefCountedObject.h
index db966089e00..1f806bdacb1 100644
--- a/base/poco/Foundation/include/Poco/RefCountedObject.h
+++ b/base/poco/Foundation/include/Poco/RefCountedObject.h
@@ -53,11 +53,10 @@ protected:
     virtual ~RefCountedObject();
     /// Destroys the RefCountedObject.
 
+    mutable std::atomic<size_t> _counter;
 private:
     RefCountedObject(const RefCountedObject &);
     RefCountedObject & operator=(const RefCountedObject &);
-
-    mutable std::atomic<size_t> _counter;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 7813faf136a..d5c2d25be79 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -302,38 +302,9 @@ void Logger::formatDump(std::string& message, const void* buffer, std::size_t le
 namespace
 {
 
-struct LoggerDeleter
-{
-	void operator()(Poco::Logger * logger)
-	{
-		std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-		/// If logger infrastructure is destroyed just decrement logger reference count
-		if (!_pLoggerMap)
-		{
-			logger->release();
-			return;
-		}
-
-		auto it = _pLoggerMap->find(logger->name());
-		assert(it != _pLoggerMap->end());
-
-		/** If reference count is 1, this means this shared pointer owns logger
-		  * and need destroy it.
-		  */
-		size_t reference_count_before_release = logger->release();
-		if (reference_count_before_release == 1)
-		{
-			assert(it->second.owned_by_shared_ptr);
-			_pLoggerMap->erase(it);
-		}
-	}
-};
-
-
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
-	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
+	return LoggerPtr(&logger, false /*add_ref*/);
 }
 
 }
@@ -359,7 +330,7 @@ Logger& Logger::get(const std::string& name)
 }
 
 
-LoggerPtr Logger::getShared(const std::string & name)
+LoggerPtr Logger::getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 	auto [it, inserted] = unsafeGet(name);
@@ -367,7 +338,7 @@ LoggerPtr Logger::getShared(const std::string & name)
 	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
 	  * If logger was already created, then this shared pointer does not own it.
 	  */
-	if (inserted)
+	if (inserted && should_be_owned_by_shared_ptr_if_created)
 	{
 		it->second.owned_by_shared_ptr = true;
 	}
@@ -491,6 +462,43 @@ Logger * Logger::findRawPtr(const std::string & name)
 	return (*optional_it)->second.logger;
 }
 
+
+void intrusive_ptr_add_ref(Logger * ptr)
+{
+	ptr->duplicate();
+}
+
+
+void intrusive_ptr_release(Logger * ptr)
+{
+	size_t reference_count_before = ptr->_counter.fetch_sub(1, std::memory_order_acq_rel);
+	if (reference_count_before != 1)
+		return;
+
+	{
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		/// It is possible that during release other thread created logger
+		if (ptr->_counter.load(std::memory_order_relaxed) > 0)
+			return;
+
+		if (_pLoggerMap)
+		{
+			auto it = _pLoggerMap->find(ptr->name());
+			assert(it != _pLoggerMap->end());
+
+			/** If reference count is 0, this means this intrusive pointer owns logger
+			  * and need destroy it.
+			  */
+			assert(it->second.owned_by_shared_ptr);
+			_pLoggerMap->erase(it);
+		}
+	}
+
+	delete ptr;
+}
+
+
 void Logger::names(std::vector<std::string>& names)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
@@ -505,6 +513,7 @@ void Logger::names(std::vector<std::string>& names)
 	}
 }
 
+
 std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
 {
 	if (find(name)) throw ExistsException();
@@ -512,6 +521,7 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeCreate(const std::strin
 	return add(pLogger);
 }
 
+
 Logger& Logger::parent(const std::string& name)
 {
 	std::string::size_type pos = name.rfind('.');
diff --git a/src/Common/Logger.h b/src/Common/Logger.h
index 6dcdea9a9d8..0425da8c847 100644
--- a/src/Common/Logger.h
+++ b/src/Common/Logger.h
@@ -2,6 +2,8 @@
 
 #include <memory>
 
+#include <base/defines.h>
+
 #include <Poco/Channel.h>
 #include <Poco/Logger.h>
 #include <Poco/Message.h>
@@ -24,6 +26,16 @@ using LoggerRawPtr = Poco::Logger *;
   */
 LoggerPtr getLogger(const std::string & name);
 
+/** Get Logger with specified name. If the Logger does not exists, it is created.
+  * This overload was added for specific purpose, when logger is constructed from constexpr string.
+  * Logger is destroyed only during program shutdown.
+  */
+template <size_t n>
+ALWAYS_INLINE LoggerPtr getLogger(const char (&name)[n])
+{
+    return Poco::Logger::getShared(name, false /*should_be_owned_by_shared_ptr_if_created*/);
+}
+
 /** Create Logger with specified name, channel and logging level.
   * If Logger already exists, throws exception.
   * Logger is destroyed, when last shared ptr that refers to Logger with specified name is destroyed.
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index 04019d2c665..107e21c2dda 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -180,7 +180,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
     }
 
     LOG_DEBUG(
-        &Poco::Logger::get("MergeTreeDataPartCloner"),
+        getLogger("MergeTreeDataPartCloner"),
         "Clone {} part {} to {}{}",
         src_flushed_tmp_part ? "flushed" : "",
         src_part_storage->getFullPath(),
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index e06b301edbf..e51b3037ade 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -59,7 +59,7 @@ int main(int argc, char *argv[])
         Poco::Logger::root().setChannel(channel);
         Poco::Logger::root().setLevel("trace");
     }
-    auto * logger = &Poco::Logger::get("keeper-dumper");
+    auto * logger = getLogger("keeper-dumper");
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();

From 056108667f8626e838db2fa575c39d1178b165ed Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 31 Jan 2024 15:20:56 +0300
Subject: [PATCH 0502/1081] Fixed tests

---
 base/poco/Foundation/include/Poco/Logger.h |  1 -
 base/poco/Foundation/src/Logger.cpp        | 35 ++++++++++++++++------
 utils/keeper-data-dumper/main.cpp          |  2 +-
 3 files changed, 27 insertions(+), 11 deletions(-)

diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index 1a0820f1433..9d3a63c5d09 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -23,7 +23,6 @@
 #include <map>
 #include <vector>
 
-#include <boost/math/special_functions/fpclassify.hpp>
 #include <boost/smart_ptr/intrusive_ptr.hpp>
 
 #include "Poco/Channel.h"
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index d5c2d25be79..2d95692af20 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -355,7 +355,16 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string&
 {
 	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
 
-	if (!optional_logger_it)
+	bool should_recreate_logger = false;
+
+	/// Other thread already deleted this logger, but did not yet remove it from map
+	if (optional_logger_it && (*optional_logger_it)->second.logger->referenceCount() == 0)
+	{
+		assert((*optional_logger_it)->second.owned_by_shared_ptr);
+		should_recreate_logger = true;
+	}
+
+	if (!optional_logger_it || should_recreate_logger)
 	{
 		Logger * logger = nullptr;
 
@@ -369,6 +378,12 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string&
 			logger = new Logger(name, par.getChannel(), par.getLevel());
 		}
 
+		if (should_recreate_logger)
+		{
+			(*optional_logger_it)->second.logger = logger;
+			return std::make_pair(*optional_logger_it, true);
+		}
+
 		return add(logger);
 	}
 
@@ -478,20 +493,22 @@ void intrusive_ptr_release(Logger * ptr)
 	{
 		std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-		/// It is possible that during release other thread created logger
-		if (ptr->_counter.load(std::memory_order_relaxed) > 0)
-			return;
-
 		if (_pLoggerMap)
 		{
 			auto it = _pLoggerMap->find(ptr->name());
 			assert(it != _pLoggerMap->end());
 
-			/** If reference count is 0, this means this intrusive pointer owns logger
-			  * and need destroy it.
+			/** It is possible that during release other thread created logger and
+			  * updated iterator in map.
 			  */
-			assert(it->second.owned_by_shared_ptr);
-			_pLoggerMap->erase(it);
+			if (it->second.logger == ptr)
+			{
+				/** If reference count is 0, this means this intrusive pointer owns logger
+				  * and need destroy it.
+				  */
+				assert(it->second.owned_by_shared_ptr);
+				_pLoggerMap->erase(it);
+			}
 		}
 	}
 
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index e51b3037ade..9e107c99534 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -59,7 +59,7 @@ int main(int argc, char *argv[])
         Poco::Logger::root().setChannel(channel);
         Poco::Logger::root().setLevel("trace");
     }
-    auto * logger = getLogger("keeper-dumper");
+    auto logger = getLogger("keeper-dumper");
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();

From f62fdb86b8e0eba6d010195d2f79f27808bb7f02 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 31 Jan 2024 19:37:31 +0300
Subject: [PATCH 0503/1081] Fixed tests

---
 base/poco/Foundation/include/Poco/Logger.h |  2 +-
 base/poco/Foundation/src/Logger.cpp        | 54 ++++++++--------
 src/Common/tests/gtest_log.cpp             | 73 ++++++++++++++++++++++
 3 files changed, 101 insertions(+), 28 deletions(-)

diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index 9d3a63c5d09..883294a071a 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -945,7 +945,7 @@ protected:
     static std::string format(const std::string & fmt, int argc, std::string argv[]);
 
 private:
-    static std::pair<Logger::LoggerMapIterator, bool> unsafeGet(const std::string & name);
+    static std::pair<Logger::LoggerMapIterator, bool> unsafeGet(const std::string & name, bool get_shared);
     static Logger * unsafeGetRawPtr(const std::string & name);
     static std::pair<LoggerMapIterator, bool> unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
     static Logger & parent(const std::string & name);
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 2d95692af20..16fc3a0480e 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -314,18 +314,7 @@ Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	auto [it, inserted] = unsafeGet(name);
-
-	/** If there are already shared pointer created for this logger
-	  * we need to increment Logger reference count and now logger
-	  * is owned by logger infrastructure.
-	  */
-	if (it->second.owned_by_shared_ptr)
-	{
-		it->second.logger->duplicate();
-		it->second.owned_by_shared_ptr = false;
-	}
-
+	auto [it, inserted] = unsafeGet(name, false /*get_shared*/);
 	return *it->second.logger;
 }
 
@@ -333,35 +322,47 @@ Logger& Logger::get(const std::string& name)
 LoggerPtr Logger::getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
-	auto [it, inserted] = unsafeGet(name);
+	auto [it, inserted] = unsafeGet(name, true /*get_shared*/);
 
 	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
 	  * If logger was already created, then this shared pointer does not own it.
 	  */
-	if (inserted && should_be_owned_by_shared_ptr_if_created)
+	if (inserted)
 	{
-		it->second.owned_by_shared_ptr = true;
-	}
-	else
-	{
-		it->second.logger->duplicate();
+		if (should_be_owned_by_shared_ptr_if_created)
+			it->second.owned_by_shared_ptr = true;
+		else
+			it->second.logger->duplicate();
 	}
 
 	return makeLoggerPtr(*it->second.logger);
 }
 
 
-std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string& name)
+std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string& name, bool get_shared)
 {
 	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
 
 	bool should_recreate_logger = false;
 
-	/// Other thread already deleted this logger, but did not yet remove it from map
-	if (optional_logger_it && (*optional_logger_it)->second.logger->referenceCount() == 0)
+	if (optional_logger_it)
 	{
-		assert((*optional_logger_it)->second.owned_by_shared_ptr);
-		should_recreate_logger = true;
+		auto & logger_it = *optional_logger_it;
+		std::optional<size_t> reference_count_before;
+
+		if (get_shared)
+		{
+			reference_count_before = logger_it->second.logger->duplicate();
+		}
+		else if (logger_it->second.owned_by_shared_ptr)
+		{
+			reference_count_before = logger_it->second.logger->duplicate();
+			logger_it->second.owned_by_shared_ptr = false;
+		}
+
+		/// Other thread already decided to delete this logger, but did not yet remove it from map
+		if (reference_count_before && reference_count_before == 0)
+			should_recreate_logger = true;
 	}
 
 	if (!optional_logger_it || should_recreate_logger)
@@ -393,7 +394,7 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string&
 
 Logger * Logger::unsafeGetRawPtr(const std::string & name)
 {
-	return unsafeGet(name).first->second.logger;
+	return unsafeGet(name, false /*get_shared*/).first->second.logger;
 }
 
 
@@ -496,12 +497,11 @@ void intrusive_ptr_release(Logger * ptr)
 		if (_pLoggerMap)
 		{
 			auto it = _pLoggerMap->find(ptr->name());
-			assert(it != _pLoggerMap->end());
 
 			/** It is possible that during release other thread created logger and
 			  * updated iterator in map.
 			  */
-			if (it->second.logger == ptr)
+			if (it != _pLoggerMap->end() && ptr == it->second.logger)
 			{
 				/** If reference count is 0, this means this intrusive pointer owns logger
 				  * and need destroy it.
diff --git a/src/Common/tests/gtest_log.cpp b/src/Common/tests/gtest_log.cpp
index 622497fe2f5..6d2bd56ad77 100644
--- a/src/Common/tests/gtest_log.cpp
+++ b/src/Common/tests/gtest_log.cpp
@@ -9,6 +9,7 @@
 #include <Poco/NullChannel.h>
 #include <Poco/StreamChannel.h>
 #include <sstream>
+#include <thread>
 
 
 TEST(Logger, Log)
@@ -100,3 +101,75 @@ TEST(Logger, SideEffects)
 
     LOG_TRACE(log, "test no throw {}", getLogMessageParamOrThrow());
 }
+
+TEST(Logger, SharedRawLogger)
+{
+    {
+        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
+
+        auto shared_logger = getLogger("Logger_1");
+        shared_logger->setChannel(stream_channel.get());
+        shared_logger->setLevel("trace");
+
+        LOG_TRACE(shared_logger, "SharedLogger1Log1");
+        LOG_TRACE(getRawLogger("Logger_1"), "RawLogger1Log");
+        LOG_TRACE(shared_logger, "SharedLogger1Log2");
+
+        auto actual = stream.str();
+        EXPECT_EQ(actual, "SharedLogger1Log1\nRawLogger1Log\nSharedLogger1Log2\n");
+    }
+    {
+        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
+
+        auto * raw_logger = getRawLogger("Logger_2");
+        raw_logger->setChannel(stream_channel.get());
+        raw_logger->setLevel("trace");
+
+        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log1");
+        LOG_TRACE(raw_logger, "RawLogger2Log");
+        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log2");
+
+        auto actual = stream.str();
+        EXPECT_EQ(actual, "SharedLogger2Log1\nRawLogger2Log\nSharedLogger2Log2\n");
+    }
+}
+
+TEST(Logger, SharedLoggersThreadSafety)
+{
+    static size_t threads_count = std::thread::hardware_concurrency();
+    static constexpr size_t loggers_count = 10;
+    static constexpr size_t logger_get_count = 1000;
+
+    Poco::Logger::root();
+
+    std::vector<std::string> names;
+
+    Poco::Logger::names(names);
+    size_t loggers_size_before = names.size();
+
+    std::vector<std::thread> threads;
+
+    for (size_t thread_index = 0; thread_index < threads_count; ++thread_index)
+    {
+        threads.emplace_back([]()
+        {
+            for (size_t logger_index = 0; logger_index < loggers_count; ++logger_index)
+            {
+                for (size_t iteration = 0; iteration < logger_get_count; ++iteration)
+                {
+                    getLogger("Logger_" + std::to_string(logger_index));
+                }
+            }
+        });
+    }
+
+    for (auto & thread : threads)
+        thread.join();
+
+    Poco::Logger::names(names);
+    size_t loggers_size_after = names.size();
+
+    EXPECT_EQ(loggers_size_before, loggers_size_after);
+}

From 4ee7275f21458522d55e5eecf68100c8a8d7d3da Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 29 Jan 2024 13:30:25 +0100
Subject: [PATCH 0504/1081] Improve dry run for lambda deployment

---
 tests/ci/team_keys_lambda/build_and_deploy_archive.sh | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
index a55c1bb2b3b..5b377d3c184 100644
--- a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
+++ b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
@@ -35,6 +35,8 @@ if [ -f requirements.txt ]; then
 fi
 ( cd "$PACKAGE" && zip -9 -r ../"$PACKAGE".zip . )
 
-if [ -z "$DRY_RUN" ]; then
-  aws lambda update-function-code --function-name "$LAMBDA_NAME" --zip-file fileb://"$WORKDIR/$PACKAGE".zip
+ECHO=()
+if [ -n "$DRY_RUN" ]; then
+  ECHO=(echo Run the following command to push the changes:)
 fi
+"${ECHO[@]}" aws lambda update-function-code --function-name "$LAMBDA_NAME" --zip-file fileb://"$WORKDIR/$PACKAGE".zip

From 76c6dc51bf2fc5f99aabfeef9d99cf859772b17f Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 29 Jan 2024 14:00:22 +0100
Subject: [PATCH 0505/1081] Unify the apt cleaning part in Dockerfile's

---
 docker/packager/binary/Dockerfile             |  2 +-
 docker/server/Dockerfile.ubuntu               |  5 +-
 docker/test/base/Dockerfile                   |  5 +-
 docker/test/fasttest/Dockerfile               |  4 +-
 docker/test/fuzzer/Dockerfile                 |  2 +-
 docker/test/install/deb/Dockerfile            | 10 ++--
 .../test/integration/hive_server/Dockerfile   | 47 +++++++++----------
 .../postgresql_java_client/Dockerfile         | 12 ++---
 docker/test/integration/runner/Dockerfile     |  7 +--
 docker/test/keeper-jepsen/Dockerfile          |  5 +-
 docker/test/libfuzzer/Dockerfile              |  2 +-
 docker/test/performance-comparison/Dockerfile |  2 +-
 docker/test/server-jepsen/Dockerfile          |  4 +-
 docker/test/sqlancer/Dockerfile               |  7 +--
 docker/test/sqllogic/Dockerfile               |  3 +-
 docker/test/sqltest/Dockerfile                |  3 +-
 docker/test/stateful/Dockerfile               |  3 +-
 docker/test/stateless/Dockerfile              |  3 +-
 ...lickhouse-statelest-test-runner.Dockerfile |  8 ++--
 docker/test/stress/Dockerfile                 |  3 +-
 docker/test/style/Dockerfile                  |  3 +-
 docker/test/upgrade/Dockerfile                |  3 +-
 docker/test/util/Dockerfile                   |  8 +++-
 23 files changed, 80 insertions(+), 71 deletions(-)

diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index 1a99ab0d0b6..e20cbe9781c 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -72,7 +72,7 @@ RUN add-apt-repository ppa:ubuntu-toolchain-r/test --yes \
         zstd \
         zip \
     && apt-get clean \
-    && rm -rf /var/lib/apt/lists
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 # Download toolchain and SDK for Darwin
 RUN curl -sL -O https://github.com/phracker/MacOSX-SDKs/releases/download/11.3/MacOSX11.0.sdk.tar.xz
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 60ef7a67563..341b3863c89 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -23,10 +23,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
         tzdata \
         wget \
     && apt-get clean \
-    && rm -rf \
-        /var/lib/apt/lists/* \
-        /var/cache/debconf \
-        /tmp/*
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
diff --git a/docker/test/base/Dockerfile b/docker/test/base/Dockerfile
index b48017fdacc..55229e893de 100644
--- a/docker/test/base/Dockerfile
+++ b/docker/test/base/Dockerfile
@@ -13,7 +13,10 @@ RUN apt-get update \
         zstd \
         locales \
         sudo \
-        --yes --no-install-recommends
+        --yes --no-install-recommends \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
+
 
 # Sanitizer options for services (clickhouse-server)
 # Set resident memory limit for TSAN to 45GiB (46080MiB) to avoid OOMs in Stress tests
diff --git a/docker/test/fasttest/Dockerfile b/docker/test/fasttest/Dockerfile
index 56ec0199849..64f6a1846a5 100644
--- a/docker/test/fasttest/Dockerfile
+++ b/docker/test/fasttest/Dockerfile
@@ -20,7 +20,9 @@ RUN apt-get update \
         pv \
         jq \
         zstd \
-    --yes --no-install-recommends
+        --yes --no-install-recommends \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install numpy==1.26.3 scipy==1.12.0 pandas==1.5.3 Jinja2==3.1.3
 
diff --git a/docker/test/fuzzer/Dockerfile b/docker/test/fuzzer/Dockerfile
index 0bc0fb06633..d3f78ac1d95 100644
--- a/docker/test/fuzzer/Dockerfile
+++ b/docker/test/fuzzer/Dockerfile
@@ -29,7 +29,7 @@ RUN apt-get update \
             wget \
     && apt-get autoremove --yes \
     && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install Jinja2
 
diff --git a/docker/test/install/deb/Dockerfile b/docker/test/install/deb/Dockerfile
index e9c928b1fe7..71daffa6f2a 100644
--- a/docker/test/install/deb/Dockerfile
+++ b/docker/test/install/deb/Dockerfile
@@ -10,13 +10,13 @@ ENV \
   init=/lib/systemd/systemd
 
 # install systemd packages
-RUN apt-get update && \
-  apt-get install -y --no-install-recommends \
+RUN apt-get update \
+  && apt-get install -y --no-install-recommends \
     sudo \
     systemd \
-    && \
-  apt-get clean && \
-  rm -rf /var/lib/apt/lists
+    \
+  && apt-get clean \
+  && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 # configure systemd
 # remove systemd 'wants' triggers
diff --git a/docker/test/integration/hive_server/Dockerfile b/docker/test/integration/hive_server/Dockerfile
index e37e2800557..e34899e3329 100644
--- a/docker/test/integration/hive_server/Dockerfile
+++ b/docker/test/integration/hive_server/Dockerfile
@@ -1,31 +1,27 @@
 FROM ubuntu:20.04
 MAINTAINER lgbo-ustc <lgbo.ustc@gmail.com>
 
-RUN apt-get update 
-RUN apt-get install -y wget openjdk-8-jre
-
-RUN wget https://archive.apache.org/dist/hadoop/common/hadoop-3.1.0/hadoop-3.1.0.tar.gz && \
-        tar -xf hadoop-3.1.0.tar.gz && rm -rf hadoop-3.1.0.tar.gz
-RUN wget https://apache.apache.org/dist/hive/hive-2.3.9/apache-hive-2.3.9-bin.tar.gz && \
-        tar -xf apache-hive-2.3.9-bin.tar.gz && rm -rf apache-hive-2.3.9-bin.tar.gz
-RUN apt install -y vim
-
-RUN apt install -y openssh-server openssh-client
-
-RUN apt install -y mysql-server
-
-RUN mkdir -p /root/.ssh && \
-        ssh-keygen -t rsa -b 2048 -P '' -f /root/.ssh/id_rsa && \
-        cat /root/.ssh/id_rsa.pub > /root/.ssh/authorized_keys && \
-        cp /root/.ssh/id_rsa /etc/ssh/ssh_host_rsa_key && \
-        cp /root/.ssh/id_rsa.pub /etc/ssh/ssh_host_rsa_key.pub
-
-RUN wget https://dev.mysql.com/get/Downloads/Connector-J/mysql-connector-java-8.0.27.tar.gz &&\
-        tar -xf mysql-connector-java-8.0.27.tar.gz && \
-        mv mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /apache-hive-2.3.9-bin/lib/ && \
-        rm -rf mysql-connector-java-8.0.27.tar.gz mysql-connector-java-8.0.27
-
-RUN apt install -y iputils-ping net-tools
+RUN apt-get update \
+  && apt-get install -y wget openjdk-8-jre \
+  && wget https://archive.apache.org/dist/hadoop/common/hadoop-3.1.0/hadoop-3.1.0.tar.gz \
+  && tar -xf hadoop-3.1.0.tar.gz && rm -rf hadoop-3.1.0.tar.gz \
+  && wget https://apache.apache.org/dist/hive/hive-2.3.9/apache-hive-2.3.9-bin.tar.gz \
+  && tar -xf apache-hive-2.3.9-bin.tar.gz && rm -rf apache-hive-2.3.9-bin.tar.gz \
+  && apt install -y vim \
+  && apt install -y openssh-server openssh-client \
+  && apt install -y mysql-server \
+  && mkdir -p /root/.ssh \
+  && ssh-keygen -t rsa -b 2048 -P '' -f /root/.ssh/id_rsa \
+  && cat /root/.ssh/id_rsa.pub > /root/.ssh/authorized_keys \
+  && cp /root/.ssh/id_rsa /etc/ssh/ssh_host_rsa_key \
+  && cp /root/.ssh/id_rsa.pub /etc/ssh/ssh_host_rsa_key.pub \
+  && wget https://dev.mysql.com/get/Downloads/Connector-J/mysql-connector-java-8.0.27.tar.gz \
+  && tar -xf mysql-connector-java-8.0.27.tar.gz \
+  && mv mysql-connector-java-8.0.27/mysql-connector-java-8.0.27.jar /apache-hive-2.3.9-bin/lib/ \
+  && rm -rf mysql-connector-java-8.0.27.tar.gz mysql-connector-java-8.0.27 \
+  && apt install -y iputils-ping net-tools \
+  && apt-get clean \
+  && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 ENV JAVA_HOME=/usr
 ENV HADOOP_HOME=/hadoop-3.1.0
@@ -44,4 +40,3 @@ COPY demo_data.txt /
 ENV PATH=/apache-hive-2.3.9-bin/bin:/hadoop-3.1.0/bin:/hadoop-3.1.0/sbin:$PATH
 RUN service ssh start && sed s/HOSTNAME/$HOSTNAME/ /hadoop-3.1.0/etc/hadoop/core-site.xml.template > /hadoop-3.1.0/etc/hadoop/core-site.xml && hdfs namenode -format
 COPY start.sh /
-
diff --git a/docker/test/integration/postgresql_java_client/Dockerfile b/docker/test/integration/postgresql_java_client/Dockerfile
index f5484028ec9..c5583085ef3 100644
--- a/docker/test/integration/postgresql_java_client/Dockerfile
+++ b/docker/test/integration/postgresql_java_client/Dockerfile
@@ -3,14 +3,10 @@
 
 FROM ubuntu:18.04
 
-RUN apt-get update && \
-    apt-get install -y software-properties-common build-essential openjdk-8-jdk curl
-
-RUN rm -rf \
-        /var/lib/apt/lists/* \
-        /var/cache/debconf \
-        /tmp/* \
-RUN apt-get clean
+RUN apt-get update \
+    && apt-get install -y software-properties-common build-essential openjdk-8-jdk curl \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 ARG ver=42.2.12
 RUN curl -L -o /postgresql-java-${ver}.jar https://repo1.maven.org/maven2/org/postgresql/postgresql/${ver}/postgresql-${ver}.jar
diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index c795fbf0672..ed8c75ab00f 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -37,11 +37,8 @@ RUN apt-get update \
     libkrb5-dev \
     krb5-user \
     g++ \
-    && rm -rf \
-        /var/lib/apt/lists/* \
-        /var/cache/debconf \
-        /tmp/* \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 ENV TZ=Etc/UTC
 RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone
diff --git a/docker/test/keeper-jepsen/Dockerfile b/docker/test/keeper-jepsen/Dockerfile
index a794e076ec0..3c5d0a6ecb4 100644
--- a/docker/test/keeper-jepsen/Dockerfile
+++ b/docker/test/keeper-jepsen/Dockerfile
@@ -24,7 +24,10 @@ RUN mkdir "/root/.ssh"
 RUN touch "/root/.ssh/known_hosts"
 
 # install java
-RUN apt-get update && apt-get install default-jre default-jdk libjna-java libjna-jni ssh gnuplot graphviz --yes --no-install-recommends
+RUN apt-get update && \
+    apt-get install default-jre default-jdk libjna-java libjna-jni ssh gnuplot graphviz --yes --no-install-recommends \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 # install clojure
 RUN curl -O "https://download.clojure.org/install/linux-install-${CLOJURE_VERSION}.sh" && \
diff --git a/docker/test/libfuzzer/Dockerfile b/docker/test/libfuzzer/Dockerfile
index 081cf5473f8..c9802a0e44e 100644
--- a/docker/test/libfuzzer/Dockerfile
+++ b/docker/test/libfuzzer/Dockerfile
@@ -27,7 +27,7 @@ RUN apt-get update \
             wget \
     && apt-get autoremove --yes \
     && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install Jinja2
 
diff --git a/docker/test/performance-comparison/Dockerfile b/docker/test/performance-comparison/Dockerfile
index e4ced104445..1835900b316 100644
--- a/docker/test/performance-comparison/Dockerfile
+++ b/docker/test/performance-comparison/Dockerfile
@@ -37,7 +37,7 @@ RUN apt-get update \
     && apt-get purge --yes python3-dev g++ \
     && apt-get autoremove --yes \
     && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 COPY run.sh /
 
diff --git a/docker/test/server-jepsen/Dockerfile b/docker/test/server-jepsen/Dockerfile
index a212427b2a1..fd70fc45702 100644
--- a/docker/test/server-jepsen/Dockerfile
+++ b/docker/test/server-jepsen/Dockerfile
@@ -31,7 +31,9 @@ RUN mkdir "/root/.ssh"
 RUN touch "/root/.ssh/known_hosts"
 
 # install java
-RUN apt-get update && apt-get install default-jre default-jdk libjna-java libjna-jni ssh gnuplot graphviz --yes --no-install-recommends
+RUN apt-get update && apt-get install default-jre default-jdk libjna-java libjna-jni ssh gnuplot graphviz --yes --no-install-recommends \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 # install clojure
 RUN curl -O "https://download.clojure.org/install/linux-install-${CLOJURE_VERSION}.sh" && \
diff --git a/docker/test/sqlancer/Dockerfile b/docker/test/sqlancer/Dockerfile
index 5977044345e..82fc2598397 100644
--- a/docker/test/sqlancer/Dockerfile
+++ b/docker/test/sqlancer/Dockerfile
@@ -5,9 +5,10 @@ FROM ubuntu:22.04
 ARG apt_archive="http://archive.ubuntu.com"
 RUN sed -i "s|http://archive.ubuntu.com|$apt_archive|g" /etc/apt/sources.list
 
-RUN apt-get update --yes && \
-	env DEBIAN_FRONTEND=noninteractive apt-get install wget git default-jdk maven python3 --yes --no-install-recommends && \
-	apt-get clean
+RUN apt-get update --yes \
+    && env DEBIAN_FRONTEND=noninteractive apt-get install wget git default-jdk maven python3 --yes --no-install-recommends  \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 # We need to get the repository's HEAD each time despite, so we invalidate layers' cache
 ARG CACHE_INVALIDATOR=0
diff --git a/docker/test/sqllogic/Dockerfile b/docker/test/sqllogic/Dockerfile
index 48457a99de3..05130044c45 100644
--- a/docker/test/sqllogic/Dockerfile
+++ b/docker/test/sqllogic/Dockerfile
@@ -15,7 +15,8 @@ RUN apt-get update --yes \
             unixodbc-dev \
             odbcinst \
             sudo \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install \
     numpy \
diff --git a/docker/test/sqltest/Dockerfile b/docker/test/sqltest/Dockerfile
index 437677f4fd1..7f59f65761f 100644
--- a/docker/test/sqltest/Dockerfile
+++ b/docker/test/sqltest/Dockerfile
@@ -11,7 +11,8 @@ RUN apt-get update --yes \
             python3-dev \
             python3-pip \
             sudo \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install \
     pyyaml \
diff --git a/docker/test/stateful/Dockerfile b/docker/test/stateful/Dockerfile
index 3509998e1d4..355e70f180e 100644
--- a/docker/test/stateful/Dockerfile
+++ b/docker/test/stateful/Dockerfile
@@ -9,7 +9,8 @@ RUN apt-get update -y \
         python3-requests \
         nodejs \
         npm \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 COPY create.sql /
 COPY run.sh /
diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index bc26234db24..66ba0a58e03 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -44,7 +44,8 @@ RUN apt-get update -y \
             pv \
             zip \
             p7zip-full \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 RUN pip3 install numpy scipy pandas Jinja2 pyarrow
 
diff --git a/docker/test/stateless/clickhouse-statelest-test-runner.Dockerfile b/docker/test/stateless/clickhouse-statelest-test-runner.Dockerfile
index dc83e8b8d2e..a9802f6f1da 100644
--- a/docker/test/stateless/clickhouse-statelest-test-runner.Dockerfile
+++ b/docker/test/stateless/clickhouse-statelest-test-runner.Dockerfile
@@ -9,6 +9,8 @@ FROM ubuntu:20.04 as clickhouse-test-runner-base
 VOLUME /packages
 
 CMD apt-get update ;\
-	DEBIAN_FRONTEND=noninteractive \
-	apt install -y /packages/clickhouse-common-static_*.deb \
-		/packages/clickhouse-client_*.deb
+    DEBIAN_FRONTEND=noninteractive \
+    apt install -y /packages/clickhouse-common-static_*.deb \
+        /packages/clickhouse-client_*.deb \
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
diff --git a/docker/test/stress/Dockerfile b/docker/test/stress/Dockerfile
index 5a9625d8109..0f81a1cd07f 100644
--- a/docker/test/stress/Dockerfile
+++ b/docker/test/stress/Dockerfile
@@ -19,7 +19,8 @@ RUN apt-get update -y \
             openssl \
             netcat-openbsd \
             brotli \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 COPY run.sh /
 
diff --git a/docker/test/style/Dockerfile b/docker/test/style/Dockerfile
index a4feae27c67..f2bac2f5da4 100644
--- a/docker/test/style/Dockerfile
+++ b/docker/test/style/Dockerfile
@@ -21,7 +21,8 @@ RUN apt-get update && env DEBIAN_FRONTEND=noninteractive apt-get install --yes \
     locales \
     && pip3 install black==23.1.0 boto3 codespell==2.2.1 mypy==1.3.0 PyGithub unidiff pylint==2.6.2 \
     && apt-get clean \
-    && rm -rf /root/.cache/pip 
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/* \
+    && rm -rf /root/.cache/pip
 
 RUN echo "en_US.UTF-8 UTF-8" > /etc/locale.gen && locale-gen en_US.UTF-8
 ENV LC_ALL en_US.UTF-8
diff --git a/docker/test/upgrade/Dockerfile b/docker/test/upgrade/Dockerfile
index 9152230af1c..78d912fd031 100644
--- a/docker/test/upgrade/Dockerfile
+++ b/docker/test/upgrade/Dockerfile
@@ -19,7 +19,8 @@ RUN apt-get update -y \
             openssl \
             netcat-openbsd \
             brotli \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
 COPY run.sh /
 
diff --git a/docker/test/util/Dockerfile b/docker/test/util/Dockerfile
index eb5abce280a..054eac5f764 100644
--- a/docker/test/util/Dockerfile
+++ b/docker/test/util/Dockerfile
@@ -27,7 +27,9 @@ RUN apt-get update \
     && export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
     && echo "deb https://apt.llvm.org/${CODENAME}/ llvm-toolchain-${CODENAME}-${LLVM_VERSION} main" >> \
         /etc/apt/sources.list \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
+
 
 # Install cmake 3.20+ for rust support
 # Used https://askubuntu.com/a/1157132 as reference
@@ -60,7 +62,9 @@ RUN apt-get update \
         software-properties-common \
         tzdata \
         --yes --no-install-recommends \
-    && apt-get clean
+    && apt-get clean \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
+
 
 # This symlink required by gcc to find lld compiler
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld

From 2577f8031bee7f549614e6e47d975862db0c9f5c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 29 Jan 2024 14:04:48 +0100
Subject: [PATCH 0506/1081] Add suid bit to gdb in fast tests image

---
 docker/test/fasttest/Dockerfile | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/docker/test/fasttest/Dockerfile b/docker/test/fasttest/Dockerfile
index 64f6a1846a5..e10555d4d4a 100644
--- a/docker/test/fasttest/Dockerfile
+++ b/docker/test/fasttest/Dockerfile
@@ -33,12 +33,14 @@ RUN mkdir -p /tmp/clickhouse-odbc-tmp \
   && cp /tmp/clickhouse-odbc-tmp/lib64/*.so /usr/local/lib/ \
   && odbcinst -i -d -f /tmp/clickhouse-odbc-tmp/share/doc/clickhouse-odbc/config/odbcinst.ini.sample \
   && odbcinst -i -s -l -f /tmp/clickhouse-odbc-tmp/share/doc/clickhouse-odbc/config/odbc.ini.sample \
-  && rm -rf /tmp/clickhouse-odbc-tmp \
+  && rm -rf /tmp/clickhouse-odbc-tmp
+
+# Give suid to gdb to grant it attach permissions
+# chmod 777 to make the container user independent
+RUN chmod u+s /usr/bin/gdb \
   && mkdir -p /var/lib/clickhouse \
   && chmod 777 /var/lib/clickhouse
 
-# chmod 777 to make the container user independent
-
 ENV TZ=Europe/Amsterdam
 RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone
 

From 6f1fbdb5ca30f608bc2038068934cb314a95fa4f Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 31 Jan 2024 15:08:39 +0100
Subject: [PATCH 0507/1081] Fix the failed upgrade of kazoo to 2.10.0

---
 docker/test/integration/runner/Dockerfile | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index ed8c75ab00f..9199e941476 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -59,6 +59,8 @@ RUN curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add - \
     && dockerd --version; docker --version
 
 
+# kazoo 2.10.0 is broken
+# https://s3.amazonaws.com/clickhouse-test-reports/59337/524625a1d2f4cc608a3f1059e3df2c30f353a649/integration_tests__asan__analyzer__[5_6].html
 RUN python3 -m pip install --no-cache-dir \
     PyMySQL \
     aerospike==11.1.0 \
@@ -76,7 +78,7 @@ RUN python3 -m pip install --no-cache-dir \
     grpcio \
     grpcio-tools \
     kafka-python \
-    kazoo \
+    kazoo==2.9.0 \
     lz4 \
     minio \
     nats-py \

From a043227685a254159a0b1469d11e5f9756f943b3 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Thu, 1 Feb 2024 10:36:31 +0000
Subject: [PATCH 0508/1081] Fix ARRAY JOIN with subcolumns in analyzer

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 96 ++++++++++++++++++-
 tests/analyzer_integration_broken_tests.txt   |  1 -
 ...74_analyzer_array_join_subcolumn.reference | 16 ++++
 .../02974_analyzer_array_join_subcolumn.sql   | 24 +++++
 4 files changed, 133 insertions(+), 4 deletions(-)
 create mode 100644 tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.reference
 create mode 100644 tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.sql

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 881d5cd00b2..d92acc2b948 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -424,6 +424,7 @@ struct TableExpressionData
     bool should_qualify_columns = true;
     NamesAndTypes column_names_and_types;
     ColumnNameToColumnNodeMap column_name_to_column_node;
+    std::unordered_set<std::string> subcolumn_names; /// Subset columns that are subcolumns of other columns
     std::unordered_set<std::string, StringTransparentHash, std::equal_to<>> column_identifier_first_parts;
 
     bool hasFullIdentifierName(IdentifierView identifier_view) const
@@ -1306,6 +1307,12 @@ private:
         const QueryTreeNodePtr & table_expression_node,
         IdentifierResolveScope & scope);
 
+    QueryTreeNodePtr matchArrayJoinSubcolumns(
+        const QueryTreeNodePtr & array_join_column_inner_expression,
+        const ColumnNode & array_join_column_expression_typed,
+        const QueryTreeNodePtr & resolved_expression,
+        IdentifierResolveScope & scope);
+
     QueryTreeNodePtr tryResolveExpressionFromArrayJoinExpressions(const QueryTreeNodePtr & resolved_expression,
         const QueryTreeNodePtr & table_expression_node,
         IdentifierResolveScope & scope);
@@ -2910,8 +2917,23 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromStorage(
     QueryTreeNodePtr result_expression;
     bool match_full_identifier = false;
 
-    auto it = table_expression_data.column_name_to_column_node.find(identifier_without_column_qualifier.getFullName());
-    if (it != table_expression_data.column_name_to_column_node.end())
+    const auto & identifier_full_name = identifier_without_column_qualifier.getFullName();
+    auto it = table_expression_data.column_name_to_column_node.find(identifier_full_name);
+    bool can_resolve_directly_from_storage = it != table_expression_data.column_name_to_column_node.end();
+    if (can_resolve_directly_from_storage && table_expression_data.subcolumn_names.contains(identifier_full_name))
+    {
+        /** In the case when we have an ARRAY JOIN, we should not resolve subcolumns directly from storage.
+          * For example, consider the following SQL query:
+          * SELECT ProfileEvents.Values FROM system.query_log ARRAY JOIN ProfileEvents
+          * In this case, ProfileEvents.Values should also be array joined, not directly resolved from storage.
+          */
+        auto * nearest_query_scope = scope.getNearestQueryScope();
+        auto * nearest_query_scope_query_node = nearest_query_scope ? nearest_query_scope->scope_node->as<QueryNode>() : nullptr;
+        if (nearest_query_scope_query_node && nearest_query_scope_query_node->getJoinTree()->getNodeType() == QueryTreeNodeType::ARRAY_JOIN)
+            can_resolve_directly_from_storage = false;
+    }
+
+    if (can_resolve_directly_from_storage)
     {
         match_full_identifier = true;
         result_expression = it->second;
@@ -3394,6 +3416,68 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromJoin(const IdentifierLoo
     return resolved_identifier;
 }
 
+QueryTreeNodePtr QueryAnalyzer::matchArrayJoinSubcolumns(
+    const QueryTreeNodePtr & array_join_column_inner_expression,
+    const ColumnNode & array_join_column_expression_typed,
+    const QueryTreeNodePtr & resolved_expression,
+    IdentifierResolveScope & scope)
+{
+    const auto * resolved_function = resolved_expression->as<FunctionNode>();
+    if (!resolved_function || resolved_function->getFunctionName() != "getSubcolumn")
+        return {};
+
+    const auto * array_join_parent_column = array_join_column_inner_expression.get();
+
+    /** If both resolved and array-joined expressions are subcolumns, try to match them:
+      * For example, in `SELECT t.map.values FROM (SELECT * FROM tbl) ARRAY JOIN t.map`
+      * Identifier `t.map.values` is resolved into `getSubcolumn(t, 'map.values')` and t.map is resolved into `getSubcolumn(t, 'map')`
+      * Since we need to perform array join on `getSubcolumn(t, 'map')`, `t.map.values` should become `getSubcolumn(getSubcolumn(t, 'map'), 'values')`
+      *
+      * Note: It doesn't work when subcolumn in ARRAY JOIN is transformed by another expression, for example
+      * SELECT c.map, c.map.values FROM (SELECT * FROM tbl) ARRAY JOIN mapApply(x -> x, t.map);
+      */
+    String array_join_subcolumn_prefix;
+    auto * array_join_column_inner_expression_function = array_join_column_inner_expression->as<FunctionNode>();
+    if (array_join_column_inner_expression_function &&
+        array_join_column_inner_expression_function->getFunctionName() == "getSubcolumn")
+    {
+        const auto & argument_nodes = array_join_column_inner_expression_function->getArguments().getNodes();
+        if (argument_nodes.size() == 2 && argument_nodes.at(1)->getNodeType() == QueryTreeNodeType::CONSTANT)
+        {
+            const auto & constant_node = argument_nodes.at(1)->as<ConstantNode &>();
+            const auto & constant_node_value = constant_node.getValue();
+            if (constant_node_value.getType() == Field::Types::String)
+            {
+                array_join_subcolumn_prefix = constant_node_value.get<String>() + ".";
+                array_join_parent_column = argument_nodes.at(0).get();
+            }
+        }
+    }
+
+    const auto & argument_nodes = resolved_function->getArguments().getNodes();
+    if (argument_nodes.size() != 2 && !array_join_parent_column->isEqual(*argument_nodes.at(0)))
+        return {};
+
+    const auto * second_argument = argument_nodes.at(1)->as<ConstantNode>();
+    if (!second_argument || second_argument->getValue().getType() != Field::Types::String)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected constant string as second argument of getSubcolumn function {}", resolved_function->dumpTree());
+
+    const auto & resolved_subcolumn_path = second_argument->getValue().get<String &>();
+    if (!startsWith(resolved_subcolumn_path, array_join_subcolumn_prefix))
+        return {};
+
+    auto get_subcolumn_function = std::make_shared<FunctionNode>("getSubcolumn");
+    get_subcolumn_function->getArguments().getNodes().push_back(
+        std::make_shared<ColumnNode>(array_join_column_expression_typed.getColumn(), array_join_column_expression_typed.getColumnSource()));
+    get_subcolumn_function->getArguments().getNodes().push_back(
+        std::make_shared<ConstantNode>(resolved_subcolumn_path.substr(array_join_subcolumn_prefix.size())));
+
+    QueryTreeNodePtr function_query_node = get_subcolumn_function;
+    resolveFunction(function_query_node, scope);
+
+    return function_query_node;
+}
+
 QueryTreeNodePtr QueryAnalyzer::tryResolveExpressionFromArrayJoinExpressions(const QueryTreeNodePtr & resolved_expression,
     const QueryTreeNodePtr & table_expression_node,
     IdentifierResolveScope & scope)
@@ -3462,8 +3546,12 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveExpressionFromArrayJoinExpressions(con
                 array_join_column_expression_typed.getColumnSource());
             break;
         }
-    }
 
+        /// When we select subcolumn of array joined column it also should be array joined
+        array_join_resolved_expression = matchArrayJoinSubcolumns(array_join_column_inner_expression, array_join_column_expression_typed, resolved_expression, scope);
+        if (array_join_resolved_expression)
+            break;
+    }
     return array_join_resolved_expression;
 }
 
@@ -6424,6 +6512,8 @@ void QueryAnalyzer::initializeTableExpressionData(const QueryTreeNodePtr & table
           */
         for (const auto & column_name_and_type : table_expression_data.column_names_and_types)
         {
+            for (const auto & subcolumn : columns_description.getSubcolumns(column_name_and_type.name))
+                table_expression_data.subcolumn_names.insert(subcolumn.name);
             const auto & column_default = columns_description.getDefault(column_name_and_type.name);
 
             if (column_default && column_default->kind == ColumnDefaultKind::Alias)
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index e1d4de59a23..06142f98da1 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -10,7 +10,6 @@ test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_ove
 test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_task
 test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
-test_profile_events_s3/test.py::test_profile_events
 test_replicating_constants/test.py::test_different_versions
 test_select_access_rights/test_main.py::test_alias_columns
 test_select_access_rights/test_main.py::test_select_count
diff --git a/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.reference b/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.reference
new file mode 100644
index 00000000000..827c710ef1a
--- /dev/null
+++ b/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.reference
@@ -0,0 +1,16 @@
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
+('a',(1,2))	1
+('b',(2,3))	2
diff --git a/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.sql b/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.sql
new file mode 100644
index 00000000000..14823644b96
--- /dev/null
+++ b/tests/queries/0_stateless/02974_analyzer_array_join_subcolumn.sql
@@ -0,0 +1,24 @@
+DROP TABLE IF EXISTS t2;
+DROP TABLE IF EXISTS t3;
+
+CREATE TABLE t2 (id Int32, pe Map(String, Tuple(a UInt64, b UInt64))) ENGINE = MergeTree ORDER BY id;
+INSERT INTO t2 VALUES (1, {'a': (1, 2), 'b': (2, 3)}),
+
+CREATE TABLE t3 (id Int32, c Tuple(v String, pe Map(String, Tuple(a UInt64, b UInt64)))) ENGINE = MergeTree ORDER BY id;
+INSERT INTO t3 VALUES (1, ('A', {'a':(1, 2),'b':(2, 3)}));
+
+SELECT pe, pe.values.a FROM (SELECT * FROM t2) ARRAY JOIN pe SETTINGS allow_experimental_analyzer = 1;
+SELECT p, p.values.a FROM (SELECT * FROM t2) ARRAY JOIN pe AS p SETTINGS allow_experimental_analyzer = 1;
+
+SELECT pe, pe.values.a FROM t2 ARRAY JOIN pe;
+SELECT p, p.values.a FROM t2 ARRAY JOIN pe AS p;
+
+SELECT c.pe, c.pe.values.a FROM (SELECT * FROM t3) ARRAY JOIN c.pe SETTINGS allow_experimental_analyzer = 1;
+SELECT p, p.values.a FROM (SELECT * FROM t3) ARRAY JOIN c.pe as p SETTINGS allow_experimental_analyzer = 1;
+
+SELECT c.pe, c.pe.values.a FROM t3 ARRAY JOIN c.pe SETTINGS allow_experimental_analyzer = 1;
+SELECT p, p.values.a FROM t3 ARRAY JOIN c.pe as p;
+
+
+DROP TABLE IF EXISTS t2;
+DROP TABLE IF EXISTS t3;

From a0222c0479f302898cb1f7114826d14e7e9e042a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 1 Feb 2024 11:46:55 +0100
Subject: [PATCH 0509/1081] Fix problem detected by UBSAN

---
 src/Interpreters/GlobalSubqueriesVisitor.h                    | 4 +++-
 .../queries/0_stateless/02972_parallel_replicas_cte.reference | 1 +
 tests/queries/0_stateless/02972_parallel_replicas_cte.sql     | 4 ++++
 3 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/GlobalSubqueriesVisitor.h b/src/Interpreters/GlobalSubqueriesVisitor.h
index 08fbd748e48..5f029395df9 100644
--- a/src/Interpreters/GlobalSubqueriesVisitor.h
+++ b/src/Interpreters/GlobalSubqueriesVisitor.h
@@ -267,8 +267,10 @@ private:
                 /// We don't support WITH cte as (subquery) Select table JOIN cte because we don't do conversion in AST
                 bool is_subquery = false;
                 if (const auto * ast_table_expr = table_elem.table_expression->as<ASTTableExpression>())
-                    is_subquery = ast_table_expr->subquery->as<ASTSubquery>() != nullptr
+                {
+                    is_subquery = ast_table_expr->subquery && ast_table_expr->subquery->as<ASTSubquery>() != nullptr
                         && ast_table_expr->subquery->as<ASTSubquery>()->cte_name.empty();
+                }
                 else if (table_elem.table_expression->as<ASTSubquery>())
                     is_subquery = true;
 
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.reference b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
index fe21e3cec22..449fe3d34e3 100644
--- a/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.reference
@@ -1,2 +1,3 @@
 990000
 990000
+10
diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
index d65374a3e02..c39ad172a27 100644
--- a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
@@ -19,5 +19,9 @@ WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
 SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
 SETTINGS allow_experimental_analyzer = 0, allow_experimental_parallel_reading_from_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3; -- { serverError SUPPORT_IS_DISABLED }
 
+-- Sanitizer
+SELECT count() FROM pr_2 JOIN numbers(10) as pr_1 ON pr_2.a = pr_1.number
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3;
+
 DROP TABLE IF EXISTS pr_1;
 DROP TABLE IF EXISTS pr_2;

From d076b13ac8a7e874237832881ba19ea82f14bbf2 Mon Sep 17 00:00:00 2001
From: zhongyuankai <872237106@qq.com>
Date: Thu, 1 Feb 2024 18:51:54 +0800
Subject: [PATCH 0510/1081] `order by all` doesn't work for `select *`

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 27 ++++++++++---------
 .../0_stateless/02943_order_by_all.reference  |  9 +++++++
 .../0_stateless/02943_order_by_all.sql        | 20 ++++++++++++++
 3 files changed, 44 insertions(+), 12 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 881d5cd00b2..621ee700508 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1214,7 +1214,7 @@ private:
 
     static void expandGroupByAll(QueryNode & query_tree_node_typed);
 
-    static void expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings);
+    void expandOrderByAll(QueryNode & query_tree_node_typed, const Settings & settings);
 
     static std::string
     rewriteAggregateFunctionNameIfNeeded(const std::string & aggregate_function_name, NullsAction action, const ContextPtr & context);
@@ -2349,15 +2349,19 @@ void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed, const Se
 
     for (auto & node : projection_nodes)
     {
-        if (auto * identifier_node = node->as<IdentifierNode>(); identifier_node != nullptr)
-            if (Poco::toUpper(identifier_node->getIdentifier().getFullName()) == "ALL" || Poco::toUpper(identifier_node->getAlias()) == "ALL")
-                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
-                    "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
-
-        if (auto * function_node = node->as<FunctionNode>(); function_node != nullptr)
-            if (Poco::toUpper(function_node->getAlias()) == "ALL")
-                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
-                                "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+        auto resolved_expression_it = resolved_expressions.find(node);
+        if (resolved_expression_it != resolved_expressions.end())
+        {
+            auto projection_names = resolved_expression_it->second;
+            if (projection_names.size() != 1)
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                "Expression nodes list expected 1 projection names. Actual {}",
+                                projection_names.size());
+            else
+                if (Poco::toUpper(projection_names[0]) == "ALL")
+                    throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                                    "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+        }
 
         auto sort_node = std::make_shared<SortNode>(node, all_node->getSortDirection(), all_node->getNullsSortDirection());
         list_node->getNodes().push_back(sort_node);
@@ -7180,8 +7184,6 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
     if (query_node_typed.hasHaving() && query_node_typed.isGroupByWithTotals() && is_rollup_or_cube)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "WITH TOTALS and WITH ROLLUP or CUBE are not supported together in presence of HAVING");
 
-    expandOrderByAll(query_node_typed, settings);
-
     /// Initialize aliases in query node scope
     QueryExpressionsAliasVisitor visitor(scope);
 
@@ -7368,6 +7370,7 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
         if (settings.enable_positional_arguments)
             replaceNodesWithPositionalArguments(query_node_typed.getOrderByNode(), query_node_typed.getProjection().getNodes(), scope);
 
+        expandOrderByAll(query_node_typed, settings);
         resolveSortNodeList(query_node_typed.getOrderByNode(), scope);
     }
 
diff --git a/tests/queries/0_stateless/02943_order_by_all.reference b/tests/queries/0_stateless/02943_order_by_all.reference
index 48d828b6924..1c94206c687 100644
--- a/tests/queries/0_stateless/02943_order_by_all.reference
+++ b/tests/queries/0_stateless/02943_order_by_all.reference
@@ -82,3 +82,12 @@ B	3	10
 D	1	20
 A	2	30
 C	\N	40
+-- SELECT *
+A	2	30
+B	3	10
+C	\N	40
+D	1	20
+A	2	30
+B	3	10
+C	\N	40
+D	1	20
diff --git a/tests/queries/0_stateless/02943_order_by_all.sql b/tests/queries/0_stateless/02943_order_by_all.sql
index 0756563946c..0848b008fe4 100644
--- a/tests/queries/0_stateless/02943_order_by_all.sql
+++ b/tests/queries/0_stateless/02943_order_by_all.sql
@@ -86,4 +86,24 @@ SELECT a, b, all FROM order_by_all ORDER BY all, a;
 SET allow_experimental_analyzer = 1;
 SELECT a, b, all FROM order_by_all ORDER BY all, a;
 
+SELECT '-- SELECT *';
+DROP TABLE IF EXISTS order_by_all1;
+
+CREATE TABLE order_by_all1
+(
+    a String,
+    b Nullable(Int32),
+    c UInt64,
+)
+    ENGINE = Memory;
+
+INSERT INTO order_by_all1 VALUES ('B', 3, 10), ('C', NULL, 40), ('D', 1, 20), ('A', 2, 30);
+
+SET allow_experimental_analyzer = 0;
+SELECT * FROM order_by_all1 ORDER BY ALL;
+
+SET allow_experimental_analyzer = 1;
+SELECT * FROM order_by_all1 ORDER BY ALL;
+
 DROP TABLE order_by_all;
+DROP TABLE order_by_all1;

From 3a16427e002711005bcfa5b75bf7a1d301348e9f Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 1 Feb 2024 12:35:01 +0100
Subject: [PATCH 0511/1081] Fix test

---
 src/Storages/S3Queue/StorageS3Queue.cpp         | 1 -
 tests/integration/test_storage_s3_queue/test.py | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 5fc0d19ce0e..0723205b544 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -161,7 +161,6 @@ StorageS3Queue::StorageS3Queue(
     }
     catch (...)
     {
-        S3QueueMetadataFactory::instance().remove(zk_path);
         throw;
     }
 
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 34146484ced..2cb617b3872 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -541,7 +541,7 @@ def test_multiple_tables_meta_mismatch(started_cluster):
         )
     except QueryRuntimeException as e:
         assert (
-            "Metadata with the same `s3queue_zookeeper_path` was already created but with different settings"
+            "Existing table metadata in ZooKeeper differs in engine mode"
             in str(e)
         )
         failed = True

From 1d8de1d345e9e401c108a7b114933e0dd160cb01 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 1 Feb 2024 19:39:22 +0800
Subject: [PATCH 0512/1081] fix style

---
 src/Functions/if.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 7108ecfbbf3..9d6badcb645 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -38,7 +38,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
-    extern const int SIZES_OF_ARRAYS_DONT_MATCH;
+    extern const int LOGICAL_ERROR;
 }
 
 namespace

From fe829cac489ce09f80f8db7d9dfc6de27b9ae685 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 1 Feb 2024 11:43:55 +0000
Subject: [PATCH 0513/1081] Automatic style fix

---
 tests/integration/test_storage_s3_queue/test.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 2cb617b3872..810c4f29e9d 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -540,10 +540,7 @@ def test_multiple_tables_meta_mismatch(started_cluster):
             },
         )
     except QueryRuntimeException as e:
-        assert (
-            "Existing table metadata in ZooKeeper differs in engine mode"
-            in str(e)
-        )
+        assert "Existing table metadata in ZooKeeper differs in engine mode" in str(e)
         failed = True
 
     assert failed is True

From 82a4fa0dfcda1f4ea3d987a855d2321dc5a92523 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 1 Feb 2024 11:41:00 +0000
Subject: [PATCH 0514/1081] Smaller fixups

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp          |  7 +++----
 .../0_stateless/02943_order_by_all.reference       |  2 +-
 tests/queries/0_stateless/02943_order_by_all.sql   | 14 +++++++-------
 3 files changed, 11 insertions(+), 12 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 621ee700508..cb1e94305fb 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2357,10 +2357,9 @@ void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed, const Se
                 throw Exception(ErrorCodes::LOGICAL_ERROR,
                                 "Expression nodes list expected 1 projection names. Actual {}",
                                 projection_names.size());
-            else
-                if (Poco::toUpper(projection_names[0]) == "ALL")
-                    throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
-                                    "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+            if (Poco::toUpper(projection_names[0]) == "ALL")
+                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                                "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
         }
 
         auto sort_node = std::make_shared<SortNode>(node, all_node->getSortDirection(), all_node->getNullsSortDirection());
diff --git a/tests/queries/0_stateless/02943_order_by_all.reference b/tests/queries/0_stateless/02943_order_by_all.reference
index 1c94206c687..6eed33cc68d 100644
--- a/tests/queries/0_stateless/02943_order_by_all.reference
+++ b/tests/queries/0_stateless/02943_order_by_all.reference
@@ -82,7 +82,7 @@ B	3	10
 D	1	20
 A	2	30
 C	\N	40
--- SELECT *
+-- test SELECT * ORDER BY ALL with no "all" column in the SELECT clause
 A	2	30
 B	3	10
 C	\N	40
diff --git a/tests/queries/0_stateless/02943_order_by_all.sql b/tests/queries/0_stateless/02943_order_by_all.sql
index 0848b008fe4..0960d75ad96 100644
--- a/tests/queries/0_stateless/02943_order_by_all.sql
+++ b/tests/queries/0_stateless/02943_order_by_all.sql
@@ -86,10 +86,11 @@ SELECT a, b, all FROM order_by_all ORDER BY all, a;
 SET allow_experimental_analyzer = 1;
 SELECT a, b, all FROM order_by_all ORDER BY all, a;
 
-SELECT '-- SELECT *';
-DROP TABLE IF EXISTS order_by_all1;
+DROP TABLE order_by_all;
 
-CREATE TABLE order_by_all1
+SELECT '-- test SELECT * ORDER BY ALL with no "all" column in the SELECT clause';
+
+CREATE TABLE order_by_all
 (
     a String,
     b Nullable(Int32),
@@ -97,13 +98,12 @@ CREATE TABLE order_by_all1
 )
     ENGINE = Memory;
 
-INSERT INTO order_by_all1 VALUES ('B', 3, 10), ('C', NULL, 40), ('D', 1, 20), ('A', 2, 30);
+INSERT INTO order_by_all VALUES ('B', 3, 10), ('C', NULL, 40), ('D', 1, 20), ('A', 2, 30);
 
 SET allow_experimental_analyzer = 0;
-SELECT * FROM order_by_all1 ORDER BY ALL;
+SELECT * FROM order_by_all ORDER BY ALL;
 
 SET allow_experimental_analyzer = 1;
-SELECT * FROM order_by_all1 ORDER BY ALL;
+SELECT * FROM order_by_all ORDER BY ALL;
 
 DROP TABLE order_by_all;
-DROP TABLE order_by_all1;

From 6e82dc81fcf6daa0180ec09f82a1e367788864f6 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Wed, 31 Jan 2024 22:35:13 +0100
Subject: [PATCH 0515/1081] Use fixed seed in test

---
 tests/queries/0_stateless/02975_system_zookeeper_retries.sql | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02975_system_zookeeper_retries.sql b/tests/queries/0_stateless/02975_system_zookeeper_retries.sql
index c23a1ad41c9..8b402ec6d65 100644
--- a/tests/queries/0_stateless/02975_system_zookeeper_retries.sql
+++ b/tests/queries/0_stateless/02975_system_zookeeper_retries.sql
@@ -7,7 +7,8 @@ ORDER BY path, name
 SETTINGS
   insert_keeper_retry_initial_backoff_ms = 1,
   insert_keeper_retry_max_backoff_ms = 20,
-  insert_keeper_fault_injection_probability=0.5,
+  insert_keeper_fault_injection_probability=0.3,
+  insert_keeper_fault_injection_seed=4,
   log_comment='02975_system_zookeeper_retries';
 
 
From 92a00d317cddec0e65d398db01ef7ee71fc818a5 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 31 Jan 2024 11:38:22 +0000
Subject: [PATCH 0516/1081] Cosmetics

---
 base/base/getMemoryAmount.cpp              | 17 +++++----
 src/Common/getNumberOfPhysicalCPUCores.cpp | 40 +++++++++++-----------
 2 files changed, 30 insertions(+), 27 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index a46e964c5a3..2e89ac52650 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -1,8 +1,10 @@
-#include <stdexcept>
-#include <fstream>
 #include <base/getMemoryAmount.h>
+
 #include <base/getPageSize.h>
 
+#include <fstream>
+#include <stdexcept>
+
 #include <unistd.h>
 #include <sys/types.h>
 #include <sys/param.h>
@@ -27,10 +29,11 @@ uint64_t getMemoryAmountOrZero()
     uint64_t memory_amount = num_pages * page_size;
 
 #if defined(OS_LINUX)
-    // Try to lookup at the Cgroup limit
+    /// Limit the memory amount by limits set by cgroups
+    std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
 
-    // CGroups v2
-    std::ifstream cgroupv2_limit("/sys/fs/cgroup/memory.max");
+    /// cgroups v2
+    std::ifstream cgroupv2_limit(default_cgroups_mount / "memory.max");
     if (cgroupv2_limit.is_open())
     {
         uint64_t memory_limit = 0;
@@ -40,8 +43,8 @@ uint64_t getMemoryAmountOrZero()
     }
     else
     {
-        // CGroups v1
-        std::ifstream cgroup_limit("/sys/fs/cgroup/memory/memory.limit_in_bytes");
+        /// cgroups v1
+        std::ifstream cgroup_limit(default_cgroups_mount / "memory/memory.limit_in_bytes");
         if (cgroup_limit.is_open())
         {
             uint64_t memory_limit = 0; // in case of read error
diff --git a/src/Common/getNumberOfPhysicalCPUCores.cpp b/src/Common/getNumberOfPhysicalCPUCores.cpp
index 8fbb32e911f..21060bbfaf1 100644
--- a/src/Common/getNumberOfPhysicalCPUCores.cpp
+++ b/src/Common/getNumberOfPhysicalCPUCores.cpp
@@ -1,7 +1,6 @@
 #include "getNumberOfPhysicalCPUCores.h"
 #include <filesystem>
 
-#include "config.h"
 #if defined(OS_LINUX)
 #    include <cmath>
 #    include <fstream>
@@ -34,9 +33,9 @@ int32_t readFrom(const std::filesystem::path & filename, int default_value)
 uint32_t getCGroupLimitedCPUCores(unsigned default_cpu_count)
 {
     uint32_t quota_count = default_cpu_count;
-    std::filesystem::path prefix = "/sys/fs/cgroup";
+    std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
     /// cgroupsv2
-    std::ifstream contr_file(prefix / "cgroup.controllers");
+    std::ifstream contr_file(default_cgroups_mount / "cgroup.controllers");
     if (contr_file.is_open())
     {
         /// First, we identify the cgroup the process belongs
@@ -51,16 +50,15 @@ uint32_t getCGroupLimitedCPUCores(unsigned default_cpu_count)
 
         std::filesystem::path current_cgroup;
         if (cgroup_name.empty())
-            current_cgroup = prefix;
+            current_cgroup = default_cgroups_mount;
         else
-            current_cgroup = prefix / cgroup_name;
+            current_cgroup = default_cgroups_mount / cgroup_name;
 
         // Looking for cpu.max in directories from the current cgroup to the top level
         // It does not stop on the first time since the child could have a greater value than parent
-        while (current_cgroup != prefix.parent_path())
+        while (current_cgroup != default_cgroups_mount.parent_path())
         {
             std::ifstream cpu_max_file(current_cgroup / "cpu.max");
-            current_cgroup = current_cgroup.parent_path();
             if (cpu_max_file.is_open())
             {
                 std::string cpu_limit_str;
@@ -72,10 +70,11 @@ uint32_t getCGroupLimitedCPUCores(unsigned default_cpu_count)
                     quota_count = std::min(static_cast<uint32_t>(ceil(cpu_limit / cpu_period)), quota_count);
                 }
             }
+            current_cgroup = current_cgroup.parent_path();
         }
-        current_cgroup = prefix / cgroup_name;
+        current_cgroup = default_cgroups_mount / cgroup_name;
         // Looking for cpuset.cpus.effective in directories from the current cgroup to the top level
-        while (current_cgroup != prefix.parent_path())
+        while (current_cgroup != default_cgroups_mount.parent_path())
         {
             std::ifstream cpuset_cpus_file(current_cgroup / "cpuset.cpus.effective");
             current_cgroup = current_cgroup.parent_path();
@@ -113,8 +112,8 @@ uint32_t getCGroupLimitedCPUCores(unsigned default_cpu_count)
     /// cgroupsv1
     /// Return the number of milliseconds per period process is guaranteed to run.
     /// -1 for no quota
-    int cgroup_quota = readFrom(prefix / "cpu/cpu.cfs_quota_us", -1);
-    int cgroup_period = readFrom(prefix / "cpu/cpu.cfs_period_us", -1);
+    int cgroup_quota = readFrom(default_cgroups_mount / "cpu/cpu.cfs_quota_us", -1);
+    int cgroup_period = readFrom(default_cgroups_mount / "cpu/cpu.cfs_period_us", -1);
     if (cgroup_quota > -1 && cgroup_period > 0)
         quota_count = static_cast<uint32_t>(ceil(static_cast<float>(cgroup_quota) / static_cast<float>(cgroup_period)));
 
@@ -178,24 +177,25 @@ catch (...)
 
 unsigned getNumberOfPhysicalCPUCoresImpl()
 {
-    unsigned cpu_count = std::thread::hardware_concurrency(); /// logical cores (with SMT/HyperThreading)
+    unsigned cores = std::thread::hardware_concurrency(); /// logical cores (with SMT/HyperThreading)
 
+
+#if defined(__x86_64__) && defined(OS_LINUX)
     /// Most x86_64 CPUs have 2-way SMT (Hyper-Threading).
     /// Aarch64 and RISC-V don't have SMT so far.
     /// POWER has SMT and it can be multi-way (e.g. 8-way), but we don't know how ClickHouse really behaves, so use all of them.
-
-#if defined(__x86_64__) && defined(OS_LINUX)
+    ///
     /// On really big machines, SMT is detrimental to performance (+ ~5% overhead in ClickBench). On such machines, we limit ourself to the physical cores.
     /// Few cores indicate it is a small machine, runs in a VM or is a limited cloud instance --> it is reasonable to use all the cores.
-    if (cpu_count >= 32)
-        cpu_count = physical_concurrency();
+    if (cores >= 32)
+        cores = physical_concurrency();
 #endif
 
 #if defined(OS_LINUX)
-    cpu_count = getCGroupLimitedCPUCores(cpu_count);
+    cores = getCGroupLimitedCPUCores(cores);
 #endif
 
-    return cpu_count;
+    return cores;
 }
 
 }
@@ -203,6 +203,6 @@ unsigned getNumberOfPhysicalCPUCoresImpl()
 unsigned getNumberOfPhysicalCPUCores()
 {
     /// Calculate once.
-    static auto res = getNumberOfPhysicalCPUCoresImpl();
-    return res;
+    static auto cores = getNumberOfPhysicalCPUCoresImpl();
+    return cores;
 }

From ad0c0d87276e7a2a9eedee07a41a55895f7d88a5 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 31 Jan 2024 11:47:38 +0000
Subject: [PATCH 0517/1081] Factorize cgroup memory access code

This fixes the edge case that cgroup memory limit "0" is no longer
interpreted as "no limit" but as actual zero available memory, see (*).
The cgroup default setting "max" continues to be interpreted as "no
limit".

(*) https://docs.kernel.org/admin-guide/cgroup-v2.html
---
 base/base/getMemoryAmount.cpp | 51 ++++++++++++++++++++---------------
 1 file changed, 29 insertions(+), 22 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 2e89ac52650..167cd807774 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -13,6 +13,28 @@
 #endif
 
 
+namespace
+{
+
+std::optional<uint64_t> getCgroupsMemoryLimit(const std::string & setting)
+{
+#if defined(OS_LINUX)
+    std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
+    std::ifstream file(default_cgroups_mount / setting);
+    if (!file.is_open())
+        return {};
+    uint64_t value;
+    if (file >> value)
+        return {value};
+    else
+        return {}; /// e.g. the cgroups default "max"
+#else
+    return {};
+#endif
+}
+
+}
+
 /** Returns the size of physical memory (RAM) in bytes.
   * Returns 0 on unsupported platform
   */
@@ -28,35 +50,20 @@ uint64_t getMemoryAmountOrZero()
 
     uint64_t memory_amount = num_pages * page_size;
 
-#if defined(OS_LINUX)
-    /// Limit the memory amount by limits set by cgroups
-    std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
+    /// Respect the memory limit set by cgroups
 
     /// cgroups v2
-    std::ifstream cgroupv2_limit(default_cgroups_mount / "memory.max");
-    if (cgroupv2_limit.is_open())
-    {
-        uint64_t memory_limit = 0;
-        cgroupv2_limit >> memory_limit;
-        if (memory_limit > 0 && memory_limit < memory_amount)
-            memory_amount = memory_limit;
-    }
+    auto limit_v2 = getCgroupsMemoryLimit("memory.max");
+    if (limit_v2.has_value() && *limit_v2 < memory_amount)
+         memory_amount = *limit_v2;
     else
     {
-        /// cgroups v1
-        std::ifstream cgroup_limit(default_cgroups_mount / "memory/memory.limit_in_bytes");
-        if (cgroup_limit.is_open())
-        {
-            uint64_t memory_limit = 0; // in case of read error
-            cgroup_limit >> memory_limit;
-            if (memory_limit > 0 && memory_limit < memory_amount)
-                memory_amount = memory_limit;
-        }
+        auto limit_v1 = getCgroupsMemoryLimit("memory/memory.limit_in_bytes");
+        if (limit_v1.has_value() && *limit_v1 < memory_amount)
+             memory_amount = *limit_v1;
     }
-#endif
 
     return memory_amount;
-
 }
 
 
From 3243ea0b66ed9b435011aa6570b70ed080cd5410 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 31 Jan 2024 12:49:03 +0000
Subject: [PATCH 0518/1081] Remove cgroups v1 support to simplify the code
 going forward

---
 base/base/getMemoryAmount.cpp | 18 ++++++------------
 1 file changed, 6 insertions(+), 12 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 167cd807774..060de685778 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -16,7 +16,7 @@
 namespace
 {
 
-std::optional<uint64_t> getCgroupsMemoryLimit(const std::string & setting)
+std::optional<uint64_t> getCgroupsV2MemoryLimit(const std::string & setting)
 {
 #if defined(OS_LINUX)
     std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
@@ -50,18 +50,12 @@ uint64_t getMemoryAmountOrZero()
 
     uint64_t memory_amount = num_pages * page_size;
 
-    /// Respect the memory limit set by cgroups
+    /// Respect the memory limit set by cgroups v2.
+    /// Cgroups v1 is dead since many years and its limits are not considered for simplicity.
 
-    /// cgroups v2
-    auto limit_v2 = getCgroupsMemoryLimit("memory.max");
-    if (limit_v2.has_value() && *limit_v2 < memory_amount)
-         memory_amount = *limit_v2;
-    else
-    {
-        auto limit_v1 = getCgroupsMemoryLimit("memory/memory.limit_in_bytes");
-        if (limit_v1.has_value() && *limit_v1 < memory_amount)
-             memory_amount = *limit_v1;
-    }
+    auto limit = getCgroupsV2MemoryLimit("memory.max");
+    if (limit.has_value() && *limit < memory_amount)
+         memory_amount = *limit;
 
     return memory_amount;
 }

From 03249f3efa4c3dcc1ecbdfe691171acef7009ee5 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 12:24:24 +0000
Subject: [PATCH 0519/1081] Fixes & comments

staleness -> delay (double -> UInt32)
---
 src/Client/ConnectionEstablisher.cpp        |  5 +-
 src/Client/HedgedConnectionsFactory.cpp     |  2 +-
 src/Common/PoolWithFailoverBase.h           | 93 +++++++++++----------
 src/Processors/QueryPlan/ReadFromRemote.cpp |  4 +-
 4 files changed, 52 insertions(+), 52 deletions(-)

diff --git a/src/Client/ConnectionEstablisher.cpp b/src/Client/ConnectionEstablisher.cpp
index a9009e5bb25..4ff4cceee5e 100644
--- a/src/Client/ConnectionEstablisher.cpp
+++ b/src/Client/ConnectionEstablisher.cpp
@@ -79,14 +79,13 @@ void ConnectionEstablisher::run(ConnectionEstablisher::TryResult & result, std::
             return;
         }
 
-        UInt32 delay = table_status_it->second.absolute_delay;
-
+        const UInt32 delay = table_status_it->second.absolute_delay;
         if (delay < max_allowed_delay)
             result.is_up_to_date = true;
         else
         {
             result.is_up_to_date = false;
-            result.staleness = delay;
+            result.delay = delay;
 
             LOG_TRACE(log, "Server {} has unacceptable replica delay for table {}.{}: {}", result.entry->getDescription(), table_to_check->database, table_to_check->table, delay);
             ProfileEvents::increment(ProfileEvents::DistributedConnectionStaleReplica);
diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index 01f9a32ce75..8d21b1032d6 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -413,7 +413,7 @@ HedgedConnectionsFactory::State HedgedConnectionsFactory::setBestUsableReplica(C
         indexes.end(),
         [&](size_t lhs, size_t rhs)
         {
-            return replicas[lhs].connection_establisher->getResult().staleness < replicas[rhs].connection_establisher->getResult().staleness;
+            return replicas[lhs].connection_establisher->getResult().delay < replicas[rhs].connection_establisher->getResult().delay;
         });
 
     replicas[indexes[0]].is_ready = true;
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index ef4bb40535f..6cd72391fc9 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -73,26 +73,20 @@ public:
     {
         TryResult() = default;
 
-        explicit TryResult(Entry entry_)
-            : entry(std::move(entry_))
-            , is_usable(true)
-            , is_up_to_date(true)
-        {
-        }
-
         void reset()
         {
             entry = Entry();
             is_usable = false;
             is_up_to_date = false;
-            staleness = 0.0;
+            delay = 0;
         }
 
-        Entry entry;
-        bool is_usable = false; /// If false, the entry is unusable for current request
-                                /// (but may be usable for other requests, so error counts are not incremented)
-        bool is_up_to_date = false; /// If true, the entry is a connection to up-to-date replica.
-        double staleness = 0.0; /// Helps choosing the "least stale" option when all replicas are stale.
+        Entry entry; /// use isNull() to check if conection is established
+        bool is_usable = false; /// if connection is established, then can be false only with table check
+                                /// if table is not present on remote peer, -> it'll be false
+        bool is_up_to_date = false; /// If true, the entry is a connection to up-to-date replica
+                                    /// Depends on max_replica_delay_for_distributed_queries setting
+        UInt32 delay = 0; /// Helps choosing the "least stale" option when all replicas are stale.
     };
 
     struct PoolState;
@@ -249,44 +243,51 @@ PoolWithFailoverBase<TNestedPool>::getMany(
     });
 
     std::string fail_messages;
-    for (size_t i = 0; i < shuffled_pools.size(); ++i)
+    bool finished = false;
+    while (!finished)
     {
-        if (up_to_date_count >= max_entries /// Already enough good entries.
-            || entries_count + failed_pools_count >= nested_pools.size()) /// No more good entries will be produced.
-            break;
-
-        ShuffledPool & shuffled_pool = shuffled_pools[i];
-        TryResult & result = try_results[i];
-        if (max_tries && (shuffled_pool.error_count >= max_tries || !result.entry.isNull()))
-            continue;
-
-        std::string fail_message;
-        result = try_get_entry(*shuffled_pool.pool, fail_message);
-
-        if (!fail_message.empty())
-            fail_messages += fail_message + '\n';
-
-        if (!result.entry.isNull())
+        for (size_t i = 0; i < shuffled_pools.size(); ++i)
         {
-            ++entries_count;
-            if (result.is_usable)
+            if (up_to_date_count >= max_entries /// Already enough good entries.
+                || entries_count + failed_pools_count >= nested_pools.size()) /// No more good entries will be produced.
             {
-                ++usable_count;
-                if (result.is_up_to_date)
-                    ++up_to_date_count;
+                finished = true;
+                break;
             }
-        }
-        else
-        {
-            LOG_WARNING(log, "Connection failed at try №{}, reason: {}", (shuffled_pool.error_count + 1), fail_message);
-            ProfileEvents::increment(ProfileEvents::DistributedConnectionFailTry);
 
-            shuffled_pool.error_count = std::min(max_error_cap, shuffled_pool.error_count + 1);
+            ShuffledPool & shuffled_pool = shuffled_pools[i];
+            TryResult & result = try_results[i];
+            if (max_tries && (shuffled_pool.error_count >= max_tries || !result.entry.isNull()))
+                continue;
 
-            if (shuffled_pool.error_count >= max_tries)
+            std::string fail_message;
+            result = try_get_entry(*shuffled_pool.pool, fail_message);
+
+            if (!fail_message.empty())
+                fail_messages += fail_message + '\n';
+
+            if (!result.entry.isNull())
             {
-                ++failed_pools_count;
-                ProfileEvents::increment(ProfileEvents::DistributedConnectionFailAtAll);
+                ++entries_count;
+                if (result.is_usable)
+                {
+                    ++usable_count;
+                    if (result.is_up_to_date)
+                        ++up_to_date_count;
+                }
+            }
+            else
+            {
+                LOG_WARNING(log, "Connection failed at try №{}, reason: {}", (shuffled_pool.error_count + 1), fail_message);
+                ProfileEvents::increment(ProfileEvents::DistributedConnectionFailTry);
+
+                shuffled_pool.error_count = std::min(max_error_cap, shuffled_pool.error_count + 1);
+
+                if (shuffled_pool.error_count >= max_tries)
+                {
+                    ++failed_pools_count;
+                    ProfileEvents::increment(ProfileEvents::DistributedConnectionFailAtAll);
+                }
             }
         }
     }
@@ -302,8 +303,8 @@ PoolWithFailoverBase<TNestedPool>::getMany(
             try_results.begin(), try_results.end(),
             [](const TryResult & left, const TryResult & right)
             {
-                return std::forward_as_tuple(!left.is_up_to_date, left.staleness)
-                    < std::forward_as_tuple(!right.is_up_to_date, right.staleness);
+                return std::forward_as_tuple(!left.is_up_to_date, left.delay)
+                    < std::forward_as_tuple(!right.is_up_to_date, right.delay);
             });
 
     if (fallback_to_stale_replicas)
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 4dd79903965..f92dc06fa7e 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -178,11 +178,11 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
                 throw;
         }
 
-        double max_remote_delay = 0.0;
+        UInt32 max_remote_delay = 0;
         for (const auto & try_result : try_results)
         {
             if (!try_result.is_up_to_date)
-                max_remote_delay = std::max(try_result.staleness, max_remote_delay);
+                max_remote_delay = std::max(try_result.delay, max_remote_delay);
         }
 
         if (try_results.empty() || local_delay < max_remote_delay)

From e6061fa9f9cb53ae1896a6010ae73343f11ea11a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 1 Feb 2024 14:46:16 +0100
Subject: [PATCH 0520/1081] Revert "Update libxml2 version to address some
 bogus security issues"

---
 contrib/libxml2                               |   2 +-
 .../linux_x86_64/include/libxml/xmlversion.h  | 108 ++++++++----------
 2 files changed, 51 insertions(+), 59 deletions(-)

diff --git a/contrib/libxml2 b/contrib/libxml2
index 8292f361458..223cb03a5d2 160000
--- a/contrib/libxml2
+++ b/contrib/libxml2
@@ -1 +1 @@
-Subproject commit 8292f361458fcffe0bff515a385be02e9d35582c
+Subproject commit 223cb03a5d27b1b2393b266a8657443d046139d6
diff --git a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
index d8535e91a0e..c2faeb47cb1 100644
--- a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
+++ b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
@@ -21,7 +21,7 @@ extern "C" {
  * your library and includes mismatch
  */
 #ifndef LIBXML2_COMPILING_MSCCDEF
-XMLPUBFUN void xmlCheckVersion(int version);
+XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 #endif /* LIBXML2_COMPILING_MSCCDEF */
 
 /**
@@ -29,28 +29,28 @@ XMLPUBFUN void xmlCheckVersion(int version);
  *
  * the version string like "1.2.3"
  */
-#define LIBXML_DOTTED_VERSION "2.12.4"
+#define LIBXML_DOTTED_VERSION "2.10.3"
 
 /**
  * LIBXML_VERSION:
  *
  * the version number: 1.2.3 value is 10203
  */
-#define LIBXML_VERSION 21204
+#define LIBXML_VERSION 21003
 
 /**
  * LIBXML_VERSION_STRING:
  *
  * the version number string, 1.2.3 value is "10203"
  */
-#define LIBXML_VERSION_STRING "21204"
+#define LIBXML_VERSION_STRING "21003"
 
 /**
  * LIBXML_VERSION_EXTRA:
  *
  * extra version information, used to show a git commit description
  */
-#define LIBXML_VERSION_EXTRA "-GITv2.12.4"
+#define LIBXML_VERSION_EXTRA ""
 
 /**
  * LIBXML_TEST_VERSION:
@@ -58,7 +58,7 @@ XMLPUBFUN void xmlCheckVersion(int version);
  * Macro to check that the libxml version in use is compatible with
  * the version the software has been compiled against
  */
-#define LIBXML_TEST_VERSION xmlCheckVersion(21204);
+#define LIBXML_TEST_VERSION xmlCheckVersion(21003);
 
 #ifndef VMS
 #if 0
@@ -270,7 +270,7 @@ XMLPUBFUN void xmlCheckVersion(int version);
  *
  * Whether iconv support is available
  */
-#if 1
+#if 0
 #define LIBXML_ICONV_ENABLED
 #endif
 
@@ -313,7 +313,7 @@ XMLPUBFUN void xmlCheckVersion(int version);
 /**
  * LIBXML_DEBUG_RUNTIME:
  *
- * Removed
+ * Whether the runtime debugging is configured in
  */
 #if 0
 #define LIBXML_DEBUG_RUNTIME
@@ -409,7 +409,12 @@ XMLPUBFUN void xmlCheckVersion(int version);
 #endif
 
 #ifdef __GNUC__
-/** DOC_DISABLE */
+
+/**
+ * ATTRIBUTE_UNUSED:
+ *
+ * Macro used to signal to GCC unused function parameters
+ */
 
 #ifndef ATTRIBUTE_UNUSED
 # if ((__GNUC__ > 2) || ((__GNUC__ == 2) && (__GNUC_MINOR__ >= 7)))
@@ -419,6 +424,12 @@ XMLPUBFUN void xmlCheckVersion(int version);
 # endif
 #endif
 
+/**
+ * LIBXML_ATTR_ALLOC_SIZE:
+ *
+ * Macro used to indicate to GCC this is an allocator function
+ */
+
 #ifndef LIBXML_ATTR_ALLOC_SIZE
 # if (!defined(__clang__) && ((__GNUC__ > 4) || ((__GNUC__ == 4) && (__GNUC_MINOR__ >= 3))))
 #  define LIBXML_ATTR_ALLOC_SIZE(x) __attribute__((alloc_size(x)))
@@ -429,6 +440,12 @@ XMLPUBFUN void xmlCheckVersion(int version);
 # define LIBXML_ATTR_ALLOC_SIZE(x)
 #endif
 
+/**
+ * LIBXML_ATTR_FORMAT:
+ *
+ * Macro used to indicate to GCC the parameter are printf like
+ */
+
 #ifndef LIBXML_ATTR_FORMAT
 # if ((__GNUC__ > 3) || ((__GNUC__ == 3) && (__GNUC_MINOR__ >= 3)))
 #  define LIBXML_ATTR_FORMAT(fmt,args) __attribute__((__format__(__printf__,fmt,args)))
@@ -440,69 +457,44 @@ XMLPUBFUN void xmlCheckVersion(int version);
 #endif
 
 #ifndef XML_DEPRECATED
-#  if defined (IN_LIBXML) || (__GNUC__ * 100 + __GNUC_MINOR__ < 301)
+#  ifdef IN_LIBXML
 #    define XML_DEPRECATED
-/* Available since at least GCC 3.1 */
 #  else
+/* Available since at least GCC 3.1 */
 #    define XML_DEPRECATED __attribute__((deprecated))
 #  endif
 #endif
 
-#if defined(__clang__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 406)
-  #if defined(__clang__) || (__GNUC__ * 100 + __GNUC_MINOR__ >= 800)
-    #define XML_IGNORE_FPTR_CAST_WARNINGS \
-      _Pragma("GCC diagnostic push") \
-      _Pragma("GCC diagnostic ignored \"-Wpedantic\"") \
-      _Pragma("GCC diagnostic ignored \"-Wcast-function-type\"")
-  #else
-    #define XML_IGNORE_FPTR_CAST_WARNINGS \
-      _Pragma("GCC diagnostic push") \
-      _Pragma("GCC diagnostic ignored \"-Wpedantic\"")
-  #endif
-  #define XML_POP_WARNINGS \
-    _Pragma("GCC diagnostic pop")
-#else
-  #define XML_IGNORE_FPTR_CAST_WARNINGS
-  #define XML_POP_WARNINGS
-#endif
-
 #else /* ! __GNUC__ */
+/**
+ * ATTRIBUTE_UNUSED:
+ *
+ * Macro used to signal to GCC unused function parameters
+ */
 #define ATTRIBUTE_UNUSED
+/**
+ * LIBXML_ATTR_ALLOC_SIZE:
+ *
+ * Macro used to indicate to GCC this is an allocator function
+ */
 #define LIBXML_ATTR_ALLOC_SIZE(x)
+/**
+ * LIBXML_ATTR_FORMAT:
+ *
+ * Macro used to indicate to GCC the parameter are printf like
+ */
 #define LIBXML_ATTR_FORMAT(fmt,args)
+/**
+ * XML_DEPRECATED:
+ *
+ * Macro used to indicate that a function, variable, type or struct member
+ * is deprecated.
+ */
 #ifndef XML_DEPRECATED
-#  if defined (IN_LIBXML) || !defined (_MSC_VER)
-#    define XML_DEPRECATED
-/* Available since Visual Studio 2005 */
-#  elif defined (_MSC_VER) && (_MSC_VER >= 1400)
-#    define XML_DEPRECATED __declspec(deprecated)
-#  endif
-#endif
-#if defined (_MSC_VER) && (_MSC_VER >= 1400)
-#  define XML_IGNORE_FPTR_CAST_WARNINGS __pragma(warning(push))
-#else
-#  define XML_IGNORE_FPTR_CAST_WARNINGS
-#endif
-#ifndef XML_POP_WARNINGS
-#  if defined (_MSC_VER) && (_MSC_VER >= 1400)
-#    define XML_POP_WARNINGS __pragma(warning(pop))
-#  else
-#    define XML_POP_WARNINGS
-#  endif
+#define XML_DEPRECATED
 #endif
 #endif /* __GNUC__ */
 
-#define XML_NO_ATTR
-
-#ifdef LIBXML_THREAD_ENABLED
-  #define XML_DECLARE_GLOBAL(name, type, attrs) \
-    attrs XMLPUBFUN type *__##name(void);
-  #define XML_GLOBAL_MACRO(name) (*__##name())
-#else
-  #define XML_DECLARE_GLOBAL(name, type, attrs) \
-    attrs XMLPUBVAR type name;
-#endif
-
 #ifdef __cplusplus
 }
 #endif /* __cplusplus */

From ecd85096d0879b170a91afd63dbcce50a41a2ed3 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 14:12:11 +0000
Subject: [PATCH 0521/1081] FIx typo

---
 src/Common/PoolWithFailoverBase.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index 6cd72391fc9..e67d819cbf9 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -81,7 +81,7 @@ public:
             delay = 0;
         }
 
-        Entry entry; /// use isNull() to check if conection is established
+        Entry entry; /// use isNull() to check if connection is established
         bool is_usable = false; /// if connection is established, then can be false only with table check
                                 /// if table is not present on remote peer, -> it'll be false
         bool is_up_to_date = false; /// If true, the entry is a connection to up-to-date replica

From 1a4f56a61ac8dc5dab3245f6574769991bffc927 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 31 Jan 2024 19:33:04 +0000
Subject: [PATCH 0522/1081] Fix `ASTAlterCommand::formatImpl` in case of column
 specific settings modifications

---
 src/Parsers/ASTAlterQuery.cpp | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index e229095df1b..dd7f40cff95 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -104,6 +104,14 @@ void ASTAlterCommand::formatImpl(const FormatSettings & settings, FormatState &
         {
             settings.ostr << (settings.hilite ? hilite_keyword : "") << " REMOVE " << remove_property;
         }
+        else if (settings_changes) {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << "MODIFY SETTING " << (settings.hilite ? hilite_none : "");
+            settings_changes->formatImpl(settings, state, frame);
+        }
+        else if (settings_resets) {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << "RESET SETTING " << (settings.hilite ? hilite_none : "");
+            settings_resets->formatImpl(settings, state, frame);
+        }
         else
         {
             if (first)

From 7c04a1a972f3e639f6f4e6bd3efc4e1c8ba8557d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 31 Jan 2024 20:32:07 +0000
Subject: [PATCH 0523/1081] Test query formatting

---
 .../0_stateless/02870_per_column_settings.reference       | 8 ++++++--
 tests/queries/0_stateless/02870_per_column_settings.sql   | 8 ++++++--
 2 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/02870_per_column_settings.reference b/tests/queries/0_stateless/02870_per_column_settings.reference
index 144c8c5ee2e..be08e7a682b 100644
--- a/tests/queries/0_stateless/02870_per_column_settings.reference
+++ b/tests/queries/0_stateless/02870_per_column_settings.reference
@@ -1,10 +1,14 @@
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
 1000
+ALTER TABLE tab\n    MODIFY COLUMN `long_string`MODIFY SETTING min_compress_block_size = 8192
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (min_compress_block_size = 8192, max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
+ALTER TABLE tab\n    MODIFY COLUMN `long_string`RESET SETTING min_compress_block_size
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
+ALTER TABLE tab\n    MODIFY COLUMN `long_string` REMOVE SETTINGS
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String,\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
+ALTER TABLE tab\n    MODIFY COLUMN `long_string` String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840)
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
---- 
+---
 (0,0)	0
 (1,1)	1
 (2,2)	2
@@ -15,4 +19,4 @@ CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS
 (7,7)	7
 (8,8)	8
 (9,9)	9
---- 
+---
diff --git a/tests/queries/0_stateless/02870_per_column_settings.sql b/tests/queries/0_stateless/02870_per_column_settings.sql
index 345cf5cc744..d242ebe6c61 100644
--- a/tests/queries/0_stateless/02870_per_column_settings.sql
+++ b/tests/queries/0_stateless/02870_per_column_settings.sql
@@ -23,21 +23,25 @@ SHOW CREATE tab;
 INSERT INTO TABLE tab SELECT number, randomPrintableASCII(1000), randomPrintableASCII(10), rand(number), rand(number+1), rand(number+2) FROM numbers(1000);
 SELECT count() FROM tab;
 
+SELECT formatQuery('ALTER TABLE tab MODIFY COLUMN long_string MODIFY SETTING min_compress_block_size = 8192;');
 ALTER TABLE tab MODIFY COLUMN long_string MODIFY SETTING min_compress_block_size = 8192;
 SHOW CREATE tab;
 
+SELECT formatQuery('ALTER TABLE tab MODIFY COLUMN long_string RESET SETTING min_compress_block_size;');
 ALTER TABLE tab MODIFY COLUMN long_string RESET SETTING min_compress_block_size;
 SHOW CREATE tab;
 
+SELECT formatQuery('ALTER TABLE tab MODIFY COLUMN long_string REMOVE SETTINGS;');
 ALTER TABLE tab MODIFY COLUMN long_string REMOVE SETTINGS;
 SHOW CREATE tab;
 
+SELECT formatQuery('ALTER TABLE tab MODIFY COLUMN long_string String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840);');
 ALTER TABLE tab MODIFY COLUMN long_string String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840);
 SHOW CREATE tab;
 
 DROP TABLE tab;
 
-SELECT '--- ';
+SELECT '---';
 
 SET allow_experimental_object_type = 1;
 
@@ -56,7 +60,7 @@ SELECT tup, json.key AS key FROM tab ORDER BY key LIMIT 10;
 
 DROP TABLE tab;
 
-SELECT '--- ';
+SELECT '---';
 
 -- Unsupported column-level settings are rejected
 CREATE TABLE tab

From e8c9500981e9ebda0d4de5ff8db693fbe92a31ff Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <antaljanosbenjamin@users.noreply.github.com>
Date: Wed, 31 Jan 2024 21:56:15 +0100
Subject: [PATCH 0524/1081] Update src/Parsers/ASTAlterQuery.cpp

Co-authored-by: Nikolay Degterinsky <43110995+evillique@users.noreply.github.com>
---
 src/Parsers/ASTAlterQuery.cpp | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index dd7f40cff95..a6543190904 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -104,12 +104,14 @@ void ASTAlterCommand::formatImpl(const FormatSettings & settings, FormatState &
         {
             settings.ostr << (settings.hilite ? hilite_keyword : "") << " REMOVE " << remove_property;
         }
-        else if (settings_changes) {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << "MODIFY SETTING " << (settings.hilite ? hilite_none : "");
+        else if (settings_changes)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << " MODIFY SETTING " << (settings.hilite ? hilite_none : "");
             settings_changes->formatImpl(settings, state, frame);
         }
-        else if (settings_resets) {
-            settings.ostr << (settings.hilite ? hilite_keyword : "") << "RESET SETTING " << (settings.hilite ? hilite_none : "");
+        else if (settings_resets)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << " RESET SETTING " << (settings.hilite ? hilite_none : "");
             settings_resets->formatImpl(settings, state, frame);
         }
         else

From 20311791e0cb5c15273cf58de75ef70cb16bbc8c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 1 Feb 2024 10:34:03 +0000
Subject: [PATCH 0525/1081] Fix tests

---
 tests/queries/0_stateless/02870_per_column_settings.reference | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02870_per_column_settings.reference b/tests/queries/0_stateless/02870_per_column_settings.reference
index be08e7a682b..c2ae34928bd 100644
--- a/tests/queries/0_stateless/02870_per_column_settings.reference
+++ b/tests/queries/0_stateless/02870_per_column_settings.reference
@@ -1,8 +1,8 @@
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (min_compress_block_size = 163840, max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
 1000
-ALTER TABLE tab\n    MODIFY COLUMN `long_string`MODIFY SETTING min_compress_block_size = 8192
+ALTER TABLE tab\n    MODIFY COLUMN `long_string` MODIFY SETTING min_compress_block_size = 8192
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (min_compress_block_size = 8192, max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
-ALTER TABLE tab\n    MODIFY COLUMN `long_string`RESET SETTING min_compress_block_size
+ALTER TABLE tab\n    MODIFY COLUMN `long_string` RESET SETTING min_compress_block_size
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String SETTINGS (max_compress_block_size = 163840),\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192
 ALTER TABLE tab\n    MODIFY COLUMN `long_string` REMOVE SETTINGS
 CREATE TABLE default.tab\n(\n    `id` UInt64,\n    `long_string` String,\n    `v1` String,\n    `v2` UInt64,\n    `v3` Float32,\n    `v4` Float64\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/tab/2870\', \'r1\')\nORDER BY id\nSETTINGS min_bytes_for_wide_part = 1, index_granularity = 8192

From d322accd89a79ab1c8c6817426c637b4a99b466d Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 1 Feb 2024 12:46:18 +0000
Subject: [PATCH 0526/1081] CI: fix workflow run_command in bugfix validation

---
 .github/workflows/pull_request.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 56617294fb6..9c08363f674 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -491,11 +491,11 @@ jobs:
       run_command: |
         TEMP_PATH="${TEMP_PATH}/integration" \
           python3 integration_test_check.py "Integration $CHECK_NAME" \
-            --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
+            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
 
         TEMP_PATH="${TEMP_PATH}/stateless" \
           python3 functional_test_check.py "Stateless $CHECK_NAME" "$KILL_TIMEOUT" \
-            --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
+            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
 
         python3 bugfix_validate_check.py "${TEMP_PATH}/stateless/functional_commit_status.tsv" "${TEMP_PATH}/integration/integration_commit_status.tsv"
 ##############################################################################################

From a0935770bba84796f3f611f2022110a283114013 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 1 Feb 2024 14:50:29 +0000
Subject: [PATCH 0527/1081] Fix docs

---
 .../sql-reference/statements/alter/column.md  | 22 +++++++++++--------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/docs/en/sql-reference/statements/alter/column.md b/docs/en/sql-reference/statements/alter/column.md
index 676d30f5e44..193136cf8ba 100644
--- a/docs/en/sql-reference/statements/alter/column.md
+++ b/docs/en/sql-reference/statements/alter/column.md
@@ -139,8 +139,8 @@ ALTER TABLE visits COMMENT COLUMN browser 'This column shows the browser used fo
 ## MODIFY COLUMN
 
 ``` sql
-MODIFY COLUMN [IF EXISTS] name [type] [default_expr] [codec] [TTL] [AFTER name_after | FIRST]
-ALTER COLUMN [IF EXISTS] name TYPE [type] [default_expr] [codec] [TTL] [AFTER name_after | FIRST]
+MODIFY COLUMN [IF EXISTS] name [type] [default_expr] [codec] [TTL] [settings] [AFTER name_after | FIRST]
+ALTER COLUMN [IF EXISTS] name TYPE [type] [default_expr] [codec] [TTL] [settings] [AFTER name_after | FIRST]
 ```
 
 This query changes the `name` column properties:
@@ -153,10 +153,14 @@ This query changes the `name` column properties:
 
 - TTL
 
+- Column-level Settings
+
 For examples of columns compression CODECS modifying, see [Column Compression Codecs](../create/table.md/#codecs).
 
 For examples of columns TTL modifying, see [Column TTL](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#mergetree-column-ttl).
 
+For examples of colum-level settings modifying, see [Column-level Settings](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#column-level-settings).
+
 If the `IF EXISTS` clause is specified, the query won’t return an error if the column does not exist.
 
 When changing the type, values are converted as if the [toType](/docs/en/sql-reference/functions/type-conversion-functions.md) functions were applied to them. If only the default expression is changed, the query does not do anything complex, and is completed almost instantly.
@@ -209,7 +213,7 @@ The `ALTER` query for changing columns is replicated. The instructions are saved
 
 ## MODIFY COLUMN REMOVE
 
-Removes one of the column properties: `DEFAULT`, `ALIAS`, `MATERIALIZED`, `CODEC`, `COMMENT`, `TTL`, `SETTING`.
+Removes one of the column properties: `DEFAULT`, `ALIAS`, `MATERIALIZED`, `CODEC`, `COMMENT`, `TTL`, `SETTINGS`.
 
 Syntax:
 
@@ -237,7 +241,7 @@ Modify a column setting.
 Syntax:
 
 ```sql
-ALTER TABLE table_name MODIFY COLUMN MODIFY SETTING name=value,...;
+ALTER TABLE table_name MODIFY COLUMN column_name MODIFY SETTING name=value,...;
 ```
 
 **Example**
@@ -245,7 +249,7 @@ ALTER TABLE table_name MODIFY COLUMN MODIFY SETTING name=value,...;
 Modify column's `max_compress_block_size` to `1MB`:
 
 ```sql
-ALTER TABLE table_name MODIFY COLUMN MODIFY SETTING max_compress_block_size = 1048576;
+ALTER TABLE table_name MODIFY COLUMN column_name MODIFY SETTING max_compress_block_size = 1048576;
 ```
 
 ## MODIFY COLUMN RESET SETTING
@@ -255,21 +259,21 @@ Reset a column setting, also removes the setting declaration in the column expre
 Syntax:
 
 ```sql
-ALTER TABLE table_name MODIFY COLUMN RESET SETTING name,...;
+ALTER TABLE table_name MODIFY COLUMN column_name RESET SETTING name,...;
 ```
 
 **Example**
 
-Remove column setting `max_compress_block_size` to `1MB`:
+Reset column setting `max_compress_block_size` to it's default value:
 
 ```sql
-ALTER TABLE table_name MODIFY COLUMN REMOVE SETTING max_compress_block_size;
+ALTER TABLE table_name MODIFY COLUMN column_name RESET SETTING max_compress_block_size;
 ```
 
 ## MATERIALIZE COLUMN
 
 Materializes or updates a column with an expression for a default value (`DEFAULT` or `MATERIALIZED`).
-It is used if it is necessary to add or update a column with a complicated expression, because evaluating such an expression directly on `SELECT` executing turns out to be expensive. 
+It is used if it is necessary to add or update a column with a complicated expression, because evaluating such an expression directly on `SELECT` executing turns out to be expensive.
 Implemented as a [mutation](/docs/en/sql-reference/statements/alter/index.md#mutations).
 
 Syntax:

From 3108a988dea5807a177bb0e02489bbf9da2c0aa7 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 1 Feb 2024 15:53:13 +0100
Subject: [PATCH 0528/1081] Fix possible uncaught exception during distributed
 query cancellation

Cancellation of distributed queries may throw (i.e. some timeout), and
in case of pipeline had not been properly created properly
(EXCEPTION_BEFORE_START) cancel will not be sent, so cancellation will
be done from dtor and will throw.

<details>

<summary>stacktrace</summary>

```
<Fatal> BaseDaemon: (version 23.9.2.56 (official build), build id: 76109A79FA62B9BC630A6C39438DEA7D28147B68, git hash: a1bf3f1de55abf2354dc498ffbee270be043d633) (from thread 51895) Terminate called for uncaught exception:
<Fatal> BaseDaemon: Code: 209. DB::NetException: Timeout exceeded while reading from socket (socket (10.61.1.50:9000), receive timeout 20000 ms). (SOCKET_TIMEOUT), Stack trace (when copying this message, always include the lines below):
<Fatal> BaseDaemon:
<Fatal> BaseDaemon: 0. ./build_docker/./src/Common/Exception.cpp:98: DB::Exception::Exception(DB::Exception::MessageMasked&&, int, bool) @ 0x000000000c741d97 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 1. ./build_docker/./contrib/llvm-project/libcxx/include/string:1499: DB::NetException::NetException<String const&>(int, String const&) @ 0x000000001148ace7 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 2. ./build_docker/./src/QueryPipeline/RemoteQueryExecutorReadContext.cpp:101: DB::RemoteQueryExecutorReadContext::checkTimeout(bool) @ 0x000000001148a70a in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 3. ./build_docker/./src/Common/Fiber.h:42: DB::RemoteQueryExecutorReadContext::cancelBefore() @ 0x000000001148aded in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 4. ./build_docker/./src/Common/Fiber.h:27: DB::AsyncTaskExecutor::cancel() @ 0x000000001148969d in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 5. ./build_docker/./src/QueryPipeline/RemoteQueryExecutor.cpp:169: DB::RemoteQueryExecutor::~RemoteQueryExecutor() @ 0x000000001147a9d0 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 6. ./build_docker/./contrib/llvm-project/libcxx/src/include/atomic_support.h:74: std::__shared_ptr_emplace<DB::RemoteSource, std::allocator<DB::RemoteSource>>::__on_zero_shared() @ 0x000000000c94a4a1 in /usr/lib/debug/usr/bin/clickhou

<Fatal> BaseDaemon: 7. ./build_docker/./contrib/llvm-project/libcxx/src/include/atomic_support.h:74: std::__shared_ptr_emplace<std::vector<std::shared_ptr<DB::IProcessor>, std::allocator<std::shared_ptr<DB::IProcessor>>>, std::allocator<std::vector<std::
or<std::shared_ptr<DB::IProcessor>>>>>::__on_zero_shared() @ 0x00000000114603a1 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 8. ./build_docker/./contrib/llvm-project/libcxx/src/include/atomic_support.h:74: DB::QueryPipeline::~QueryPipeline() @ 0x000000001146347a in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 9. ./build_docker/./src/QueryPipeline/QueryPipeline.cpp:709: DB::QueryPipeline::reset() @ 0x0000000011468f78 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 10. ./build_docker/./src/Interpreters/executeQuery.cpp:1427: DB::executeQuery(DB::ReadBuffer&, DB::WriteBuffer&, bool, std::shared_ptr<DB::Context>, std::function<void (DB::QueryResultDetails const&)>, std::optional<DB::FormatSettings> const&, std::function<void (DB::IOutputFormat&)>) @ 0x000000001249aa8b in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 11. ./build_docker/./contrib/llvm-project/libcxx/include/__functional/function.h:818: DB::HTTPHandler::processQuery(DB::HTTPServerRequest&, DB::HTMLForm&, DB::HTTPServerResponse&, DB::HTTPHandler::Output&, std::optional<DB::CurrentThread::QueryScope>&) @ 0x00000000132bddb4 in /usr/lib/debug/usr/bin/clickhouse.debug
<Fatal> BaseDaemon: 12. ./build_docker/./contrib/llvm-project/libcxx/include/__memory/unique_ptr.h:290: DB::HTTPHandler::handleRequest(DB::HTTPServerRequest&, DB::HTTPServerResponse&) @ 0x00000000132c23a4 in /usr/lib/debug/usr/bin/clickhouse.debug
```

</details>

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/QueryPipeline/RemoteQueryExecutor.cpp | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 136a3bb09c6..e053bd2703a 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -182,7 +182,19 @@ RemoteQueryExecutor::~RemoteQueryExecutor()
     {
         /// Set was_cancelled, so the query won't be sent after creating connections.
         was_cancelled = true;
-        read_context->cancel();
+
+        /// Cancellation may throw (i.e. some timeout), and in case of pipeline
+        /// had not been properly created properly (EXCEPTION_BEFORE_START)
+        /// cancel will not be sent, so cancellation will be done from dtor and
+        /// will throw.
+        try
+        {
+            read_context->cancel();
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log ? log : getLogger("RemoteQueryExecutor"));
+        }
     }
 
     /** If interrupted in the middle of the loop of communication with replicas, then interrupt

From 72ddc6af02208818dfcbf03d364035ab22016ae8 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 15:47:13 +0000
Subject: [PATCH 0529/1081] Remove unused includes

---
 src/Common/Epoll.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Common/Epoll.h b/src/Common/Epoll.h
index 5eadd5a7a65..a200f0c2fb4 100644
--- a/src/Common/Epoll.h
+++ b/src/Common/Epoll.h
@@ -2,8 +2,6 @@
 #if defined(OS_LINUX)
 
 #include <sys/epoll.h>
-#include <vector>
-#include <functional>
 #include <boost/noncopyable.hpp>
 #include <Poco/Logger.h>
 

From 479514986378ac3bc0acdf99ca9a140b6efce7a6 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Feb 2024 17:16:42 +0100
Subject: [PATCH 0530/1081] print stats once

---
 .../MergeTree/MergeTreeDataPartWriterOnDisk.cpp    | 14 +++++++++-----
 .../MergeTree/MergeTreeDataPartWriterOnDisk.h      | 12 ++++++++++++
 2 files changed, 21 insertions(+), 5 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index 153bcaa6320..6a265d79019 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -6,7 +6,7 @@
 
 namespace ProfileEvents
 {
-extern const Event MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds;
+extern const Event MergeTreeDataWriterSkipIndicesCalculationMicroseconds;
 }
 
 namespace DB
@@ -155,6 +155,7 @@ MergeTreeDataPartWriterOnDisk::MergeTreeDataPartWriterOnDisk(
     , default_codec(default_codec_)
     , compute_granularity(index_granularity.empty())
     , compress_primary_key(settings.compress_primary_key)
+    , execution_stats(skip_indices.size(), stats.size())
     , log(getLogger(storage.getLogName() + " (DataPartWriter)"))
 {
     if (settings.blocks_are_granules_size && !index_granularity.empty())
@@ -362,7 +363,6 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializeSkipIndices(const Block
             store = it->second;
         }
 
-        size_t index_build_us = 0;
         for (const auto & granule : granules_to_write)
         {
             if (skip_index_accumulated_marks[i] == index_helper->index.granularity)
@@ -387,16 +387,15 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializeSkipIndices(const Block
                     writeBinaryLittleEndian(1UL, marks_out);
             }
 
-            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds);
+            ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterSkipIndicesCalculationMicroseconds);
 
             size_t pos = granule.start_row;
             skip_indices_aggregators[i]->update(skip_indexes_block, &pos, granule.rows_to_write);
             if (granule.is_complete)
                 ++skip_index_accumulated_marks[i];
 
-            index_build_us += watch.elapsed<Microseconds>();
+            execution_stats.skip_indices_build_us[i] += watch.elapsed();
         }
-        LOG_DEBUG(log, "Spent {} ms calculating index {} for the part {}", index_build_us / 1000, skip_indices[i]->index.name, data_part->name);
     }
 }
 
@@ -518,6 +517,11 @@ void MergeTreeDataPartWriterOnDisk::finishSkipIndicesSerialization(bool sync)
     }
     for (auto & store: gin_index_stores)
         store.second->finalize();
+
+    chassert(execution_stats.skip_indices_build_us.size() == skip_indices.size());
+    for (size_t i = 0; i < skip_indices.size(); ++i)
+        LOG_DEBUG(log, "Spent {} ms calculating index {}", execution_stats.skip_indices_build_us[i] / 1000, skip_indices[i]->index.name);
+
     gin_index_stores.clear();
     skip_indices_streams.clear();
     skip_indices_aggregators.clear();
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
index 5292c0d5590..9f2cc3970fa 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h
@@ -191,6 +191,18 @@ private:
 
     virtual void fillIndexGranularity(size_t index_granularity_for_block, size_t rows_in_block) = 0;
 
+    struct ExecutionStatistics
+    {
+        ExecutionStatistics(size_t skip_indices_cnt, size_t stats_cnt)
+            : skip_indices_build_us(skip_indices_cnt, 0), statistics_build_us(stats_cnt, 0)
+        {
+        }
+
+        std::vector<size_t> skip_indices_build_us; // [i] corresponds to the i-th index
+        std::vector<size_t> statistics_build_us; // [i] corresponds to the i-th stat
+    };
+    ExecutionStatistics execution_stats;
+
     LoggerPtr log;
 };
 

From d5eec2d85b616a13fe5123ab4cdc7f0d3471e425 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Thu, 1 Feb 2024 16:27:57 +0000
Subject: [PATCH 0531/1081] trying to fix (casting the result to int)

---
 base/base/Decimal_fwd.h                       |   6 +
 src/Functions/FunctionBinaryArithmetic.h      | 137 ++++++++----------
 .../02975_intdiv_with_decimal.reference       |  20 +--
 .../0_stateless/02975_intdiv_with_decimal.sql |   8 +-
 4 files changed, 84 insertions(+), 87 deletions(-)

diff --git a/base/base/Decimal_fwd.h b/base/base/Decimal_fwd.h
index 589d6224917..beb228cea3c 100644
--- a/base/base/Decimal_fwd.h
+++ b/base/base/Decimal_fwd.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <base/types.h>
+#include <base/extended_types.h>
 
 namespace wide
 {
@@ -44,3 +45,8 @@ concept is_over_big_int =
     || std::is_same_v<T, Decimal128>
     || std::is_same_v<T, Decimal256>;
 }
+
+template <> struct is_signed<DB::Decimal32> { static constexpr bool value = true; };
+template <> struct is_signed<DB::Decimal64> { static constexpr bool value = true; };
+template <> struct is_signed<DB::Decimal128> { static constexpr bool value = true; };
+template <> struct is_signed<DB::Decimal256> { static constexpr bool value = true; };
diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index e31183573c3..9b0afee5053 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -152,22 +152,7 @@ public:
     /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
     using ResultDataType = Switch<
         /// Result must be Integer
-        Case<
-            only_integer && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>),
-            Switch<
-                Case<
-                    IsDataTypeDecimal<LeftDataType>,
-                    Switch<
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal256>, DataTypeInt256>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal128>, DataTypeInt128>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal64>, DataTypeInt64>,
-                        Case<std::is_same_v<LeftDataType, DataTypeDecimal32>, DataTypeInt32>>>,
-                Case<
-                    IsDataTypeDecimal<RightDataType>,
-                    Switch<
-                        Case<IsIntegralOrExtended<LeftDataType>, LeftDataType>,
-                        Case<std::is_same_v<LeftDataType, DataTypeFloat64>, DataTypeInt64>,
-                        Case<std::is_same_v<LeftDataType, DataTypeFloat32>, DataTypeInt32>>>>>,
+        Case<IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero, DataTypeFromFieldType<typename Op::ResultType>>,
 
         /// Decimal cases
         Case<!allow_decimal && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>), InvalidType>,
@@ -1687,16 +1672,7 @@ public:
                     if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
                     {
                         if constexpr (is_div_int || is_div_int_or_zero)
-                        {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
-                                type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
-                                type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
-                                type_res = std::make_shared<DataTypeInt64>();
-                            else
-                                type_res = std::make_shared<DataTypeInt32>();
-                        }
+                            type_res = std::make_shared<ResultDataType>();
                         else
                         {
                             if constexpr (is_division)
@@ -1721,54 +1697,22 @@ public:
                     else if constexpr (((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
                         (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)))
                     {
-                        if constexpr ((is_div_int || is_div_int_or_zero) && IsDataTypeDecimal<LeftDataType>)
-                        {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
-                                type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
-                                type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
-                                type_res = std::make_shared<DataTypeInt64>();
-                            else
-                                type_res = std::make_shared<DataTypeInt32>();
-                        }
-                        else if constexpr (is_div_int || is_div_int_or_zero)
-                        {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeFloat64>)
-                                type_res = std::make_shared<DataTypeInt64>();
-                            else
-                                type_res = std::make_shared<DataTypeInt32>();
-                        }
+                        if constexpr (is_div_int || is_div_int_or_zero)
+                            type_res = std::make_shared<ResultDataType>();
                         else
                             type_res = std::make_shared<DataTypeFloat64>();
                     }
                     else if constexpr (IsDataTypeDecimal<LeftDataType>)
                     {
                         if constexpr (is_div_int || is_div_int_or_zero)
-                        {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal256>)
-                                type_res = std::make_shared<DataTypeInt256>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal128>)
-                                type_res = std::make_shared<DataTypeInt128>();
-                            else if constexpr (std::is_same_v<LeftDataType, DataTypeDecimal64>)
-                                type_res = std::make_shared<DataTypeInt64>();
-                            else
-                                type_res = std::make_shared<DataTypeInt32>();
-                        }
+                            type_res = std::make_shared<ResultDataType>();
                         else
                             type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
                     }
                     else if constexpr (IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr ((is_div_int || is_div_int_or_zero) && IsIntegralOrExtended<LeftDataType>)
-                            type_res = std::make_shared<LeftDataType>();
-                        else if constexpr (is_div_int || is_div_int_or_zero)
-                        {
-                            if constexpr (std::is_same_v<LeftDataType, DataTypeFloat64>)
-                                type_res = std::make_shared<DataTypeInt64>();
-                            else
-                                type_res = std::make_shared<DataTypeInt32>();
-                        }
+                        if constexpr (is_div_int || is_div_int_or_zero)
+                            type_res = std::make_shared<ResultDataType>();
                         else
                             type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
                     }
@@ -2089,10 +2033,8 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
             constexpr bool decimal_with_float = (IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>)
                 || (IsFloatingPoint<LeftDataType> && IsDataTypeDecimal<RightDataType>);
 
-            constexpr bool is_div_int_with_decimal = (is_div_int || is_div_int_or_zero) && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>);
-
-            using T0 = std::conditional_t<decimal_with_float, Float64, std::conditional_t<is_div_int_with_decimal, Int64, typename LeftDataType::FieldType>>;
-            using T1 = std::conditional_t<decimal_with_float, Float64, std::conditional_t<is_div_int_with_decimal, Int64, typename RightDataType::FieldType>>;
+            using T0 = std::conditional_t<decimal_with_float, Float64, typename LeftDataType::FieldType>;
+            using T1 = std::conditional_t<decimal_with_float, Float64, typename RightDataType::FieldType>;
             using ResultType = typename ResultDataType::FieldType;
             using ColVecT0 = ColumnVectorOrDecimal<T0>;
             using ColVecT1 = ColumnVectorOrDecimal<T1>;
@@ -2108,12 +2050,6 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                 left_col = castColumn(arguments[0], converted_type);
                 right_col = castColumn(arguments[1], converted_type);
             }
-            else if constexpr (is_div_int_with_decimal)
-            {
-                const auto converted_type = std::make_shared<DataTypeInt64>();
-                left_col = castColumn(arguments[0], converted_type);
-                right_col = castColumn(arguments[1], converted_type);
-            }
             else
             {
                 left_col = arguments[0].column;
@@ -2139,6 +2075,61 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                     col_left_size,
                     right_nullmap);
             }
+            else if constexpr (!decimal_with_float && (is_div_int || is_div_int_or_zero) && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>))
+            {
+                using DecimalResultType = Switch<
+                    Case<
+                        IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>,
+                        LeftDataType>,
+                    Case<IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>, RightDataType>,
+                    Case<IsDataTypeDecimal<LeftDataType> && IsIntegralOrExtended<RightDataType>, LeftDataType>,
+                    Case<IsDataTypeDecimal<RightDataType> && IsIntegralOrExtended<LeftDataType>, RightDataType>,
+
+                    /// Decimal <op> Real is not supported (traditional DBs convert Decimal <op> Real to Real)
+                    Case<IsDataTypeDecimal<LeftDataType> && !IsIntegralOrExtendedOrDecimal<RightDataType>, InvalidType>,
+                    Case<IsDataTypeDecimal<RightDataType> && !IsIntegralOrExtendedOrDecimal<LeftDataType>, InvalidType>>; /// Determine result decimal type as it would be with usual division (as we determine BinaryOperationTraits::ResultType)
+
+                if constexpr (!std::is_same_v<DecimalResultType, InvalidType>)
+                {
+                    DataTypePtr type_res;
+                    if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
+                    {
+                        if constexpr (is_division)
+                        {
+                            if (context->getSettingsRef().decimal_check_overflow)
+                            {
+                                /// Check overflow by using operands scale (based on big decimal division implementation details):
+                                /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
+                                /// i.e. int_operand = decimal_operand*10^scale
+                                /// For division, left operand will be scaled by right operand scale also to do big integer division,
+                                /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
+                                /// So, we can check upfront possible overflow just by checking max scale used for left operand
+                                /// Note: it doesn't detect all possible overflow during big decimal division
+                                if (left.getScale() + right.getScale() > DecimalResultType::maxPrecision())
+                                    throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
+                            }
+                        }
+                        DecimalResultType result_type = decimalResultType<is_multiply, is_division>(left, right);
+                        type_res = std::make_shared<DecimalResultType>(result_type.getPrecision(), result_type.getScale());
+                    }
+                    else if constexpr (IsDataTypeDecimal<LeftDataType>)
+                        type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
+                    else
+                        type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
+                    // Create result decimal type somehow, maybe similar to how we do it in getReturnTypeImplStatic
+
+                    auto res = executeNumericWithDecimal<LeftDataType, RightDataType, DecimalResultType>(
+                            left, right,
+                            col_left_const, col_right_const,
+                            col_left, col_right,
+                            col_left_size,
+                            right_nullmap);
+
+                    auto col = ColumnWithTypeAndName(res, type_res, name);
+                    return castColumn(col, std::make_shared<ResultDataType>());
+                }
+                return nullptr;
+            }
             else // can't avoid else and another indentation level, otherwise the compiler would try to instantiate
                  // ColVecResult for Decimals which would lead to a compile error.
             {
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.reference b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
index 594dcee975a..5540734ae4c 100644
--- a/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.reference
@@ -1,19 +1,19 @@
 2
 2
+1
+2
+2
 2
 2
 2
 2
 2
 2
+1
 2
+1
 2
-2
-2
-2
-2
-2
-2
+1
 2
 2
 2
@@ -34,6 +34,7 @@
 2
 2
 2
+1
 2
 2
 2
@@ -42,12 +43,11 @@
 2
 2
 2
+1
 2
+1
 2
-2
-2
-2
-2
+1
 2
 2
 2
diff --git a/tests/queries/0_stateless/02975_intdiv_with_decimal.sql b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
index 18e657caa8a..0911a481251 100644
--- a/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
+++ b/tests/queries/0_stateless/02975_intdiv_with_decimal.sql
@@ -13,9 +13,9 @@ SELECT intDiv(toDecimal256(4.4, 5), toDecimal32(2.2, 2));
 SELECT intDiv(4, toDecimal64(2.2, 2));
 SELECT intDiv(toDecimal32(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDiv(4, toDecimal128(2.2, 3));
-SELECT intDiv(toDecimal32(4.4, 2), toDecimal128(2.2, 3));
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal128(2.2, 2));
 SELECT intDiv(4, toDecimal256(2.2, 4));
-SELECT intDiv(toDecimal32(4.4, 2), toDecimal256(2.2, 4));
+SELECT intDiv(toDecimal32(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDiv(toDecimal64(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDiv(toDecimal128(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDiv(toDecimal256(4.4, 2), toDecimal64(2.2, 2));
@@ -48,9 +48,9 @@ SELECT intDivOrZero(toDecimal256(4.4, 5), toDecimal32(2.2, 2));
 SELECT intDivOrZero(4, toDecimal64(2.2, 2));
 SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDivOrZero(4, toDecimal128(2.2, 3));
-SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal128(2.2, 3));
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal128(2.2, 2));
 SELECT intDivOrZero(4, toDecimal256(2.2, 4));
-SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal256(2.2, 4));
+SELECT intDivOrZero(toDecimal32(4.4, 2), toDecimal256(2.2, 2));
 SELECT intDivOrZero(toDecimal64(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDivOrZero(toDecimal128(4.4, 2), toDecimal64(2.2, 2));
 SELECT intDivOrZero(toDecimal256(4.4, 2), toDecimal64(2.2, 2));

From 76f2ae08b503bfffd732187203dbb6ea0c4bde1a Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Feb 2024 18:16:09 +0100
Subject: [PATCH 0532/1081] collect stats build time

---
 src/Common/ProfileEvents.cpp                           |  3 ++-
 .../MergeTree/MergeTreeDataPartWriterOnDisk.cpp        | 10 ++++++++--
 2 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index ef0606162a2..2e5001ce413 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -197,7 +197,8 @@
     M(MergeTreeDataWriterBlocks, "Number of blocks INSERTed to MergeTree tables. Each block forms a data part of level zero.") \
     M(MergeTreeDataWriterBlocksAlreadySorted, "Number of blocks INSERTed to MergeTree tables that appeared to be already sorted.") \
     \
-    M(MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds, "Time spent calculating secondary indices") \
+    M(MergeTreeDataWriterSkipIndicesCalculationMicroseconds, "Time spent calculating skip indices") \
+    M(MergeTreeDataWriterStatisticsCalculationMicroseconds, "Time spent calculating statistics") \
     M(MergeTreeDataWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
     M(MergeTreeDataWriterMergingBlocksMicroseconds, "Time spent merging input blocks (for special MergeTree engines)") \
     M(MergeTreeDataWriterProjectionsCalculationMicroseconds, "Time spent calculating projections") \
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index 6a265d79019..b8cfdf19f54 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -7,6 +7,7 @@
 namespace ProfileEvents
 {
 extern const Event MergeTreeDataWriterSkipIndicesCalculationMicroseconds;
+extern const Event MergeTreeDataWriterStatisticsCalculationMicroseconds;
 }
 
 namespace DB
@@ -338,9 +339,12 @@ void MergeTreeDataPartWriterOnDisk::calculateAndSerializePrimaryIndex(const Bloc
 
 void MergeTreeDataPartWriterOnDisk::calculateAndSerializeStatistics(const Block & block)
 {
-    for (const auto & stat_ptr : stats)
+    for (size_t i = 0; i < stats.size(); ++i)
     {
+        const auto & stat_ptr = stats[i];
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterStatisticsCalculationMicroseconds);
         stat_ptr->update(block.getByName(stat_ptr->columnName()).column);
+        execution_stats.statistics_build_us[i] += watch.elapsed();
     }
 }
 
@@ -494,6 +498,9 @@ void MergeTreeDataPartWriterOnDisk::finishStatisticsSerialization(bool sync)
         if (sync)
             stream->sync();
     }
+
+    for (size_t i = 0; i < stats.size(); ++i)
+        LOG_DEBUG(log, "Spent {} ms calculating statistics {}", execution_stats.statistics_build_us[i] / 1000, stats[i]->columnName());
 }
 
 void MergeTreeDataPartWriterOnDisk::fillStatisticsChecksums(MergeTreeData::DataPart::Checksums & checksums)
@@ -518,7 +525,6 @@ void MergeTreeDataPartWriterOnDisk::finishSkipIndicesSerialization(bool sync)
     for (auto & store: gin_index_stores)
         store.second->finalize();
 
-    chassert(execution_stats.skip_indices_build_us.size() == skip_indices.size());
     for (size_t i = 0; i < skip_indices.size(); ++i)
         LOG_DEBUG(log, "Spent {} ms calculating index {}", execution_stats.skip_indices_build_us[i] / 1000, skip_indices[i]->index.name);
 

From ce31fa912b2f67411350d2de85a21090726101fa Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Thu, 1 Feb 2024 09:24:12 -0800
Subject: [PATCH 0533/1081] removed unnecessary method overloading and fixed
 documentation

---
 .../functions/time-series-functions.md        |  30 ++---
 src/Functions/seriesOutliersDetectTukey.cpp   | 121 +++++++-----------
 .../02813_seriesOutliersTukey.reference       |  10 +-
 .../0_stateless/02813_seriesOutliersTukey.sql |  23 ++--
 4 files changed, 75 insertions(+), 109 deletions(-)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index bd50ef556f7..bb6f3da25fb 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -10,33 +10,27 @@ Below functions are used for series data analysis.
 
 ## seriesOutliersDetectTukey
 
-Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
+Detects outliers in series data using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
 
 **Syntax**
 
 ``` sql
 seriesOutliersDetectTukey(series);
-seriesOutliersDetectTukey(series, kind, min_percentile, max_percentile, K);
+seriesOutliersDetectTukey(series, min_percentile, max_percentile, K);
 ```
 
 **Arguments**
 
 - `series` - An array of numeric values.
-- `kind` - Kind of algorithm to use. Supported values are 'tukey' for standard tukey and 'ctukey' for custom tukey algorithm. The default is 'ctukey'.
-- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 10. This value is only supported for 'ctukey'.
-- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 90. This value is only supported for 'ctukey'.
+- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range [(IQR)](https://en.wikipedia.org/wiki/Interquartile_range). The value must be in range [2,98]. The default is 25.
+- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range (IQR). The value must be in range [2,98]. The default is 75.
 - `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
 
 At least four data points are required in `series` to detect outliers.
 
-Default quantile range:
-- `tukey` - 25%/75%
-- `ctukey` - 10%/90%
-
 **Returned value**
 
-- Returns an array of the same length where each value represents score of possible anomaly of corresponding element in the series.
-- A non-zero score indicates a possible anomaly.
+- Returns an array of the same length as the input array where each value represents score of possible anomaly of corresponding element in the series. A non-zero score indicates a possible anomaly.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -51,23 +45,23 @@ SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4,
 Result:
 
 ``` text
-┌───────────print_0───────────────────┐
-│[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0] │
-└─────────────────────────────────────┘
+┌───────────print_0─────────────────┐
+│[0,0,0,0,0,0,0,0,0,27,0,0,0,0,0,0] │
+└───────────────────────────────────┘
 ```
 
 Query:
 
 ``` sql
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 20, 80, 1.5) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 20, 80, 1.5) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌─print_0────────────────────────────┐
-│ [0,0,0,0,0,0,0,0,0,12,0,0,0,0,0,0] │
-└────────────────────────────────────┘
+┌─print_0──────────────────────────────┐
+│ [0,0,0,0,0,0,0,0,0,19.5,0,0,0,0,0,0] │
+└──────────────────────────────────────┘
 ```
 
 ## seriesPeriodDetectFFT
diff --git a/src/Functions/seriesOutliersDetectTukey.cpp b/src/Functions/seriesOutliersDetectTukey.cpp
index ce5ed391fa0..66fda8ce976 100644
--- a/src/Functions/seriesOutliersDetectTukey.cpp
+++ b/src/Functions/seriesOutliersDetectTukey.cpp
@@ -14,9 +14,10 @@ namespace ErrorCodes
 {
 extern const int BAD_ARGUMENTS;
 extern const int ILLEGAL_COLUMN;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
-///Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
+/// Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences)
 class FunctionSeriesOutliersDetectTukey : public IFunction
 {
 public:
@@ -36,9 +37,15 @@ public:
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
+        if (arguments.size() != 1 && arguments.size() != 4)
+            throw Exception(
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                "Function {} needs either 1 or 4 arguments; passed {}.",
+                getName(),
+                arguments.size());
+
         FunctionArgumentDescriptors mandatory_args{{"time_series", &isArray<IDataType>, nullptr, "Array"}};
         FunctionArgumentDescriptors optional_args{
-            {"kind", &isString<IDataType>, isColumnConst, "const String"},
             {"min_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"},
             {"max_percentile", &isNativeNumber<IDataType>, isColumnConst, "Number"},
             {"k", &isNativeNumber<IDataType>, isColumnConst, "Number"}};
@@ -48,9 +55,9 @@ public:
         return std::make_shared<DataTypeArray>(std::make_shared<DataTypeFloat64>());
     }
 
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3, 4}; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3}; }
 
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         ColumnPtr col = arguments[0].column;
         const ColumnArray * col_arr = checkAndGetColumn<ColumnArray>(col.get());
@@ -58,62 +65,36 @@ public:
         const IColumn & arr_data = col_arr->getData();
         const ColumnArray::Offsets & arr_offsets = col_arr->getOffsets();
 
-        Float64 min_percentile = 0.10; //default 10th percentile
-        Float64 max_percentile = 0.90; //default 90th percentile
+        ColumnPtr col_res;
+        if (input_rows_count == 0)
+            return ColumnArray::create(ColumnFloat64::create());
+
+
+        Float64 min_percentile = 0.25; /// default 25th percentile
+        Float64 max_percentile = 0.75; /// default 75th percentile
+        Float64 K = 1.50;
 
         if (arguments.size() > 1)
         {
-            //const IColumn * arg_column = arguments[1].column.get();
-            const ColumnConst * arg_string = checkAndGetColumnConstStringOrFixedString(arguments[1].column.get());
+            Float64 p_min = arguments[1].column->getFloat64(0);
+            if (p_min < 2.0 || p_min > 98.0)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} must be in range [2.0, 98.0]", getName());
 
-            if (!arg_string)
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "The second argument of function {} must be constant String", getName());
+            min_percentile = p_min / 100;
 
-            String kind = arg_string->getValue<String>();
-            if (kind == "ctukey")
-            {
-                if (arguments.size() > 2)
-                {
-                    Float64 p_min = arguments[2].column->getFloat64(0);
-                    if (p_min >= 2.0 && p_min <= 98.0)
-                        min_percentile = p_min / 100;
-                    else
-                        throw Exception(
-                            ErrorCodes::BAD_ARGUMENTS, "The third argument of function {} must be in range [2.0, 98.0]", getName());
-                }
+            Float64 p_max = arguments[2].column->getFloat64(0);
+            if (p_max < 2.0 || p_max > 98.0 || p_max < min_percentile * 100)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The third argument of function {} must be in range [2.0, 98.0]", getName());
 
-                if (arguments.size() > 3)
-                {
-                    Float64 p_max = arguments[3].column->getFloat64(0);
-                    if (p_max >= 2.0 && p_max <= 98.0 && p_max > min_percentile * 100)
-                        max_percentile = p_max / 100;
-                    else
-                        throw Exception(
-                            ErrorCodes::BAD_ARGUMENTS, "The fourth argument of function {} must be in range [2.0, 98.0]", getName());
-                }
-            }
-            else if (kind == "tukey")
-            {
-                min_percentile = 0.25;
-                max_percentile = 0.75;
-            }
-            else
-                throw Exception(
-                    ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} can only be 'tukey' or 'ctukey'.", getName());
+            max_percentile = p_max / 100;
+
+            auto k_val = arguments[3].column->getFloat64(0);
+            if (k_val < 0.0)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fourth argument of function {} must be a positive number", getName());
+
+            K = k_val;
         }
 
-        Float64 K = 1.50;
-        if (arguments.size() == 5)
-        {
-            auto k_val = arguments[4].column->getFloat64(0);
-            if (k_val >= 0.0)
-                K = k_val;
-            else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fifth argument of function {} must be a positive number", getName());
-        }
-
-        ColumnPtr col_res;
-
         if (executeNumber<UInt8>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
             || executeNumber<UInt16>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
             || executeNumber<UInt32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
@@ -172,7 +153,7 @@ private:
 
             Float64 q1, q2;
 
-            auto p1 = len * min_percentile;
+            Float64 p1 = len * min_percentile;
             if (p1 == static_cast<Int64>(p1))
             {
                 size_t index = static_cast<size_t>(p1) - 1;
@@ -184,7 +165,7 @@ private:
                 q1 = src_sorted[index];
             }
 
-            auto p2 = len * max_percentile;
+            Float64 p2 = len * max_percentile;
             if (p2 == static_cast<Int64>(p2))
             {
                 size_t index = static_cast<size_t>(p2) - 1;
@@ -219,33 +200,27 @@ REGISTER_FUNCTION(SeriesOutliersDetectTukey)
 {
     factory.registerFunction<FunctionSeriesOutliersDetectTukey>(FunctionDocumentation{
         .description = R"(
-Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
-
-Detects a possible anomaly in series using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
+Detects outliers in series data using [Tukey Fences](https://en.wikipedia.org/wiki/Outlier#Tukey%27s_fences).
 
 **Syntax**
 
 ``` sql
 seriesOutliersDetectTukey(series);
-seriesOutliersDetectTukey(series, kind, min_percentile, max_percentile, K);
+seriesOutliersDetectTukey(series, min_percentile, max_percentile, K);
 ```
 
 **Arguments**
 
 - `series` - An array of numeric values.
-- `kind` - Kind of algorithm to use. Supported values are 'tukey' for standard tukey and 'ctukey' for custom tukey algorithm. The default is 'ctukey'.
-- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 10. This value is only supported for 'ctukey'.
-- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range(IQR). The value must be in range [2,98]. The default is 90. This value is only supported for 'ctukey'.
+- `min_percentile` - The minimum percentile to be used to calculate inter-quantile range [(IQR)](https://en.wikipedia.org/wiki/Interquartile_range). The value must be in range [2,98]. The default is 25.
+- `max_percentile` - The maximum percentile to be used to calculate inter-quantile range (IQR). The value must be in range [2,98]. The default is 75.
 - `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
 
-Default quantile range:
-- `tukey` - 25%/75%
-- `ctukey` - 10%/90%
+At least four data points are required in `series` to detect outliers.
 
 **Returned value**
 
-- Returns an array of the same length where each value represents score of possible anomaly of corresponding element in the series.
-- A non-zero score indicates a possible anomaly.
+- Returns an array of the same length as the input array where each value represents score of possible anomaly of corresponding element in the series. A non-zero score indicates a possible anomaly.
 
 Type: [Array](../../sql-reference/data-types/array.md).
 
@@ -260,23 +235,23 @@ SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4,
 Result:
 
 ``` text
-┌───────────print_0───────────────────┐
-│[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0] │
-└─────────────────────────────────────┘
+┌───────────print_0─────────────────┐
+│[0,0,0,0,0,0,0,0,0,27,0,0,0,0,0,0] │
+└───────────────────────────────────┘
 ```
 
 Query:
 
 ``` sql
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 20, 80, 1.5) AS print_0;
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 20, 80, 1.5) AS print_0;
 ```
 
 Result:
 
 ``` text
-┌─print_0────────────────────────────┐
-│ [0,0,0,0,0,0,0,0,0,12,0,0,0,0,0,0] │
-└────────────────────────────────────┘
+┌─print_0──────────────────────────────┐
+│ [0,0,0,0,0,0,0,0,0,19.5,0,0,0,0,0,0] │
+└──────────────────────────────────────┘
 ```)",
         .categories{"Time series analysis"}});
 }
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
index bdcde0419a4..85c65ab10ba 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.reference
@@ -1,14 +1,12 @@
-[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,11.100000000000001,0,0,0,0,0,0]
 [-4.475000000000001,0,6.925000000000001,0,0,0,0,0,0,0,0,7.925000000000001,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,27.975,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,26.1,0,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,11.100000000000001,0,0,0,0,0,0]
+[0,0,0,0,0,0,0,0,0,27.3,0,0,0,0,0,0]
+[-2.4999999999999996,0,5.1,0,0,0,0,0,2.0999999999999996,50.1,2.0999999999999996,0,0,0,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,27.3,0,0,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,10.5,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,27.3,0,0,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
 [0,0,0,0]
 [0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0]
-[0,0,0,0,0,0,0,0,0,27,0,0,0,0,0,0]
 [0,0,0,0,0,0,0,0,0,18,0,0,0,0,0,0]
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
index 7efe4903249..b43fa40e82b 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
+++ b/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
@@ -1,11 +1,11 @@
 DROP TABLE IF EXISTS tb1;
 
 CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;
-INSERT INTO tb1 VALUES (1, [-3,2.40,15,3.90,5,6,4.50,5.20,3,4,5,16,7,5,5,4]), (2, [-3,2.40,15,3.90,5,6,4.50,5.20,12,45,12,3.40,3,4,5,6]);
+INSERT INTO tb1 VALUES (1, [-3, 2.40, 15, 3.90, 5, 6, 4.50, 5.20, 3, 4, 5, 16, 7, 5, 5, 4]), (2, [-3, 2.40, 15, 3.90, 5, 6, 4.50, 5.20, 12, 45, 12, 3.40, 3, 4, 5, 6]);
 
 -- non-const inputs
 SELECT seriesOutliersDetectTukey(a) FROM tb1 ORDER BY n;
-SELECT seriesOutliersDetectTukey(a,'ctukey', 25,75) FROM tb1 ORDER BY n;
+SELECT seriesOutliersDetectTukey(a,10,90,1.5) FROM tb1 ORDER BY n;
 DROP TABLE IF EXISTS tb1;
 
 -- const inputs
@@ -13,18 +13,17 @@ SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40,
 SELECT seriesOutliersDetectTukey([-3, 2.40, 15, 3.90, 5, 6, 4.50, 5.20, 12, 60, 12, 3.40, 3, 4, 5, 6, 3.40, 2.7]);
 
 -- const inputs with optional arguments
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 25, 75);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 10, 90);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'tukey', 10, 90);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 'ctukey', 2, 98);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'ctukey', 2, 98);
-SELECT seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30)), 'tukey');
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, 1.5);
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, 3);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 25, 75, 1.5);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 10, 90, 1.5);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4.50, 5, 12, 45, 12, 3.40, 3, 4, 5, 6], 2, 98, 1.5);
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 2, 98, 1.5);
+SELECT seriesOutliersDetectTukey(arrayMap(x -> sin(x / 10), range(30)));
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 25, 75, 3);
 
 -- negative tests
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 'tukey', 25, 75, -1); -- { serverError BAD_ARGUMENTS}
-SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 'xyz', 33, 53); -- { serverError BAD_ARGUMENTS}
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3, 5, 6, 4, 5, 12, 45, 12, 3, 3, 4, 5, 6], 25, 75, -1); -- { serverError BAD_ARGUMENTS}
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 33, 53); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
+SELECT seriesOutliersDetectTukey([-3, 2, 15, 3], 33); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
 SELECT seriesOutliersDetectTukey([-3, 2.4, 15, NULL]); -- { serverError ILLEGAL_COLUMN}
 SELECT seriesOutliersDetectTukey([]); -- { serverError ILLEGAL_COLUMN}
 SELECT seriesOutliersDetectTukey([-3, 2.4, 15]); -- { serverError BAD_ARGUMENTS}
\ No newline at end of file

From c93a2cd2dd4c8269007151e5d051687223fbe531 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 17:31:14 +0000
Subject: [PATCH 0534/1081] Remove unused header

---
 src/Client/ConnectionEstablisher.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Client/ConnectionEstablisher.h b/src/Client/ConnectionEstablisher.h
index 7ea65708b1d..e80bf09c5b1 100644
--- a/src/Client/ConnectionEstablisher.h
+++ b/src/Client/ConnectionEstablisher.h
@@ -1,7 +1,5 @@
 #pragma once
 
-#include <variant>
-
 #include <Common/AsyncTaskExecutor.h>
 #include <Common/Epoll.h>
 #include <Common/Fiber.h>

From 132c7362cf585f255971b094f62a9120fce1dc31 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Feb 2024 18:51:05 +0100
Subject: [PATCH 0535/1081] Fix `00191_aggregating_merge_tree_and_final`

It became flaky after we merged #39663. When external aggregation happens it seems like we get more than one part, and because we used `OPTIMIZE` without `FINAL` data wasn't properly merged.
`order by` on the line 12 is not needed by now, but let's add it just in case.
---
 .../0_stateless/00191_aggregating_merge_tree_and_final.sql    | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00191_aggregating_merge_tree_and_final.sql b/tests/queries/0_stateless/00191_aggregating_merge_tree_and_final.sql
index 8160d4dee9e..4f73a9e9a54 100644
--- a/tests/queries/0_stateless/00191_aggregating_merge_tree_and_final.sql
+++ b/tests/queries/0_stateless/00191_aggregating_merge_tree_and_final.sql
@@ -7,9 +7,9 @@ INSERT INTO aggregating_00191 (k, u) SELECT intDiv(number, 100) AS k, uniqState(
 
 SELECT k, finalizeAggregation(u) FROM aggregating_00191 FINAL order by k;
 
-OPTIMIZE TABLE aggregating_00191;
+OPTIMIZE TABLE aggregating_00191 FINAL;
 
-SELECT k, finalizeAggregation(u) FROM aggregating_00191;
+SELECT k, finalizeAggregation(u) FROM aggregating_00191 order by k;
 SELECT k, finalizeAggregation(u) FROM aggregating_00191 FINAL order by k;
 
 DROP TABLE aggregating_00191;

From a40be3ea115c79309d29b67e5078cc56eda3da50 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 1 Feb 2024 20:04:39 +0100
Subject: [PATCH 0536/1081] Make MAX use the same rules as permutation for
 complex types

---
 .../AggregateFunctionMax.cpp                  | 14 ++++----
 .../AggregateFunctionMin.cpp                  | 14 ++++----
 src/Core/Field.h                              |  4 ++-
 .../02982_minmax_nan_null_order.reference     | 34 +++++++++++++++++++
 .../02982_minmax_nan_null_order.sql           | 28 +++++++++++++++
 5 files changed, 79 insertions(+), 15 deletions(-)
 create mode 100644 tests/queries/0_stateless/02982_minmax_nan_null_order.reference
 create mode 100644 tests/queries/0_stateless/02982_minmax_nan_null_order.sql

diff --git a/src/AggregateFunctions/AggregateFunctionMax.cpp b/src/AggregateFunctions/AggregateFunctionMax.cpp
index e9cd651b8db..c20df0bc81e 100644
--- a/src/AggregateFunctions/AggregateFunctionMax.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMax.cpp
@@ -82,7 +82,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlace(
         return Parent::addBatchSinglePlace(row_begin, row_end, place, columns, arena, if_argument_pos);
     }
 
-    constexpr int nan_direction_hint = 1;
+    constexpr int nan_null_direction_hint = -1;
     auto const & column = *columns[0];
     if (if_argument_pos >= 0)
     {
@@ -95,7 +95,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlace(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((if_flags[i] != 0) && (column.compareAt(i, index, column, nan_direction_hint) > 0))
+            if ((if_flags[i] != 0) && (column.compareAt(i, index, column, nan_null_direction_hint) > 0))
                 index = i;
         }
         this->data(place).changeIfGreater(column, index, arena);
@@ -111,7 +111,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlace(
             size_t index = row_begin;
             for (size_t i = index + 1; i < row_end; i++)
             {
-                if (column.compareAt(i, index, column, nan_direction_hint) > 0)
+                if (column.compareAt(i, index, column, nan_null_direction_hint) > 0)
                     index = i;
             }
             this->data(place).changeIfGreater(column, index, arena);
@@ -122,7 +122,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlace(
             constexpr IColumn::PermutationSortStability stability = IColumn::PermutationSortStability::Unstable;
             IColumn::Permutation permutation;
             constexpr UInt64 limit = 1;
-            column.getPermutation(direction, stability, limit, nan_direction_hint, permutation);
+            column.getPermutation(direction, stability, limit, nan_null_direction_hint, permutation);
             this->data(place).changeIfGreater(column, permutation[0], arena);
         }
     }
@@ -177,7 +177,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlaceNotNull(
         return Parent::addBatchSinglePlaceNotNull(row_begin, row_end, place, columns, null_map, arena, if_argument_pos);
     }
 
-    constexpr int nan_direction_hint = 1;
+    constexpr int nan_null_direction_hint = -1;
     auto const & column = *columns[0];
     if (if_argument_pos >= 0)
     {
@@ -190,7 +190,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlaceNotNull(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((if_flags[i] != 0) && (null_map[i] == 0) && (column.compareAt(i, index, column, nan_direction_hint) > 0))
+            if ((if_flags[i] != 0) && (null_map[i] == 0) && (column.compareAt(i, index, column, nan_null_direction_hint) > 0))
                 index = i;
         }
         this->data(place).changeIfGreater(column, index, arena);
@@ -205,7 +205,7 @@ void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlaceNotNull(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((null_map[i] == 0) && (column.compareAt(i, index, column, nan_direction_hint) > 0))
+            if ((null_map[i] == 0) && (column.compareAt(i, index, column, nan_null_direction_hint) > 0))
                 index = i;
         }
         this->data(place).changeIfGreater(column, index, arena);
diff --git a/src/AggregateFunctions/AggregateFunctionMin.cpp b/src/AggregateFunctions/AggregateFunctionMin.cpp
index d767bd5c563..7941f3af0de 100644
--- a/src/AggregateFunctions/AggregateFunctionMin.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMin.cpp
@@ -83,7 +83,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlace(
         return Parent::addBatchSinglePlace(row_begin, row_end, place, columns, arena, if_argument_pos);
     }
 
-    constexpr int nan_direction_hint = 1;
+    constexpr int nan_null_direction_hint = 1;
     auto const & column = *columns[0];
     if (if_argument_pos >= 0)
     {
@@ -96,7 +96,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlace(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((if_flags[i] != 0) && (column.compareAt(i, index, column, nan_direction_hint) < 0))
+            if ((if_flags[i] != 0) && (column.compareAt(i, index, column, nan_null_direction_hint) < 0))
                 index = i;
         }
         this->data(place).changeIfLess(column, index, arena);
@@ -112,7 +112,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlace(
             size_t index = row_begin;
             for (size_t i = index + 1; i < row_end; i++)
             {
-                if (column.compareAt(i, index, column, nan_direction_hint) < 0)
+                if (column.compareAt(i, index, column, nan_null_direction_hint) < 0)
                     index = i;
             }
             this->data(place).changeIfLess(column, index, arena);
@@ -123,7 +123,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlace(
             constexpr IColumn::PermutationSortStability stability = IColumn::PermutationSortStability::Unstable;
             IColumn::Permutation permutation;
             constexpr UInt64 limit = 1;
-            column.getPermutation(direction, stability, limit, nan_direction_hint, permutation);
+            column.getPermutation(direction, stability, limit, nan_null_direction_hint, permutation);
             this->data(place).changeIfLess(column, permutation[0], arena);
         }
     }
@@ -178,7 +178,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlaceNotNull(
         return Parent::addBatchSinglePlaceNotNull(row_begin, row_end, place, columns, null_map, arena, if_argument_pos);
     }
 
-    constexpr int nan_direction_hint = 1;
+    constexpr int nan_null_direction_hint = 1;
     auto const & column = *columns[0];
     if (if_argument_pos >= 0)
     {
@@ -191,7 +191,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlaceNotNull(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((if_flags[i] != 0) && (null_map[index] == 0) && (column.compareAt(i, index, column, nan_direction_hint) < 0))
+            if ((if_flags[i] != 0) && (null_map[index] == 0) && (column.compareAt(i, index, column, nan_null_direction_hint) < 0))
                 index = i;
         }
         this->data(place).changeIfLess(column, index, arena);
@@ -206,7 +206,7 @@ void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlaceNotNull(
 
         for (size_t i = index + 1; i < row_end; i++)
         {
-            if ((null_map[i] == 0) && (column.compareAt(i, index, column, nan_direction_hint) < 0))
+            if ((null_map[i] == 0) && (column.compareAt(i, index, column, nan_null_direction_hint) < 0))
                 index = i;
         }
         this->data(place).changeIfLess(column, index, arena);
diff --git a/src/Core/Field.h b/src/Core/Field.h
index 445a5850ca4..f9ce70efbc5 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -306,7 +306,6 @@ static constexpr auto DBMS_MIN_FIELD_SIZE = 32;
   */
 class Field
 {
-    static constexpr int nan_direction_hint = 1; // When comparing Floats NaN are considered to be larger than all numbers
 public:
     struct Types
     {
@@ -511,6 +510,7 @@ public:
             case Types::IPv4:    return get<IPv4>()    < rhs.get<IPv4>();
             case Types::IPv6:    return get<IPv6>()    < rhs.get<IPv6>();
             case Types::Float64:
+                static constexpr int nan_direction_hint = 1; /// Put NaN at the end
                 return FloatCompareHelper<Float64>::less(get<Float64>(), rhs.get<Float64>(), nan_direction_hint);
             case Types::String:  return get<String>()  < rhs.get<String>();
             case Types::Array:   return get<Array>()   < rhs.get<Array>();
@@ -555,6 +555,7 @@ public:
             case Types::IPv6:    return get<IPv6>()    <= rhs.get<IPv6>();
             case Types::Float64:
             {
+                static constexpr int nan_direction_hint = 1; /// Put NaN at the end
                 Float64 f1 = get<Float64>();
                 Float64 f2 = get<Float64>();
                 return FloatCompareHelper<Float64>::less(f1, f2, nan_direction_hint)
@@ -595,6 +596,7 @@ public:
             case Types::UInt64: return get<UInt64>() == rhs.get<UInt64>();
             case Types::Int64:   return get<Int64>() == rhs.get<Int64>();
             case Types::Float64:
+                static constexpr int nan_direction_hint = 1; /// Put NaN at the end
                 return FloatCompareHelper<Float64>::equals(get<Float64>(), rhs.get<Float64>(), nan_direction_hint);
             case Types::UUID:    return get<UUID>()    == rhs.get<UUID>();
             case Types::IPv4:    return get<IPv4>()    == rhs.get<IPv4>();
diff --git a/tests/queries/0_stateless/02982_minmax_nan_null_order.reference b/tests/queries/0_stateless/02982_minmax_nan_null_order.reference
new file mode 100644
index 00000000000..2d8b7f8843e
--- /dev/null
+++ b/tests/queries/0_stateless/02982_minmax_nan_null_order.reference
@@ -0,0 +1,34 @@
+-- { echoOn }
+-- Tuples with NaN
+SELECT min((c1, c2)), max((c1, c2)) FROM values((nan, 0.), (0., 0.), (5., 5.));
+(0,0)	(5,5)
+SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+(0,0)
+SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+(5,5)
+SELECT min((c1, c2)), max((c1, c2)) FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.));
+(-5,0)	(5,5)
+SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+(-5,0)
+SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+(5,5)
+-- Tuples with NULL
+SELECT min((c1, c2)), max((c1, c2)) FROM values((NULL, 0.), (0., 0.), (5., 5.));
+(0,0)	(5,5)
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+(0,0)
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+(5,5)
+SELECT min((c1, c2)), max((c1, c2)) FROM values((0., 0.), (5., 5.), (NULL, 0.));
+(0,0)	(5,5)
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t ASC LIMIT 1;
+(0,0)
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t DESC LIMIT 1;
+(5,5)
+-- Map with NULL
+SELECT min(map(0, c1)), max(map(0, c1)) FROM values(NULL, 0, 5., 5.);
+{0:0}	{0:5}
+SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t ASC LIMIT 1;
+{0:0}
+SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t DESC LIMIT 1;
+{0:5}
diff --git a/tests/queries/0_stateless/02982_minmax_nan_null_order.sql b/tests/queries/0_stateless/02982_minmax_nan_null_order.sql
new file mode 100644
index 00000000000..ad9e40874a7
--- /dev/null
+++ b/tests/queries/0_stateless/02982_minmax_nan_null_order.sql
@@ -0,0 +1,28 @@
+-- { echoOn }
+-- Tuples with NaN
+SELECT min((c1, c2)), max((c1, c2)) FROM values((nan, 0.), (0., 0.), (5., 5.));
+SELECT minIf((c1, c2), c2 >= 0.0), maxIf((c1, c2), c2 >= 0.0) FROM values((nan, 0.), (0., 0.), (5., 5.));
+SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+
+SELECT min((c1, c2)), max((c1, c2)) FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.));
+SELECT minIf((c1, c2), c2 >= 0.0), maxIf((c1, c2), c2 >= 0.0) FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.));
+SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+
+-- Tuples with NULL
+SELECT min((c1, c2)), max((c1, c2)) FROM values((NULL, 0.), (0., 0.), (5., 5.));
+SELECT minIf((c1, c2), c2 >= 0), maxIf((c1, c2), c2 >= 0) FROM values((NULL, 0.), (0., 0.), (5., 5.));
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
+
+SELECT min((c1, c2)), max((c1, c2)) FROM values((0., 0.), (5., 5.), (NULL, 0.));
+SELECT minIf((c1, c2), c2 >= 0), maxIf((c1, c2), c2 >= 0) FROM values((0., 0.), (5., 5.), (NULL, 0.));
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t ASC LIMIT 1;
+SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t DESC LIMIT 1;
+
+-- Map with NULL
+SELECT min(map(0, c1)), max(map(0, c1)) FROM values(NULL, 0, 5., 5.);
+SELECT minIf(map(0, c1), assumeNotNull(c1) >= 0), maxIf(map(0, c1), assumeNotNull(c1) >= 0) FROM values(NULL, 0, 5., 5.);
+SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t ASC LIMIT 1;
+SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t DESC LIMIT 1;

From 667256a67d07b117fe78fbd5c399cfd09373af9c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 1 Feb 2024 20:36:38 +0100
Subject: [PATCH 0537/1081] Fixes for binary.html

---
 programs/server/binary.html | 36 ++++++++++++++++++------------------
 1 file changed, 18 insertions(+), 18 deletions(-)

diff --git a/programs/server/binary.html b/programs/server/binary.html
index 74095dff537..eec39cd4463 100644
--- a/programs/server/binary.html
+++ b/programs/server/binary.html
@@ -70,6 +70,19 @@
             if (params.has('password')) { password = params.get('password'); }
         }
 
+        let url = `${host}?allow_introspection_functions=1`;
+
+        if (add_http_cors_header) {
+            url += '&add_http_cors_header=1';
+        }
+
+        if (user) {
+            url += `&user=${encodeURIComponent(user)}`;
+        }
+        if (password) {
+            url += `&password=${encodeURIComponent(password)}`;
+        }
+
         let map = L.map('space', {
             crs: L.CRS.Simple,
             center: [-512, 512],
@@ -103,24 +116,11 @@
             const key = `${coords.z}-${coords.x}-${coords.y}`;
             let buf = cached_tiles[key];
             if (!buf) {
-                let url = `${host}?default_format=RowBinary&allow_introspection_functions=1`;
+                let request_url = `${url}&default_format=RowBinary` +
+                    `&param_z=${coords.z}&param_x=${coords.x}&param_y=${coords.y}` +
+                    `&enable_http_compression=1&network_compression_method=zstd&network_zstd_compression_level=6`;
 
-                if (add_http_cors_header) {
-                    // For debug purposes, you may set add_http_cors_header from a browser console
-                    url += '&add_http_cors_header=1';
-                }
-
-                if (user) {
-                    url += `&user=${encodeURIComponent(user)}`;
-                }
-                if (password) {
-                    url += `&password=${encodeURIComponent(password)}`;
-                }
-
-                url += `&param_z=${coords.z}&param_x=${coords.x}&param_y=${coords.y}`;
-                url += `&enable_http_compression=1&network_compression_method=zstd&network_zstd_compression_level=6`;
-
-                const response = await fetch(url, { method: 'POST', body: sql });
+                const response = await fetch(request_url, { method: 'POST', body: sql });
 
                 if (!response.ok) {
                     const text = await response.text();
@@ -238,7 +238,7 @@
 
             const addr_hex = '0x' + addr_int.toString(16);
             const response = fetch(
-                `http://localhost:8123/?default_format=JSON`,
+                `${url}&default_format=JSON`,
                 {
                     method: 'POST',
                     body: `SELECT encodeXMLComponent(demangle(addressToSymbol(${addr_int}::UInt64))) AS name,

From 698d00dbfee5f03badbfa182865ca4f2c9cb627d Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Feb 2024 20:43:43 +0100
Subject: [PATCH 0538/1081] add to MutateTask

---
 src/Common/ProfileEvents.cpp                        |  1 +
 src/Storages/MergeTree/MutateTask.cpp               | 13 ++++++++++++-
 .../02982_perf_introspection_for_inserts.sh         |  2 +-
 3 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 2e5001ce413..4d1a30d7676 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -204,6 +204,7 @@
     M(MergeTreeDataWriterProjectionsCalculationMicroseconds, "Time spent calculating projections") \
     M(MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
     M(MergeTreeDataProjectionWriterMergingBlocksMicroseconds, "Time spent merging input blocks") \
+    M(MutateTaskProjectionsCalculationMicroseconds, "Time spent calculating projections") \
     \
     M(InsertedWideParts, "Number of parts inserted in Wide format.") \
     M(InsertedCompactParts, "Number of parts inserted in Compact format.") \
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index e325bb5d720..2affb474104 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -28,6 +28,11 @@
 #include <Common/ProfileEventsScope.h>
 
 
+namespace ProfileEvents
+{
+extern const Event MutateTaskProjectionsCalculationMicroseconds;
+}
+
 namespace CurrentMetrics
 {
     extern const Metric PartMutation;
@@ -1239,7 +1244,13 @@ bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
         {
             const auto & projection = *ctx->projections_to_build[i];
-            auto projection_block = projection_squashes[i].add(projection.calculate(cur_block, ctx->context));
+
+            Block projection_block;
+            {
+                ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MutateTaskProjectionsCalculationMicroseconds);
+                projection_block = projection_squashes[i].add(projection.calculate(cur_block, ctx->context));
+            }
+
             if (projection_block)
             {
                 auto tmp_part = MergeTreeDataWriter::writeTempProjectionPart(
diff --git a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
index a45f88fc10f..a249cbef6a2 100755
--- a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
+++ b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
@@ -40,7 +40,7 @@ SELECT
     ProfileEvents['MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds'] > 0,
     ProfileEvents['MergeTreeDataWriterPrimaryKeyCalculationMicroseconds'] > 0,
     ProfileEvents['MergeTreeDataWriterProjectionsCalculationMicroseconds'] > 0,
-    ProfileEvents['MergeTreeDataWriterSecondaryIndicesCalculationMicroseconds'] > 0
+    ProfileEvents['MergeTreeDataWriterSkipIndicesCalculationMicroseconds'] > 0
 FROM system.query_log
 WHERE current_database = currentDatabase() AND query_id='$query_id' AND type = 'QueryFinish';
 """

From ff21aa9a19a9a2ebd9e16aa32ea1a10d4e988abe Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 1 Feb 2024 19:47:05 +0000
Subject: [PATCH 0539/1081] Don't infer floats in exponential notation by
 default

---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Formats/FormatFactory.cpp                 |  1 +
 src/Formats/FormatSettings.h                  |  1 +
 src/Formats/SchemaInferenceUtils.cpp          | 16 +++++--
 src/IO/readFloatText.cpp                      |  3 ++
 src/IO/readFloatText.h                        | 48 +++++++++++--------
 ...02982_dont_infer_exponent_floats.reference |  2 +
 .../02982_dont_infer_exponent_floats.sql      |  3 ++
 9 files changed, 51 insertions(+), 25 deletions(-)
 create mode 100644 tests/queries/0_stateless/02982_dont_infer_exponent_floats.reference
 create mode 100644 tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 4bb48cb3a29..a892c3bb58e 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1008,6 +1008,7 @@ class IColumn;
     M(Bool, input_format_try_infer_integers, true, "Try to infer integers instead of floats while schema inference in text formats", 0) \
     M(Bool, input_format_try_infer_dates, true, "Try to infer dates from string fields while schema inference in text formats", 0) \
     M(Bool, input_format_try_infer_datetimes, true, "Try to infer datetimes from string fields while schema inference in text formats", 0) \
+    M(Bool, input_format_try_infer_exponent_floats, false, "Try to infer floats in exponential notation while schema inference in text formats", 0) \
     M(Bool, output_format_markdown_escape_special_characters, false, "Escape special characters in Markdown", 0) \
     M(Bool, input_format_protobuf_flatten_google_wrappers, false, "Enable Google wrappers for regular non-nested columns, e.g. google.protobuf.StringValue 'str' for String column 'str'. For Nullable columns empty wrappers are recognized as defaults, and missing as nulls", 0) \
     M(Bool, output_format_protobuf_nullables_with_google_wrappers, false, "When serializing Nullable columns with Google wrappers, serialize default values as empty wrappers. If turned off, default and null values are not serialized", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index ad04ee79995..a70daf8e1c7 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -84,6 +84,7 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
+    {"24.2", {{"input_format_try_infer_exponent_floats", true, false, "Don't infer floats in exponential notation by default"}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 62cbadec4f4..78378168d02 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -226,6 +226,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.try_infer_integers = settings.input_format_try_infer_integers;
     format_settings.try_infer_dates = settings.input_format_try_infer_dates;
     format_settings.try_infer_datetimes = settings.input_format_try_infer_datetimes;
+    format_settings.try_infer_exponent_floats = settings.input_format_try_infer_exponent_floats;
     format_settings.markdown.escape_special_characters = settings.output_format_markdown_escape_special_characters;
     format_settings.bson.output_string_as_string = settings.output_format_bson_string_as_string;
     format_settings.bson.skip_fields_with_unsupported_types_in_schema_inference = settings.input_format_bson_skip_fields_with_unsupported_types_in_schema_inference;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 30e4dd04513..ba7cd6055a7 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -46,6 +46,7 @@ struct FormatSettings
     bool try_infer_integers = false;
     bool try_infer_dates = false;
     bool try_infer_datetimes = false;
+    bool try_infer_exponent_floats = false;
 
     enum class DateTimeInputFormat
     {
diff --git a/src/Formats/SchemaInferenceUtils.cpp b/src/Formats/SchemaInferenceUtils.cpp
index 2cfcff75edd..06b52e7a7a2 100644
--- a/src/Formats/SchemaInferenceUtils.cpp
+++ b/src/Formats/SchemaInferenceUtils.cpp
@@ -17,6 +17,7 @@
 #include <IO/ReadHelpers.h>
 #include <IO/parseDateTimeBestEffort.h>
 #include <IO/PeekableReadBuffer.h>
+#include <IO/readFloatText.h>
 
 #include <Core/Block.h>
 #include <Common/assert_cast.h>
@@ -865,6 +866,13 @@ namespace
         return std::make_shared<DataTypeTuple>(nested_types);
     }
 
+    bool tryReadFloat(Float64 & value, ReadBuffer & buf, const FormatSettings & settings)
+    {
+        if (settings.try_infer_exponent_floats)
+            return tryReadFloatText(value, buf);
+        return tryReadFloatTextNoExponent(value, buf);
+    }
+
     DataTypePtr tryInferNumber(ReadBuffer & buf, const FormatSettings & settings)
     {
         if (buf.eof())
@@ -903,7 +911,7 @@ namespace
                     buf.position() = number_start;
                 }
 
-                if (tryReadFloatText(tmp_float, buf))
+                if (tryReadFloat(tmp_float, buf, settings))
                 {
                     if (read_int && buf.position() == int_end)
                         return std::make_shared<DataTypeInt64>();
@@ -937,7 +945,7 @@ namespace
                 peekable_buf.rollbackToCheckpoint(true);
             }
 
-            if (tryReadFloatText(tmp_float, peekable_buf))
+            if (tryReadFloat(tmp_float, peekable_buf, settings))
             {
                 /// Float parsing reads no fewer bytes than integer parsing,
                 /// so position of the buffer is either the same, or further.
@@ -949,7 +957,7 @@ namespace
                 return std::make_shared<DataTypeFloat64>();
             }
         }
-        else if (tryReadFloatText(tmp_float, buf))
+        else if (tryReadFloat(tmp_float, buf, settings))
         {
             return std::make_shared<DataTypeFloat64>();
         }
@@ -1390,7 +1398,7 @@ DataTypePtr tryInferNumberFromString(std::string_view field, const FormatSetting
     buf.position() = buf.buffer().begin();
 
     Float64 tmp;
-    if (tryReadFloatText(tmp, buf) && buf.eof())
+    if (tryReadFloat(tmp, buf, settings) && buf.eof())
         return std::make_shared<DataTypeFloat64>();
 
     return nullptr;
diff --git a/src/IO/readFloatText.cpp b/src/IO/readFloatText.cpp
index d1143f7c62c..17ccc1b25b7 100644
--- a/src/IO/readFloatText.cpp
+++ b/src/IO/readFloatText.cpp
@@ -67,4 +67,7 @@ template void readFloatText<Float64>(Float64 &, ReadBuffer &);
 template bool tryReadFloatText<Float32>(Float32 &, ReadBuffer &);
 template bool tryReadFloatText<Float64>(Float64 &, ReadBuffer &);
 
+template bool tryReadFloatTextNoExponent<Float32>(Float32 &, ReadBuffer &);
+template bool tryReadFloatTextNoExponent<Float64>(Float64 &, ReadBuffer &);
+
 }
diff --git a/src/IO/readFloatText.h b/src/IO/readFloatText.h
index 23e904f305a..51964636389 100644
--- a/src/IO/readFloatText.h
+++ b/src/IO/readFloatText.h
@@ -324,7 +324,7 @@ static inline void readUIntTextUpToNSignificantDigits(T & x, ReadBuffer & buf)
 }
 
 
-template <typename T, typename ReturnType>
+template <typename T, typename ReturnType, bool allow_exponent = true>
 ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
 {
     static_assert(std::is_same_v<T, double> || std::is_same_v<T, float>, "Argument for readFloatTextImpl must be float or double");
@@ -395,30 +395,33 @@ ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
         after_point_exponent = (read_digits > significant_digits ? -significant_digits : static_cast<int>(-read_digits)) - after_point_num_leading_zeros;
     }
 
-    if (checkChar('e', in) || checkChar('E', in))
+    if constexpr (allow_exponent)
     {
-        if (in.eof())
+        if (checkChar('e', in) || checkChar('E', in))
         {
-            if constexpr (throw_exception)
-                throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after exponent");
-            else
-                return false;
-        }
+            if (in.eof())
+            {
+                if constexpr (throw_exception)
+                    throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after exponent");
+                else
+                    return false;
+            }
 
-        bool exponent_negative = false;
-        if (*in.position() == '-')
-        {
-            exponent_negative = true;
-            ++in.position();
-        }
-        else if (*in.position() == '+')
-        {
-            ++in.position();
-        }
+            bool exponent_negative = false;
+            if (*in.position() == '-')
+            {
+                exponent_negative = true;
+                ++in.position();
+            }
+            else if (*in.position() == '+')
+            {
+                ++in.position();
+            }
 
-        readUIntTextUpToNSignificantDigits<4>(exponent, in);
-        if (exponent_negative)
-            exponent = -exponent;
+            readUIntTextUpToNSignificantDigits<4>(exponent, in);
+            if (exponent_negative)
+                exponent = -exponent;
+        }
     }
 
     if (after_point)
@@ -604,4 +607,7 @@ template <typename T> bool tryReadFloatTextSimple(T & x, ReadBuffer & in) { retu
 template <typename T> void readFloatText(T & x, ReadBuffer & in) { readFloatTextFast(x, in); }
 template <typename T> bool tryReadFloatText(T & x, ReadBuffer & in) { return tryReadFloatTextFast(x, in); }
 
+/// Don't read exponent part of the number.
+template <typename T> bool tryReadFloatTextNoExponent(T & x, ReadBuffer & in) { return readFloatTextFastImpl<T, bool, false>(x, in); }
+
 }
diff --git a/tests/queries/0_stateless/02982_dont_infer_exponent_floats.reference b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.reference
new file mode 100644
index 00000000000..b6d1ff865e5
--- /dev/null
+++ b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.reference
@@ -0,0 +1,2 @@
+c1	Nullable(String)					
+c1	Nullable(Float64)					
diff --git a/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql
new file mode 100644
index 00000000000..17f62557fc2
--- /dev/null
+++ b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql
@@ -0,0 +1,3 @@
+DESC format(CSV, '1E20\n1.1E20') settings input_format_try_infer_exponent_floats = 0;
+DESC format(CSV, '1E20\n1.1E20') settings input_format_try_infer_exponent_floats = 1;
+

From 6c83508af10973cbb321e96268257154a7157f0a Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 19:51:07 +0000
Subject: [PATCH 0540/1081] Remove unused member

---
 src/QueryPipeline/RemoteQueryExecutor.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.h b/src/QueryPipeline/RemoteQueryExecutor.h
index e874b4be726..3fac2065d02 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.h
+++ b/src/QueryPipeline/RemoteQueryExecutor.h
@@ -50,7 +50,6 @@ public:
         std::shared_ptr<TaskIterator> task_iterator = nullptr;
         std::shared_ptr<ParallelReplicasReadingCoordinator> parallel_reading_coordinator = nullptr;
         std::optional<IConnections::ReplicaInfo> replica_info = {};
-        GetPriorityForLoadBalancing::Func priority_func;
     };
 
     /// Takes already set connection.

From 2b786f7c6de22ca5ee01613a529a35306b391ab0 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 1 Feb 2024 20:56:31 +0100
Subject: [PATCH 0541/1081] Wrap disconnect into try/catch in
 RemoteQueryExecutor dtor as well

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/QueryPipeline/RemoteQueryExecutor.cpp | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index e053bd2703a..ab52dee2cf9 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -202,7 +202,17 @@ RemoteQueryExecutor::~RemoteQueryExecutor()
       * these connections did not remain hanging in the out-of-sync state.
       */
     if (established || (isQueryPending() && connections))
-        connections->disconnect();
+    {
+        /// May also throw (so as cancel() above)
+        try
+        {
+            connections->disconnect();
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log ? log : getLogger("RemoteQueryExecutor"));
+        }
+    }
 }
 
 /** If we receive a block with slightly different column types, or with excessive columns,

From d73abc17f53282a39ee085a0ae3dfcc51f92a86e Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 1 Feb 2024 21:06:44 +0100
Subject: [PATCH 0542/1081] better

---
 src/Common/ProfileEvents.cpp                              | 6 +++---
 src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp  | 4 ++--
 src/Storages/MergeTree/MergeTreeDataWriter.cpp            | 8 ++++----
 .../0_stateless/02982_perf_introspection_for_inserts.sh   | 4 ++--
 4 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 4d1a30d7676..d831402fd37 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -199,11 +199,11 @@
     \
     M(MergeTreeDataWriterSkipIndicesCalculationMicroseconds, "Time spent calculating skip indices") \
     M(MergeTreeDataWriterStatisticsCalculationMicroseconds, "Time spent calculating statistics") \
-    M(MergeTreeDataWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
+    M(MergeTreeDataWriterSortingBlocksMicroseconds, "Time spent sorting blocks") \
     M(MergeTreeDataWriterMergingBlocksMicroseconds, "Time spent merging input blocks (for special MergeTree engines)") \
     M(MergeTreeDataWriterProjectionsCalculationMicroseconds, "Time spent calculating projections") \
-    M(MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds, "Time spent calculating primary key") \
-    M(MergeTreeDataProjectionWriterMergingBlocksMicroseconds, "Time spent merging input blocks") \
+    M(MergeTreeDataProjectionWriterSortingBlocksMicroseconds, "Time spent sorting blocks (for projection it might be a key different from table's sorting key)") \
+    M(MergeTreeDataProjectionWriterMergingBlocksMicroseconds, "Time spent merging blocks") \
     M(MutateTaskProjectionsCalculationMicroseconds, "Time spent calculating projections") \
     \
     M(InsertedWideParts, "Number of parts inserted in Wide format.") \
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index b8cfdf19f54..fd83d2ebfe9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -500,7 +500,7 @@ void MergeTreeDataPartWriterOnDisk::finishStatisticsSerialization(bool sync)
     }
 
     for (size_t i = 0; i < stats.size(); ++i)
-        LOG_DEBUG(log, "Spent {} ms calculating statistics {}", execution_stats.statistics_build_us[i] / 1000, stats[i]->columnName());
+        LOG_DEBUG(log, "Spent {} ms calculating statistics {} for the part {}", execution_stats.statistics_build_us[i] / 1000, stats[i]->columnName(), data_part->name);
 }
 
 void MergeTreeDataPartWriterOnDisk::fillStatisticsChecksums(MergeTreeData::DataPart::Checksums & checksums)
@@ -526,7 +526,7 @@ void MergeTreeDataPartWriterOnDisk::finishSkipIndicesSerialization(bool sync)
         store.second->finalize();
 
     for (size_t i = 0; i < skip_indices.size(); ++i)
-        LOG_DEBUG(log, "Spent {} ms calculating index {}", execution_stats.skip_indices_build_us[i] / 1000, skip_indices[i]->index.name);
+        LOG_DEBUG(log, "Spent {} ms calculating index {} for the part {}", execution_stats.skip_indices_build_us[i] / 1000, skip_indices[i]->index.name, data_part->name);
 
     gin_index_stores.clear();
     skip_indices_streams.clear();
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index 8f522832bce..0418bf6fc7d 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -36,7 +36,7 @@ namespace ProfileEvents
     extern const Event MergeTreeDataWriterRows;
     extern const Event MergeTreeDataWriterUncompressedBytes;
     extern const Event MergeTreeDataWriterCompressedBytes;
-    extern const Event MergeTreeDataWriterPrimaryKeyCalculationMicroseconds;
+    extern const Event MergeTreeDataWriterSortingBlocksMicroseconds;
     extern const Event MergeTreeDataWriterMergingBlocksMicroseconds;
     extern const Event MergeTreeDataWriterProjectionsCalculationMicroseconds;
     extern const Event MergeTreeDataProjectionWriterBlocks;
@@ -44,7 +44,7 @@ namespace ProfileEvents
     extern const Event MergeTreeDataProjectionWriterRows;
     extern const Event MergeTreeDataProjectionWriterUncompressedBytes;
     extern const Event MergeTreeDataProjectionWriterCompressedBytes;
-    extern const Event MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds;
+    extern const Event MergeTreeDataProjectionWriterSortingBlocksMicroseconds;
     extern const Event MergeTreeDataProjectionWriterMergingBlocksMicroseconds;
     extern const Event RejectedInserts;
 }
@@ -478,7 +478,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     IColumn::Permutation perm;
     if (!sort_description.empty())
     {
-        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterPrimaryKeyCalculationMicroseconds);
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterSortingBlocksMicroseconds);
 
         if (!isAlreadySorted(block, sort_description))
         {
@@ -702,7 +702,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
     IColumn::Permutation perm;
     if (!sort_description.empty())
     {
-        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds);
+        ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataProjectionWriterSortingBlocksMicroseconds);
 
         if (!isAlreadySorted(block, sort_description))
         {
diff --git a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
index a249cbef6a2..f5fb54b54d3 100755
--- a/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
+++ b/tests/queries/0_stateless/02982_perf_introspection_for_inserts.sh
@@ -37,8 +37,8 @@ $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
 $CLICKHOUSE_CLIENT -q """
 SELECT
     ProfileEvents['MergeTreeDataProjectionWriterMergingBlocksMicroseconds'] > 0,
-    ProfileEvents['MergeTreeDataProjectionWriterPrimaryKeyCalculationMicroseconds'] > 0,
-    ProfileEvents['MergeTreeDataWriterPrimaryKeyCalculationMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataProjectionWriterSortingBlocksMicroseconds'] > 0,
+    ProfileEvents['MergeTreeDataWriterSortingBlocksMicroseconds'] > 0,
     ProfileEvents['MergeTreeDataWriterProjectionsCalculationMicroseconds'] > 0,
     ProfileEvents['MergeTreeDataWriterSkipIndicesCalculationMicroseconds'] > 0
 FROM system.query_log

From 82d7b2214407c68b96334d002f01ed68937e07f4 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 1 Feb 2024 21:06:29 +0000
Subject: [PATCH 0543/1081] Parallel replicas: better replicas failover

---
 .../ClusterProxy/executeQuery.cpp             | 15 +++---
 src/Processors/QueryPlan/ReadFromRemote.cpp   | 52 ++++++-------------
 src/Processors/QueryPlan/ReadFromRemote.h     |  5 +-
 src/QueryPipeline/RemoteQueryExecutor.cpp     | 44 ++++++++++++++++
 src/QueryPipeline/RemoteQueryExecutor.h       | 13 ++++-
 5 files changed, 82 insertions(+), 47 deletions(-)

diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 35451e1d774..023ed6c7b61 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -374,12 +374,12 @@ void executeQueryWithParallelReplicas(
         shard_num = column->getUInt(0);
     }
 
-    ClusterPtr new_cluster;
+    const auto shard_count = not_optimized_cluster->getShardCount();
+    ClusterPtr new_cluster = not_optimized_cluster;
     /// if got valid shard_num from query initiator, then parallel replicas scope is the specified shard
     /// shards are numbered in order of appearance in the cluster config
     if (shard_num > 0)
     {
-        const auto shard_count = not_optimized_cluster->getShardCount();
         if (shard_num > shard_count)
             throw Exception(
                 ErrorCodes::LOGICAL_ERROR,
@@ -395,17 +395,16 @@ void executeQueryWithParallelReplicas(
 
         // get cluster for shard specified by shard_num
         // shard_num is 1-based, but getClusterWithSingleShard expects 0-based index
-        auto single_shard_cluster = not_optimized_cluster->getClusterWithSingleShard(shard_num - 1);
-        // convert cluster to representation expected by parallel replicas
-        new_cluster = single_shard_cluster->getClusterWithReplicasAsShards(settings, settings.max_parallel_replicas);
+        new_cluster = not_optimized_cluster->getClusterWithSingleShard(shard_num - 1);
     }
     else
     {
-        new_cluster = not_optimized_cluster->getClusterWithReplicasAsShards(settings, settings.max_parallel_replicas);
+        // todo: add error and exception for this case
+        chassert(not_optimized_cluster->getShardCount() == 1);
     }
 
-    auto coordinator
-        = std::make_shared<ParallelReplicasReadingCoordinator>(new_cluster->getShardCount(), settings.parallel_replicas_mark_segment_size);
+    auto coordinator = std::make_shared<ParallelReplicasReadingCoordinator>(
+        new_cluster->getShardsInfo().begin()->getAllNodeCount(), settings.parallel_replicas_mark_segment_size);
     auto external_tables = new_context->getExternalTables();
     auto read_from_remote = std::make_unique<ReadFromParallelRemoteReplicasStep>(
         query_ast,
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 4dd79903965..fcdb7cd4a70 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -399,51 +399,33 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
     const Settings & current_settings = context->getSettingsRef();
     auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(current_settings);
 
+    const auto & shard = cluster->getShardsInfo().at(0);
     size_t all_replicas_count = current_settings.max_parallel_replicas;
-    if (all_replicas_count > cluster->getShardsInfo().size())
+    if (all_replicas_count > shard.getAllNodeCount())
     {
-        LOG_INFO(getLogger("ReadFromParallelRemoteReplicasStep"),
-            "The number of replicas requested ({}) is bigger than the real number available in the cluster ({}). "\
-            "Will use the latter number to execute the query.", current_settings.max_parallel_replicas, cluster->getShardsInfo().size());
-        all_replicas_count = cluster->getShardsInfo().size();
+        LOG_INFO(
+            getLogger("ReadFromParallelRemoteReplicasStep"),
+            "The number of replicas requested ({}) is bigger than the real number available in the cluster ({}). "
+            "Will use the latter number to execute the query.",
+            current_settings.max_parallel_replicas,
+            shard.getAllNodeCount());
+        all_replicas_count = shard.getAllNodeCount();
     }
 
-    /// Find local shard. It might happen that there is no local shard, but that's fine
-    for (const auto & shard: cluster->getShardsInfo())
+    chassert(cluster->getShardCount() == 1);
+    auto shuffled_pool = shard.pool->getShuffledPools(current_settings);
+    shuffled_pool.resize(all_replicas_count);
+
+    for (size_t i=0; i < all_replicas_count; ++i)
     {
-        if (shard.isLocal())
-        {
-            IConnections::ReplicaInfo replica_info
-            {
-                .all_replicas_count = all_replicas_count,
-                /// `shard_num` will be equal to the number of the given replica in the cluster (set by `Cluster::getClusterWithReplicasAsShards`).
-                /// we should use this number specifically because efficiency of data distribution by consistent hash depends on it.
-                .number_of_current_replica = shard.shard_num - 1,
-            };
-
-            addPipeForSingeReplica(pipes, shard.pool, replica_info);
-        }
-    }
-
-    auto current_shard = cluster->getShardsInfo().begin();
-    while (pipes.size() != all_replicas_count)
-    {
-        if (current_shard->isLocal())
-        {
-            ++current_shard;
-            continue;
-        }
-
         IConnections::ReplicaInfo replica_info
         {
             .all_replicas_count = all_replicas_count,
-            /// `shard_num` will be equal to the number of the given replica in the cluster (set by `Cluster::getClusterWithReplicasAsShards`).
             /// we should use this number specifically because efficiency of data distribution by consistent hash depends on it.
-            .number_of_current_replica = current_shard->shard_num - 1,
+            .number_of_current_replica = i,
         };
 
-        addPipeForSingeReplica(pipes, current_shard->pool, replica_info);
-        ++current_shard;
+        addPipeForSingeReplica(pipes, shuffled_pool[i].pool, replica_info);
     }
 
     auto pipe = Pipe::unitePipes(std::move(pipes));
@@ -456,7 +438,7 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
 }
 
 
-void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(Pipes & pipes, std::shared_ptr<ConnectionPoolWithFailover> pool, IConnections::ReplicaInfo replica_info)
+void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(Pipes & pipes, IConnectionPool* pool, IConnections::ReplicaInfo replica_info)
 {
     bool add_agg_info = stage == QueryProcessingStage::WithMergeableState;
     bool add_totals = false;
diff --git a/src/Processors/QueryPlan/ReadFromRemote.h b/src/Processors/QueryPlan/ReadFromRemote.h
index f853a12910b..07443220c8d 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.h
+++ b/src/Processors/QueryPlan/ReadFromRemote.h
@@ -10,8 +10,7 @@
 namespace DB
 {
 
-class ConnectionPoolWithFailover;
-using ConnectionPoolWithFailoverPtr = std::shared_ptr<ConnectionPoolWithFailover>;
+class IConnectionPool;
 
 class Throttler;
 using ThrottlerPtr = std::shared_ptr<Throttler>;
@@ -92,7 +91,7 @@ public:
 
 private:
 
-    void addPipeForSingeReplica(Pipes & pipes, std::shared_ptr<ConnectionPoolWithFailover> pool, IConnections::ReplicaInfo replica_info);
+    void addPipeForSingeReplica(Pipes & pipes, IConnectionPool* pool, IConnections::ReplicaInfo replica_info);
 
     ClusterPtr cluster;
     ASTPtr query_ast;
diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 136a3bb09c6..7f25c2331c3 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -62,6 +62,50 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 {
 }
 
+RemoteQueryExecutor::RemoteQueryExecutor(
+    IConnectionPool * pool,
+    const String & query_,
+    const Block & header_,
+    ContextPtr context_,
+    ThrottlerPtr throttler,
+    const Scalars & scalars_,
+    const Tables & external_tables_,
+    QueryProcessingStage::Enum stage_,
+    std::optional<Extension> extension_)
+    : RemoteQueryExecutor(query_, header_, context_, scalars_, external_tables_, stage_, extension_)
+{
+    create_connections = [this, pool, throttler, extension_](AsyncCallback)
+    {
+        const Settings & current_settings = context->getSettingsRef();
+        auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(current_settings);
+
+        ConnectionPoolWithFailover::TryResult result;
+        std::string fail_message;
+        if (main_table)
+        {
+            auto table_name = main_table.getQualifiedName();
+
+            ConnectionEstablisher connection_establisher(pool, &timeouts, current_settings, log, &table_name);
+            connection_establisher.run(result, fail_message);
+        }
+        else
+        {
+            ConnectionEstablisher connection_establisher(pool, &timeouts, current_settings, log, nullptr);
+            connection_establisher.run(result, fail_message);
+        }
+
+        std::vector<IConnectionPool::Entry> connection_entries;
+        if (!result.entry.isNull() && result.is_usable)
+            connection_entries.emplace_back(std::move(result.entry));
+
+        auto res = std::make_unique<MultiplexedConnections>(std::move(connection_entries), context->getSettingsRef(), throttler);
+        if (extension_ && extension_->replica_info)
+            res->setReplicaInfo(*extension_->replica_info);
+
+        return res;
+    };
+}
+
 RemoteQueryExecutor::RemoteQueryExecutor(
     Connection & connection,
     const String & query_, const Block & header_, ContextPtr context_,
diff --git a/src/QueryPipeline/RemoteQueryExecutor.h b/src/QueryPipeline/RemoteQueryExecutor.h
index 444f1258f3e..cc3291313a8 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.h
+++ b/src/QueryPipeline/RemoteQueryExecutor.h
@@ -50,9 +50,20 @@ public:
         std::shared_ptr<TaskIterator> task_iterator = nullptr;
         std::shared_ptr<ParallelReplicasReadingCoordinator> parallel_reading_coordinator = nullptr;
         std::optional<IConnections::ReplicaInfo> replica_info = {};
-        GetPriorityForLoadBalancing::Func priority_func;
     };
 
+    /// Takes a connection pool to a node (not cluster)
+    RemoteQueryExecutor(
+        IConnectionPool * pool,
+        const String & query_,
+        const Block & header_,
+        ContextPtr context_,
+        ThrottlerPtr throttler = nullptr,
+        const Scalars & scalars_ = Scalars(),
+        const Tables & external_tables_ = Tables(),
+        QueryProcessingStage::Enum stage_ = QueryProcessingStage::Complete,
+        std::optional<Extension> extension_ = std::nullopt);
+
     /// Takes already set connection.
     RemoteQueryExecutor(
         Connection & connection,

From 04c8bd1be54e4b35ab2dd331fca651b9ec2d00ec Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Fri, 29 Dec 2023 06:57:55 +0000
Subject: [PATCH 0544/1081] Adaptive asynchronous insert timeouts

Implement the algorithm described in #56783 for adaptive asynchronous
insert timeouts.
- The adaptive async insert timeout can take values within
[async_insert_busy_timeout_min_ms, async_insert_busy_timeout_max_ms].
- The initial value is set to async_insert_busy_timeout_min_ms.
- If the elapsed time since the most recent queue insert was
  greater than the maximum timeout, process the queue content immediately,
  and reduce the timeout.
- If the elapsed time was long enough (longer than a would-be decreased
  timeout), decrease the timeout.
- The adaptive timeout is changes exponentially based on the
  async_insert_busy_timeout_{increase|decrease}_rate.

Fixes: https://github.com/ClickHouse/ClickHouse/issues/56783
---
 src/Core/Settings.h                          |   6 +-
 src/Interpreters/AsynchronousInsertQueue.cpp | 156 ++++++++++++++++---
 src/Interpreters/AsynchronousInsertQueue.h   |  14 ++
 src/Interpreters/Context.cpp                 |   7 +-
 4 files changed, 154 insertions(+), 29 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index bc518ca856b..2b36b83edd2 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -750,8 +750,12 @@ class IColumn;
     M(Seconds, wait_for_async_insert_timeout, DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC, "Timeout for waiting for processing asynchronous insertion", 0) \
     M(UInt64, async_insert_max_data_size, 1000000, "Maximum size in bytes of unparsed data collected per query before being inserted", 0) \
     M(UInt64, async_insert_max_query_number, 450, "Maximum number of insert queries before being inserted", 0) \
-    M(Milliseconds, async_insert_busy_timeout_ms, 200, "Maximum time to wait before dumping collected data per query since the first data appeared", 0) \
     M(Milliseconds, async_insert_poll_timeout_ms, 10, "Timeout for polling data from asynchronous insert queue", 0) \
+    M(Bool, async_insert_use_adaptive_busy_timeout, true, "If it is set to true, use adaptive busy timeout for asynchronous inserts", 0) \
+    M(Milliseconds, async_insert_busy_timeout_min_ms, 50, "If auto-adjusting is enabled through async_insert_use_adaptive_busy_timeout, minimum time to wait before dumping collected data per query since the first data appeared. It also serves as the initial value for the adaptive algorithm", 0) \
+    M(Milliseconds, async_insert_busy_timeout_max_ms, 200, "Maximum time to wait before dumping collected data per query since the first data appeared.", 0) ALIAS(async_insert_busy_timeout_ms) \
+    M(Double, async_insert_busy_timeout_increase_rate, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases", 0) \
+    M(Double, async_insert_busy_timeout_decrease_rate, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases", 0) \
     \
     M(UInt64, remote_fs_read_max_backoff_ms, 10000, "Max wait time when trying to read data for remote disk", 0) \
     M(UInt64, remote_fs_read_backoff_max_tries, 5, "Max attempts to read with backoff", 0) \
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 3aa61f93924..5aedf581775 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -60,6 +60,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_FORMAT;
     extern const int BAD_ARGUMENTS;
     extern const int LOGICAL_ERROR;
+    extern const int INVALID_SETTING_VALUE;
 }
 
 static const NameSet settings_to_skip
@@ -181,6 +182,12 @@ AsynchronousInsertQueue::AsynchronousInsertQueue(ContextPtr context_, size_t poo
     if (!pool_size)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "pool_size cannot be zero");
 
+    const auto & settings = getContext()->getSettingsRef();
+
+    for (size_t i = 0; i < pool_size; ++i)
+        queue_shards[i].busy_timeout_ms
+            = std::min(Milliseconds(settings.async_insert_busy_timeout_min_ms), Milliseconds(settings.async_insert_busy_timeout_max_ms));
+
     for (size_t i = 0; i < pool_size; ++i)
         dump_by_first_update_threads.emplace_back([this, i] { processBatchDeadlines(i); });
 }
@@ -222,9 +229,7 @@ void AsynchronousInsertQueue::scheduleDataProcessingJob(const InsertQuery & key,
     /// Wrap 'unique_ptr' with 'shared_ptr' to make this
     /// lambda copyable and allow to save it to the thread pool.
     pool.scheduleOrThrowOnError([key, global_context, my_data = std::make_shared<InsertDataPtr>(std::move(data))]() mutable
-    {
-        processData(key, std::move(*my_data), std::move(global_context));
-    });
+                                { processData(key, std::move(*my_data), std::move(global_context)); });
 }
 
 void AsynchronousInsertQueue::preprocessInsertQuery(const ASTPtr & query, const ContextPtr & query_context)
@@ -300,6 +305,7 @@ AsynchronousInsertQueue::PushResult
 AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr query_context)
 {
     const auto & settings = query_context->getSettingsRef();
+    validateSettings(settings, log);
     auto & insert_query = query->as<ASTInsertQuery &>();
 
     auto data_kind = chunk.getDataKind();
@@ -319,17 +325,14 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
 
     auto shard_num = key.hash % pool_size;
     auto & shard = queue_shards[shard_num];
-
     {
         std::lock_guard lock(shard.mutex);
 
         auto [it, inserted] = shard.iterators.try_emplace(key.hash);
+        auto now = std::chrono::steady_clock::now();
+        auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, shard_num, now);
         if (inserted)
-        {
-            auto now = std::chrono::steady_clock::now();
-            auto timeout = now + Milliseconds{key.settings.async_insert_busy_timeout_ms};
-            it->second = shard.queue.emplace(timeout, Container{key, std::make_unique<InsertData>()}).first;
-        }
+            it->second = shard.queue.emplace(now + timeout_ms, Container{key, std::make_unique<InsertData>()}).first;
 
         auto queue_it = it->second;
         auto & data = queue_it->second.data;
@@ -346,16 +349,29 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         bool has_enough_bytes = data->size_in_bytes >= key.settings.async_insert_max_data_size;
         bool has_enough_queries = data->entries.size() >= key.settings.async_insert_max_query_number && key.settings.async_insert_deduplicate;
 
-        /// Here we check whether we hit the limit on maximum data size in the buffer.
-        /// And use setting from query context.
-        /// It works, because queries with the same set of settings are already grouped together.
-        if (!flush_stopped && (has_enough_bytes || has_enough_queries))
+        auto max_busy_timeout_exceeded = [&shard, &settings, &now]() -> bool
+        {
+            if (!settings.async_insert_use_adaptive_busy_timeout || !shard.last_insert_time)
+                return false;
+
+            auto max_ms = Milliseconds(settings.async_insert_busy_timeout_max_ms);
+            return *shard.last_insert_time + max_ms < now;
+        };
+
+        /// Here we check whether we have hit the limit on the maximum data size in the buffer or
+        /// if the elapsed time since the last insert exceeds the maximum busy wait timeout.
+        /// We also use the limit settings from the query context.
+        /// This works because queries with the same set of settings are already grouped together.
+        if (!flush_stopped && (has_enough_bytes || has_enough_queries || max_busy_timeout_exceeded()))
         {
             data_to_process = std::move(data);
             shard.iterators.erase(it);
             shard.queue.erase(queue_it);
         }
 
+        shard.last_insert_time = now;
+        shard.busy_timeout_ms = timeout_ms;
+
         CurrentMetrics::add(CurrentMetrics::PendingAsyncInsert);
         ProfileEvents::increment(ProfileEvents::AsyncInsertQuery);
         ProfileEvents::increment(ProfileEvents::AsyncInsertBytes, entry_data_size);
@@ -374,6 +390,95 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
     };
 }
 
+AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeoutMs(
+    const Settings & settings,
+    const AsynchronousInsertQueue::QueueShard & shard,
+    size_t shard_num,
+    std::chrono::steady_clock::time_point now) const
+{
+    if (!settings.async_insert_use_adaptive_busy_timeout)
+        return settings.async_insert_busy_timeout_max_ms;
+
+    const auto max_ms = Milliseconds(settings.async_insert_busy_timeout_max_ms);
+    const auto min_ms = std::min(std::max(Milliseconds(settings.async_insert_busy_timeout_min_ms), Milliseconds(1)), max_ms);
+
+    auto normalize = [&min_ms, &max_ms](const auto & t_ms) { return std::min(std::max(t_ms, min_ms), max_ms); };
+
+    if (!shard.last_insert_time)
+        return normalize(shard.busy_timeout_ms);
+
+    const auto & last_insert_time = *shard.last_insert_time;
+    const double increase_rate = settings.async_insert_busy_timeout_increase_rate;
+    const double decrease_rate = settings.async_insert_busy_timeout_decrease_rate;
+
+    const auto decreased_timeout_ms = std::min(
+        std::chrono::duration_cast<Milliseconds>(shard.busy_timeout_ms / (1.0 + decrease_rate)), shard.busy_timeout_ms - Milliseconds(1));
+
+    /// Increase the timeout for frequent inserts.
+    if (last_insert_time + min_ms > now)
+    {
+        auto timeout_ms = std::max(
+            std::chrono::duration_cast<Milliseconds>(shard.busy_timeout_ms * (1.0 + increase_rate)),
+            shard.busy_timeout_ms + Milliseconds(1));
+        if (timeout_ms != shard.busy_timeout_ms)
+            LOG_TRACE(
+                log,
+                "Async timeout increased from {} to {} for queue shard {}.",
+                shard.busy_timeout_ms.count(),
+                timeout_ms.count(),
+                shard_num);
+
+        return normalize(timeout_ms);
+    }
+    /// Decrease the timeout if inserts are not frequent,
+    /// that is, if the time since the last insert long enough (exceeding the adjusted timeout).
+    /// This ensures the timeout value converges to the minimum over time for non-frequent inserts.
+    else if (last_insert_time + decreased_timeout_ms < now)
+    {
+        auto timeout_ms = decreased_timeout_ms;
+        if (timeout_ms != shard.busy_timeout_ms)
+            LOG_TRACE(
+                log,
+                "Async timeout decreased from {} to {} for queue shard {}.",
+                shard.busy_timeout_ms.count(),
+                timeout_ms.count(),
+                shard_num);
+
+        return normalize(timeout_ms);
+    }
+
+    return normalize(shard.busy_timeout_ms);
+}
+
+void AsynchronousInsertQueue::validateSettings(const Settings & settings, LoggerPtr log)
+{
+    const auto max_ms = std::chrono::milliseconds(settings.async_insert_busy_timeout_max_ms);
+
+    if (max_ms == std::chrono::milliseconds::zero())
+        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting 'async_insert_busy_timeout_max_ms' can't be zero");
+
+    if (!settings.async_insert_use_adaptive_busy_timeout)
+        return;
+
+    /// Adaptive timeout settings.
+    const auto min_ms = std::chrono::milliseconds(settings.async_insert_busy_timeout_min_ms);
+
+    if (min_ms > max_ms)
+        if (log)
+            LOG_WARNING(
+                log,
+                "Setting 'async_insert_busy_timeout_min_ms'={} is greater than 'async_insert_busy_timeout_max_ms'={}. Ignoring "
+                "'async_insert_busy_timeout_min_ms'",
+                min_ms.count(),
+                max_ms.count());
+
+    if (settings.async_insert_busy_timeout_increase_rate <= 0)
+        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting 'async_insert_busy_timeout_increase_rate' must be greater than zero");
+
+    if (settings.async_insert_busy_timeout_decrease_rate <= 0)
+        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting 'async_insert_busy_timeout_decrease_rate' must be greater than zero");
+}
+
 void AsynchronousInsertQueue::flushAll()
 {
     std::lock_guard flush_lock(flush_mutex);
@@ -395,8 +500,9 @@ void AsynchronousInsertQueue::flushAll()
     size_t total_bytes = 0;
     size_t total_entries = 0;
 
-    for (auto & queue : queues_to_flush)
+    for (size_t i = 0; i < pool_size; ++i)
     {
+        auto & queue = queues_to_flush[i];
         total_queries += queue.size();
         for (auto & [_, entry] : queue)
         {
@@ -429,17 +535,21 @@ void AsynchronousInsertQueue::processBatchDeadlines(size_t shard_num)
         {
             std::unique_lock lock(shard.mutex);
 
-            shard.are_tasks_available.wait_for(lock,
-                Milliseconds(getContext()->getSettingsRef().async_insert_poll_timeout_ms), [&shard, this]
-            {
-                if (shutdown)
-                    return true;
+            const auto rel_time
+                = std::min(shard.busy_timeout_ms, Milliseconds(getContext()->getSettingsRef().async_insert_poll_timeout_ms));
+            shard.are_tasks_available.wait_for(
+                lock,
+                rel_time,
+                [&shard, this]
+                {
+                    if (shutdown)
+                        return true;
 
-                if (!shard.queue.empty() && shard.queue.begin()->first < std::chrono::steady_clock::now())
-                    return true;
+                    if (!shard.queue.empty() && shard.queue.begin()->first < std::chrono::steady_clock::now())
+                        return true;
 
-                return false;
-            });
+                    return false;
+                });
 
             if (shutdown)
                 return;
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index f4bfdbd38a5..9d244034b1c 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -53,6 +53,8 @@ public:
         Preprocessed = 1,
     };
 
+    static void validateSettings(const Settings & settings, LoggerPtr log);
+
     /// Force flush the whole queue.
     void flushAll();
 
@@ -187,6 +189,11 @@ private:
 
         Queue queue;
         QueueIteratorByKey iterators;
+
+        using OptionalTimePoint = std::optional<std::chrono::steady_clock::time_point>;
+        OptionalTimePoint last_insert_time;
+
+        std::chrono::milliseconds busy_timeout_ms;
     };
 
     const size_t pool_size;
@@ -217,6 +224,13 @@ private:
     LoggerPtr log = getLogger("AsynchronousInsertQueue");
 
     PushResult pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr query_context);
+
+    Milliseconds getBusyWaitTimeoutMs(
+        const Settings & settings,
+        const AsynchronousInsertQueue::QueueShard & shard,
+        size_t shard_num,
+        std::chrono::steady_clock::time_point now) const;
+
     void preprocessInsertQuery(const ASTPtr & query, const ContextPtr & query_context);
 
     void processBatchDeadlines(size_t shard_num);
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 0a4d01de86d..0e5897e7306 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -4862,12 +4862,9 @@ AsynchronousInsertQueue * Context::getAsynchronousInsertQueue() const
 
 void Context::setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInsertQueue> & ptr)
 {
-    using namespace std::chrono;
+    AsynchronousInsertQueue::validateSettings(settings, getLogger("Context"));
 
-    if (std::chrono::milliseconds(settings.async_insert_busy_timeout_ms) == 0ms)
-        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting async_insert_busy_timeout_ms can't be zero");
-
-    if (std::chrono::milliseconds(settings.async_insert_poll_timeout_ms) == 0ms)
+    if (std::chrono::milliseconds(settings.async_insert_poll_timeout_ms) == std::chrono::milliseconds::zero())
         throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting async_insert_poll_timeout_ms can't be zero");
 
     shared->async_insert_queue = ptr;

From c04e5a4f35783ae4bacd8bbb696871dedc95ca0f Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Thu, 4 Jan 2024 01:09:15 +0000
Subject: [PATCH 0545/1081] Asynchronous insert queue size and bytes metrics
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Add AsynchronousInsertQueueSize and AsynchronousInsertQueueBytes
metrics to improve observability of asynchronous inserts.
The metrics do not account for tasks dispatched for immediate processing
(as opposed to, e.g., PendingAsyncInsert).

```
SELECT value
FROM system.metrics
WHERE metric IN ('AsynchronousInsertQueueSize', 'PendingAsyncInsert')

Query id: a711dd83-b48d-4ad5-8031-fa59b21a7c38

┌─value─┐
│    18 │
│    23 │
└───────┘
```

```
SELECT value
FROM system.metrics
WHERE metric IN ('AsynchronousInsertQueueSize', 'AsynchronousInsertQueueBytes')

Query id: b35a7ceb-2bb5-46ad-b301-e6cf03508699

┌─value─┐
│    28 │
│  1372 │
└───────┘
```
---
 src/Common/CurrentMetrics.cpp                |  2 ++
 src/Interpreters/AsynchronousInsertQueue.cpp | 25 ++++++++++++++++++++
 2 files changed, 27 insertions(+)

diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index e7534f71dbb..835ba606cdf 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -143,6 +143,8 @@
     M(AsynchronousInsertThreads, "Number of threads in the AsynchronousInsert thread pool.") \
     M(AsynchronousInsertThreadsActive, "Number of threads in the AsynchronousInsert thread pool running a task.") \
     M(AsynchronousInsertThreadsScheduled, "Number of queued or active jobs in the AsynchronousInsert thread pool.") \
+    M(AsynchronousInsertQueueSize, "Number of pending tasks in the AsynchronousInsert queue.") \
+    M(AsynchronousInsertQueueBytes, "Number of pending bytes in the AsynchronousInsert queue.") \
     M(StartupSystemTablesThreads, "Number of threads in the StartupSystemTables thread pool.") \
     M(StartupSystemTablesThreadsActive, "Number of threads in the StartupSystemTables thread pool running a task.") \
     M(StartupSystemTablesThreadsScheduled, "Number of queued or active jobs in the StartupSystemTables thread pool.") \
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 5aedf581775..b665cd12f93 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -40,6 +40,8 @@ namespace CurrentMetrics
     extern const Metric AsynchronousInsertThreads;
     extern const Metric AsynchronousInsertThreadsActive;
     extern const Metric AsynchronousInsertThreadsScheduled;
+    extern const Metric AsynchronousInsertQueueSize;
+    extern const Metric AsynchronousInsertQueueBytes;
 }
 
 namespace ProfileEvents
@@ -339,6 +341,7 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         size_t entry_data_size = entry->chunk.byteSize();
 
         assert(data);
+        auto size_in_bytes = data->size_in_bytes;
         data->size_in_bytes += entry_data_size;
         data->entries.emplace_back(entry);
         insert_future = entry->getFuture();
@@ -375,6 +378,19 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         CurrentMetrics::add(CurrentMetrics::PendingAsyncInsert);
         ProfileEvents::increment(ProfileEvents::AsyncInsertQuery);
         ProfileEvents::increment(ProfileEvents::AsyncInsertBytes, entry_data_size);
+
+        if (data_to_process)
+        {
+            if (!inserted)
+                CurrentMetrics::sub(CurrentMetrics::AsynchronousInsertQueueSize);
+            CurrentMetrics::sub(CurrentMetrics::AsynchronousInsertQueueBytes, size_in_bytes);
+        }
+        else
+        {
+            if (inserted)
+                CurrentMetrics::add(CurrentMetrics::AsynchronousInsertQueueSize);
+            CurrentMetrics::add(CurrentMetrics::AsynchronousInsertQueueBytes, entry_data_size);
+        }
     }
 
     if (data_to_process)
@@ -559,17 +575,26 @@ void AsynchronousInsertQueue::processBatchDeadlines(size_t shard_num)
 
             const auto now = std::chrono::steady_clock::now();
 
+            size_t size_in_bytes = 0;
             while (true)
             {
                 if (shard.queue.empty() || shard.queue.begin()->first > now)
                     break;
 
                 auto it = shard.queue.begin();
+                size_in_bytes += it->second.data->size_in_bytes;
+
                 shard.iterators.erase(it->second.key.hash);
 
                 entries_to_flush.emplace_back(std::move(it->second));
                 shard.queue.erase(it);
             }
+
+            if (!entries_to_flush.empty())
+            {
+                CurrentMetrics::sub(CurrentMetrics::AsynchronousInsertQueueSize, entries_to_flush.size());
+                CurrentMetrics::sub(CurrentMetrics::AsynchronousInsertQueueBytes, size_in_bytes);
+            }
         }
 
         for (auto & entry : entries_to_flush)

From 4ef02a189556499f1ba3016293bb7e34ad7f4143 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Wed, 17 Jan 2024 23:35:44 +0000
Subject: [PATCH 0546/1081] Log timeout for entries processed asynchronously

---
 src/Interpreters/AsynchronousInsertLog.cpp   |  5 ++--
 src/Interpreters/AsynchronousInsertLog.h     |  1 +
 src/Interpreters/AsynchronousInsertQueue.cpp | 29 ++++++++++++--------
 src/Interpreters/AsynchronousInsertQueue.h   |  8 ++++--
 4 files changed, 27 insertions(+), 16 deletions(-)

diff --git a/src/Interpreters/AsynchronousInsertLog.cpp b/src/Interpreters/AsynchronousInsertLog.cpp
index 9034f582869..5d851f6b47d 100644
--- a/src/Interpreters/AsynchronousInsertLog.cpp
+++ b/src/Interpreters/AsynchronousInsertLog.cpp
@@ -32,8 +32,7 @@ ColumnsDescription AsynchronousInsertLogElement::getColumnsDescription()
             {"Preprocessed", static_cast<Int8>(DataKind::Preprocessed)},
         });
 
-    return ColumnsDescription
-    {
+    return ColumnsDescription{
         {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
@@ -53,6 +52,7 @@ ColumnsDescription AsynchronousInsertLogElement::getColumnsDescription()
         {"flush_time", std::make_shared<DataTypeDateTime>()},
         {"flush_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
         {"flush_query_id", std::make_shared<DataTypeString>()},
+        {"timeout_milliseconds", std::make_shared<DataTypeUInt64>()},
     };
 }
 
@@ -80,6 +80,7 @@ void AsynchronousInsertLogElement::appendToBlock(MutableColumns & columns) const
     columns[i++]->insert(flush_time);
     columns[i++]->insert(flush_time_microseconds);
     columns[i++]->insert(flush_query_id);
+    columns[i++]->insert(timeout_milliseconds);
 }
 
 }
diff --git a/src/Interpreters/AsynchronousInsertLog.h b/src/Interpreters/AsynchronousInsertLog.h
index d05375002ad..70b56a273ad 100644
--- a/src/Interpreters/AsynchronousInsertLog.h
+++ b/src/Interpreters/AsynchronousInsertLog.h
@@ -38,6 +38,7 @@ struct AsynchronousInsertLogElement
     time_t flush_time{};
     Decimal64 flush_time_microseconds{};
     String flush_query_id;
+    UInt64 timeout_milliseconds = 0;
 
     static std::string name() { return "AsynchronousInsertLog"; }
     static ColumnsDescription getColumnsDescription();
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index b665cd12f93..6844ae5e551 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -334,7 +334,7 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         auto now = std::chrono::steady_clock::now();
         auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, shard_num, now);
         if (inserted)
-            it->second = shard.queue.emplace(now + timeout_ms, Container{key, std::make_unique<InsertData>()}).first;
+            it->second = shard.queue.emplace(now + timeout_ms, Container{key, std::make_unique<InsertData>(timeout_ms)}).first;
 
         auto queue_it = it->second;
         auto & data = queue_it->second.data;
@@ -367,6 +367,7 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         /// This works because queries with the same set of settings are already grouped together.
         if (!flush_stopped && (has_enough_bytes || has_enough_queries || max_busy_timeout_exceeded()))
         {
+            data->timeout_ms = Milliseconds::zero();
             data_to_process = std::move(data);
             shard.iterators.erase(it);
             shard.queue.erase(queue_it);
@@ -748,9 +749,12 @@ try
         throw;
     }
 
-    auto add_entry_to_log = [&](
-        const auto & entry, const auto & entry_query_for_logging,
-        const auto & exception, size_t num_rows, size_t num_bytes)
+    auto add_entry_to_log = [&](const auto & entry,
+                                const auto & entry_query_for_logging,
+                                const auto & exception,
+                                size_t num_rows,
+                                size_t num_bytes,
+                                Milliseconds timeout_ms)
     {
         if (!async_insert_log)
             return;
@@ -767,6 +771,7 @@ try
         elem.rows = num_rows;
         elem.exception = exception;
         elem.data_kind = entry->chunk.getDataKind();
+        elem.timeout_milliseconds = timeout_ms.count();
 
         /// If there was a parsing error,
         /// the entry won't be flushed anyway,
@@ -801,9 +806,9 @@ try
     auto header = pipeline.getHeader();
 
     if (key.data_kind == DataKind::Parsed)
-        chunk = processEntriesWithParsing(key, data->entries, header, insert_context, log, add_entry_to_log);
+        chunk = processEntriesWithParsing(key, data, header, insert_context, log, add_entry_to_log);
     else
-        chunk = processPreprocessedEntries(key, data->entries, header, insert_context, add_entry_to_log);
+        chunk = processPreprocessedEntries(key, data, header, insert_context, add_entry_to_log);
 
     ProfileEvents::increment(ProfileEvents::AsyncInsertRows, chunk.getNumRows());
 
@@ -864,7 +869,7 @@ catch (...)
 template <typename LogFunc>
 Chunk AsynchronousInsertQueue::processEntriesWithParsing(
     const InsertQuery & key,
-    const std::list<InsertData::EntryPtr> & entries,
+    const InsertDataPtr & data,
     const Block & header,
     const ContextPtr & insert_context,
     const LoggerPtr logger,
@@ -905,7 +910,7 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
     auto chunk_info = std::make_shared<AsyncInsertInfo>();
     auto query_for_logging = serializeQuery(*key.query, insert_context->getSettingsRef().log_queries_cut_to_length);
 
-    for (const auto & entry : entries)
+    for (const auto & entry : data->entries)
     {
         current_entry = entry;
 
@@ -921,7 +926,7 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
         chunk_info->offsets.push_back(total_rows);
         chunk_info->tokens.push_back(entry->async_dedup_token);
 
-        add_to_async_insert_log(entry, query_for_logging, current_exception, num_rows, num_bytes);
+        add_to_async_insert_log(entry, query_for_logging, current_exception, num_rows, num_bytes, data->timeout_ms);
         current_exception.clear();
     }
 
@@ -933,7 +938,7 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
 template <typename LogFunc>
 Chunk AsynchronousInsertQueue::processPreprocessedEntries(
     const InsertQuery & key,
-    const std::list<InsertData::EntryPtr> & entries,
+    const InsertDataPtr & data,
     const Block & header,
     const ContextPtr & insert_context,
     LogFunc && add_to_async_insert_log)
@@ -956,7 +961,7 @@ Chunk AsynchronousInsertQueue::processPreprocessedEntries(
         return it->second;
     };
 
-    for (const auto & entry : entries)
+    for (const auto & entry : data->entries)
     {
         const auto * block = entry->chunk.asBlock();
         if (!block)
@@ -972,7 +977,7 @@ Chunk AsynchronousInsertQueue::processPreprocessedEntries(
         chunk_info->tokens.push_back(entry->async_dedup_token);
 
         const auto & query_for_logging = get_query_by_format(entry->format);
-        add_to_async_insert_log(entry, query_for_logging, "", block->rows(), block->bytes());
+        add_to_async_insert_log(entry, query_for_logging, "", block->rows(), block->bytes(), data->timeout_ms);
     }
 
     Chunk chunk(std::move(result_columns), total_rows);
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index 9d244034b1c..1f18cf56032 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -148,6 +148,9 @@ private:
             std::atomic_bool finished = false;
         };
 
+        InsertData() = default;
+        explicit InsertData(Milliseconds timeout_ms_) : timeout_ms(timeout_ms_) { }
+
         ~InsertData()
         {
             auto it = entries.begin();
@@ -165,6 +168,7 @@ private:
 
         std::list<EntryPtr> entries;
         size_t size_in_bytes = 0;
+        Milliseconds timeout_ms = Milliseconds::zero();
     };
 
     using InsertDataPtr = std::unique_ptr<InsertData>;
@@ -241,7 +245,7 @@ private:
     template <typename LogFunc>
     static Chunk processEntriesWithParsing(
         const InsertQuery & key,
-        const std::list<InsertData::EntryPtr> & entries,
+        const InsertDataPtr & data,
         const Block & header,
         const ContextPtr & insert_context,
         const LoggerPtr logger,
@@ -250,7 +254,7 @@ private:
     template <typename LogFunc>
     static Chunk processPreprocessedEntries(
         const InsertQuery & key,
-        const std::list<InsertData::EntryPtr> & entries,
+        const InsertDataPtr & data,
         const Block & header,
         const ContextPtr & insert_context,
         LogFunc && add_to_async_insert_log);

From 17d2455448ed9c096c1e5d61aca36a47e6c5023d Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Thu, 4 Jan 2024 02:18:59 +0000
Subject: [PATCH 0547/1081] Integration tests for adaptive async insert timeout

Add initial tests.
---
 .../__init__.py                               |   0
 .../configs/users.xml                         |  14 +
 .../configs/zookeeper_config.xml              |   8 +
 .../test.py                                   | 372 ++++++++++++++++++
 ...68_adaptive_async_insert_timeout.reference |   0
 .../02968_adaptive_async_insert_timeout.sql   |  51 +++
 6 files changed, 445 insertions(+)
 create mode 100644 tests/integration/test_async_insert_adaptive_busy_timeout/__init__.py
 create mode 100644 tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
 create mode 100644 tests/integration/test_async_insert_adaptive_busy_timeout/configs/zookeeper_config.xml
 create mode 100644 tests/integration/test_async_insert_adaptive_busy_timeout/test.py
 create mode 100644 tests/queries/0_stateless/02968_adaptive_async_insert_timeout.reference
 create mode 100644 tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql

diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/__init__.py b/tests/integration/test_async_insert_adaptive_busy_timeout/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
new file mode 100644
index 00000000000..f38fa9f0315
--- /dev/null
+++ b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
@@ -0,0 +1,14 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <allow_experimental_async_insert_adaptive_busy_timeout>1</allow_experimental_async_insert_adaptive_busy_timeout>
+        </default>
+    </profiles>
+
+    <users>
+        <default>
+            <password></password>
+            <profile>default</profile>
+        </default>
+    </users>
+</clickhouse>
diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/configs/zookeeper_config.xml b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/zookeeper_config.xml
new file mode 100644
index 00000000000..18412349228
--- /dev/null
+++ b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/zookeeper_config.xml
@@ -0,0 +1,8 @@
+<clickhouse>
+    <zookeeper>
+        <node index="1">
+            <host>zoo1</host>
+            <port>2181</port>
+        </node>
+    </zookeeper>
+</clickhouse>
diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/test.py b/tests/integration/test_async_insert_adaptive_busy_timeout/test.py
new file mode 100644
index 00000000000..4d6261c0f63
--- /dev/null
+++ b/tests/integration/test_async_insert_adaptive_busy_timeout/test.py
@@ -0,0 +1,372 @@
+import copy
+import logging
+import pytest
+import random
+import timeit
+
+from math import floor
+from multiprocessing import Pool
+from itertools import repeat
+
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+
+node = cluster.add_instance(
+    "node",
+    main_configs=["configs/zookeeper_config.xml"],
+    user_configs=[
+        "configs/users.xml",
+    ],
+    with_zookeeper=True,
+)
+
+
+@pytest.fixture(scope="module", autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+_query_settings = {"async_insert": 1, "wait_for_async_insert": 1}
+
+
+def _generate_values(size, min_int, max_int, array_size_range):
+    gen_tuple = lambda _min_int, _max_int, _array_size_range: (
+        random.randint(_min_int, _max_int),
+        [
+            random.randint(_min_int, _max_int)
+            for _ in range(random.randint(*_array_size_range))
+        ],
+    )
+
+    return map(lambda _: gen_tuple(min_int, max_int, array_size_range), range(size))
+
+
+def _insert_query(table_name, settings, *args, **kwargs):
+    settings_s = ", ".join("{}={}".format(k, settings[k]) for k in settings)
+    INSERT_QUERY = "INSERT INTO {} SETTINGS {} VALUES {}"
+    node.query(
+        INSERT_QUERY.format(
+            table_name,
+            settings_s,
+            ", ".join(map(str, _generate_values(*args, **kwargs))),
+        )
+    )
+
+
+def _insert_queries_sequentially(
+    table_name, settings, iterations, max_values_size, array_size_range
+):
+    for iter in range(iterations):
+        _insert_query(
+            table_name,
+            settings,
+            random.randint(1, max_values_size),
+            iter * max_values_size,
+            (iter + 1) * max_values_size - 1,
+            array_size_range,
+        )
+
+
+def _insert_queries_in_parallel(
+    table_name, settings, thread_num, tasks, max_values_size, array_size_range
+):
+    sizes = [random.randint(1, max_values_size) for _ in range(tasks)]
+    min_ints = [iter * max_values_size for iter in range(tasks)]
+    max_ints = [(iter + 1) * max_values_size - 1 for iter in range(tasks)]
+    with Pool(thread_num) as p:
+        p.starmap(
+            _insert_query,
+            zip(
+                repeat(table_name),
+                repeat(settings),
+                sizes,
+                min_ints,
+                max_ints,
+                repeat(array_size_range),
+            ),
+        )
+
+
+def test_with_merge_tree():
+    table_name = "async_insert_mt_table"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            table_name
+        )
+    )
+
+    _insert_queries_sequentially(
+        table_name,
+        _query_settings,
+        iterations=100,
+        max_values_size=1000,
+        array_size_range=[10, 50],
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(table_name))
+
+
+def test_with_merge_tree_multithread():
+    thread_num = 15
+    table_name = "async_insert_mt_multithread_table"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            table_name
+        )
+    )
+
+    _insert_queries_in_parallel(
+        table_name,
+        _query_settings,
+        thread_num=15,
+        tasks=1000,
+        max_values_size=1000,
+        array_size_range=[10, 15],
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(table_name))
+
+
+def test_with_replicated_merge_tree():
+    table_name = "async_insert_replicated_mt_table"
+
+    create_query = " ".join(
+        (
+            "CREATE TABLE {} (a UInt64, b Array(UInt64))".format(table_name),
+            "ENGINE=ReplicatedMergeTree('/clickhouse/tables/test/{}', 'node')".format(
+                table_name
+            ),
+            "ORDER BY a",
+        )
+    )
+
+    node.query(create_query)
+
+    settings = _query_settings
+    _insert_queries_sequentially(
+        table_name,
+        settings,
+        iterations=100,
+        max_values_size=1000,
+        array_size_range=[10, 50],
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(table_name))
+
+
+def test_with_replicated_merge_tree_multithread():
+    thread_num = 15
+    table_name = "async_insert_replicated_mt_multithread_table"
+
+    create_query = " ".join(
+        (
+            "CREATE TABLE {} (a UInt64, b Array(UInt64))".format(table_name),
+            "ENGINE=ReplicatedMergeTree('/clickhouse/tables/test/{}', 'node')".format(
+                table_name
+            ),
+            "ORDER BY a",
+        )
+    )
+
+    node.query(create_query)
+
+    _insert_queries_in_parallel(
+        table_name,
+        _query_settings,
+        thread_num=15,
+        tasks=1000,
+        max_values_size=1000,
+        array_size_range=[10, 15],
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(table_name))
+
+
+# Ensure that the combined duration of inserts with adaptive timeouts is less than
+# the combined duration for fixed timeouts.
+def test_compare_sequential_inserts_durations_for_adaptive_and_fixed_async_timeouts():
+    fixed_tm_table_name = "async_insert_mt_fixed_async_timeout"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            fixed_tm_table_name
+        )
+    )
+
+    fixed_tm_settings = copy.copy(_query_settings)
+    fixed_tm_settings["allow_experimental_async_insert_adaptive_busy_timeout"] = 0
+    fixed_tm_settings["async_insert_busy_timeout_ms"] = 200
+
+    fixed_tm_run_duration = timeit.timeit(
+        lambda: _insert_queries_sequentially(
+            fixed_tm_table_name,
+            fixed_tm_settings,
+            iterations=100,
+            max_values_size=1000,
+            array_size_range=[10, 50],
+        ),
+        setup="pass",
+        number=3,
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(fixed_tm_table_name))
+
+    logging.debug(
+        "Run duration with fixed asynchronous timeout is {} seconds".format(
+            fixed_tm_run_duration
+        )
+    )
+
+    adaptive_tm_table_name = "async_insert_mt_adaptive_async_timeout"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            adaptive_tm_table_name
+        )
+    )
+
+    adaptive_tm_settings = copy.copy(_query_settings)
+    adaptive_tm_settings["async_insert_busy_timeout_min_ms"] = 10
+    adaptive_tm_settings["async_insert_busy_timeout_max_ms"] = 1000
+
+    adaptive_tm_run_duration = timeit.timeit(
+        lambda: _insert_queries_sequentially(
+            adaptive_tm_table_name,
+            adaptive_tm_settings,
+            iterations=100,
+            max_values_size=1000,
+            array_size_range=[10, 50],
+        ),
+        setup="pass",
+        number=3,
+    )
+
+    logging.debug(
+        "Run duration with adaptive asynchronous timeout is {} seconds.".format(
+            adaptive_tm_run_duration
+        )
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(adaptive_tm_table_name))
+
+    assert adaptive_tm_run_duration <= fixed_tm_run_duration
+
+
+# Ensure that the combined duration of inserts with adaptive timeouts is less than
+# the combined duration for fixed timeouts.
+def test_compare_parallel_inserts_durations_for_adaptive_and_fixed_async_timeouts():
+    fixed_tm_table_name = "async_insert_mt_fixed_async_timeout"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            fixed_tm_table_name
+        )
+    )
+
+    fixed_tm_settings = copy.copy(_query_settings)
+    fixed_tm_settings["allow_experimental_async_insert_adaptive_busy_timeout"] = 0
+    fixed_tm_settings["async_insert_busy_timeout_ms"] = 200
+
+    fixed_tm_run_duration = timeit.timeit(
+        lambda: _insert_queries_in_parallel(
+            fixed_tm_table_name,
+            fixed_tm_settings,
+            thread_num=15,
+            tasks=1000,
+            max_values_size=1000,
+            array_size_range=[10, 50],
+        ),
+        setup="pass",
+        number=3,
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(fixed_tm_table_name))
+
+    logging.debug(
+        "Run duration with fixed asynchronous timeout is {} seconds".format(
+            fixed_tm_run_duration
+        )
+    )
+
+    adaptive_tm_table_name = "async_insert_mt_adaptive_async_timeout"
+    node.query(
+        "CREATE TABLE {} (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a".format(
+            adaptive_tm_table_name
+        )
+    )
+
+    adaptive_tm_settings = copy.copy(_query_settings)
+    adaptive_tm_settings["async_insert_busy_timeout_min_ms"] = 10
+    adaptive_tm_settings["async_insert_busy_timeout_max_ms"] = 200
+
+    adaptive_tm_run_duration = timeit.timeit(
+        lambda: _insert_queries_in_parallel(
+            adaptive_tm_table_name,
+            adaptive_tm_settings,
+            thread_num=15,
+            tasks=100,
+            max_values_size=1000,
+            array_size_range=[10, 50],
+        ),
+        setup="pass",
+        number=3,
+    )
+
+    logging.debug(
+        "Run duration with adaptive asynchronous timeout is {} seconds.".format(
+            adaptive_tm_run_duration
+        )
+    )
+
+    node.query("DROP TABLE IF EXISTS {}".format(adaptive_tm_table_name))
+
+    assert adaptive_tm_run_duration <= fixed_tm_run_duration
+
+
+# Ensure that the delay converges to a minimum for sequential inserts and wait_for_async_insert=1.
+def test_change_queries_frequency():
+    table_name = "async_insert_mt_change_queries_frequencies"
+
+    create_query = " ".join(
+        (
+            "CREATE TABLE {} (a UInt64, b Array(UInt64))".format(table_name),
+            "ENGINE=ReplicatedMergeTree('/clickhouse/tables/test_frequencies/{}', 'node')".format(
+                table_name
+            ),
+            "ORDER BY a",
+        )
+    )
+
+    node.query(create_query)
+
+    settings = copy.copy(_query_settings)
+    min_ms = 50
+    settings["async_insert_busy_timeout_min_ms"] = min_ms
+    settings["async_insert_busy_timeout_max_ms"] = 2000
+
+    _insert_queries_in_parallel(
+        table_name,
+        settings,
+        thread_num=15,
+        tasks=2000,
+        max_values_size=1000,
+        array_size_range=[10, 15],
+    )
+
+    _insert_queries_sequentially(
+        table_name,
+        settings,
+        iterations=200,
+        max_values_size=1000,
+        array_size_range=[10, 50],
+    )
+
+    select_log_query = "SELECT timeout_milliseconds FROM system.asynchronous_insert_log ORDER BY event_time DESC LIMIT 50"
+    res = node.query(select_log_query)
+    for line in res.splitlines():
+        assert int(line) == min_ms
+
+    node.query("DROP TABLE IF EXISTS {}".format(table_name))
diff --git a/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.reference b/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql b/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql
new file mode 100644
index 00000000000..bca01b9fc92
--- /dev/null
+++ b/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql
@@ -0,0 +1,51 @@
+DROP TABLE IF EXISTS async_insert_mt_test;
+CREATE TABLE async_insert_mt_test (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a;
+
+SET allow_experimental_async_insert_adaptive_busy_timeout = 1;
+
+INSERT INTO async_insert_mt_test
+    SETTINGS
+        async_insert=1,
+        wait_for_async_insert=1,
+        async_insert_busy_timeout_min_ms=10,
+        async_insert_busy_timeout_max_ms=500,
+        async_insert_busy_timeout_increase_rate=1.0,
+        async_insert_busy_timeout_decrease_rate=1.0
+    VALUES (3, []), (1, [1, 3]), (2, [7, 8]), (4, [5, 9]), (5, [2, 6]);
+
+
+INSERT INTO async_insert_mt_test
+    SETTINGS
+        async_insert=1,
+        wait_for_async_insert=1,
+        async_insert_busy_timeout_ms=500,
+        async_insert_busy_timeout_min_ms=500
+    VALUES (3, []), (1, [1, 3]), (2, [7, 8]), (4, [5, 9]), (5, [2, 6]);
+
+
+INSERT INTO async_insert_mt_test
+    SETTINGS
+        async_insert=1,
+        wait_for_async_insert=1,
+        async_insert_busy_timeout_ms=100,
+        async_insert_busy_timeout_min_ms=500
+    VALUES (3, []), (1, [1, 3]), (2, [7, 8]), (4, [5, 9]), (5, [2, 6]);
+
+
+INSERT INTO async_insert_mt_test
+    SETTINGS
+        async_insert=1,
+        wait_for_async_insert=1,
+        async_insert_busy_timeout_increase_rate=-1.0
+    VALUES (3, []), (1, [1, 3]), (2, [7, 8]), (4, [5, 9]), (5, [2, 6]); -- { serverError INVALID_SETTING_VALUE }
+
+
+INSERT INTO async_insert_mt_test
+    SETTINGS
+        async_insert=1,
+        wait_for_async_insert=1,
+        async_insert_busy_timeout_decrease_rate=-1.0
+    VALUES (3, []), (1, [1, 3]), (2, [7, 8]), (4, [5, 9]), (5, [2, 6]); -- { serverError INVALID_SETTING_VALUE }
+
+
+DROP TABLE IF EXISTS async_insert_mt_test;

From 689c368b76aae3afde0ea23ca0790a494dcbad89 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Sat, 20 Jan 2024 04:11:10 +0000
Subject: [PATCH 0548/1081] Adaptive async timeouts: consider queue flush
 history

In addition to the time since the most recent insert,
consider the elapsed time between the two recent queue
flushes when decreasing the timeout or processing an
entry synchronously.
---
 src/Interpreters/AsynchronousInsertQueue.cpp  | 63 +++++++++++++------
 src/Interpreters/AsynchronousInsertQueue.h    | 28 +++++++--
 .../configs/users.xml                         |  2 +-
 .../test.py                                   |  4 +-
 .../02968_adaptive_async_insert_timeout.sql   |  2 +-
 5 files changed, 72 insertions(+), 27 deletions(-)

diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 6844ae5e551..e7f292d9b77 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -33,7 +33,6 @@
 #include <Common/SipHash.h>
 #include <Common/logger_useful.h>
 
-
 namespace CurrentMetrics
 {
     extern const Metric PendingAsyncInsert;
@@ -174,12 +173,31 @@ void AsynchronousInsertQueue::InsertData::Entry::finish(std::exception_ptr excep
     }
 }
 
+AsynchronousInsertQueue::QueueShardFlushTimeHistory::TimePoints
+AsynchronousInsertQueue::QueueShardFlushTimeHistory::getRecentTimePoints() const
+{
+    std::shared_lock lock(mutex);
+    return time_points;
+}
+
+void AsynchronousInsertQueue::QueueShardFlushTimeHistory::updateWithCurrentTime()
+{
+    std::unique_lock lock(mutex);
+    time_points.first = time_points.second;
+    time_points.second = std::chrono::steady_clock::now();
+}
+
 AsynchronousInsertQueue::AsynchronousInsertQueue(ContextPtr context_, size_t pool_size_, bool flush_on_shutdown_)
     : WithContext(context_)
     , pool_size(pool_size_)
     , flush_on_shutdown(flush_on_shutdown_)
     , queue_shards(pool_size)
-    , pool(CurrentMetrics::AsynchronousInsertThreads, CurrentMetrics::AsynchronousInsertThreadsActive, CurrentMetrics::AsynchronousInsertThreadsScheduled, pool_size)
+    , flush_time_history_per_queue_shard(pool_size)
+    , pool(
+          CurrentMetrics::AsynchronousInsertThreads,
+          CurrentMetrics::AsynchronousInsertThreadsActive,
+          CurrentMetrics::AsynchronousInsertThreadsScheduled,
+          pool_size)
 {
     if (!pool_size)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "pool_size cannot be zero");
@@ -210,7 +228,7 @@ AsynchronousInsertQueue::~AsynchronousInsertQueue()
         if (flush_on_shutdown)
         {
             for (auto & [_, elem] : shard.queue)
-                scheduleDataProcessingJob(elem.key, std::move(elem.data), getContext());
+                scheduleDataProcessingJob(elem.key, std::move(elem.data), getContext(), i);
         }
         else
         {
@@ -226,12 +244,14 @@ AsynchronousInsertQueue::~AsynchronousInsertQueue()
     LOG_TRACE(log, "Asynchronous insertion queue finished");
 }
 
-void AsynchronousInsertQueue::scheduleDataProcessingJob(const InsertQuery & key, InsertDataPtr data, ContextPtr global_context)
+void AsynchronousInsertQueue::scheduleDataProcessingJob(
+    const InsertQuery & key, InsertDataPtr data, ContextPtr global_context, size_t shard_num)
 {
     /// Wrap 'unique_ptr' with 'shared_ptr' to make this
     /// lambda copyable and allow to save it to the thread pool.
-    pool.scheduleOrThrowOnError([key, global_context, my_data = std::make_shared<InsertDataPtr>(std::move(data))]() mutable
-                                { processData(key, std::move(*my_data), std::move(global_context)); });
+    pool.scheduleOrThrowOnError(
+        [this, key, global_context, shard_num, my_data = std::make_shared<InsertDataPtr>(std::move(data))]() mutable
+        { processData(key, std::move(*my_data), std::move(global_context), flush_time_history_per_queue_shard[shard_num]); });
 }
 
 void AsynchronousInsertQueue::preprocessInsertQuery(const ASTPtr & query, const ContextPtr & query_context)
@@ -327,12 +347,13 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
 
     auto shard_num = key.hash % pool_size;
     auto & shard = queue_shards[shard_num];
+    const auto flush_time_points = flush_time_history_per_queue_shard[shard_num].getRecentTimePoints();
     {
         std::lock_guard lock(shard.mutex);
 
         auto [it, inserted] = shard.iterators.try_emplace(key.hash);
         auto now = std::chrono::steady_clock::now();
-        auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, shard_num, now);
+        auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, shard_num, flush_time_points, now);
         if (inserted)
             it->second = shard.queue.emplace(now + timeout_ms, Container{key, std::make_unique<InsertData>(timeout_ms)}).first;
 
@@ -352,13 +373,13 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
         bool has_enough_bytes = data->size_in_bytes >= key.settings.async_insert_max_data_size;
         bool has_enough_queries = data->entries.size() >= key.settings.async_insert_max_query_number && key.settings.async_insert_deduplicate;
 
-        auto max_busy_timeout_exceeded = [&shard, &settings, &now]() -> bool
+        auto max_busy_timeout_exceeded = [&shard, &settings, &now, &flush_time_points]() -> bool
         {
-            if (!settings.async_insert_use_adaptive_busy_timeout || !shard.last_insert_time)
+            if (!settings.async_insert_use_adaptive_busy_timeout || !shard.last_insert_time || !flush_time_points.first)
                 return false;
 
             auto max_ms = Milliseconds(settings.async_insert_busy_timeout_max_ms);
-            return *shard.last_insert_time + max_ms < now;
+            return *shard.last_insert_time + max_ms < now && *flush_time_points.first + max_ms < *flush_time_points.second;
         };
 
         /// Here we check whether we have hit the limit on the maximum data size in the buffer or
@@ -395,7 +416,7 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
     }
 
     if (data_to_process)
-        scheduleDataProcessingJob(key, std::move(data_to_process), getContext());
+        scheduleDataProcessingJob(key, std::move(data_to_process), getContext(), shard_num);
     else
         shard.are_tasks_available.notify_one();
 
@@ -409,8 +430,9 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
 
 AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeoutMs(
     const Settings & settings,
-    const AsynchronousInsertQueue::QueueShard & shard,
+    const QueueShard & shard,
     size_t shard_num,
+    const QueueShardFlushTimeHistory::TimePoints & flush_time_points,
     std::chrono::steady_clock::time_point now) const
 {
     if (!settings.async_insert_use_adaptive_busy_timeout)
@@ -421,10 +443,11 @@ AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeou
 
     auto normalize = [&min_ms, &max_ms](const auto & t_ms) { return std::min(std::max(t_ms, min_ms), max_ms); };
 
-    if (!shard.last_insert_time)
+    if (!shard.last_insert_time || !flush_time_points.first)
         return normalize(shard.busy_timeout_ms);
 
     const auto & last_insert_time = *shard.last_insert_time;
+    const auto & [t1, t2] = std::tie(*flush_time_points.first, *flush_time_points.second);
     const double increase_rate = settings.async_insert_busy_timeout_increase_rate;
     const double decrease_rate = settings.async_insert_busy_timeout_decrease_rate;
 
@@ -448,9 +471,10 @@ AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeou
         return normalize(timeout_ms);
     }
     /// Decrease the timeout if inserts are not frequent,
-    /// that is, if the time since the last insert long enough (exceeding the adjusted timeout).
+    /// that is, if the time since the last insert and the difference between the last two queue flushes were both
+    /// long enough (exceeding the adjusted timeout).
     /// This ensures the timeout value converges to the minimum over time for non-frequent inserts.
-    else if (last_insert_time + decreased_timeout_ms < now)
+    else if (last_insert_time + decreased_timeout_ms < now && t1 + decreased_timeout_ms < t2)
     {
         auto timeout_ms = decreased_timeout_ms;
         if (timeout_ms != shard.busy_timeout_ms)
@@ -525,7 +549,7 @@ void AsynchronousInsertQueue::flushAll()
         {
             total_bytes += entry.data->size_in_bytes;
             total_entries += entry.data->entries.size();
-            scheduleDataProcessingJob(entry.key, std::move(entry.data), getContext());
+            scheduleDataProcessingJob(entry.key, std::move(entry.data), getContext(), i);
         }
     }
 
@@ -599,7 +623,7 @@ void AsynchronousInsertQueue::processBatchDeadlines(size_t shard_num)
         }
 
         for (auto & entry : entries_to_flush)
-            scheduleDataProcessingJob(entry.key, std::move(entry.data), getContext());
+            scheduleDataProcessingJob(entry.key, std::move(entry.data), getContext(), shard_num);
     }
 }
 
@@ -643,7 +667,8 @@ String serializeQuery(const IAST & query, size_t max_length)
 }
 
 // static
-void AsynchronousInsertQueue::processData(InsertQuery key, InsertDataPtr data, ContextPtr global_context)
+void AsynchronousInsertQueue::processData(
+    InsertQuery key, InsertDataPtr data, ContextPtr global_context, QueueShardFlushTimeHistory & queue_shard_flush_time_history)
 try
 {
     if (!data)
@@ -831,6 +856,8 @@ try
 
         LOG_INFO(log, "Flushed {} rows, {} bytes for query '{}'", num_rows, num_bytes, key.query_str);
 
+        queue_shard_flush_time_history.updateWithCurrentTime();
+
         bool pulling_pipeline = false;
         logQueryFinish(query_log_elem, insert_context, key.query, pipeline, pulling_pipeline, query_span, QueryCache::Usage::None, internal);
     }
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index 1f18cf56032..c2c4755f192 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -10,6 +10,7 @@
 #include <Processors/Chunk.h>
 
 #include <future>
+#include <shared_mutex>
 #include <variant>
 
 namespace DB
@@ -186,6 +187,8 @@ private:
     using QueueIterator = Queue::iterator;
     using QueueIteratorByKey = std::unordered_map<UInt128, QueueIterator>;
 
+    using OptionalTimePoint = std::optional<std::chrono::steady_clock::time_point>;
+
     struct QueueShard
     {
         mutable std::mutex mutex;
@@ -194,16 +197,29 @@ private:
         Queue queue;
         QueueIteratorByKey iterators;
 
-        using OptionalTimePoint = std::optional<std::chrono::steady_clock::time_point>;
         OptionalTimePoint last_insert_time;
-
         std::chrono::milliseconds busy_timeout_ms;
     };
 
+    /// Times of the two most recent queue flushes.
+    /// Used to calculate adaptive timeout.
+    struct QueueShardFlushTimeHistory
+    {
+    public:
+        using TimePoints = std::pair<OptionalTimePoint, OptionalTimePoint>;
+        TimePoints getRecentTimePoints() const;
+        void updateWithCurrentTime();
+
+    private:
+        mutable std::shared_mutex mutex;
+        TimePoints time_points;
+    };
+
     const size_t pool_size;
     const bool flush_on_shutdown;
 
     std::vector<QueueShard> queue_shards;
+    std::vector<QueueShardFlushTimeHistory> flush_time_history_per_queue_shard;
 
     /// Logic and events behind queue are as follows:
     ///  - async_insert_busy_timeout_ms:
@@ -231,16 +247,18 @@ private:
 
     Milliseconds getBusyWaitTimeoutMs(
         const Settings & settings,
-        const AsynchronousInsertQueue::QueueShard & shard,
+        const QueueShard & shard,
         size_t shard_num,
+        const QueueShardFlushTimeHistory::TimePoints & flush_time_points,
         std::chrono::steady_clock::time_point now) const;
 
     void preprocessInsertQuery(const ASTPtr & query, const ContextPtr & query_context);
 
     void processBatchDeadlines(size_t shard_num);
-    void scheduleDataProcessingJob(const InsertQuery & key, InsertDataPtr data, ContextPtr global_context);
+    void scheduleDataProcessingJob(const InsertQuery & key, InsertDataPtr data, ContextPtr global_context, size_t shard_num);
 
-    static void processData(InsertQuery key, InsertDataPtr data, ContextPtr global_context);
+    static void processData(
+        InsertQuery key, InsertDataPtr data, ContextPtr global_context, QueueShardFlushTimeHistory & queue_shard_flush_time_history);
 
     template <typename LogFunc>
     static Chunk processEntriesWithParsing(
diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
index f38fa9f0315..755dc4ac269 100644
--- a/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
+++ b/tests/integration/test_async_insert_adaptive_busy_timeout/configs/users.xml
@@ -1,7 +1,7 @@
 <clickhouse>
     <profiles>
         <default>
-            <allow_experimental_async_insert_adaptive_busy_timeout>1</allow_experimental_async_insert_adaptive_busy_timeout>
+            <async_insert_use_adaptive_busy_timeout>1</async_insert_use_adaptive_busy_timeout>
         </default>
     </profiles>
 
diff --git a/tests/integration/test_async_insert_adaptive_busy_timeout/test.py b/tests/integration/test_async_insert_adaptive_busy_timeout/test.py
index 4d6261c0f63..93319a56d0f 100644
--- a/tests/integration/test_async_insert_adaptive_busy_timeout/test.py
+++ b/tests/integration/test_async_insert_adaptive_busy_timeout/test.py
@@ -199,7 +199,7 @@ def test_compare_sequential_inserts_durations_for_adaptive_and_fixed_async_timeo
     )
 
     fixed_tm_settings = copy.copy(_query_settings)
-    fixed_tm_settings["allow_experimental_async_insert_adaptive_busy_timeout"] = 0
+    fixed_tm_settings["async_insert_use_adaptive_busy_timeout"] = 0
     fixed_tm_settings["async_insert_busy_timeout_ms"] = 200
 
     fixed_tm_run_duration = timeit.timeit(
@@ -267,7 +267,7 @@ def test_compare_parallel_inserts_durations_for_adaptive_and_fixed_async_timeout
     )
 
     fixed_tm_settings = copy.copy(_query_settings)
-    fixed_tm_settings["allow_experimental_async_insert_adaptive_busy_timeout"] = 0
+    fixed_tm_settings["async_insert_use_adaptive_busy_timeout"] = 0
     fixed_tm_settings["async_insert_busy_timeout_ms"] = 200
 
     fixed_tm_run_duration = timeit.timeit(
diff --git a/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql b/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql
index bca01b9fc92..f9606cace6e 100644
--- a/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql
+++ b/tests/queries/0_stateless/02968_adaptive_async_insert_timeout.sql
@@ -1,7 +1,7 @@
 DROP TABLE IF EXISTS async_insert_mt_test;
 CREATE TABLE async_insert_mt_test (a UInt64, b Array(UInt64)) ENGINE=MergeTree() ORDER BY a;
 
-SET allow_experimental_async_insert_adaptive_busy_timeout = 1;
+SET async_insert_use_adaptive_busy_timeout = 1;
 
 INSERT INTO async_insert_mt_test
     SETTINGS

From 5b07039ab2c6db4a8d5b0418f334febd65419584 Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Fri, 26 Jan 2024 22:55:30 +0000
Subject: [PATCH 0549/1081] Update settings.md

---
 docs/en/operations/settings/settings.md | 59 ++++++++++++++++++++++++-
 1 file changed, 57 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index c673464b23d..7aa033bf4ce 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1935,7 +1935,7 @@ Possible values:
 
 Default value: `450`.
 
-### async_insert_busy_timeout_ms {#async-insert-busy-timeout-ms}
+### async_insert_busy_timeout_max_ms {#async-insert-busy-timeout-max-ms}
 
 The maximum timeout in milliseconds since the first `INSERT` query before inserting collected data.
 
@@ -1946,6 +1946,61 @@ Possible values:
 
 Default value: `200`.
 
+### async_insert_poll_timeout_ms {#async-insert-poll-timeout-ms}
+
+Timeout in milliseconds for polling data from asynchronous insert queue.
+
+Possible values:
+
+- Positive integer.
+
+Default value: `10`.
+
+### async_insert_use_adaptive_busy_timeout {#allow-experimental-async-insert-adaptive-busy-timeout}
+
+Use adaptive asynchronous insert timeout.
+
+Possible values:
+
+- 0 - Disabled.
+- 1 - Enabled.
+
+Default value: `0`.
+
+### async_insert_busy_timeout_min_ms {#async-insert-busy-timeout-min-ms}
+
+If adaptive asynchronous insert timeout is allowed through [async_insert_use_adaptive_busy_timeout](#allow-experimental-async-insert-adaptive-busy-timeout), the setting specifies the minimum value of the asynchronous insert timeout in milliseconds. It also serves as the initial value, which may be increased later by the adaptive algorithm, up to the [async_insert_busy_timeout_ms](#async_insert_busy_timeout_ms).
+
+Possible values:
+
+- Positive integer.
+
+Default value: `50`.
+
+### async_insert_busy_timeout_ms {#async-insert-busy-timeout-ms}
+
+Alias for [`async_insert_busy_timeout_max_ms`](#async_insert_busy_timeout_max_ms).
+
+### async_insert_busy_timeout_increase_rate {#async-insert-busy-timeout-increase-rate}
+
+If adaptive asynchronous insert timeout is allowed through [async_insert_use_adaptive_busy_timeout](#allow-experimental-async-insert-adaptive-busy-timeout), the setting specifies the exponential growth rate at which the adaptive asynchronous insert timeout increases.
+
+Possible values:
+
+- A positive floating-point number.
+
+Default value: `0.2`.
+
+### async_insert_busy_timeout_decrease_rate {#async-insert-busy-timeout-decrease-rate}
+
+If adaptive asynchronous insert timeout is allowed through [async_insert_use_adaptive_busy_timeout](#allow-experimental-async-insert-adaptive-busy-timeout), the setting specifies the exponential growth rate at which the adaptive asynchronous insert timeout decreases.
+
+Possible values:
+
+- A positive floating-point number.
+
+Default value: `0.2`.
+
 ### async_insert_stale_timeout_ms {#async-insert-stale-timeout-ms}
 
 The maximum timeout in milliseconds since the last `INSERT` query before dumping collected data. If enabled, the settings prolongs the [async_insert_busy_timeout_ms](#async-insert-busy-timeout-ms) with every `INSERT` query as long as [async_insert_max_data_size](#async-insert-max-data-size) is not exceeded.
@@ -5321,4 +5376,4 @@ Allow to ignore schema evolution in Iceberg table engine and read all data using
 Enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema.
 :::
 
-Default value: 'false'.
\ No newline at end of file
+Default value: 'false'.

From b2508bd70f0b0f33e2eaf5603e67337bf1cbca76 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 2 Feb 2024 03:38:10 +0100
Subject: [PATCH 0550/1081] Use threadpool size as feature flag

---
 src/Core/ServerSettings.h            | 3 +--
 src/Databases/DatabaseReplicated.cpp | 2 +-
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 0d48ddca687..99fe66c34ad 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -114,8 +114,7 @@ namespace DB
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
-    M(Bool, allow_database_replicated_concurrent_table_creation, false, "Allow concurrent table creation during replica recovery in DatabaseReplicated.", 0) \
-    M(UInt64, max_database_replicated_create_table_thread_pool_size, 32, "The number of threads to create tables during replica recovery in DatabaseReplicated.", 0) \
+    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Zero means tables will be created sequentially.", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 6db6bb8c034..0d02d2a5a1c 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -1093,7 +1093,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
 
     tables_dependencies.checkNoCyclicDependencies();
 
-    auto allow_concurrent_table_creation = getContext()->getServerSettings().allow_database_replicated_concurrent_table_creation;
+    auto allow_concurrent_table_creation = getContext()->getServerSettings().max_database_replicated_create_table_thread_pool_size > 0;
     auto tables_to_create_by_level = tables_dependencies.getTablesSortedByDependencyWithLevels();
 
     auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "CreateTables");

From 7c715e66a270e5f1dde41a64ab347e1c7008c16a Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Tue, 30 Jan 2024 03:27:46 +0000
Subject: [PATCH 0551/1081] Update existing tests

---
 tests/queries/0_stateless/02015_async_inserts_2.sh            | 4 +++-
 tests/queries/0_stateless/02134_async_inserts_formats.sh      | 4 +++-
 tests/queries/0_stateless/02726_async_insert_flush_queue.sql  | 3 ++-
 .../02810_async_insert_dedup_replicated_collapsing.sh         | 4 ++--
 .../0_stateless/02884_async_insert_native_protocol_1.sh       | 2 +-
 .../0_stateless/02884_async_insert_native_protocol_3.sh       | 2 +-
 .../queries/0_stateless/02884_async_insert_skip_settings.sql  | 3 ++-
 7 files changed, 14 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/02015_async_inserts_2.sh b/tests/queries/0_stateless/02015_async_inserts_2.sh
index 48523ccd9a9..606d4cc37b6 100755
--- a/tests/queries/0_stateless/02015_async_inserts_2.sh
+++ b/tests/queries/0_stateless/02015_async_inserts_2.sh
@@ -5,7 +5,9 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_busy_timeout_ms=600000&async_insert_max_query_number=3&async_insert_deduplicate=1"
+# With adaptive timeout enabled, the asynchronous queue can be flushed synchronously, depending on the elapsed since the last insert.
+# This may result in test flakiness.
+url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_busy_timeout_ms=600000&async_insert_max_query_number=3&async_insert_deduplicate=1&async_insert_use_adaptive_busy_timeout=0"
 
 ${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS async_inserts"
 ${CLICKHOUSE_CLIENT} -q "CREATE TABLE async_inserts (id UInt32, s String) ENGINE = MergeTree ORDER BY id"
diff --git a/tests/queries/0_stateless/02134_async_inserts_formats.sh b/tests/queries/0_stateless/02134_async_inserts_formats.sh
index 631809e5dc2..89705bf6415 100755
--- a/tests/queries/0_stateless/02134_async_inserts_formats.sh
+++ b/tests/queries/0_stateless/02134_async_inserts_formats.sh
@@ -4,7 +4,9 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1"
+# With adaptive timeout enabled, the asynchronous queue can be flushed synchronously, depending on the elapsed since the last insert.
+# This may result in test flakiness.
+url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_use_adaptive_busy_timeout=0"
 
 ${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS async_inserts"
 ${CLICKHOUSE_CLIENT} -q "CREATE TABLE async_inserts (id UInt32, s String) ENGINE = MergeTree ORDER BY id"
diff --git a/tests/queries/0_stateless/02726_async_insert_flush_queue.sql b/tests/queries/0_stateless/02726_async_insert_flush_queue.sql
index 98e78045b85..1ae24e4f3da 100644
--- a/tests/queries/0_stateless/02726_async_insert_flush_queue.sql
+++ b/tests/queries/0_stateless/02726_async_insert_flush_queue.sql
@@ -6,7 +6,8 @@ CREATE TABLE t_async_inserts_flush (a UInt64) ENGINE = Memory;
 
 SET async_insert = 1;
 SET wait_for_async_insert = 0;
-SET async_insert_busy_timeout_ms = 1000000;
+SET async_insert_busy_timeout_min_ms = 1000000;
+SET async_insert_busy_timeout_max_ms = 10000000;
 
 INSERT INTO t_async_inserts_flush VALUES (1) (2);
 INSERT INTO t_async_inserts_flush FORMAT JSONEachRow {"a": 10} {"a": 20};
diff --git a/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh
index 804cd894ebc..57950af8975 100755
--- a/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh
+++ b/tests/queries/0_stateless/02810_async_insert_dedup_replicated_collapsing.sh
@@ -7,7 +7,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 ${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS 02810_async_insert_dedup_collapsing"
 ${CLICKHOUSE_CLIENT} -q "CREATE TABLE 02810_async_insert_dedup_collapsing (stringvalue String, sign Int8) ENGINE = ReplicatedCollapsingMergeTree('/clickhouse/{database}/02810_async_insert_dedup', 'r1', sign) ORDER BY stringvalue"
 
-url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_busy_timeout_ms=3000&async_insert_deduplicate=1"
+url="${CLICKHOUSE_URL}&async_insert=1&wait_for_async_insert=1&async_insert_busy_timeout_ms=3000&async_insert_use_adaptive_busy_timeout=0&async_insert_deduplicate=1"
 
 # insert value with same key and sign so it's collapsed on insert
 ${CLICKHOUSE_CURL} -sS "$url" -d "INSERT INTO 02810_async_insert_dedup_collapsing VALUES ('string1', 1)" &
@@ -36,4 +36,4 @@ wait
 ${CLICKHOUSE_CLIENT} -q "SELECT stringvalue FROM 02810_async_insert_dedup_collapsing ORDER BY stringvalue"
 ${CLICKHOUSE_CLIENT} -q "SELECT '------------'"
 
-${CLICKHOUSE_CLIENT} -q "DROP TABLE 02810_async_insert_dedup_collapsing"
\ No newline at end of file
+${CLICKHOUSE_CLIENT} -q "DROP TABLE 02810_async_insert_dedup_collapsing"
diff --git a/tests/queries/0_stateless/02884_async_insert_native_protocol_1.sh b/tests/queries/0_stateless/02884_async_insert_native_protocol_1.sh
index 82e2bb709f9..7f583087336 100755
--- a/tests/queries/0_stateless/02884_async_insert_native_protocol_1.sh
+++ b/tests/queries/0_stateless/02884_async_insert_native_protocol_1.sh
@@ -12,7 +12,7 @@ $CLICKHOUSE_CLIENT -n -q "
     CREATE TABLE t_async_insert_native_1 (id UInt64, s String) ENGINE = MergeTree ORDER BY id;
 "
 
-async_insert_options="--async_insert 1 --wait_for_async_insert 0 --async_insert_busy_timeout_ms 1000000"
+async_insert_options="--async_insert 1 --wait_for_async_insert 0 --async_insert_busy_timeout_min_ms 1000000 --async_insert_busy_timeout_max_ms 10000000"
 
 echo '{"id": 1, "s": "aaa"} {"id": 2, "s": "bbb"}' | $CLICKHOUSE_CLIENT $async_insert_options -q 'INSERT INTO t_async_insert_native_1 FORMAT JSONEachRow'
 $CLICKHOUSE_CLIENT $async_insert_options  -q 'INSERT INTO t_async_insert_native_1 FORMAT JSONEachRow {"id": 3, "s": "ccc"}'
diff --git a/tests/queries/0_stateless/02884_async_insert_native_protocol_3.sh b/tests/queries/0_stateless/02884_async_insert_native_protocol_3.sh
index abe6be9e2bc..c9d399607d0 100755
--- a/tests/queries/0_stateless/02884_async_insert_native_protocol_3.sh
+++ b/tests/queries/0_stateless/02884_async_insert_native_protocol_3.sh
@@ -12,7 +12,7 @@ $CLICKHOUSE_CLIENT -n -q "
     CREATE TABLE t_async_insert_native_3 (id UInt64, s String) ENGINE = MergeTree ORDER BY id;
 "
 
-async_insert_options="--async_insert 1 --wait_for_async_insert 0 --async_insert_busy_timeout_ms 1000000"
+async_insert_options="--async_insert 1 --wait_for_async_insert 0 --async_insert_busy_timeout_min_ms 1000000 --async_insert_busy_timeout_max_ms 10000000"
 
 echo '{"id": 1, "s": "aaa"} {"id": 2, "s": "bbb"}' | $CLICKHOUSE_CLIENT $async_insert_options -q 'INSERT INTO t_async_insert_native_3 FORMAT JSONEachRow'
 echo "(3, 'ccc') (4, 'ddd') (5, 'eee')" | $CLICKHOUSE_CLIENT $async_insert_options -q 'INSERT INTO t_async_insert_native_3 FORMAT Values'
diff --git a/tests/queries/0_stateless/02884_async_insert_skip_settings.sql b/tests/queries/0_stateless/02884_async_insert_skip_settings.sql
index facd39d1079..9bc689fb4ec 100644
--- a/tests/queries/0_stateless/02884_async_insert_skip_settings.sql
+++ b/tests/queries/0_stateless/02884_async_insert_skip_settings.sql
@@ -9,7 +9,8 @@ ORDER BY id;
 SET async_insert = 1;
 SET async_insert_deduplicate = 1;
 SET wait_for_async_insert = 0;
-SET async_insert_busy_timeout_ms = 100000;
+SET async_insert_busy_timeout_min_ms = 100000;
+SET async_insert_busy_timeout_max_ms = 1000000;
 
 SET insert_deduplication_token = '1';
 SET log_comment = 'async_insert_skip_settings_1';

From 505b9bac44f3cd6a4803224d5055a2d85ac349ad Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Wed, 31 Jan 2024 20:19:25 +0000
Subject: [PATCH 0552/1081] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index ad04ee79995..c3b0cee00a4 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -84,6 +84,12 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
+    {"24.2", {{"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
+              {"async_insert_use_adaptive_busy_timeout", true, true, "Use adaptive asynchronous insert timeout"},
+              {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
+              {"async_insert_busy_timeout_max_ms", 200, 200, "The minimum value of the asynchronous insert timeout in milliseconds; async_insert_busy_timeout_ms is aliased to async_insert_busy_timeout_max_ms"},
+              {"async_insert_busy_timeout_increase_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases"},
+              {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},

From a9674b9cd49420a30ec09c550b59fb0702d5b3d2 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 2 Feb 2024 03:39:17 +0100
Subject: [PATCH 0553/1081] Enable in tests

---
 tests/config/config.d/database_replicated.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/config/config.d/database_replicated.xml b/tests/config/config.d/database_replicated.xml
index 2504a7ca526..d8bed2f08fe 100644
--- a/tests/config/config.d/database_replicated.xml
+++ b/tests/config/config.d/database_replicated.xml
@@ -97,4 +97,5 @@
     </remote_servers>
 
     <_functional_tests_helper_database_replicated_replace_args_macros>1</_functional_tests_helper_database_replicated_replace_args_macros>
+    <max_database_replicated_create_table_thread_pool_size>50</max_database_replicated_create_table_thread_pool_size>
 </clickhouse>

From eba094e228cdc53e4cb9eea35a8860d6f7ba2fac Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 2 Feb 2024 16:48:30 +0800
Subject: [PATCH 0554/1081] optimize sum decimal and bitint conditionally

---
 src/AggregateFunctions/AggregateFunctionSum.h | 36 ++++++++++++++++---
 1 file changed, 32 insertions(+), 4 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index 5781ab69c6b..b3ba7cc7f57 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -146,9 +146,7 @@ struct AggregateFunctionSumData
         size_t count = end - start;
         const auto * end_ptr = ptr + count;
 
-        if constexpr (
-            (is_integer<T> && !is_big_int_v<T>)
-            || (is_decimal<T> && !std::is_same_v<T, Decimal256> && !std::is_same_v<T, Decimal128>))
+        if constexpr ((is_integer<T> || is_decimal<T>)&&!is_over_big_int<T>)
         {
             /// For integers we can vectorize the operation if we replace the null check using a multiplication (by 0 for null, 1 for not null)
             /// https://quick-bench.com/q/MLTnfTvwC2qZFVeWHfOBR3U7a8I
@@ -163,8 +161,38 @@ struct AggregateFunctionSumData
             Impl::add(sum, local_sum);
             return;
         }
+        else if constexpr (is_integer<T> || is_decimal<T>)
+        {
+            /// Use a mask to discard the value if it is null
+            T local_sum{};
+            using MaskType = std::conditional_t<sizeof(T) == 16, Int8, Int64>;
+            alignas(64) const MaskType masks[2] = {0, -1};
+            while (ptr < end_ptr)
+            {
+                Value v = *ptr;
+                if constexpr (!add_if_zero)
+                {
+                    if constexpr (is_integer<T>)
+                        v &= masks[*condition_map];
+                    else
+                        v.value &= masks[*condition_map];
+                }
+                else
+                {
+                    if constexpr (is_integer<T>)
+                        v &= masks[!*condition_map];
+                    else
+                        v.value &= masks[!*condition_map];
+                }
 
-        if constexpr (std::is_floating_point_v<T>)
+                Impl::add(local_sum, v);
+                ++ptr;
+                ++condition_map;
+            }
+            Impl::add(sum, local_sum);
+            return;
+        }
+        else if constexpr (std::is_floating_point_v<T>)
         {
             /// For floating point we use a similar trick as above, except that now we  reinterpret the floating point number as an unsigned
             /// integer of the same size and use a mask instead (0 to discard, 0xFF..FF to keep)

From 1faa04de48eb7114620a74ce4f5d4e1ad83e490a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Fri, 2 Feb 2024 08:58:43 +0000
Subject: [PATCH 0555/1081] Fix typo

---
 docs/en/sql-reference/statements/alter/column.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/alter/column.md b/docs/en/sql-reference/statements/alter/column.md
index 193136cf8ba..f6d9668e628 100644
--- a/docs/en/sql-reference/statements/alter/column.md
+++ b/docs/en/sql-reference/statements/alter/column.md
@@ -159,7 +159,7 @@ For examples of columns compression CODECS modifying, see [Column Compression Co
 
 For examples of columns TTL modifying, see [Column TTL](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#mergetree-column-ttl).
 
-For examples of colum-level settings modifying, see [Column-level Settings](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#column-level-settings).
+For examples of column-level settings modifying, see [Column-level Settings](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#column-level-settings).
 
 If the `IF EXISTS` clause is specified, the query won’t return an error if the column does not exist.
 

From 654f274c014fe46005231651dd89d4e6f27c86f3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 2 Feb 2024 11:06:46 +0100
Subject: [PATCH 0556/1081] Missing refs

---
 .../0_stateless/02982_minmax_nan_null_order.reference  | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/tests/queries/0_stateless/02982_minmax_nan_null_order.reference b/tests/queries/0_stateless/02982_minmax_nan_null_order.reference
index 2d8b7f8843e..2b3ef0b7733 100644
--- a/tests/queries/0_stateless/02982_minmax_nan_null_order.reference
+++ b/tests/queries/0_stateless/02982_minmax_nan_null_order.reference
@@ -2,12 +2,16 @@
 -- Tuples with NaN
 SELECT min((c1, c2)), max((c1, c2)) FROM values((nan, 0.), (0., 0.), (5., 5.));
 (0,0)	(5,5)
+SELECT minIf((c1, c2), c2 >= 0.0), maxIf((c1, c2), c2 >= 0.0) FROM values((nan, 0.), (0., 0.), (5., 5.));
+(0,0)	(5,5)
 SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
 (0,0)
 SELECT (c1, c2) as t FROM values((nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
 (5,5)
 SELECT min((c1, c2)), max((c1, c2)) FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.));
 (-5,0)	(5,5)
+SELECT minIf((c1, c2), c2 >= 0.0), maxIf((c1, c2), c2 >= 0.0) FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.));
+(-5,0)	(5,5)
 SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
 (-5,0)
 SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
@@ -15,12 +19,16 @@ SELECT (c1, c2) as t FROM values((-5, 0), (nan, 0.), (0., 0.), (5., 5.)) ORDER B
 -- Tuples with NULL
 SELECT min((c1, c2)), max((c1, c2)) FROM values((NULL, 0.), (0., 0.), (5., 5.));
 (0,0)	(5,5)
+SELECT minIf((c1, c2), c2 >= 0), maxIf((c1, c2), c2 >= 0) FROM values((NULL, 0.), (0., 0.), (5., 5.));
+(0,0)	(5,5)
 SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t ASC LIMIT 1;
 (0,0)
 SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.)) ORDER BY t DESC LIMIT 1;
 (5,5)
 SELECT min((c1, c2)), max((c1, c2)) FROM values((0., 0.), (5., 5.), (NULL, 0.));
 (0,0)	(5,5)
+SELECT minIf((c1, c2), c2 >= 0), maxIf((c1, c2), c2 >= 0) FROM values((0., 0.), (5., 5.), (NULL, 0.));
+(0,0)	(5,5)
 SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t ASC LIMIT 1;
 (0,0)
 SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORDER BY t DESC LIMIT 1;
@@ -28,6 +36,8 @@ SELECT (c1, c2) as t FROM values((NULL, 0.), (0., 0.), (5., 5.), (NULL, 0.)) ORD
 -- Map with NULL
 SELECT min(map(0, c1)), max(map(0, c1)) FROM values(NULL, 0, 5., 5.);
 {0:0}	{0:5}
+SELECT minIf(map(0, c1), assumeNotNull(c1) >= 0), maxIf(map(0, c1), assumeNotNull(c1) >= 0) FROM values(NULL, 0, 5., 5.);
+{0:0}	{0:5}
 SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t ASC LIMIT 1;
 {0:0}
 SELECT map(0, c1) as t FROM values(NULL, 0, 5., 5.) ORDER BY t DESC LIMIT 1;

From e997168b50a7d2f471d1d8f552e0b7f6a2df495a Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 31 Jan 2024 12:46:35 +0000
Subject: [PATCH 0557/1081] Support memory limits in nested cgroups

---
 base/base/getMemoryAmount.cpp | 63 +++++++++++++++++++++++++++++------
 1 file changed, 52 insertions(+), 11 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 060de685778..a55dabdcf46 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -3,6 +3,7 @@
 #include <base/getPageSize.h>
 
 #include <fstream>
+#include <sstream>
 #include <stdexcept>
 
 #include <unistd.h>
@@ -16,18 +17,59 @@
 namespace
 {
 
-std::optional<uint64_t> getCgroupsV2MemoryLimit(const std::string & setting)
+std::optional<uint64_t> getCgroupsV2MemoryLimit()
 {
 #if defined(OS_LINUX)
-    std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
-    std::ifstream file(default_cgroups_mount / setting);
-    if (!file.is_open())
+    const std::filesystem::path default_cgroups_mount = "/sys/fs/cgroup";
+
+    /// This file exists iff the host has cgroups v2 enabled.
+    std::ifstream controllers_file(default_cgroups_mount / "cgroup.controllers");
+    if (!controllers_file.is_open())
         return {};
-    uint64_t value;
-    if (file >> value)
-        return {value};
-    else
-        return {}; /// e.g. the cgroups default "max"
+
+    /// We also need the memory controller enabled
+    std::stringstream controllers_buf;
+    controllers_buf << controllers_file.rdbuf();
+    std::string controllers = controllers_buf.str();
+    if (controllers.find("memory") == std::string::npos)
+        return {};
+
+    /// Identify the cgroup the process belongs to
+    std::ifstream cgroup_name_file("/proc/self/cgroup");
+    if (!cgroup_name_file.is_open())
+        return {};
+
+    std::stringstream cgroup_name_buf;
+    cgroup_name_buf << cgroup_name_file.rdbuf();
+    std::string cgroup_name = cgroup_name_buf.str();
+    if (!cgroup_name.empty() && cgroup_name.back() == '\n')
+        cgroup_name.pop_back(); /// remove trailing newline, if any
+    /// cgroups v2 will show a single line with prefix "0::/"
+    /// - https://book.hacktricks.xyz/linux-hardening/privilege-escalation/docker-security/cgroups
+    const std::string v2_prefix = "0::/";
+    if (cgroup_name.find('\n') != std::string::npos || !cgroup_name.starts_with(v2_prefix))
+        return {};
+    cgroup_name = cgroup_name.substr(v2_prefix.length());
+
+    std::filesystem::path current_cgroup = cgroup_name.empty() ? default_cgroups_mount : (default_cgroups_mount / cgroup_name);
+
+    /// Open the bottom-most nested memory limit setting file. If there is no such file at the current
+    /// level, try again at the parent level as memory settings are inherited.
+    while (current_cgroup != default_cgroups_mount.parent_path())
+    {
+        std::ifstream setting_file(current_cgroup / "memory.max");
+        if (setting_file.is_open())
+        {
+            uint64_t value;
+            if (setting_file >> value)
+                return {value};
+            else
+                return {}; /// e.g. the cgroups default "max"
+        }
+        current_cgroup = current_cgroup.parent_path();
+    }
+
+    return {};
 #else
     return {};
 #endif
@@ -52,8 +94,7 @@ uint64_t getMemoryAmountOrZero()
 
     /// Respect the memory limit set by cgroups v2.
     /// Cgroups v1 is dead since many years and its limits are not considered for simplicity.
-
-    auto limit = getCgroupsV2MemoryLimit("memory.max");
+    auto limit = getCgroupsV2MemoryLimit();
     if (limit.has_value() && *limit < memory_amount)
          memory_amount = *limit;
 

From 80a0e05ac4e3fc6d1837877bad2be7a1016ee4e6 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 31 Jan 2024 15:04:24 +0000
Subject: [PATCH 0558/1081] Resurrect v1

---
 base/base/getMemoryAmount.cpp | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index a55dabdcf46..7f50683944e 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -93,10 +93,24 @@ uint64_t getMemoryAmountOrZero()
     uint64_t memory_amount = num_pages * page_size;
 
     /// Respect the memory limit set by cgroups v2.
-    /// Cgroups v1 is dead since many years and its limits are not considered for simplicity.
-    auto limit = getCgroupsV2MemoryLimit();
-    if (limit.has_value() && *limit < memory_amount)
-         memory_amount = *limit;
+    auto limit_v2 = getCgroupsV2MemoryLimit();
+    if (limit_v2.has_value() && *limit_v2 < memory_amount)
+         memory_amount = *limit_v2;
+    else
+    {
+        /// Cgroups v1 were replaced by v2 in 2015. The only reason we keep supporting v1 is that the transition to v2
+        /// has been slow. Caveat : Hierarchical groups as in v2 are not supported for v1, the location of the memory
+        /// limit (virtual) file is hard-coded.
+        /// TODO: check at the end of 2024 if we can get rid of v1.
+        std::ifstream limit_file_v1("/sys/fs/cgroup/memory/memory.limit_in_bytes");
+        if (limit_file_v1.is_open())
+        {
+            uint64_t limit_v1;
+            if (limit_file_v1 >> limit_v1)
+                if (limit_v1 < memory_amount)
+                    memory_amount = limit_v1;
+        }
+    }
 
     return memory_amount;
 }

From 87d493533c8f08ce67c571ee644263f887b0fb86 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 2 Feb 2024 12:10:05 +0100
Subject: [PATCH 0559/1081] Revert "Poco Logger small refactoring"

---
 base/poco/Foundation/CMakeLists.txt           |   6 -
 base/poco/Foundation/include/Poco/Logger.h    |  42 ++--
 .../include/Poco/RefCountedObject.h           |   3 +-
 base/poco/Foundation/src/Logger.cpp           | 226 +++++++-----------
 src/Common/Logger.h                           |  12 -
 src/Common/tests/gtest_log.cpp                |  73 ------
 .../ObjectStorages/ObjectStorageFactory.cpp   |   2 +-
 .../ObjectStorages/Web/WebObjectStorage.cpp   |   2 +-
 .../MergeTree/MergeTreeDataPartCloner.cpp     |   2 +-
 utils/keeper-data-dumper/main.cpp             |   2 +-
 10 files changed, 114 insertions(+), 256 deletions(-)

diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index 5fe644d3057..dfb41a33fb1 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -166,12 +166,6 @@ set (SRCS
 )
 
 add_library (_poco_foundation ${SRCS})
-target_link_libraries (_poco_foundation
-    PUBLIC
-        boost::headers_only
-        boost::system
-)
-
 add_library (Poco::Foundation ALIAS _poco_foundation)
 
 # TODO: remove these warning exclusions
diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index 883294a071a..cf202718662 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -22,9 +22,6 @@
 #include <cstddef>
 #include <map>
 #include <vector>
-
-#include <boost/smart_ptr/intrusive_ptr.hpp>
-
 #include "Poco/Channel.h"
 #include "Poco/Format.h"
 #include "Poco/Foundation.h"
@@ -37,7 +34,7 @@ namespace Poco
 
 class Exception;
 class Logger;
-using LoggerPtr = boost::intrusive_ptr<Logger>;
+using LoggerPtr = std::shared_ptr<Logger>;
 
 class Foundation_API Logger : public Channel
 /// Logger is a special Channel that acts as the main
@@ -874,11 +871,21 @@ public:
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
-    static LoggerPtr getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created = true);
+    static LoggerPtr getShared(const std::string & name);
     /// Returns a shared pointer to the Logger with the given name.
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
+    static Logger & unsafeGet(const std::string & name);
+    /// Returns a reference to the Logger with the given name.
+    /// If the Logger does not yet exist, it is created, based
+    /// on its parent logger.
+    ///
+    /// WARNING: This method is not thread safe. You should
+    /// probably use get() instead.
+    /// The only time this method should be used is during
+    /// program initialization, when only one thread is running.
+
     static Logger & create(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
     /// Creates and returns a reference to a Logger with the
     /// given name. The Logger's Channel and log level as set as
@@ -925,16 +932,6 @@ public:
 
     static const std::string ROOT; /// The name of the root logger ("").
 
-public:
-    struct LoggerEntry
-    {
-        Poco::Logger * logger;
-        bool owned_by_shared_ptr = false;
-    };
-
-    using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
-    using LoggerMapIterator = LoggerMap::iterator;
-
 protected:
     Logger(const std::string & name, Channel * pChannel, int level);
     ~Logger();
@@ -943,19 +940,12 @@ protected:
     void log(const std::string & text, Message::Priority prio, const char * file, int line);
 
     static std::string format(const std::string & fmt, int argc, std::string argv[]);
+    static Logger & unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
+    static Logger & parent(const std::string & name);
+    static void add(Logger * pLogger);
+    static Logger * find(const std::string & name);
 
 private:
-    static std::pair<Logger::LoggerMapIterator, bool> unsafeGet(const std::string & name, bool get_shared);
-    static Logger * unsafeGetRawPtr(const std::string & name);
-    static std::pair<LoggerMapIterator, bool> unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
-    static Logger & parent(const std::string & name);
-    static std::pair<LoggerMapIterator, bool> add(Logger * pLogger);
-    static std::optional<LoggerMapIterator> find(const std::string & name);
-    static Logger * findRawPtr(const std::string & name);
-
-    friend void intrusive_ptr_add_ref(Logger * ptr);
-    friend void intrusive_ptr_release(Logger * ptr);
-
     Logger();
     Logger(const Logger &);
     Logger & operator=(const Logger &);
diff --git a/base/poco/Foundation/include/Poco/RefCountedObject.h b/base/poco/Foundation/include/Poco/RefCountedObject.h
index 1f806bdacb1..db966089e00 100644
--- a/base/poco/Foundation/include/Poco/RefCountedObject.h
+++ b/base/poco/Foundation/include/Poco/RefCountedObject.h
@@ -53,10 +53,11 @@ protected:
     virtual ~RefCountedObject();
     /// Destroys the RefCountedObject.
 
-    mutable std::atomic<size_t> _counter;
 private:
     RefCountedObject(const RefCountedObject &);
     RefCountedObject & operator=(const RefCountedObject &);
+
+    mutable std::atomic<size_t> _counter;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 16fc3a0480e..cfc063c8979 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -38,7 +38,14 @@ std::mutex & getLoggerMutex()
 	return *logger_mutex;
 }
 
-Poco::Logger::LoggerMap * _pLoggerMap = nullptr;
+struct LoggerEntry
+{
+	Poco::Logger * logger;
+	bool owned_by_shared_ptr = false;
+};
+
+using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
+LoggerMap * _pLoggerMap = nullptr;
 
 }
 
@@ -302,9 +309,38 @@ void Logger::formatDump(std::string& message, const void* buffer, std::size_t le
 namespace
 {
 
+struct LoggerDeleter
+{
+	void operator()(Poco::Logger * logger)
+	{
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		/// If logger infrastructure is destroyed just decrement logger reference count
+		if (!_pLoggerMap)
+		{
+			logger->release();
+			return;
+		}
+
+		auto it = _pLoggerMap->find(logger->name());
+		assert(it != _pLoggerMap->end());
+
+		/** If reference count is 1, this means this shared pointer owns logger
+		  * and need destroy it.
+		  */
+		size_t reference_count_before_release = logger->release();
+		if (reference_count_before_release == 1)
+		{
+			assert(it->second.owned_by_shared_ptr);
+			_pLoggerMap->erase(it);
+		}
+	}
+};
+
+
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
-	return LoggerPtr(&logger, false /*add_ref*/);
+	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
 }
 
 }
@@ -314,87 +350,64 @@ Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	auto [it, inserted] = unsafeGet(name, false /*get_shared*/);
-	return *it->second.logger;
+	Logger & logger = unsafeGet(name);
+
+	/** If there are already shared pointer created for this logger
+	  * we need to increment Logger reference count and now logger
+	  * is owned by logger infrastructure.
+	  */
+	auto it = _pLoggerMap->find(name);
+	if (it->second.owned_by_shared_ptr)
+	{
+		it->second.logger->duplicate();
+		it->second.owned_by_shared_ptr = false;
+	}
+
+	return logger;
 }
 
 
-LoggerPtr Logger::getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created)
+LoggerPtr Logger::getShared(const std::string & name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
-	auto [it, inserted] = unsafeGet(name, true /*get_shared*/);
+	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
 
-	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
-	  * If logger was already created, then this shared pointer does not own it.
+	Logger & logger = unsafeGet(name);
+
+	/** If logger already exists, then this shared pointer does not own it.
+	  * If logger does not exists, logger infrastructure could be already destroyed
+	  * or logger was created.
 	  */
-	if (inserted)
+	if (logger_exists)
 	{
-		if (should_be_owned_by_shared_ptr_if_created)
-			it->second.owned_by_shared_ptr = true;
-		else
-			it->second.logger->duplicate();
+		logger.duplicate();
+	}
+	else if (_pLoggerMap)
+	{
+		_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
 	}
 
-	return makeLoggerPtr(*it->second.logger);
+	return makeLoggerPtr(logger);
 }
 
 
-std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string& name, bool get_shared)
+Logger& Logger::unsafeGet(const std::string& name)
 {
-	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
-
-	bool should_recreate_logger = false;
-
-	if (optional_logger_it)
+	Logger* pLogger = find(name);
+	if (!pLogger)
 	{
-		auto & logger_it = *optional_logger_it;
-		std::optional<size_t> reference_count_before;
-
-		if (get_shared)
-		{
-			reference_count_before = logger_it->second.logger->duplicate();
-		}
-		else if (logger_it->second.owned_by_shared_ptr)
-		{
-			reference_count_before = logger_it->second.logger->duplicate();
-			logger_it->second.owned_by_shared_ptr = false;
-		}
-
-		/// Other thread already decided to delete this logger, but did not yet remove it from map
-		if (reference_count_before && reference_count_before == 0)
-			should_recreate_logger = true;
-	}
-
-	if (!optional_logger_it || should_recreate_logger)
-	{
-		Logger * logger = nullptr;
-
 		if (name == ROOT)
 		{
-			logger = new Logger(name, nullptr, Message::PRIO_INFORMATION);
+			pLogger = new Logger(name, 0, Message::PRIO_INFORMATION);
 		}
 		else
 		{
 			Logger& par = parent(name);
-			logger = new Logger(name, par.getChannel(), par.getLevel());
+			pLogger = new Logger(name, par.getChannel(), par.getLevel());
 		}
-
-		if (should_recreate_logger)
-		{
-			(*optional_logger_it)->second.logger = logger;
-			return std::make_pair(*optional_logger_it, true);
-		}
-
-		return add(logger);
+		add(pLogger);
 	}
-
-	return std::make_pair(*optional_logger_it, false);
-}
-
-
-Logger * Logger::unsafeGetRawPtr(const std::string & name)
-{
-	return unsafeGet(name, false /*get_shared*/).first->second.logger;
+	return *pLogger;
 }
 
 
@@ -402,24 +415,24 @@ Logger& Logger::create(const std::string& name, Channel* pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return *unsafeCreate(name, pChannel, level).first->second.logger;
+	return unsafeCreate(name, pChannel, level);
 }
 
 LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	auto [it, inserted] = unsafeCreate(name, pChannel, level);
-	it->second.owned_by_shared_ptr = true;
+	Logger & logger = unsafeCreate(name, pChannel, level);
+	_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
 
-	return makeLoggerPtr(*it->second.logger);
+	return makeLoggerPtr(logger);
 }
 
 Logger& Logger::root()
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return *unsafeGetRawPtr(ROOT);
+	return unsafeGet(ROOT);
 }
 
 
@@ -427,11 +440,7 @@ Logger* Logger::has(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	auto optional_it = find(name);
-	if (!optional_it)
-		return nullptr;
-
-	return (*optional_it)->second.logger;
+	return find(name);
 }
 
 
@@ -450,69 +459,20 @@ void Logger::shutdown()
 		}
 
 		delete _pLoggerMap;
-		_pLoggerMap = nullptr;
+		_pLoggerMap = 0;
 	}
 }
 
 
-std::optional<Logger::LoggerMapIterator> Logger::find(const std::string& name)
+Logger* Logger::find(const std::string& name)
 {
 	if (_pLoggerMap)
 	{
 		LoggerMap::iterator it = _pLoggerMap->find(name);
 		if (it != _pLoggerMap->end())
-			return it;
-
-		return {};
+			return it->second.logger;
 	}
-
-	return {};
-}
-
-Logger * Logger::findRawPtr(const std::string & name)
-{
-	auto optional_it = find(name);
-	if (!optional_it)
-		return nullptr;
-
-	return (*optional_it)->second.logger;
-}
-
-
-void intrusive_ptr_add_ref(Logger * ptr)
-{
-	ptr->duplicate();
-}
-
-
-void intrusive_ptr_release(Logger * ptr)
-{
-	size_t reference_count_before = ptr->_counter.fetch_sub(1, std::memory_order_acq_rel);
-	if (reference_count_before != 1)
-		return;
-
-	{
-		std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-		if (_pLoggerMap)
-		{
-			auto it = _pLoggerMap->find(ptr->name());
-
-			/** It is possible that during release other thread created logger and
-			  * updated iterator in map.
-			  */
-			if (it != _pLoggerMap->end() && ptr == it->second.logger)
-			{
-				/** If reference count is 0, this means this intrusive pointer owns logger
-				  * and need destroy it.
-				  */
-				assert(it->second.owned_by_shared_ptr);
-				_pLoggerMap->erase(it);
-			}
-		}
-	}
-
-	delete ptr;
+	return 0;
 }
 
 
@@ -530,14 +490,14 @@ void Logger::names(std::vector<std::string>& names)
 	}
 }
 
-
-std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
+Logger& Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
 {
 	if (find(name)) throw ExistsException();
 	Logger* pLogger = new Logger(name, pChannel, level);
-	return add(pLogger);
-}
+	add(pLogger);
 
+	return *pLogger;
+}
 
 Logger& Logger::parent(const std::string& name)
 {
@@ -545,13 +505,13 @@ Logger& Logger::parent(const std::string& name)
 	if (pos != std::string::npos)
 	{
 		std::string pname = name.substr(0, pos);
-		Logger* pParent = findRawPtr(pname);
+		Logger* pParent = find(pname);
 		if (pParent)
 			return *pParent;
 		else
 			return parent(pname);
 	}
-	else return *unsafeGetRawPtr(ROOT);
+	else return unsafeGet(ROOT);
 }
 
 
@@ -619,14 +579,12 @@ namespace
 }
 
 
-std::pair<Logger::LoggerMapIterator, bool> Logger::add(Logger* pLogger)
+void Logger::add(Logger* pLogger)
 {
 	if (!_pLoggerMap)
-		_pLoggerMap = new Logger::LoggerMap;
+		_pLoggerMap = new LoggerMap;
 
-	auto result = _pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
-	assert(result.second);
-	return result;
+	_pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
 }
 
 
diff --git a/src/Common/Logger.h b/src/Common/Logger.h
index 0425da8c847..6dcdea9a9d8 100644
--- a/src/Common/Logger.h
+++ b/src/Common/Logger.h
@@ -2,8 +2,6 @@
 
 #include <memory>
 
-#include <base/defines.h>
-
 #include <Poco/Channel.h>
 #include <Poco/Logger.h>
 #include <Poco/Message.h>
@@ -26,16 +24,6 @@ using LoggerRawPtr = Poco::Logger *;
   */
 LoggerPtr getLogger(const std::string & name);
 
-/** Get Logger with specified name. If the Logger does not exists, it is created.
-  * This overload was added for specific purpose, when logger is constructed from constexpr string.
-  * Logger is destroyed only during program shutdown.
-  */
-template <size_t n>
-ALWAYS_INLINE LoggerPtr getLogger(const char (&name)[n])
-{
-    return Poco::Logger::getShared(name, false /*should_be_owned_by_shared_ptr_if_created*/);
-}
-
 /** Create Logger with specified name, channel and logging level.
   * If Logger already exists, throws exception.
   * Logger is destroyed, when last shared ptr that refers to Logger with specified name is destroyed.
diff --git a/src/Common/tests/gtest_log.cpp b/src/Common/tests/gtest_log.cpp
index 6d2bd56ad77..622497fe2f5 100644
--- a/src/Common/tests/gtest_log.cpp
+++ b/src/Common/tests/gtest_log.cpp
@@ -9,7 +9,6 @@
 #include <Poco/NullChannel.h>
 #include <Poco/StreamChannel.h>
 #include <sstream>
-#include <thread>
 
 
 TEST(Logger, Log)
@@ -101,75 +100,3 @@ TEST(Logger, SideEffects)
 
     LOG_TRACE(log, "test no throw {}", getLogMessageParamOrThrow());
 }
-
-TEST(Logger, SharedRawLogger)
-{
-    {
-        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
-
-        auto shared_logger = getLogger("Logger_1");
-        shared_logger->setChannel(stream_channel.get());
-        shared_logger->setLevel("trace");
-
-        LOG_TRACE(shared_logger, "SharedLogger1Log1");
-        LOG_TRACE(getRawLogger("Logger_1"), "RawLogger1Log");
-        LOG_TRACE(shared_logger, "SharedLogger1Log2");
-
-        auto actual = stream.str();
-        EXPECT_EQ(actual, "SharedLogger1Log1\nRawLogger1Log\nSharedLogger1Log2\n");
-    }
-    {
-        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
-
-        auto * raw_logger = getRawLogger("Logger_2");
-        raw_logger->setChannel(stream_channel.get());
-        raw_logger->setLevel("trace");
-
-        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log1");
-        LOG_TRACE(raw_logger, "RawLogger2Log");
-        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log2");
-
-        auto actual = stream.str();
-        EXPECT_EQ(actual, "SharedLogger2Log1\nRawLogger2Log\nSharedLogger2Log2\n");
-    }
-}
-
-TEST(Logger, SharedLoggersThreadSafety)
-{
-    static size_t threads_count = std::thread::hardware_concurrency();
-    static constexpr size_t loggers_count = 10;
-    static constexpr size_t logger_get_count = 1000;
-
-    Poco::Logger::root();
-
-    std::vector<std::string> names;
-
-    Poco::Logger::names(names);
-    size_t loggers_size_before = names.size();
-
-    std::vector<std::thread> threads;
-
-    for (size_t thread_index = 0; thread_index < threads_count; ++thread_index)
-    {
-        threads.emplace_back([]()
-        {
-            for (size_t logger_index = 0; logger_index < loggers_count; ++logger_index)
-            {
-                for (size_t iteration = 0; iteration < logger_get_count; ++iteration)
-                {
-                    getLogger("Logger_" + std::to_string(logger_index));
-                }
-            }
-        });
-    }
-
-    for (auto & thread : threads)
-        thread.join();
-
-    Poco::Logger::names(names);
-    size_t loggers_size_after = names.size();
-
-    EXPECT_EQ(loggers_size_before, loggers_size_after);
-}
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 4a6bb924bdc..ec6f7081c85 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -102,7 +102,7 @@ void checkS3Capabilities(
     if (s3_capabilities.support_batch_delete && !checkBatchRemove(storage, key_with_trailing_slash))
     {
         LOG_WARNING(
-            getLogger("S3ObjectStorage"),
+            &Poco::Logger::get("S3ObjectStorage"),
             "Storage for disk {} does not support batch delete operations, "
             "so `s3_capabilities.support_batch_delete` was automatically turned off during the access check. "
             "To remove this message set `s3_capabilities.support_batch_delete` for the disk to `false`.",
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 786b23caf48..0223c24973e 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -82,7 +82,7 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
             if (!inserted)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Loading data for {} more than once", file_path);
 
-            LOG_TRACE(getLogger("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
+            LOG_TRACE(&Poco::Logger::get("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
             loaded_files.emplace_back(file_path);
         }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index 107e21c2dda..04019d2c665 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -180,7 +180,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
     }
 
     LOG_DEBUG(
-        getLogger("MergeTreeDataPartCloner"),
+        &Poco::Logger::get("MergeTreeDataPartCloner"),
         "Clone {} part {} to {}{}",
         src_flushed_tmp_part ? "flushed" : "",
         src_part_storage->getFullPath(),
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index 9e107c99534..e06b301edbf 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -59,7 +59,7 @@ int main(int argc, char *argv[])
         Poco::Logger::root().setChannel(channel);
         Poco::Logger::root().setLevel("trace");
     }
-    auto logger = getLogger("keeper-dumper");
+    auto * logger = &Poco::Logger::get("keeper-dumper");
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();

From 4b77258341cfc35bfeb2ad63a6747f34cfb0c54b Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 11:28:35 +0000
Subject: [PATCH 0560/1081] Fix test

---
 src/QueryPipeline/RemoteQueryExecutor.h                      | 2 +-
 .../02769_parallel_replicas_unavailable_shards.sql           | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.h b/src/QueryPipeline/RemoteQueryExecutor.h
index cc3291313a8..1eee0ac664f 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.h
+++ b/src/QueryPipeline/RemoteQueryExecutor.h
@@ -52,7 +52,7 @@ public:
         std::optional<IConnections::ReplicaInfo> replica_info = {};
     };
 
-    /// Takes a connection pool to a node (not cluster)
+    /// Takes a connection pool for a node (not cluster)
     RemoteQueryExecutor(
         IConnectionPool * pool,
         const String & query_,
diff --git a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
index 38d592201e3..be200353f06 100644
--- a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
+++ b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
@@ -6,10 +6,11 @@ SYSTEM FLUSH LOGS;
 
 SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=11, cluster_for_parallel_replicas='parallel_replicas', parallel_replicas_for_non_replicated_merge_tree=1;
 SET send_logs_level='error';
-SELECT count() FROM test_parallel_replicas_unavailable_shards WHERE NOT ignore(*);
+SELECT count() FROM test_parallel_replicas_unavailable_shards WHERE NOT ignore(*) SETTINGS log_comment = '02769_7b513191-5082-4073-8568-53b86a49da79';
 
 SYSTEM FLUSH LOGS;
 
-SELECT count() > 0 FROM system.text_log WHERE yesterday() <= event_date AND message LIKE '%Replica number 10 is unavailable%';
+SET allow_experimental_parallel_reading_from_replicas=0;
+SELECT count() FROM system.text_log WHERE yesterday() <= event_date AND query_id in (select query_id from system.query_log where log_comment = '02769_7b513191-5082-4073-8568-53b86a49da79' and current_database = currentDatabase()) and message LIKE '%Replica number % is unavailable%';
 
 DROP TABLE test_parallel_replicas_unavailable_shards;

From e7f63abc2f344722cbb40f462c4a40ab3c58ae4c Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 2 Feb 2024 11:41:46 +0000
Subject: [PATCH 0561/1081] Update version_date.tsv and changelogs after
 v24.1.2.5-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.2.5-stable.md  | 14 ++++++++++++++
 utils/list-versions/version_date.tsv |  1 +
 5 files changed, 18 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.2.5-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 82405d63df9..fe33bf9e0ea 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.1.2048"
+ARG VERSION="24.1.2.5"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index f48e14aba50..f0adadd2d59 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.1.2048"
+ARG VERSION="24.1.2.5"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 60ef7a67563..bc15c99a034 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -30,7 +30,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.1.2048"
+ARG VERSION="24.1.2.5"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.2.5-stable.md b/docs/changelogs/v24.1.2.5-stable.md
new file mode 100644
index 00000000000..bac25c9b9ed
--- /dev/null
+++ b/docs/changelogs/v24.1.2.5-stable.md
@@ -0,0 +1,14 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.2.5-stable (b2605dd4a5a) FIXME as compared to v24.1.1.2048-stable (5a024dfc093)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix translate() with FixedString input [#59356](https://github.com/ClickHouse/ClickHouse/pull/59356) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix stacktraces for binaries without debug symbols [#59444](https://github.com/ClickHouse/ClickHouse/pull/59444) ([Azat Khuzhin](https://github.com/azat)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 34df4a3f0cf..ab3535adccf 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28

From ae6618e0b3c8bf99d84644c08764d30b2cea26df Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 2 Feb 2024 11:57:38 +0000
Subject: [PATCH 0562/1081] Update version_date.tsv and changelogs after
 v23.12.3.40-stable

---
 docs/changelogs/v23.12.3.40-stable.md | 36 +++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv  |  1 +
 2 files changed, 37 insertions(+)
 create mode 100644 docs/changelogs/v23.12.3.40-stable.md

diff --git a/docs/changelogs/v23.12.3.40-stable.md b/docs/changelogs/v23.12.3.40-stable.md
new file mode 100644
index 00000000000..e2a9e3af407
--- /dev/null
+++ b/docs/changelogs/v23.12.3.40-stable.md
@@ -0,0 +1,36 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.12.3.40-stable (a594704ae75) FIXME as compared to v23.12.2.59-stable (17ab210e761)
+
+#### Improvement
+* Backported in [#58660](https://github.com/ClickHouse/ClickHouse/issues/58660): When executing some queries, which require a lot of streams for reading data, the error `"Paste JOIN requires sorted tables only"` was previously thrown. Now the numbers of streams resize to 1 in that case. [#58608](https://github.com/ClickHouse/ClickHouse/pull/58608) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Backported in [#58817](https://github.com/ClickHouse/ClickHouse/issues/58817): Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Backported in [#59235](https://github.com/ClickHouse/ClickHouse/issues/59235): Allow to ignore schema evolution in Iceberg table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Delay reading from StorageKafka to allow multiple reads in materialized views [#58477](https://github.com/ClickHouse/ClickHouse/pull/58477) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Disable max_joined_block_rows in ConcurrentHashJoin [#58595](https://github.com/ClickHouse/ClickHouse/pull/58595) ([vdimir](https://github.com/vdimir)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* Multiple read file log storage in mv [#58877](https://github.com/ClickHouse/ClickHouse/pull/58877) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix not-ready set for system.tables [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix translate() with FixedString input [#59356](https://github.com/ClickHouse/ClickHouse/pull/59356) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Follow-up to [#58482](https://github.com/ClickHouse/ClickHouse/issues/58482) [#58574](https://github.com/ClickHouse/ClickHouse/pull/58574) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix possible race in ManyAggregatedData dtor. [#58624](https://github.com/ClickHouse/ClickHouse/pull/58624) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Change log level for super imporant message in Keeper [#59010](https://github.com/ClickHouse/ClickHouse/pull/59010) ([alesapin](https://github.com/alesapin)).
+* Decrease log level for one log message [#59168](https://github.com/ClickHouse/ClickHouse/pull/59168) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix fasttest by pinning pip dependencies [#59256](https://github.com/ClickHouse/ClickHouse/pull/59256) ([Azat Khuzhin](https://github.com/azat)).
+* No debug symbols in Rust [#59306](https://github.com/ClickHouse/ClickHouse/pull/59306) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index ab3535adccf..773db8a01d1 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,5 +1,6 @@
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28
 v23.11.4.24-stable	2024-01-05

From 6df4c64500f16bbc575570089ec798964919389b Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 2 Feb 2024 13:20:32 +0100
Subject: [PATCH 0563/1081] Use in integration test

---
 tests/integration/test_replicated_database/configs/config.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_replicated_database/configs/config.xml b/tests/integration/test_replicated_database/configs/config.xml
index e598cc28d5d..7d779cb0d2e 100644
--- a/tests/integration/test_replicated_database/configs/config.xml
+++ b/tests/integration/test_replicated_database/configs/config.xml
@@ -4,4 +4,5 @@
     <merge_tree>
         <initialization_retry_period>10</initialization_retry_period>
     </merge_tree>
+    <max_database_replicated_create_table_thread_pool_size>50</max_database_replicated_create_table_thread_pool_size>
 </clickhouse>

From 31d1205aa41dbf4001561e6dc62e44a627ef0983 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 2 Feb 2024 13:23:04 +0100
Subject: [PATCH 0564/1081] Less than two threads mean disabled

---
 src/Core/ServerSettings.h            | 2 +-
 src/Databases/DatabaseReplicated.cpp | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 99fe66c34ad..da49153bdf0 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -114,7 +114,7 @@ namespace DB
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
-    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Zero means tables will be created sequentially.", 0) \
+    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Value less than two mean tables will be created sequentially.", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 0d02d2a5a1c..fcefa2ae253 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -1093,7 +1093,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
 
     tables_dependencies.checkNoCyclicDependencies();
 
-    auto allow_concurrent_table_creation = getContext()->getServerSettings().max_database_replicated_create_table_thread_pool_size > 0;
+    auto allow_concurrent_table_creation = getContext()->getServerSettings().max_database_replicated_create_table_thread_pool_size > 1;
     auto tables_to_create_by_level = tables_dependencies.getTablesSortedByDependencyWithLevels();
 
     auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "CreateTables");

From 679276cca264c97a9e16269818baa5fe1e82eb5f Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 2 Feb 2024 13:32:28 +0100
Subject: [PATCH 0565/1081] Typo

---
 src/Core/ServerSettings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index da49153bdf0..92e91cbca54 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -114,7 +114,7 @@ namespace DB
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
-    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Value less than two mean tables will be created sequentially.", 0) \
+    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Value less than two means tables will be created sequentially.", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 

From 67ac92e1a1e109a36c2e7a6871d6da52279aa96b Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 2 Feb 2024 12:55:17 +0000
Subject: [PATCH 0566/1081] Update version_date.tsv and changelogs after
 v23.11.5.29-stable

---
 docs/changelogs/v23.11.5.29-stable.md | 31 +++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv  |  2 ++
 2 files changed, 33 insertions(+)
 create mode 100644 docs/changelogs/v23.11.5.29-stable.md

diff --git a/docs/changelogs/v23.11.5.29-stable.md b/docs/changelogs/v23.11.5.29-stable.md
new file mode 100644
index 00000000000..f73a21c2095
--- /dev/null
+++ b/docs/changelogs/v23.11.5.29-stable.md
@@ -0,0 +1,31 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.11.5.29-stable (d83b108deca) FIXME as compared to v23.11.4.24-stable (e79d840d7fe)
+
+#### Improvement
+* Backported in [#58815](https://github.com/ClickHouse/ClickHouse/issues/58815): Add `SYSTEM JEMALLOC PURGE` for purging unused jemalloc pages, `SYSTEM JEMALLOC [ ENABLE | DISABLE | FLUSH ] PROFILE` for controlling jemalloc profile if the profiler is enabled. Add jemalloc-related 4LW command in Keeper: `jmst` for dumping jemalloc stats, `jmfp`, `jmep`, `jmdp` for controlling jemalloc profile if the profiler is enabled. [#58665](https://github.com/ClickHouse/ClickHouse/pull/58665) ([Antonio Andelic](https://github.com/antonio2368)).
+* Backported in [#59234](https://github.com/ClickHouse/ClickHouse/issues/59234): Allow to ignore schema evolution in Iceberg table engine and read all data using schema specified by the user on table creation or latest schema parsed from metadata on table creation. This is done under a setting `iceberg_engine_ignore_schema_evolution` that is disabled by default. Note that enabling this setting can lead to incorrect result as in case of evolved schema all data files will be read using the same schema. [#59133](https://github.com/ClickHouse/ClickHouse/pull/59133) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix a stupid case of intersecting parts [#58482](https://github.com/ClickHouse/ClickHouse/pull/58482) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix stream partitioning in parallel window functions [#58739](https://github.com/ClickHouse/ClickHouse/pull/58739) ([Dmitry Novik](https://github.com/novikd)).
+* Fix double destroy call on exception throw in addBatchLookupTable8 [#58745](https://github.com/ClickHouse/ClickHouse/pull/58745) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix JSONExtract function for LowCardinality(Nullable) columns [#58808](https://github.com/ClickHouse/ClickHouse/pull/58808) ([vdimir](https://github.com/vdimir)).
+* Fix: LIMIT BY and LIMIT in distributed query [#59153](https://github.com/ClickHouse/ClickHouse/pull/59153) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix not-ready set for system.tables [#59351](https://github.com/ClickHouse/ClickHouse/pull/59351) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix translate() with FixedString input [#59356](https://github.com/ClickHouse/ClickHouse/pull/59356) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* refine error message [#57991](https://github.com/ClickHouse/ClickHouse/pull/57991) ([Han Fei](https://github.com/hanfei1991)).
+* Fix rare race in external sort/aggregation with temporary data in cache [#58013](https://github.com/ClickHouse/ClickHouse/pull/58013) ([Anton Popov](https://github.com/CurtizJ)).
+* Follow-up to [#58482](https://github.com/ClickHouse/ClickHouse/issues/58482) [#58574](https://github.com/ClickHouse/ClickHouse/pull/58574) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix possible race in ManyAggregatedData dtor. [#58624](https://github.com/ClickHouse/ClickHouse/pull/58624) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Decrease log level for one log message [#59168](https://github.com/ClickHouse/ClickHouse/pull/59168) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index ab3535adccf..36b1db583a8 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,7 +1,9 @@
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28
+v23.11.5.29-stable	2024-02-02
 v23.11.4.24-stable	2024-01-05
 v23.11.3.23-stable	2023-12-21
 v23.11.2.11-stable	2023-12-13

From d5e3b7159015b8a6b5145d7f29ab8c47b1274d52 Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Fri, 2 Feb 2024 14:07:37 +0100
Subject: [PATCH 0567/1081] Remove scarry message if error is retryable

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 87f23b0da2a..cc435ba7c36 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -686,9 +686,12 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
     }
     catch (...)
     {
+        /// Don't scare people with broken part error
+        if (!isRetryableException(std::current_exception()))
+            LOG_ERROR(storage.log, "Part {} is broken and need manual correction", getDataPartStorage().getFullPath());
+
         // There could be conditions that data part to be loaded is broken, but some of meta infos are already written
         // into meta data before exception, need to clean them all.
-        LOG_ERROR(storage.log, "Part {} is broken and need manual correction", getDataPartStorage().getFullPath());
         metadata_manager->deleteAll(/*include_projection*/ true);
         metadata_manager->assertAllDeleted(/*include_projection*/ true);
         throw;

From 7cd78b7fc4010fe6d5599a0a41325a2880f4a53a Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 13:09:23 +0000
Subject: [PATCH 0568/1081] Fix clang-tidy warning

---
 src/Server/TCPHandler.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index 80ec484ab1c..f1087fa14b0 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -147,8 +147,8 @@ public:
       *  because it allows to check the IP ranges of the trusted proxy.
       * Proxy-forwarded (original client) IP address is used for quota accounting if quota is keyed by forwarded IP.
       */
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string host_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string host_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
     ~TCPHandler() override;
 
     void run() override;

From 8ebd7a7952dcace13bf71cf29431f992869ad909 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 13:39:06 +0000
Subject: [PATCH 0569/1081] Formatting

---
 src/Processors/QueryPlan/ReadFromRemote.cpp | 12 ++++++++++--
 src/Processors/QueryPlan/ReadFromRemote.h   |  3 +--
 2 files changed, 11 insertions(+), 4 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index fcdb7cd4a70..cab3ae72678 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -438,7 +438,8 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
 }
 
 
-void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(Pipes & pipes, IConnectionPool* pool, IConnections::ReplicaInfo replica_info)
+void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(
+    Pipes & pipes, IConnectionPool * pool, IConnections::ReplicaInfo replica_info)
 {
     bool add_agg_info = stage == QueryProcessingStage::WithMergeableState;
     bool add_totals = false;
@@ -458,7 +459,14 @@ void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(Pipes & pipes, I
     assert(output_stream);
 
     auto remote_query_executor = std::make_shared<RemoteQueryExecutor>(
-        pool, query_string, output_stream->header, context, throttler, scalars, external_tables, stage,
+        pool,
+        query_string,
+        output_stream->header,
+        context,
+        throttler,
+        scalars,
+        external_tables,
+        stage,
         RemoteQueryExecutor::Extension{.parallel_reading_coordinator = coordinator, .replica_info = std::move(replica_info)});
 
     remote_query_executor->setLogger(log);
diff --git a/src/Processors/QueryPlan/ReadFromRemote.h b/src/Processors/QueryPlan/ReadFromRemote.h
index 07443220c8d..eb3bcd12cc3 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.h
+++ b/src/Processors/QueryPlan/ReadFromRemote.h
@@ -90,8 +90,7 @@ public:
     void enforceAggregationInOrder();
 
 private:
-
-    void addPipeForSingeReplica(Pipes & pipes, IConnectionPool* pool, IConnections::ReplicaInfo replica_info);
+    void addPipeForSingeReplica(Pipes & pipes, IConnectionPool * pool, IConnections::ReplicaInfo replica_info);
 
     ClusterPtr cluster;
     ASTPtr query_ast;

From 9febc8e5b43215408389115db149da54c4b61c0a Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 2 Feb 2024 14:39:23 +0100
Subject: [PATCH 0570/1081] Update the peter-evans/create-pull-request action
 to v6

---
 .github/workflows/tags_stable.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/tags_stable.yml b/.github/workflows/tags_stable.yml
index 0a3945829ca..e4fc9f0b1d3 100644
--- a/.github/workflows/tags_stable.yml
+++ b/.github/workflows/tags_stable.yml
@@ -55,7 +55,7 @@ jobs:
         python3 ./utils/security-generator/generate_security.py > SECURITY.md
         git diff HEAD
     - name: Create Pull Request
-      uses: peter-evans/create-pull-request@v3
+      uses: peter-evans/create-pull-request@v6
       with:
         author: "robot-clickhouse <robot-clickhouse@users.noreply.github.com>"
         token: ${{ secrets.ROBOT_CLICKHOUSE_COMMIT_TOKEN }}

From 05a7d22c24f030a5bc9aa75fc22e4ca103e37468 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 2 Feb 2024 13:45:04 +0000
Subject: [PATCH 0571/1081] WIP on calculate aliases only once

---
 src/Storages/StorageMerge.cpp | 111 ++++++++++++++++++++--------------
 src/Storages/StorageMerge.h   |   2 +-
 2 files changed, 67 insertions(+), 46 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 17a6ade4059..5ef6b5117f6 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -58,6 +58,7 @@
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
+#include "Core/NamesAndTypes.h"
 
 namespace
 {
@@ -388,7 +389,12 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
 
         Names column_names_as_aliases;
         Aliases aliases;
-        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, column_names, column_names_as_aliases, aliases);
+
+        Names real_column_names = column_names;
+        if (child_plan.row_policy_data_opt)
+            child_plan.row_policy_data_opt->extendNames(real_column_names);
+
+        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
 
         auto source_pipeline = createSources(
             child_plan.plan,
@@ -624,47 +630,50 @@ public:
             column != nullptr && column->hasExpression())
         {
             node = column->getExpressionOrThrow();
+            node->setAlias(column->getColumnName());
         }
     }
 };
 
-bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
-{
-    QueryTreeNodes stack = { node };
-    while (!stack.empty())
-    {
-        auto current = stack.back();
-        stack.pop_back();
+// bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
+// {
+//     QueryTreeNodes stack = { node };
+//     while (!stack.empty())
+//     {
+//         auto current = stack.back();
+//         stack.pop_back();
 
-        switch (current->getNodeType())
-        {
-            case QueryTreeNodeType::CONSTANT:
-                break;
-            case QueryTreeNodeType::COLUMN:
-            {
-                auto * column_node = current->as<ColumnNode>();
-                auto source = column_node->getColumnSourceOrNull();
-                if (source != replacement_table_expression)
-                    return true;
-                break;
-            }
-            default:
-            {
-                for (const auto & child : current->getChildren())
-                {
-                    if (child)
-                        stack.push_back(child);
-                }
-            }
-        }
-    }
-    return false;
-}
+//         switch (current->getNodeType())
+//         {
+//             case QueryTreeNodeType::CONSTANT:
+//                 break;
+//             case QueryTreeNodeType::COLUMN:
+//             {
+//                 auto * column_node = current->as<ColumnNode>();
+//                 auto source = column_node->getColumnSourceOrNull();
+//                 if (source != replacement_table_expression)
+//                     return true;
+//                 break;
+//             }
+//             default:
+//             {
+//                 for (const auto & child : current->getChildren())
+//                 {
+//                     if (child)
+//                         stack.push_back(child);
+//                 }
+//             }
+//         }
+//     }
+//     return false;
+// }
 
 QueryTreeNodePtr removeJoin(
     QueryTreeNodePtr query,
     QueryTreeNodePtr original_table_expression,
-    QueryTreeNodePtr replacement_table_expression)
+    QueryTreeNodePtr replacement_table_expression,
+    const ContextPtr & context,
+    const Names & required_column_names)
 {
     auto * query_node = query->as<QueryNode>();
     auto join_tree = query_node->getJoinTree();
@@ -687,21 +696,33 @@ QueryTreeNodePtr removeJoin(
     if (join_tree->as<TableNode>() == nullptr && join_tree->as<TableFunctionNode>() == nullptr)
     {
         auto & projection = modified_query_node->getProjection().getNodes();
-        auto projection_columns = modified_query_node->getProjectionColumns();
-        for (size_t i = 0; i < projection.size();)
+        projection.clear();
+        NamesAndTypes projection_columns;
+
+        for (auto const & column_name : required_column_names)
         {
-            if (hasUnknownColumn(projection[i], replacement_table_expression))
-            {
-                projection.erase(projection.begin() + i);
-                projection_columns.erase(projection_columns.begin() + i);
-                continue;
-            }
-            ++i;
+            QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column_name});
+
+            QueryAnalysisPass query_analysis_pass(original_table_expression);
+            query_analysis_pass.run(fake_node, context);
+
+            auto * resolved_column = fake_node->as<ColumnNode>();
+            if (!resolved_column)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Required column '{}' is not resolved", column_name);
+            auto fake_column = resolved_column->getColumn();
+
+            ApplyAliasColumnExpressionsVisitor visitor;
+            visitor.visit(fake_node);
+
+            projection.push_back(fake_node);
+            projection_columns.push_back(fake_column);
         }
 
         query_node->resolveProjectionColumns(std::move(projection_columns));
     }
 
+    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Result:\n{}", modified_query->dumpTree());
+
     return modified_query;
 }
 
@@ -710,7 +731,7 @@ QueryTreeNodePtr removeJoin(
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
     const StorageSnapshotPtr & storage_snapshot,
-    Names real_column_names,
+    Names required_column_names,
     Names & column_names_as_aliases,
     Aliases & aliases) const
 {
@@ -725,7 +746,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
-        modified_query_info.query_tree = removeJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression);
+        modified_query_info.query_tree = removeJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression, modified_context, required_column_names);
         modified_query_info.table_expression = replacement_table_expression;
         modified_query_info.planner_context->getOrCreateTableExpressionData(replacement_table_expression);
 
@@ -755,7 +776,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         if (with_aliases)
         {
             auto filter_actions_dag = std::make_shared<ActionsDAG>();
-            for (const auto & column : real_column_names)
+            for (const auto & column : required_column_names)
             {
                 const auto column_default = storage_columns.getDefault(column);
                 bool is_alias = column_default && column_default->kind == ColumnDefaultKind::Alias;
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index c500d1358a3..f5b6c3a7ca9 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -192,7 +192,7 @@ private:
     SelectQueryInfo getModifiedQueryInfo(const ContextPtr & modified_context,
         const StorageWithLockAndName & storage_with_lock_and_name,
         const StorageSnapshotPtr & storage_snapshot,
-        Names real_column_names,
+        Names required_column_names,
         Names & column_names_as_aliases,
         Aliases & aliases) const;
 

From 4c75b4bc7ca549bfad5225526e6fee62026b0440 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 14:04:27 +0000
Subject: [PATCH 0572/1081] Return display name

---
 src/Server/TCPHandler.cpp      | 12 ++++++------
 src/Server/TCPHandler.h        |  6 +++---
 src/Server/TCPHandlerFactory.h | 13 ++++---------
 3 files changed, 13 insertions(+), 18 deletions(-)

diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 339b664640f..ec6b374518d 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -184,7 +184,7 @@ void validateClientInfo(const ClientInfo & session_client_info, const ClientInfo
 namespace DB
 {
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string host_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
+TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
     : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
@@ -192,11 +192,11 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , log(getLogger("TCPHandler"))
     , read_event(read_event_)
     , write_event(write_event_)
-    , host_name(std::move(host_name_))
+    , server_display_name(std::move(server_display_name_))
 {
 }
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string host_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
+TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
 : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
@@ -206,7 +206,7 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , read_event(read_event_)
     , write_event(write_event_)
     , default_database(stack_data.default_database)
-    , host_name(std::move(host_name_))
+    , server_display_name(std::move(server_display_name_))
 {
     if (!forwarded_for.empty())
         LOG_TRACE(log, "Forwarded client address: {}", forwarded_for);
@@ -1201,7 +1201,7 @@ void TCPHandler::sendExtremes(const Block & extremes)
 void TCPHandler::sendProfileEvents()
 {
     Block block;
-    ProfileEvents::getProfileEvents(host_name, state.profile_queue, block, last_sent_snapshots);
+    ProfileEvents::getProfileEvents(server_display_name, state.profile_queue, block, last_sent_snapshots);
     if (block.rows() != 0)
     {
         initProfileEventsBlockOutput(block);
@@ -1536,7 +1536,7 @@ void TCPHandler::sendHello()
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_SERVER_TIMEZONE)
         writeStringBinary(DateLUT::instance().getTimeZone(), *out);
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_SERVER_DISPLAY_NAME)
-        writeStringBinary(host_name, *out);
+        writeStringBinary(server_display_name, *out);
     if (client_tcp_protocol_version >= DBMS_MIN_REVISION_WITH_VERSION_PATCH)
         writeVarUInt(VERSION_PATCH, *out);
     if (client_tcp_protocol_version >= DBMS_MIN_PROTOCOL_VERSION_WITH_PASSWORD_COMPLEXITY_RULES)
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index f1087fa14b0..26cecf46662 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -147,8 +147,8 @@ public:
       *  because it allows to check the IP ranges of the trusted proxy.
       * Proxy-forwarded (original client) IP address is used for quota accounting if quota is keyed by forwarded IP.
       */
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string host_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string host_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
     ~TCPHandler() override;
 
     void run() override;
@@ -224,7 +224,7 @@ private:
     ProfileEvents::ThreadIdToCountersSnapshot last_sent_snapshots;
 
     /// It is the name of the server that will be sent to the client.
-    String host_name;
+    String server_display_name;
 
     void runImpl();
 
diff --git a/src/Server/TCPHandlerFactory.h b/src/Server/TCPHandlerFactory.h
index 212572fb7a7..d65c9898b23 100644
--- a/src/Server/TCPHandlerFactory.h
+++ b/src/Server/TCPHandlerFactory.h
@@ -19,7 +19,7 @@ private:
     IServer & server;
     bool parse_proxy_protocol = false;
     LoggerPtr log;
-    std::string host_name;
+    std::string server_display_name;
 
     ProfileEvents::Event read_event;
     ProfileEvents::Event write_event;
@@ -42,12 +42,7 @@ public:
         , read_event(read_event_)
         , write_event(write_event_)
     {
-        const bool use_display_name = server.config().getBool("tcp_use_display_name_as_host_name", false);
-        if (use_display_name)
-            host_name = server.config().getString("display_name", "");
-
-        if (!host_name.length())
-            host_name = getFQDNOrHostName();
+        server_display_name = server.config().getString("display_name", getFQDNOrHostName());
     }
 
     Poco::Net::TCPServerConnection * createConnection(const Poco::Net::StreamSocket & socket, TCPServer & tcp_server) override
@@ -55,7 +50,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, host_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, server_display_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {
@@ -69,7 +64,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, stack_data, host_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, stack_data, server_display_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {

From 8c60c6b6690f13183da1f2c46a3e674cd2cbcce7 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 14:24:44 +0000
Subject: [PATCH 0573/1081] Use always host_name for profile events block

---
 src/Server/TCPHandler.cpp      | 26 ++++++++++++++++++++++----
 src/Server/TCPHandler.h        | 21 +++++++++++++++++++--
 src/Server/TCPHandlerFactory.h |  6 ++++--
 3 files changed, 45 insertions(+), 8 deletions(-)

diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index ec6b374518d..2c4e9c1e3b2 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -184,7 +184,15 @@ void validateClientInfo(const ClientInfo & session_client_info, const ClientInfo
 namespace DB
 {
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
+TCPHandler::TCPHandler(
+    IServer & server_,
+    TCPServer & tcp_server_,
+    const Poco::Net::StreamSocket & socket_,
+    bool parse_proxy_protocol_,
+    std::string server_display_name_,
+    std::string host_name_,
+    const ProfileEvents::Event & read_event_,
+    const ProfileEvents::Event & write_event_)
     : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
@@ -193,11 +201,20 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , read_event(read_event_)
     , write_event(write_event_)
     , server_display_name(std::move(server_display_name_))
+    , host_name(std::move(host_name_))
 {
 }
 
-TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_, const ProfileEvents::Event & write_event_)
-: Poco::Net::TCPServerConnection(socket_)
+TCPHandler::TCPHandler(
+    IServer & server_,
+    TCPServer & tcp_server_,
+    const Poco::Net::StreamSocket & socket_,
+    TCPProtocolStackData & stack_data,
+    std::string server_display_name_,
+    std::string host_name_,
+    const ProfileEvents::Event & read_event_,
+    const ProfileEvents::Event & write_event_)
+    : Poco::Net::TCPServerConnection(socket_)
     , server(server_)
     , tcp_server(tcp_server_)
     , log(getLogger("TCPHandler"))
@@ -207,6 +224,7 @@ TCPHandler::TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::N
     , write_event(write_event_)
     , default_database(stack_data.default_database)
     , server_display_name(std::move(server_display_name_))
+    , host_name(std::move(host_name_))
 {
     if (!forwarded_for.empty())
         LOG_TRACE(log, "Forwarded client address: {}", forwarded_for);
@@ -1201,7 +1219,7 @@ void TCPHandler::sendExtremes(const Block & extremes)
 void TCPHandler::sendProfileEvents()
 {
     Block block;
-    ProfileEvents::getProfileEvents(server_display_name, state.profile_queue, block, last_sent_snapshots);
+    ProfileEvents::getProfileEvents(host_name, state.profile_queue, block, last_sent_snapshots);
     if (block.rows() != 0)
     {
         initProfileEventsBlockOutput(block);
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index 26cecf46662..fc42a614f5c 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -147,8 +147,24 @@ public:
       *  because it allows to check the IP ranges of the trusted proxy.
       * Proxy-forwarded (original client) IP address is used for quota accounting if quota is keyed by forwarded IP.
       */
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, bool parse_proxy_protocol_, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
-    TCPHandler(IServer & server_, TCPServer & tcp_server_, const Poco::Net::StreamSocket & socket_, TCPProtocolStackData & stack_data, std::string server_display_name_, const ProfileEvents::Event & read_event_ = ProfileEvents::end(), const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(
+        IServer & server_,
+        TCPServer & tcp_server_,
+        const Poco::Net::StreamSocket & socket_,
+        bool parse_proxy_protocol_,
+        String server_display_name_,
+        String host_name_,
+        const ProfileEvents::Event & read_event_ = ProfileEvents::end(),
+        const ProfileEvents::Event & write_event_ = ProfileEvents::end());
+    TCPHandler(
+        IServer & server_,
+        TCPServer & tcp_server_,
+        const Poco::Net::StreamSocket & socket_,
+        TCPProtocolStackData & stack_data,
+        String server_display_name_,
+        String host_name_,
+        const ProfileEvents::Event & read_event_ = ProfileEvents::end(),
+        const ProfileEvents::Event & write_event_ = ProfileEvents::end());
     ~TCPHandler() override;
 
     void run() override;
@@ -225,6 +241,7 @@ private:
 
     /// It is the name of the server that will be sent to the client.
     String server_display_name;
+    String host_name;
 
     void runImpl();
 
diff --git a/src/Server/TCPHandlerFactory.h b/src/Server/TCPHandlerFactory.h
index d65c9898b23..3e861b9e18d 100644
--- a/src/Server/TCPHandlerFactory.h
+++ b/src/Server/TCPHandlerFactory.h
@@ -20,6 +20,7 @@ private:
     bool parse_proxy_protocol = false;
     LoggerPtr log;
     std::string server_display_name;
+    std::string host_name;
 
     ProfileEvents::Event read_event;
     ProfileEvents::Event write_event;
@@ -43,6 +44,7 @@ public:
         , write_event(write_event_)
     {
         server_display_name = server.config().getString("display_name", getFQDNOrHostName());
+        host_name = getFQDNOrHostName();
     }
 
     Poco::Net::TCPServerConnection * createConnection(const Poco::Net::StreamSocket & socket, TCPServer & tcp_server) override
@@ -50,7 +52,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, server_display_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, parse_proxy_protocol, server_display_name, host_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {
@@ -64,7 +66,7 @@ public:
         try
         {
             LOG_TRACE(log, "TCP Request. Address: {}", socket.peerAddress().toString());
-            return new TCPHandler(server, tcp_server, socket, stack_data, server_display_name, read_event, write_event);
+            return new TCPHandler(server, tcp_server, socket, stack_data, server_display_name, host_name, read_event, write_event);
         }
         catch (const Poco::Net::NetException &)
         {

From 931fc6572ce2ce7cc9d3fd9ec0d92bbe552e377e Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 14:33:34 +0000
Subject: [PATCH 0574/1081] Call getFQDNOrHostName() once

---
 src/Server/TCPHandlerFactory.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Server/TCPHandlerFactory.h b/src/Server/TCPHandlerFactory.h
index 3e861b9e18d..4e9963d2c6e 100644
--- a/src/Server/TCPHandlerFactory.h
+++ b/src/Server/TCPHandlerFactory.h
@@ -19,8 +19,8 @@ private:
     IServer & server;
     bool parse_proxy_protocol = false;
     LoggerPtr log;
-    std::string server_display_name;
     std::string host_name;
+    std::string server_display_name;
 
     ProfileEvents::Event read_event;
     ProfileEvents::Event write_event;
@@ -43,8 +43,8 @@ public:
         , read_event(read_event_)
         , write_event(write_event_)
     {
-        server_display_name = server.config().getString("display_name", getFQDNOrHostName());
         host_name = getFQDNOrHostName();
+        server_display_name = server.config().getString("display_name", host_name);
     }
 
     Poco::Net::TCPServerConnection * createConnection(const Poco::Net::StreamSocket & socket, TCPServer & tcp_server) override

From ea2dad181d5c91bddd63fc1ca64636123053fb8a Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 15:05:14 +0000
Subject: [PATCH 0575/1081] Fix non linux builds

---
 src/QueryPipeline/RemoteQueryExecutor.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 7f25c2331c3..90bd4bfdfdf 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -4,7 +4,7 @@
 
 #include <Columns/ColumnConst.h>
 #include <Common/CurrentThread.h>
-#include "Core/Protocol.h"
+#include <Core/Protocol.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
 #include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
@@ -17,6 +17,7 @@
 #include <Interpreters/Context.h>
 #include <Interpreters/InternalTextLogsQueue.h>
 #include <IO/ConnectionTimeouts.h>
+#include <Client/ConnectionEstablisher.h>
 #include <Client/MultiplexedConnections.h>
 #include <Client/HedgedConnections.h>
 #include <Storages/MergeTree/MergeTreeDataPartUUID.h>

From 28e6e290045c54dffedcbdb8879e785368f7bf24 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Fri, 2 Feb 2024 07:46:36 -0800
Subject: [PATCH 0576/1081] Minor fixes

---
 .../functions/time-series-functions.md        |  2 +-
 src/Functions/seriesOutliersDetectTukey.cpp   | 41 ++++++++++---------
 ...02813_seriesOutliersDetectTukey.reference} |  0
 ...ql => 02813_seriesOutliersDetectTukey.sql} |  3 ++
 4 files changed, 26 insertions(+), 20 deletions(-)
 rename tests/queries/0_stateless/{02813_seriesOutliersTukey.reference => 02813_seriesOutliersDetectTukey.reference} (100%)
 rename tests/queries/0_stateless/{02813_seriesOutliersTukey.sql => 02813_seriesOutliersDetectTukey.sql} (94%)

diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index bb6f3da25fb..ce36c89f473 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -24,7 +24,7 @@ seriesOutliersDetectTukey(series, min_percentile, max_percentile, K);
 - `series` - An array of numeric values.
 - `min_percentile` - The minimum percentile to be used to calculate inter-quantile range [(IQR)](https://en.wikipedia.org/wiki/Interquartile_range). The value must be in range [2,98]. The default is 25.
 - `max_percentile` - The maximum percentile to be used to calculate inter-quantile range (IQR). The value must be in range [2,98]. The default is 75.
-- `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
+- `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5.
 
 At least four data points are required in `series` to detect outliers.
 
diff --git a/src/Functions/seriesOutliersDetectTukey.cpp b/src/Functions/seriesOutliersDetectTukey.cpp
index 66fda8ce976..a2fc9cf8eb6 100644
--- a/src/Functions/seriesOutliersDetectTukey.cpp
+++ b/src/Functions/seriesOutliersDetectTukey.cpp
@@ -23,6 +23,9 @@ class FunctionSeriesOutliersDetectTukey : public IFunction
 public:
     static constexpr auto name = "seriesOutliersDetectTukey";
 
+    static constexpr Float64 min_quartile = 2.0;
+    static constexpr Float64 max_quartile = 98.0;
+
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSeriesOutliersDetectTukey>(); }
 
     std::string getName() const override { return name; }
@@ -72,18 +75,18 @@ public:
 
         Float64 min_percentile = 0.25; /// default 25th percentile
         Float64 max_percentile = 0.75; /// default 75th percentile
-        Float64 K = 1.50;
+        Float64 k = 1.50;
 
         if (arguments.size() > 1)
         {
             Float64 p_min = arguments[1].column->getFloat64(0);
-            if (p_min < 2.0 || p_min > 98.0)
+            if (p_min < min_quartile|| p_min > max_quartile)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} must be in range [2.0, 98.0]", getName());
 
             min_percentile = p_min / 100;
 
             Float64 p_max = arguments[2].column->getFloat64(0);
-            if (p_max < 2.0 || p_max > 98.0 || p_max < min_percentile * 100)
+            if (p_max < min_quartile || p_max > max_quartile || p_max < min_percentile * 100)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The third argument of function {} must be in range [2.0, 98.0]", getName());
 
             max_percentile = p_max / 100;
@@ -92,19 +95,19 @@ public:
             if (k_val < 0.0)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fourth argument of function {} must be a positive number", getName());
 
-            K = k_val;
+            k = k_val;
         }
 
-        if (executeNumber<UInt8>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<UInt16>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<UInt32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<UInt64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Int8>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Int16>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Int32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Int64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Float32>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res)
-            || executeNumber<Float64>(arr_data, arr_offsets, min_percentile, max_percentile, K, col_res))
+        if (executeNumber<UInt8>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<UInt16>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<UInt32>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<UInt64>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Int8>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Int16>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Int32>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Int64>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Float32>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res)
+            || executeNumber<Float64>(arr_data, arr_offsets, min_percentile, max_percentile, k, col_res))
         {
             return col_res;
         }
@@ -123,7 +126,7 @@ private:
         const ColumnArray::Offsets & arr_offsets,
         Float64 min_percentile,
         Float64 max_percentile,
-        Float64 K,
+        Float64 k,
         ColumnPtr & res_ptr) const
     {
         const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&arr_data);
@@ -179,8 +182,8 @@ private:
 
             Float64 iqr = q2 - q1; /// interquantile range
 
-            Float64 lower_fence = q1 - K * iqr;
-            Float64 upper_fence = q2 + K * iqr;
+            Float64 lower_fence = q1 - k * iqr;
+            Float64 upper_fence = q2 + k * iqr;
 
             for (ColumnArray::Offset j = prev_src_offset; j < src_offset; ++j)
             {
@@ -206,7 +209,7 @@ Detects outliers in series data using [Tukey Fences](https://en.wikipedia.org/wi
 
 ``` sql
 seriesOutliersDetectTukey(series);
-seriesOutliersDetectTukey(series, min_percentile, max_percentile, K);
+seriesOutliersDetectTukey(series, min_percentile, max_percentile, k);
 ```
 
 **Arguments**
@@ -214,7 +217,7 @@ seriesOutliersDetectTukey(series, min_percentile, max_percentile, K);
 - `series` - An array of numeric values.
 - `min_percentile` - The minimum percentile to be used to calculate inter-quantile range [(IQR)](https://en.wikipedia.org/wiki/Interquartile_range). The value must be in range [2,98]. The default is 25.
 - `max_percentile` - The maximum percentile to be used to calculate inter-quantile range (IQR). The value must be in range [2,98]. The default is 75.
-- `K` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
+- `k` - Non-negative constant value to detect mild or stronger outliers. The default value is 1.5
 
 At least four data points are required in `series` to detect outliers.
 
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.reference b/tests/queries/0_stateless/02813_seriesOutliersDetectTukey.reference
similarity index 100%
rename from tests/queries/0_stateless/02813_seriesOutliersTukey.reference
rename to tests/queries/0_stateless/02813_seriesOutliersDetectTukey.reference
diff --git a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql b/tests/queries/0_stateless/02813_seriesOutliersDetectTukey.sql
similarity index 94%
rename from tests/queries/0_stateless/02813_seriesOutliersTukey.sql
rename to tests/queries/0_stateless/02813_seriesOutliersDetectTukey.sql
index b43fa40e82b..ca116e8b7ed 100644
--- a/tests/queries/0_stateless/02813_seriesOutliersTukey.sql
+++ b/tests/queries/0_stateless/02813_seriesOutliersDetectTukey.sql
@@ -1,3 +1,6 @@
+-- Tags: no-cpu-aarch64
+-- Tag no-cpu-aarch64: values generated are slighly different on aarch64
+
 DROP TABLE IF EXISTS tb1;
 
 CREATE TABLE tb1 (n UInt32, a Array(Float64)) engine=Memory;

From 419545e359989c04113bb054558bd40e8369b9bd Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 2 Feb 2024 17:01:06 +0100
Subject: [PATCH 0577/1081] restart ci

---
 tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
index 1f00dd717eb..05d841ce01f 100644
--- a/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
+++ b/tests/queries/0_stateless/02896_leading_zeroes_no_octal.sql
@@ -100,7 +100,7 @@ INSERT INTO t_leading_zeroes_f VALUES (2069, '0x01P-01', 0x01P-01, 0.5, 'Hex sho
 -- using readUIntTextUpToNSignificantDigits<4>(exponent, in)
 -- INSERT INTO t_leading_zeroes_f VALUES (2070, '00009e00009', 00009e00009, 9e9, '???');
 
--- Binary should not work with input_format_values_interpret_expressions = 0;
+-- Binary should not work with input_format_values_interpret_expressions = 0
 
 INSERT INTO t_leading_zeroes_f VALUES (2050, '0b10000', 0b10000, 16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }
 INSERT INTO t_leading_zeroes_f VALUES (2051, '-0b10000', -0b10000, -16, 'Binary should not be parsed'); -- { clientError SYNTAX_ERROR }

From 0947d5c89edf4a74073967eeac544dc28e26facf Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Fri, 2 Feb 2024 18:10:47 +0100
Subject: [PATCH 0578/1081] CI: ci cache. step 1 (#58664)

* ci cache class
 #no_merge_commit #ci_set_reduced
---
 .github/workflows/master.yml             |   25 +-
 .github/workflows/pull_request.yml       |    4 +-
 .github/workflows/release_branches.yml   |    2 +-
 tests/ci/ci.py                           | 1075 +++++++++++++++++-----
 tests/ci/ci_config.py                    |   48 +-
 tests/ci/ci_utils.py                     |   20 +-
 tests/ci/commit_status_helper.py         |    2 +-
 tests/ci/performance_comparison_check.py |    6 +-
 tests/ci/pr_info.py                      |    5 +-
 tests/ci/s3_helper.py                    |    3 +
 tests/ci/test_ci_cache.py                |  293 ++++++
 11 files changed, 1200 insertions(+), 283 deletions(-)
 create mode 100644 tests/ci/test_ci_cache.py

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index fff058ecf87..5d57e6fc1d8 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -35,7 +35,7 @@ jobs:
       - name: PrepareRunConfig
         id: runconfig
         run: |
-            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --rebuild-all-binaries --outfile ${{ runner.temp }}/ci_run_data.json
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --outfile ${{ runner.temp }}/ci_run_data.json
 
             echo "::group::CI configuration"
             python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
@@ -319,22 +319,15 @@ jobs:
       run_command: |
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
+    needs: [RunConfig, BuilderBinDarwin, BuilderBinDarwinAarch64, BuilderDebRelease, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
-    needs:
-      - BuilderBinDarwin
-      - BuilderBinDarwinAarch64
-      - BuilderDebRelease
-      - BuilderDebAarch64
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Mark Commit Release Ready
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 mark_release_ready.py
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Mark Commit Release Ready
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
+        python3 mark_release_ready.py
 ############################################################################################
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 56617294fb6..9c08363f674 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -491,11 +491,11 @@ jobs:
       run_command: |
         TEMP_PATH="${TEMP_PATH}/integration" \
           python3 integration_test_check.py "Integration $CHECK_NAME" \
-            --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
+            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
 
         TEMP_PATH="${TEMP_PATH}/stateless" \
           python3 functional_test_check.py "Stateless $CHECK_NAME" "$KILL_TIMEOUT" \
-            --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
+            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
 
         python3 bugfix_validate_check.py "${TEMP_PATH}/stateless/functional_commit_status.tsv" "${TEMP_PATH}/integration/integration_commit_status.tsv"
 ##############################################################################################
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index 6d54e558b70..c5d8294b999 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -41,7 +41,7 @@ jobs:
         id: runconfig
         run: |
             echo "::group::configure CI run"
-            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --rebuild-all-binaries --outfile ${{ runner.temp }}/ci_run_data.json
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --outfile ${{ runner.temp }}/ci_run_data.json
             echo "::endgroup::"
             echo "::group::CI run configure results"
             python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 433ea4a3a5f..52879a1a778 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1,5 +1,7 @@
 import argparse
 import concurrent.futures
+from dataclasses import asdict, dataclass
+from enum import Enum
 import json
 import logging
 import os
@@ -7,12 +9,14 @@ import re
 import subprocess
 import sys
 from pathlib import Path
-from typing import Any, Dict, Iterable, List, Optional
+import time
+from typing import Any, Dict, List, Optional, Sequence, Union
 
 import docker_images_helper
 import upload_result_helper
 from build_check import get_release_or_pr
-from ci_config import CI_CONFIG, JobNames, Labels
+from ci_config import CI_CONFIG, Build, Labels, JobNames
+from ci_utils import GHActions, is_hex
 from clickhouse_helper import (
     CiLogsCredentials,
     ClickHouseHelper,
@@ -33,6 +37,7 @@ from digest_helper import DockerDigester, JobDigester
 from env_helper import (
     CI,
     GITHUB_JOB_API_URL,
+    GITHUB_RUN_URL,
     REPO_COPY,
     REPORT_PATH,
     S3_BUILDS_BUCKET,
@@ -48,6 +53,586 @@ from s3_helper import S3Helper
 from version_helper import get_version_from_repo
 
 
+@dataclass
+class PendingState:
+    updated_at: float
+    run_url: str
+
+
+class CiCache:
+    """
+    CI cache is a bunch of records. Record is a file stored under special location on s3.
+    The file name has following format
+
+        <RECORD_TYPE>_[<ATTRIBUTES>]--<JOB_NAME>_<JOB_DIGEST>_<BATCH>_<NUM_BATCHES>.ci
+
+    RECORD_TYPE:
+        SUCCESSFUL - for successfuly finished jobs
+        PENDING - for pending jobs
+
+    ATTRIBUTES:
+        release - for jobs being executed on the release branch including master branch (not a PR branch)
+    """
+
+    _S3_CACHE_PREFIX = "CI_cache_v1"
+    _CACHE_BUILD_REPORT_PREFIX = "build_report"
+    _RECORD_FILE_EXTENSION = ".ci"
+    _LOCAL_CACHE_PATH = Path(TEMP_PATH) / "ci_cache"
+    _ATTRIBUTE_RELEASE = "release"
+    # divider symbol 1
+    _DIV1 = "--"
+    # divider symbol 2
+    _DIV2 = "_"
+    assert _DIV1 != _DIV2
+
+    class RecordType(Enum):
+        SUCCESSFUL = "successful"
+        PENDING = "pending"
+
+    @dataclass
+    class Record:
+        record_type: "CiCache.RecordType"
+        job_name: str
+        job_digest: str
+        batch: int
+        num_batches: int
+        release_branch: bool
+        file: str = ""
+
+        def to_str_key(self):
+            """other fields must not be included in the hash str"""
+            return "_".join(
+                [self.job_name, self.job_digest, str(self.batch), str(self.num_batches)]
+            )
+
+    class JobType(Enum):
+        DOCS = "DOCS"
+        SRCS = "SRCS"
+
+        @classmethod
+        def is_docs_job(cls, job_name: str) -> bool:
+            return job_name == JobNames.DOCS_CHECK
+
+        @classmethod
+        def is_srcs_job(cls, job_name: str) -> bool:
+            return not cls.is_docs_job(job_name)
+
+        @classmethod
+        def get_type_by_name(cls, job_name: str) -> "CiCache.JobType":
+            res = cls.SRCS
+            if cls.is_docs_job(job_name):
+                res = cls.DOCS
+            elif cls.is_srcs_job(job_name):
+                res = cls.SRCS
+            else:
+                assert False
+            return res
+
+    def __init__(
+        self,
+        s3: S3Helper,
+        job_digests: Dict[str, str],
+    ):
+        self.s3 = s3
+        self.job_digests = job_digests
+        self.cache_s3_paths = {
+            job_type: f"{self._S3_CACHE_PREFIX}/{job_type.value}-{self.job_digests[self._get_reference_job_name(job_type)]}/"
+            for job_type in self.JobType
+        }
+        self.s3_record_prefixes = {
+            record_type: record_type.value for record_type in self.RecordType
+        }
+        self.records: Dict["CiCache.RecordType", Dict[str, "CiCache.Record"]] = {
+            record_type: {} for record_type in self.RecordType
+        }
+
+        self.cache_updated = False
+        self.cache_data_fetched = True
+        if not self._LOCAL_CACHE_PATH.exists():
+            self._LOCAL_CACHE_PATH.mkdir(parents=True, exist_ok=True)
+
+    def _get_reference_job_name(self, job_type: JobType) -> str:
+        res = Build.PACKAGE_RELEASE
+        if job_type == self.JobType.DOCS:
+            res = JobNames.DOCS_CHECK
+        elif job_type == self.JobType.SRCS:
+            res = Build.PACKAGE_RELEASE
+        else:
+            assert False
+        return res
+
+    def _get_record_file_name(
+        self,
+        record_type: RecordType,
+        job_name: str,
+        batch: int,
+        num_batches: int,
+        release_branch: bool,
+    ) -> str:
+        prefix = self.s3_record_prefixes[record_type]
+        prefix_extended = (
+            self._DIV2.join([prefix, self._ATTRIBUTE_RELEASE])
+            if release_branch
+            else prefix
+        )
+        assert self._DIV1 not in job_name, f"Invalid job name {job_name}"
+        job_name = self._DIV2.join(
+            [job_name, self.job_digests[job_name], str(batch), str(num_batches)]
+        )
+        file_name = self._DIV1.join([prefix_extended, job_name])
+        file_name += self._RECORD_FILE_EXTENSION
+        return file_name
+
+    def _get_record_s3_path(self, job_name: str) -> str:
+        return self.cache_s3_paths[self.JobType.get_type_by_name(job_name)]
+
+    def _parse_record_file_name(
+        self, record_type: RecordType, file_name: str
+    ) -> Optional["CiCache.Record"]:
+        # validate filename
+        if (
+            not file_name.endswith(self._RECORD_FILE_EXTENSION)
+            or not len(file_name.split(self._DIV1)) == 2
+        ):
+            print("ERROR: wrong file name format")
+            return None
+
+        file_name = file_name.removesuffix(self._RECORD_FILE_EXTENSION)
+        release_branch = False
+
+        prefix_extended, job_suffix = file_name.split(self._DIV1)
+        record_type_and_attribute = prefix_extended.split(self._DIV2)
+
+        # validate filename prefix
+        failure = False
+        if not 0 < len(record_type_and_attribute) <= 2:
+            print("ERROR: wrong file name prefix")
+            failure = True
+        if (
+            len(record_type_and_attribute) > 1
+            and record_type_and_attribute[1] != self._ATTRIBUTE_RELEASE
+        ):
+            print("ERROR: wrong record attribute")
+            failure = True
+        if record_type_and_attribute[0] != self.s3_record_prefixes[record_type]:
+            print("ERROR: wrong record type")
+            failure = True
+        if failure:
+            return None
+
+        if (
+            len(record_type_and_attribute) > 1
+            and record_type_and_attribute[1] == self._ATTRIBUTE_RELEASE
+        ):
+            release_branch = True
+
+        job_properties = job_suffix.split(self._DIV2)
+        job_name, job_digest, batch, num_batches = (
+            self._DIV2.join(job_properties[:-3]),
+            job_properties[-3],
+            int(job_properties[-2]),
+            int(job_properties[-1]),
+        )
+
+        if not is_hex(job_digest):
+            print("ERROR: wrong record job digest")
+            return None
+
+        record = self.Record(
+            record_type,
+            job_name,
+            job_digest,
+            batch,
+            num_batches,
+            release_branch,
+            file="",
+        )
+        return record
+
+    def update(self):
+        """
+        Pulls cache records from s3. Only records name w/o content.
+        """
+        for record_type in self.RecordType:
+            prefix = self.s3_record_prefixes[record_type]
+            cache_list = self.records[record_type]
+            for job_type in self.JobType:
+                path = self.cache_s3_paths[job_type]
+                records = self.s3.list_prefix(f"{path}{prefix}", S3_BUILDS_BUCKET)
+                records = [record.split("/")[-1] for record in records]
+                GHActions.print_in_group(
+                    f"Cache records: [{record_type}] in [{job_type.value}]", records
+                )
+                for file in records:
+                    record = self._parse_record_file_name(
+                        record_type=record_type, file_name=file
+                    )
+                    if not record:
+                        print(f"ERROR: failed to parse cache record [{file}]")
+                        continue
+                    if (
+                        record.job_name not in self.job_digests
+                        or self.job_digests[record.job_name] != record.job_digest
+                    ):
+                        # skip records we are not interested in
+                        continue
+
+                    if record.to_str_key() not in cache_list:
+                        cache_list[record.to_str_key()] = record
+                        self.cache_data_fetched = False
+                    elif (
+                        not cache_list[record.to_str_key()].release_branch
+                        and record.release_branch
+                    ):
+                        # replace a non-release record with a release one
+                        cache_list[record.to_str_key()] = record
+                        self.cache_data_fetched = False
+
+        self.cache_updated = True
+        return self
+
+    def fetch_records_data(self):
+        """
+        Pulls CommitStatusData for all cached jobs from s3
+        """
+        if not self.cache_updated:
+            self.update()
+
+        if self.cache_data_fetched:
+            # there are no record w/o underling data - no need to fetch
+            return self
+
+        # clean up
+        for file in self._LOCAL_CACHE_PATH.glob("*.ci"):
+            file.unlink()
+
+        # download all record files
+        for job_type in self.JobType:
+            path = self.cache_s3_paths[job_type]
+            for record_type in self.RecordType:
+                prefix = self.s3_record_prefixes[record_type]
+                _ = self.s3.download_files(
+                    bucket=S3_BUILDS_BUCKET,
+                    s3_path=f"{path}{prefix}",
+                    file_suffix=self._RECORD_FILE_EXTENSION,
+                    local_directory=self._LOCAL_CACHE_PATH,
+                )
+
+        # validate we have files for all records and save file names meanwhile
+        for record_type in self.RecordType:
+            record_list = self.records[record_type]
+            for _, record in record_list.items():
+                record_file_name = self._get_record_file_name(
+                    record_type,
+                    record.job_name,
+                    record.batch,
+                    record.num_batches,
+                    record.release_branch,
+                )
+                assert (
+                    self._LOCAL_CACHE_PATH / record_file_name
+                ).is_file(), f"BUG. Record file must be present: {self._LOCAL_CACHE_PATH / record_file_name}"
+                record.file = record_file_name
+
+        self.cache_data_fetched = True
+        return self
+
+    def exist(
+        self,
+        record_type: "CiCache.RecordType",
+        job: str,
+        batch: int,
+        num_batches: int,
+        release_branch: bool,
+    ) -> bool:
+        if not self.cache_updated:
+            self.update()
+        record_key = self.Record(
+            record_type,
+            job,
+            self.job_digests[job],
+            batch,
+            num_batches,
+            release_branch,
+        ).to_str_key()
+        res = record_key in self.records[record_type]
+        if release_branch:
+            return res and self.records[record_type][record_key].release_branch
+        else:
+            return res
+
+    def push(
+        self,
+        record_type: "CiCache.RecordType",
+        job: str,
+        batches: Union[int, Sequence[int]],
+        num_batches: int,
+        status: Union[CommitStatusData, PendingState],
+        release_branch: bool = False,
+    ) -> None:
+        """
+        Pushes a cache record (CommitStatusData)
+        @release_branch adds "release" attribute to a record
+        """
+        if isinstance(batches, int):
+            batches = [batches]
+        for batch in batches:
+            record_file = self._LOCAL_CACHE_PATH / self._get_record_file_name(
+                record_type, job, batch, num_batches, release_branch
+            )
+            record_s3_path = self._get_record_s3_path(job)
+            if record_type == self.RecordType.SUCCESSFUL:
+                assert isinstance(status, CommitStatusData)
+                status.dump_to_file(record_file)
+            elif record_type == self.RecordType.PENDING:
+                assert isinstance(status, PendingState)
+                with open(record_file, "w") as json_file:
+                    json.dump(asdict(status), json_file)
+            else:
+                assert False
+
+            _ = self.s3.upload_file(
+                bucket=S3_BUILDS_BUCKET,
+                file_path=record_file,
+                s3_path=record_s3_path + record_file.name,
+            )
+            record = self.Record(
+                record_type,
+                job,
+                self.job_digests[job],
+                batch,
+                num_batches,
+                release_branch,
+                file=record_file.name,
+            )
+            if (
+                record.release_branch
+                or record.to_str_key() not in self.records[record_type]
+            ):
+                self.records[record_type][record.to_str_key()] = record
+
+    def get(
+        self, record_type: "CiCache.RecordType", job: str, batch: int, num_batches: int
+    ) -> Optional[Union[CommitStatusData, PendingState]]:
+        """
+        Gets a cache record data for a job, or None if a cache miss
+        """
+
+        if not self.cache_data_fetched:
+            self.fetch_records_data()
+
+        record_key = self.Record(
+            record_type,
+            job,
+            self.job_digests[job],
+            batch,
+            num_batches,
+            release_branch=False,
+        ).to_str_key()
+
+        if record_key not in self.records[record_type]:
+            return None
+
+        record_file_name = self.records[record_type][record_key].file
+
+        res = CommitStatusData.load_from_file(
+            self._LOCAL_CACHE_PATH / record_file_name
+        )  # type: CommitStatusData
+
+        return res
+
+    def delete(
+        self,
+        record_type: "CiCache.RecordType",
+        job: str,
+        batch: int,
+        num_batches: int,
+        release_branch: bool,
+    ) -> None:
+        """
+        deletes record from the cache
+        """
+        raise NotImplementedError("Let's try make cache push-and-read-only")
+        # assert (
+        #     record_type == self.RecordType.PENDING
+        # ), "FIXME: delete is supported for pending records only"
+        # record_file_name = self._get_record_file_name(
+        #     self.RecordType.PENDING,
+        #     job,
+        #     batch,
+        #     num_batches,
+        #     release_branch=release_branch,
+        # )
+        # record_s3_path = self._get_record_s3_path(job)
+        # self.s3.delete_file_from_s3(S3_BUILDS_BUCKET, record_s3_path + record_file_name)
+
+        # record_key = self.Record(
+        #     record_type,
+        #     job,
+        #     self.job_digests[job],
+        #     batch,
+        #     num_batches,
+        #     release_branch=False,
+        # ).to_str_key()
+
+        # if record_key in self.records[record_type]:
+        #     del self.records[record_type][record_key]
+
+    def is_successful(
+        self, job: str, batch: int, num_batches: int, release_branch: bool
+    ) -> bool:
+        """
+        checks if a given job have already been done successfuly
+        """
+        return self.exist(
+            self.RecordType.SUCCESSFUL, job, batch, num_batches, release_branch
+        )
+
+    def is_pending(
+        self, job: str, batch: int, num_batches: int, release_branch: bool
+    ) -> bool:
+        """
+        check pending record in the cache for a given job
+        @release_branch - checks that "release" attribute is set for a record
+        """
+        if self.is_successful(job, batch, num_batches, release_branch):
+            # successful record is present - not pending
+            return False
+
+        return self.exist(
+            self.RecordType.PENDING, job, batch, num_batches, release_branch
+        )
+
+    def push_successful(
+        self,
+        job: str,
+        batch: int,
+        num_batches: int,
+        job_status: CommitStatusData,
+        release_branch: bool = False,
+    ) -> None:
+        """
+        Pushes a cache record (CommitStatusData)
+        @release_branch adds "release" attribute to a record
+        """
+        self.push(
+            self.RecordType.SUCCESSFUL,
+            job,
+            [batch],
+            num_batches,
+            job_status,
+            release_branch,
+        )
+
+    def push_pending(
+        self, job: str, batches: List[int], num_batches: int, release_branch: bool
+    ) -> None:
+        """
+        pushes pending record for a job to the cache
+        """
+        pending_state = PendingState(time.time(), run_url=GITHUB_RUN_URL)
+        self.push(
+            self.RecordType.PENDING,
+            job,
+            batches,
+            num_batches,
+            pending_state,
+            release_branch,
+        )
+
+    def get_successful(
+        self, job: str, batch: int, num_batches: int
+    ) -> Optional[CommitStatusData]:
+        """
+        Gets a cache record (CommitStatusData) for a job, or None if a cache miss
+        """
+        res = self.get(self.RecordType.SUCCESSFUL, job, batch, num_batches)
+        assert res is None or isinstance(res, CommitStatusData)
+        return res
+
+    def delete_pending(
+        self, job: str, batch: int, num_batches: int, release_branch: bool
+    ) -> None:
+        """
+        deletes pending record from the cache
+        """
+        self.delete(self.RecordType.PENDING, job, batch, num_batches, release_branch)
+
+    def download_build_reports(self, file_prefix: str = "") -> List[str]:
+        """
+        not ideal class for this method,
+        but let it be as we store build reports in CI cache directory on s3
+        and CiCache knows where exactly
+
+        @file_prefix allows to filter out reports by git head_ref
+        """
+        report_path = Path(REPORT_PATH)
+        report_path.mkdir(exist_ok=True, parents=True)
+        path = (
+            self._get_record_s3_path(Build.PACKAGE_RELEASE)
+            + self._CACHE_BUILD_REPORT_PREFIX
+        )
+        if file_prefix:
+            path += "_" + file_prefix
+        reports_files = self.s3.download_files(
+            bucket=S3_BUILDS_BUCKET,
+            s3_path=path,
+            file_suffix=".json",
+            local_directory=report_path,
+        )
+        return reports_files
+
+    def upload_build_report(self, build_result: BuildResult) -> str:
+        result_json_path = build_result.write_json(Path(TEMP_PATH))
+        s3_path = (
+            self._get_record_s3_path(Build.PACKAGE_RELEASE) + result_json_path.name
+        )
+        return self.s3.upload_file(
+            bucket=S3_BUILDS_BUCKET, file_path=result_json_path, s3_path=s3_path
+        )
+
+    # def await_jobs(self, jobs_with_params: Dict[str, Dict[str, Any]]) -> List[str]:
+    # if not jobs_with_params:
+    #     return []
+    # print(f"Start awaiting jobs [{list(jobs_with_params)}]")
+    # poll_interval_sec = 180
+    # start_at = int(time.time())
+    # TIMEOUT = 3000
+    # expired_sec = 0
+    # done_jobs = []  # type: List[str]
+    # while expired_sec < TIMEOUT and jobs_with_params:
+    #     time.sleep(poll_interval_sec)
+    #     self.update()
+    #     pending_finished: List[str] = []
+    #     for job_name in jobs_with_params:
+    #         num_batches = jobs_with_params[job_name]["num_batches"]
+    #         for batch in jobs_with_params[job_name]["batches"]:
+    #             if self.is_pending(job_name, batch, num_batches):
+    #                 continue
+    #             print(
+    #                 f"Job [{job_name}_[{batch}/{num_batches}]] is not pending anymore"
+    #             )
+    #             pending_finished.append(job_name)
+    #     if pending_finished:
+    #         # restart timer
+    #         start_at = int(time.time())
+    #         expired_sec = 0
+    #         # remove finished jobs from awaiting list
+    #         for job in pending_finished:
+    #             del jobs_with_params[job]
+    #             done_jobs.append(job)
+    #     else:
+    #         expired_sec = int(time.time()) - start_at
+    #     print(f"  ...awaiting continues... time left [{TIMEOUT - expired_sec}]")
+    # if done_jobs:
+    #     print(
+    #         f"Awaiting OK. Left jobs: [{list(jobs_with_params)}], finished jobs: [{done_jobs}]"
+    #     )
+    # else:
+    #     print("Awaiting FAILED. No job has finished.")
+    # return done_jobs
+
+
 def get_check_name(check_name: str, batch: int, num_batches: int) -> str:
     res = check_name
     if num_batches > 1:
@@ -155,11 +740,12 @@ def parse_args(parser: argparse.ArgumentParser) -> argparse.Namespace:
         default=False,
         help="will create run config for rebuilding all dockers, used in --configure action (for nightly docker job)",
     )
+    # FIXME: remove, not used
     parser.add_argument(
         "--rebuild-all-binaries",
         action="store_true",
         default=False,
-        help="will create run config without skipping build jobs in any case, used in --configure action (for release branches)",
+        help="[DEPRECATED. to be removed, once no wf use it] will create run config without skipping build jobs in any case, used in --configure action (for release branches)",
     )
     parser.add_argument(
         "--commit-message",
@@ -169,23 +755,8 @@ def parse_args(parser: argparse.ArgumentParser) -> argparse.Namespace:
     return parser.parse_args()
 
 
-def get_file_flag_name(
-    job_name: str, digest: str, batch: int = 0, num_batches: int = 1
-) -> str:
-    if num_batches < 2:
-        return f"job_{job_name}_{digest}.ci"
-    else:
-        return f"job_{job_name}_{digest}_{batch}_{num_batches}.ci"
-
-
-def get_s3_path(build_digest: str) -> str:
-    return f"CI_data/BUILD-{build_digest}/"
-
-
-def get_s3_path_docs(digest: str) -> str:
-    return f"CI_data/DOCS-{digest}/"
-
-
+# FIXME: rewrite the docker job as regular reusable_test job and move interaction with docker hub inside job script
+#   that way run config will be more clean, workflow more generic and less api calls to dockerhub
 def check_missing_images_on_dockerhub(
     image_name_tag: Dict[str, str], arch: Optional[str] = None
 ) -> Dict[str, str]:
@@ -260,13 +831,93 @@ def check_missing_images_on_dockerhub(
     return result
 
 
-def _check_and_update_for_early_style_check(run_config: dict) -> None:
+def _pre_action(s3, indata, pr_info):
+    CommitStatusData.cleanup()
+    JobReport.cleanup()
+    BuildResult.cleanup()
+    ci_cache = CiCache(s3, indata["jobs_data"]["digests"])
+
+    # for release/master branches reports must be from the same branches
+    report_prefix = pr_info.head_ref if pr_info.number == 0 else ""
+    reports_files = ci_cache.download_build_reports(file_prefix=report_prefix)
+    print(f"Pre action done. Report files [{reports_files}] have been downloaded")
+
+
+def _mark_success_action(
+    s3: S3Helper,
+    indata: Dict[str, Any],
+    pr_info: PRInfo,
+    job: str,
+    batch: int,
+) -> None:
+    ci_cache = CiCache(s3, indata["jobs_data"]["digests"])
+    job_config = CI_CONFIG.get_job_config(job)
+    num_batches = job_config.num_batches
+    # if batch is not provided - set to 0
+    batch = 0 if batch == -1 else batch
+    assert (
+        0 <= batch < num_batches
+    ), f"--batch must be provided and in range [0, {num_batches}) for {job}"
+
+    # FIXME: find generic design for propagating and handling job status (e.g. stop using statuses in GH api)
+    #   now job ca be build job w/o status data, any other job that exit with 0 with or w/o status data
+    if CI_CONFIG.is_build_job(job):
+        # there is no status for build jobs
+        # create dummy success to mark it as done
+        # FIXME: consider creating commit status for build jobs too, to treat everything the same way
+        CommitStatusData("success", "dummy description", "dummy_url").dump_status()
+
+    job_status = None
+    if CommitStatusData.exist():
+        # normal scenario
+        job_status = CommitStatusData.load_status()
+    else:
+        # apparently exit after rerun-helper check
+        # do nothing, exit without failure
+        print(f"ERROR: no status file for job [{job}]")
+
+    if job_config.run_always or job_config.run_by_label:
+        print(f"Job [{job}] runs always or by label in CI - do not cache")
+    else:
+        if pr_info.is_master():
+            pass
+            # delete method is disabled for ci_cache. need it?
+            # pending enabled for master branch jobs only
+            # ci_cache.delete_pending(job, batch, num_batches, release_branch=True)
+        if job_status and job_status.is_ok():
+            ci_cache.push_successful(
+                job, batch, num_batches, job_status, pr_info.is_release_branch()
+            )
+            print(f"Job [{job}] is ok")
+        elif job_status:
+            print(f"Job [{job}] is not ok, status [{job_status.status}]")
+
+
+def _print_results(result: Any, outfile: Optional[str], pretty: bool = False) -> None:
+    if outfile:
+        with open(outfile, "w") as f:
+            if isinstance(result, str):
+                print(result, file=f)
+            elif isinstance(result, dict):
+                print(json.dumps(result, indent=2 if pretty else None), file=f)
+            else:
+                raise AssertionError(f"Unexpected type for 'res': {type(result)}")
+    else:
+        if isinstance(result, str):
+            print(result)
+        elif isinstance(result, dict):
+            print(json.dumps(result, indent=2 if pretty else None))
+        else:
+            raise AssertionError(f"Unexpected type for 'res': {type(result)}")
+
+
+def _check_and_update_for_early_style_check(jobs_data: dict, docker_data: dict) -> None:
     """
     This is temporary hack to start style check before docker build if possible
     FIXME: need better solution to do style check as soon as possible and as fast as possible w/o dependency on docker job
     """
-    jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
-    docker_to_build = run_config.get("docker_data", {}).get("missing_multi", [])
+    jobs_to_do = jobs_data.get("jobs_to_do", [])
+    docker_to_build = docker_data.get("missing_multi", [])
     if (
         JobNames.STYLE_CHECK in jobs_to_do
         and docker_to_build
@@ -276,13 +927,16 @@ def _check_and_update_for_early_style_check(run_config: dict) -> None:
         jobs_to_do[index] = "Style check early"
 
 
-def _update_config_for_docs_only(run_config: dict) -> None:
+def _update_config_for_docs_only(jobs_data: dict) -> None:
     DOCS_CHECK_JOBS = [JobNames.DOCS_CHECK, JobNames.STYLE_CHECK]
     print(f"NOTE: Will keep only docs related jobs: [{DOCS_CHECK_JOBS}]")
-    jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
-    run_config["jobs_data"]["jobs_to_do"] = [
-        job for job in jobs_to_do if job in DOCS_CHECK_JOBS
-    ]
+    jobs_to_do = jobs_data.get("jobs_to_do", [])
+    jobs_data["jobs_to_do"] = [job for job in jobs_to_do if job in DOCS_CHECK_JOBS]
+    jobs_data["jobs_to_wait"] = {
+        job: params
+        for job, params in jobs_data["jobs_to_wait"].items()
+        if job in DOCS_CHECK_JOBS
+    }
 
 
 def _configure_docker_jobs(
@@ -351,14 +1005,11 @@ def _configure_docker_jobs(
 
 
 def _configure_jobs(
-    build_digest: str,
-    docs_digest: str,
     job_digester: JobDigester,
     s3: S3Helper,
-    rebuild_all_binaries: bool,
-    pr_labels: Iterable[str],
+    pr_info: PRInfo,
     commit_tokens: List[str],
-    ci_cache_enabled: bool,
+    ci_cache_disabled: bool,
 ) -> Dict:
     ## a. digest each item from the config
     job_digester = JobDigester()
@@ -374,19 +1025,12 @@ def _configure_jobs(
         print(f"    job [{job.rjust(50)}] has digest [{digest}]")
     print("::endgroup::")
 
-    ## b. check if we have something done
-    if ci_cache_enabled:
-        done_files = []
-    else:
-        path = get_s3_path(build_digest)
-        done_files = s3.list_prefix(path)
-        done_files = [file.split("/")[-1] for file in done_files]
-        # print(f"S3 CI files for the build [{build_digest}]: {done_files}")
-        docs_path = get_s3_path_docs(docs_digest)
-        done_files_docs = s3.list_prefix(docs_path)
-        done_files_docs = [file.split("/")[-1] for file in done_files_docs]
-        # print(f"S3 CI files for the docs [{docs_digest}]: {done_files_docs}")
-        done_files += done_files_docs
+    ## b. check what we need to run
+    ci_cache = None
+    if not ci_cache_disabled:
+        ci_cache = CiCache(s3, digests)
+
+    jobs_to_wait: Dict[str, Dict[str, Any]] = {}
 
     for job in digests:
         digest = digests[job]
@@ -394,22 +1038,37 @@ def _configure_jobs(
         num_batches: int = job_config.num_batches
         batches_to_do: List[int] = []
 
-        if job_config.run_by_label:
-            # this job controlled by label, add to todo if it's labe is set in pr
-            if job_config.run_by_label in pr_labels:
-                for batch in range(num_batches):  # type: ignore
-                    batches_to_do.append(batch)
-        elif job_config.run_always:
-            # always add to todo
-            batches_to_do.append(batch)
-        else:
-            # this job controlled by digest, add to todo if it's not successfully done before
-            for batch in range(num_batches):  # type: ignore
-                success_flag_name = get_file_flag_name(job, digest, batch, num_batches)
-                if success_flag_name not in done_files or (
-                    rebuild_all_binaries and CI_CONFIG.is_build_job(job)
-                ):
+        for batch in range(num_batches):  # type: ignore
+            if job_config.pr_only and pr_info.is_release_branch():
+                continue
+            if job_config.run_by_label:
+                # this job controlled by label, add to todo if its label is set in pr
+                if job_config.run_by_label in pr_info.labels:
                     batches_to_do.append(batch)
+            elif job_config.run_always:
+                # always add to todo
+                batches_to_do.append(batch)
+            elif not ci_cache:
+                batches_to_do.append(batch)
+            elif not ci_cache.is_successful(
+                job,
+                batch,
+                num_batches,
+                release_branch=pr_info.is_release_branch()
+                and job_config.required_on_release_branch,
+            ):
+                # ci cache is enabled and job is not in the cache - add
+                batches_to_do.append(batch)
+
+                # check if it's pending in the cache
+                if ci_cache.is_pending(job, batch, num_batches, release_branch=False):
+                    if job in jobs_to_wait:
+                        jobs_to_wait[job]["batches"].append(batch)
+                    else:
+                        jobs_to_wait[job] = {
+                            "batches": [batch],
+                            "num_batches": num_batches,
+                        }
 
         if batches_to_do:
             jobs_to_do.append(job)
@@ -420,11 +1079,11 @@ def _configure_jobs(
         else:
             jobs_to_skip.append(job)
 
-    ## c. check CI controlling labels commit messages
-    if pr_labels:
+    ## c. check CI controlling labels and commit messages
+    if pr_info.labels:
         jobs_requested_by_label = []  # type: List[str]
         ci_controlling_labels = []  # type: List[str]
-        for label in pr_labels:
+        for label in pr_info.labels:
             label_config = CI_CONFIG.get_label_config(label)
             if label_config:
                 jobs_requested_by_label += label_config.run_jobs
@@ -434,6 +1093,8 @@ def _configure_jobs(
             print(
                 f"    :   following jobs will be executed: [{jobs_requested_by_label}]"
             )
+            # so far there is only "do not test" label in the config that runs only Style check.
+            #  check later if we need to filter out requested jobs using ci cache. right now we do it:
             jobs_to_do = [job for job in jobs_requested_by_label if job in jobs_to_do]
 
     if commit_tokens:
@@ -482,68 +1143,39 @@ def _configure_jobs(
         "digests": digests,
         "jobs_to_do": jobs_to_do,
         "jobs_to_skip": jobs_to_skip,
+        "jobs_to_wait": jobs_to_wait,
         "jobs_params": {
             job: params for job, params in jobs_params.items() if job in jobs_to_do
         },
     }
 
 
-def _update_gh_statuses(indata: Dict, s3: S3Helper) -> None:
+def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
     if indata["ci_flags"][Labels.NO_CI_CACHE]:
         print("CI cache is disabled - skip restoring commit statuses from CI cache")
         return
-
-    temp_path = Path(TEMP_PATH)
-    if not temp_path.exists():
-        temp_path.mkdir(parents=True, exist_ok=True)
-
-    # clean up before start
-    for file in temp_path.glob("*.ci"):
-        file.unlink()
-
-    # download all metadata files
-    path = get_s3_path(indata["build"])
-    files = s3.download_files(  # type: ignore
-        bucket=S3_BUILDS_BUCKET,
-        s3_path=path,
-        file_suffix=".ci",
-        local_directory=temp_path,
-    )
-    print(f"CI metadata files [{files}]")
-    path = get_s3_path_docs(indata["docs"])
-    files_docs = s3.download_files(  # type: ignore
-        bucket=S3_BUILDS_BUCKET,
-        s3_path=path,
-        file_suffix=".ci",
-        local_directory=temp_path,
-    )
-    print(f"CI docs metadata files [{files_docs}]")
-    files += files_docs
-
-    # parse CI metadata
     job_digests = indata["jobs_data"]["digests"]
+    ci_cache = CiCache(s3, job_digests).update().fetch_records_data()
+
     # create GH status
     pr_info = PRInfo()
     commit = get_commit(Github(get_best_robot_token(), per_page=100), pr_info.sha)
 
-    def run_create_status(job, digest, batch, num_batches):
-        success_flag_name = get_file_flag_name(job, digest, batch, num_batches)
-        if success_flag_name in files:
-            print(f"Going to re-create GH status for job [{job}] sha [{pr_info.sha}]")
-            job_status = CommitStatusData.load_from_file(
-                f"{TEMP_PATH}/{success_flag_name}"
-            )  # type: CommitStatusData
-            assert job_status.status == SUCCESS, "BUG!"
-            commit.create_status(
-                state=job_status.status,
-                target_url=job_status.report_url,
-                description=format_description(
-                    f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
-                    f"{job_status.description}"
-                ),
-                context=get_check_name(job, batch=batch, num_batches=num_batches),
-            )
-            print(f"GH status re-created from file [{success_flag_name}]")
+    def _run_create_status(job: str, batch: int, num_batches: int) -> None:
+        job_status = ci_cache.get_successful(job, batch, num_batches)
+        if not job_status:
+            return
+        print(f"Going to re-create GH status for job [{job}] sha [{pr_info.sha}]")
+        assert job_status.status == "success", "BUG!"
+        commit.create_status(
+            state=job_status.status,
+            target_url=job_status.report_url,
+            description=format_description(
+                f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
+                f"{job_status.description}"
+            ),
+            context=get_check_name(job, batch=batch, num_batches=num_batches),
+        )
 
     with concurrent.futures.ThreadPoolExecutor() as executor:
         futures = []
@@ -551,12 +1183,9 @@ def _update_gh_statuses(indata: Dict, s3: S3Helper) -> None:
             if CI_CONFIG.is_build_job(job):
                 # no GH status for build jobs
                 continue
-            digest = job_digests[job]
             num_batches = CI_CONFIG.get_job_config(job).num_batches
             for batch in range(num_batches):
-                future = executor.submit(
-                    run_create_status, job, digest, batch, num_batches
-                )
+                future = executor.submit(_run_create_status, job, batch, num_batches)
                 futures.append(future)
         done, _ = concurrent.futures.wait(futures)
         for future in done:
@@ -568,11 +1197,6 @@ def _update_gh_statuses(indata: Dict, s3: S3Helper) -> None:
     set_status_comment(commit, pr_info)
     print("... CI report update - done")
 
-    # clean up
-    ci_files = list(temp_path.glob("*.ci"))
-    for file in ci_files:
-        file.unlink()
-
 
 def _fetch_commit_tokens(message: str) -> List[str]:
     pattern = r"#[\w-]+"
@@ -584,7 +1208,7 @@ def _fetch_commit_tokens(message: str) -> List[str]:
 def _upload_build_artifacts(
     pr_info: PRInfo,
     build_name: str,
-    build_digest: str,
+    ci_cache: CiCache,
     job_report: JobReport,
     s3: S3Helper,
     s3_destination: str,
@@ -640,12 +1264,8 @@ def _upload_build_artifacts(
         head_ref=pr_info.head_ref,
         pr_number=pr_info.number,
     )
-    result_json_path = build_result.write_json()
-    s3_path = get_s3_path(build_digest) + result_json_path.name
-    build_report_url = s3.upload_file(
-        bucket=S3_BUILDS_BUCKET, file_path=result_json_path, s3_path=s3_path
-    )
-    print(f"Report file [{result_json_path}] has been uploaded to [{build_report_url}]")
+    report_url = ci_cache.upload_build_report(build_result)
+    print(f"Report file has been uploaded to [{report_url}]")
 
     # Upload head master binaries
     static_bin_name = CI_CONFIG.build_config[build_name].static_binary_name
@@ -852,9 +1472,6 @@ def main() -> int:
 
     ### CONFIGURE action: start
     if args.configure:
-        docker_data = {}
-        git_ref = git_runner.run(f"{GIT_PREFIX} rev-parse HEAD")
-
         # if '#no_merge_commit' is set in commit message - set git ref to PR branch head to avoid merge-commit
         tokens = []
         ci_flags = {
@@ -876,6 +1493,9 @@ def main() -> int:
             ci_flags[Labels.NO_CI_CACHE] = True
             print("NOTE: Disable CI Cache")
 
+        docker_data = {}
+        git_ref = git_runner.run(f"{GIT_PREFIX} rev-parse HEAD")
+
         # let's get CH version
         version = get_version_from_repo(git=Git(True)).string
         print(f"Got CH version for this commit: [{version}]")
@@ -897,13 +1517,9 @@ def main() -> int:
         )
         jobs_data = (
             _configure_jobs(
-                build_digest,
-                docs_digest,
                 job_digester,
                 s3,
-                # FIXME: add suport for master wf w/o rebuilds
-                args.rebuild_all_binaries or pr_info.is_master(),
-                pr_info.labels,
+                pr_info,
                 tokens,
                 ci_flags[Labels.NO_CI_CACHE],
             )
@@ -911,6 +1527,39 @@ def main() -> int:
             else {}
         )
 
+        # FIXME: Early style check manipulates with job names might be not robust with await feature
+        if pr_info.number != 0 and not args.docker_digest_or_latest:
+            # FIXME: it runs style check before docker build if possible (style-check images is not changed)
+            #    find a way to do style check always before docker build and others
+            _check_and_update_for_early_style_check(jobs_data, docker_data)
+        if args.skip_jobs and pr_info.has_changes_in_documentation_only():
+            _update_config_for_docs_only(jobs_data)
+
+        # TODO: await pending jobs
+        # wait for pending jobs to be finished, await_jobs is a long blocking call if any job has to be awaited
+        ci_cache = CiCache(s3, jobs_data["digests"])
+        # awaited_jobs = ci_cache.await_jobs(jobs_data.get("jobs_to_wait", {}))
+        # for job in awaited_jobs:
+        #     jobs_to_do = jobs_data["jobs_to_do"]
+        #     if job in jobs_to_do:
+        #         jobs_to_do.remove(job)
+        #     else:
+        #         assert False, "BUG"
+
+        # set planned jobs as pending in the CI cache if on the master
+        if pr_info.is_master():
+            for job in jobs_data["jobs_to_do"]:
+                config = CI_CONFIG.get_job_config(job)
+                if config.run_always or config.run_by_label:
+                    continue
+                job_params = jobs_data["jobs_params"][job]
+                ci_cache.push_pending(
+                    job,
+                    job_params["batches"],
+                    config.num_batches,
+                    release_branch=pr_info.is_release_branch(),
+                )
+
         # conclude results
         result["git_ref"] = git_ref
         result["version"] = version
@@ -919,49 +1568,12 @@ def main() -> int:
         result["ci_flags"] = ci_flags
         result["jobs_data"] = jobs_data
         result["docker_data"] = docker_data
-        if (
-            not args.skip_jobs
-            and pr_info.number != 0
-            and not args.docker_digest_or_latest
-        ):
-            # FIXME: it runs style check before docker build if possible (style-check images is not changed)
-            #    find a way to do style check always before docker build and others
-            _check_and_update_for_early_style_check(result)
-        if not args.skip_jobs and pr_info.has_changes_in_documentation_only():
-            _update_config_for_docs_only(result)
     ### CONFIGURE action: end
 
     ### PRE action: start
     elif args.pre:
-        CommitStatusData.cleanup()
-        JobReport.cleanup()
-        BuildResult.cleanup()
-
         assert indata, "Run config must be provided via --infile"
-        report_path = Path(REPORT_PATH)
-        report_path.mkdir(exist_ok=True, parents=True)
-        path = get_s3_path(indata["build"])
-        reports_files = s3.download_files(  # type: ignore
-            bucket=S3_BUILDS_BUCKET,
-            s3_path=path,
-            file_suffix=".json",
-            local_directory=report_path,
-        )
-        # for release/master branches reports must be created on the same branches
-        files = []
-        if pr_info.number == 0:
-            for file in reports_files:
-                if pr_info.head_ref not in file:
-                    # keep reports from the same branch only, if not in a PR
-                    (report_path / file).unlink()
-                    print(f"drop report: [{report_path / file}]")
-                else:
-                    files.append(file)
-            reports_files = files
-        print(
-            f"Pre action done. Report files [{reports_files}] have been downloaded from [{path}] to [{report_path}]"
-        )
-    ### PRE action: end
+        _pre_action(s3, indata, pr_info)
 
     ### RUN action: start
     elif args.run:
@@ -993,6 +1605,9 @@ def main() -> int:
                 print("::endgroup::")
         else:
             # this is a test job - check if GH commit status is present
+
+            # rerun helper check
+            # FIXME: remove rerun_helper check and rely on ci cache only
             commit = get_commit(
                 Github(get_best_robot_token(), per_page=100), pr_info.sha
             )
@@ -1005,6 +1620,38 @@ def main() -> int:
                 print(status)
                 print("::endgroup::")
 
+            # ci cache check
+            elif not indata["ci_flags"][Labels.NO_CI_CACHE]:
+                ci_cache = CiCache(s3, indata["jobs_data"]["digests"]).update()
+                job_config = CI_CONFIG.get_job_config(check_name)
+                if ci_cache.is_successful(
+                    check_name,
+                    args.batch,
+                    job_config.num_batches,
+                    job_config.required_on_release_branch,
+                ):
+                    job_status = ci_cache.get_successful(
+                        check_name, args.batch, job_config.num_batches
+                    )
+                    assert job_status, "BUG"
+                    commit.create_status(
+                        state=job_status.status,
+                        target_url=job_status.report_url,
+                        description=format_description(
+                            f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
+                            f"{job_status.description}"
+                        ),
+                        context=get_check_name(
+                            check_name,
+                            batch=args.batch,
+                            num_batches=job_config.num_batches,
+                        ),
+                    )
+                    previous_status = job_status.status
+                    print("::group::Commit Status Data")
+                    print(job_status)
+                    print("::endgroup::")
+
         if previous_status:
             print(
                 f"Commit status or Build Report is already present - job will be skipped with status: [{previous_status}]"
@@ -1019,15 +1666,15 @@ def main() -> int:
 
     ### POST action: start
     elif args.post:
-        assert (
-            not CI_CONFIG.is_build_job(args.job_name) or indata
-        ), "--infile with config must be provided for POST action of a build type job [{args.job_name}]"
         job_report = JobReport.load() if JobReport.exist() else None
         if job_report:
             ch_helper = ClickHouseHelper()
             check_url = ""
 
             if CI_CONFIG.is_build_job(args.job_name):
+                assert (
+                    indata
+                ), "--infile with config must be provided for POST action of a build type job [{args.job_name}]"
                 build_name = args.job_name
                 s3_path_prefix = "/".join(
                     (
@@ -1039,7 +1686,7 @@ def main() -> int:
                 log_url = _upload_build_artifacts(
                     pr_info,
                     build_name,
-                    build_digest=indata["build"],  # type: ignore
+                    ci_cache=CiCache(s3, indata["jobs_data"]["digests"]),
                     job_report=job_report,
                     s3=s3,
                     s3_destination=s3_path_prefix,
@@ -1116,80 +1763,16 @@ def main() -> int:
     ### MARK SUCCESS action: start
     elif args.mark_success:
         assert indata, "Run config must be provided via --infile"
-        job = args.job_name
-        job_config = CI_CONFIG.get_job_config(job)
-        num_batches = job_config.num_batches
-        assert (
-            num_batches <= 1 or 0 <= args.batch < num_batches
-        ), f"--batch must be provided and in range [0, {num_batches}) for {job}"
-
-        # FIXME: find generic design for propagating and handling job status (e.g. stop using statuses in GH api)
-        #   now job ca be build job w/o status data, any other job that exit with 0 with or w/o status data
-        if CI_CONFIG.is_build_job(job):
-            # there is no status for build jobs
-            # create dummy success to mark it as done
-            job_status = CommitStatusData(
-                status="success", description="dummy status", report_url="dummy_url"
-            )
-        else:
-            if not CommitStatusData.is_present():
-                # apparently exit after rerun-helper check
-                # do nothing, exit without failure
-                print(f"ERROR: no status file for job [{job}]")
-                job_status = CommitStatusData(
-                    status="dummy failure",
-                    description="dummy status",
-                    report_url="dummy_url",
-                )
-            else:
-                # normal case
-                job_status = CommitStatusData.load_status()
-
-        # Storing job data (report_url) to restore OK GH status on job results reuse
-        if job_config.run_always:
-            print(f"Job [{job}] runs always in CI - do not mark as done")
-        elif job_status.is_ok():
-            success_flag_name = get_file_flag_name(
-                job, indata["jobs_data"]["digests"][job], args.batch, num_batches
-            )
-            if not CI_CONFIG.is_docs_job(job):
-                path = get_s3_path(indata["build"]) + success_flag_name
-            else:
-                path = get_s3_path_docs(indata["docs"]) + success_flag_name
-            job_status.dump_to_file(success_flag_name)
-            _ = s3.upload_file(
-                bucket=S3_BUILDS_BUCKET, file_path=success_flag_name, s3_path=path
-            )
-            os.remove(success_flag_name)
-            print(
-                f"Job [{job}] with digest [{indata['jobs_data']['digests'][job]}] {f'and batch {args.batch}/{num_batches}' if num_batches > 1 else ''} marked as successful. path: [{path}]"
-            )
-        else:
-            print(f"Job [{job}] is not ok, status [{job_status.status}]")
-    ### MARK SUCCESS action: end
+        _mark_success_action(s3, indata, pr_info, args.job_name, args.batch)
 
     ### UPDATE GH STATUSES action: start
     elif args.update_gh_statuses:
         assert indata, "Run config must be provided via --infile"
-        _update_gh_statuses(indata=indata, s3=s3)
-    ### UPDATE GH STATUSES action: end
+        _update_gh_statuses_action(indata=indata, s3=s3)
 
     ### print results
-    if args.outfile:
-        with open(args.outfile, "w") as f:
-            if isinstance(result, str):
-                print(result, file=f)
-            elif isinstance(result, dict):
-                print(json.dumps(result, indent=2 if args.pretty else None), file=f)
-            else:
-                raise AssertionError(f"Unexpected type for 'res': {type(result)}")
-    else:
-        if isinstance(result, str):
-            print(result)
-        elif isinstance(result, dict):
-            print(json.dumps(result, indent=2 if args.pretty else None))
-        else:
-            raise AssertionError(f"Unexpected type for 'res': {type(result)}")
+    _print_results(result, args.outfile, args.pretty)
+
     return exit_code
 
 
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 61f75edfa2f..347de73b5ed 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -11,6 +11,10 @@ from integration_test_images import IMAGES
 
 
 class Labels(metaclass=WithIter):
+    """
+    Label names or commit tokens in normalized form
+    """
+
     DO_NOT_TEST_LABEL = "do_not_test"
     NO_MERGE_COMMIT = "no_merge_commit"
     NO_CI_CACHE = "no_ci_cache"
@@ -111,7 +115,6 @@ class JobNames(metaclass=WithIter):
     PERFORMANCE_TEST_AMD64 = "Performance Comparison"
     PERFORMANCE_TEST_ARM64 = "Performance Comparison Aarch64"
 
-    SQL_LANCER_TEST = "SQLancer (release)"
     SQL_LOGIC_TEST = "Sqllogic test (release)"
 
     SQLANCER = "SQLancer (release)"
@@ -132,6 +135,8 @@ class JobNames(metaclass=WithIter):
     DOCS_CHECK = "Docs check"
     BUGFIX_VALIDATE = "tests bugfix validate check"
 
+    MARK_RELEASE_READY = "Mark Commit Release Ready"
+
 
 # dynamically update JobName with Build jobs
 for attr_name in dir(Build):
@@ -156,7 +161,7 @@ class DigestConfig:
 @dataclass
 class LabelConfig:
     """
-    class to configure different CI scenarious per GH label or commit message token
+    configures different CI scenarious per GH label
     """
 
     run_jobs: Iterable[str] = frozenset()
@@ -165,19 +170,26 @@ class LabelConfig:
 @dataclass
 class JobConfig:
     """
-    contains config parameter relevant for job execution in CI workflow
-    @digest - configures digest calculation for the job
-    @run_command - will be triggered for the job if omited in CI workflow yml
-    @timeout
-    @num_batches - sets number of batches for multi-batch job
+    contains config parameters for job execution in CI workflow
     """
 
+    # configures digest calculation for the job
     digest: DigestConfig = field(default_factory=DigestConfig)
+    # will be triggered for the job if omited in CI workflow yml
     run_command: str = ""
+    # job timeout
     timeout: Optional[int] = None
+    # sets number of batches for multi-batch job
     num_batches: int = 1
+    # label that enables job in CI, if set digest won't be used
     run_by_label: str = ""
+    # to run always regardless of the job digest or/and label
     run_always: bool = False
+    # if the job needs to be run on the release branch, including master (e.g. building packages, docker server).
+    # NOTE: Subsequent runs on the same branch with the similar digest are still considered skippable.
+    required_on_release_branch: bool = False
+    # job is for pr workflow only
+    pr_only: bool = False
 
 
 @dataclass
@@ -194,6 +206,7 @@ class BuildConfig:
     static_binary_name: str = ""
     job_config: JobConfig = field(
         default_factory=lambda: JobConfig(
+            required_on_release_branch=True,
             digest=DigestConfig(
                 include_paths=[
                     "./src",
@@ -614,6 +627,8 @@ CI_CONFIG = CiConfig(
                             "tsan",
                             "msan",
                             "ubsan",
+                            # skip build report jobs as not all builds will be done
+                            "build check",
                         )
                     ]
                 )
@@ -780,15 +795,19 @@ CI_CONFIG = CiConfig(
         ),
     },
     other_jobs_configs={
+        JobNames.MARK_RELEASE_READY: TestConfig(
+            "", job_config=JobConfig(required_on_release_branch=True)
+        ),
         JobNames.DOCKER_SERVER: TestConfig(
             "",
             job_config=JobConfig(
+                required_on_release_branch=True,
                 digest=DigestConfig(
                     include_paths=[
                         "tests/ci/docker_server.py",
                         "./docker/server",
                     ]
-                )
+                ),
             ),
         ),
         JobNames.DOCKER_KEEPER: TestConfig(
@@ -799,7 +818,7 @@ CI_CONFIG = CiConfig(
                         "tests/ci/docker_server.py",
                         "./docker/keeper",
                     ]
-                )
+                ),
             ),
         ),
         JobNames.DOCS_CHECK: TestConfig(
@@ -814,11 +833,12 @@ CI_CONFIG = CiConfig(
         JobNames.FAST_TEST: TestConfig(
             "",
             job_config=JobConfig(
+                pr_only=True,
                 digest=DigestConfig(
                     include_paths=["./tests/queries/0_stateless/"],
                     exclude_files=[".md"],
                     docker=["clickhouse/fasttest"],
-                )
+                ),
             ),
         ),
         JobNames.STYLE_CHECK: TestConfig(
@@ -988,11 +1008,15 @@ CI_CONFIG = CiConfig(
         ),
         JobNames.COMPATIBILITY_TEST: TestConfig(
             Build.PACKAGE_RELEASE,
-            job_config=JobConfig(digest=compatibility_check_digest),
+            job_config=JobConfig(
+                required_on_release_branch=True, digest=compatibility_check_digest
+            ),
         ),
         JobNames.COMPATIBILITY_TEST_ARM: TestConfig(
             Build.PACKAGE_AARCH64,
-            job_config=JobConfig(digest=compatibility_check_digest),
+            job_config=JobConfig(
+                required_on_release_branch=True, digest=compatibility_check_digest
+            ),
         ),
         JobNames.UNIT_TEST: TestConfig(
             Build.BINARY_RELEASE, job_config=JobConfig(**unit_test_common_params)  # type: ignore
diff --git a/tests/ci/ci_utils.py b/tests/ci/ci_utils.py
index 3c267cff79d..7e2a3d11725 100644
--- a/tests/ci/ci_utils.py
+++ b/tests/ci/ci_utils.py
@@ -1,6 +1,6 @@
 from contextlib import contextmanager
 import os
-from typing import Union, Iterator
+from typing import List, Union, Iterator
 from pathlib import Path
 
 
@@ -17,3 +17,21 @@ def cd(path: Union[Path, str]) -> Iterator[None]:
         yield
     finally:
         os.chdir(oldpwd)
+
+
+def is_hex(s):
+    try:
+        int(s, 16)
+        return True
+    except ValueError:
+        return False
+
+
+class GHActions:
+    @staticmethod
+    def print_in_group(group_name: str, lines: Union[str, List[str]]) -> None:
+        lines = list(lines)
+        print(f"::group::{group_name}")
+        for line in lines:
+            print(line)
+        print("::endgroup::")
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 598eef9922e..851a4cc5298 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -350,7 +350,7 @@ class CommitStatusData:
         return cls.load_from_file(STATUS_FILE_PATH)
 
     @classmethod
-    def is_present(cls) -> bool:
+    def exist(cls) -> bool:
         return STATUS_FILE_PATH.is_file()
 
     def dump_status(self) -> None:
diff --git a/tests/ci/performance_comparison_check.py b/tests/ci/performance_comparison_check.py
index 524da916a5e..5a98fa06b39 100644
--- a/tests/ci/performance_comparison_check.py
+++ b/tests/ci/performance_comparison_check.py
@@ -29,7 +29,7 @@ from tee_popen import TeePopen
 from clickhouse_helper import get_instance_type, get_instance_id
 from stopwatch import Stopwatch
 from build_download_helper import download_builds_filter
-from report import JobReport
+from report import SUCCESS, JobReport
 
 IMAGE_NAME = "clickhouse/performance-comparison"
 
@@ -223,7 +223,7 @@ def main():
             message = message_match.group(1).strip()
 
         # TODO: Remove me, always green mode for the first time, unless errors
-        status = "success"
+        status = SUCCESS
         if "errors" in message.lower() or too_many_slow(message.lower()):
             status = "failure"
         # TODO: Remove until here
@@ -249,7 +249,7 @@ def main():
         check_name=check_name_with_group,
     ).dump()
 
-    if status == "error":
+    if status != SUCCESS:
         sys.exit(1)
 
 
diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index d1be459666f..744de7dea72 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -287,7 +287,10 @@ class PRInfo:
             self.fetch_changed_files()
 
     def is_master(self) -> bool:
-        return self.number == 0 and self.base_ref == "master"
+        return self.number == 0 and self.head_ref == "master"
+
+    def is_release_branch(self) -> bool:
+        return self.number == 0
 
     def is_scheduled(self):
         return self.event_type == EventType.SCHEDULE
diff --git a/tests/ci/s3_helper.py b/tests/ci/s3_helper.py
index 616d645b5a6..bff53f00ad3 100644
--- a/tests/ci/s3_helper.py
+++ b/tests/ci/s3_helper.py
@@ -107,6 +107,9 @@ class S3Helper:
         logging.info("Upload %s to %s. Meta: %s", file_path, url, metadata)
         return url
 
+    def delete_file_from_s3(self, bucket_name: str, s3_path: str) -> None:
+        self.client.delete_object(Bucket=bucket_name, Key=s3_path)
+
     def upload_test_report_to_s3(self, file_path: Path, s3_path: str) -> str:
         if CI:
             return self._upload_file_to_s3(S3_TEST_REPORTS_BUCKET, file_path, s3_path)
diff --git a/tests/ci/test_ci_cache.py b/tests/ci/test_ci_cache.py
new file mode 100644
index 00000000000..0f8acf2656c
--- /dev/null
+++ b/tests/ci/test_ci_cache.py
@@ -0,0 +1,293 @@
+#!/usr/bin/env python
+
+from hashlib import md5
+from pathlib import Path
+import shutil
+from typing import Dict, Set
+import unittest
+from ci_config import Build, JobNames
+from s3_helper import S3Helper
+from ci import CiCache
+from digest_helper import JOB_DIGEST_LEN
+from commit_status_helper import CommitStatusData
+from env_helper import S3_BUILDS_BUCKET, TEMP_PATH
+
+
+def _create_mock_digest_1(string):
+    return md5((string).encode("utf-8")).hexdigest()[:JOB_DIGEST_LEN]
+
+
+def _create_mock_digest_2(string):
+    return md5((string + "+nonce").encode("utf-8")).hexdigest()[:JOB_DIGEST_LEN]
+
+
+DIGESTS = {job: _create_mock_digest_1(job) for job in JobNames}
+DIGESTS2 = {job: _create_mock_digest_2(job) for job in JobNames}
+
+
+# pylint:disable=protected-access
+class S3HelperTestMock(S3Helper):
+    def __init__(self) -> None:
+        super().__init__()
+        self.files_on_s3_paths = {}  # type: Dict[str, Set[str]]
+
+        # local path which is mocking remote s3 path with ci_cache
+        self.mock_remote_s3_path = Path(TEMP_PATH) / "mock_s3_path"
+        if not self.mock_remote_s3_path.exists():
+            self.mock_remote_s3_path.mkdir(parents=True, exist_ok=True)
+        for file in self.mock_remote_s3_path.iterdir():
+            file.unlink()
+
+    def list_prefix(self, s3_prefix_path, bucket=S3_BUILDS_BUCKET):
+        assert bucket == S3_BUILDS_BUCKET
+        file_prefix = Path(s3_prefix_path).name
+        path = str(Path(s3_prefix_path).parent)
+        return [
+            path + "/" + file
+            for file in self.files_on_s3_paths[path]
+            if file.startswith(file_prefix)
+        ]
+
+    def upload_file(self, bucket, file_path, s3_path):
+        assert bucket == S3_BUILDS_BUCKET
+        file_name = Path(file_path).name
+        assert (
+            file_name in s3_path
+        ), f"Record file name [{file_name}] must be part of a path on s3 [{s3_path}]"
+        s3_path = str(Path(s3_path).parent)
+        if s3_path in self.files_on_s3_paths:
+            self.files_on_s3_paths[s3_path].add(file_name)
+        else:
+            self.files_on_s3_paths[s3_path] = set([file_name])
+        shutil.copy(file_path, self.mock_remote_s3_path)
+
+    def download_files(self, bucket, s3_path, file_suffix, local_directory):
+        assert bucket == S3_BUILDS_BUCKET
+        assert file_suffix == CiCache._RECORD_FILE_EXTENSION
+        assert local_directory == CiCache._LOCAL_CACHE_PATH
+        assert CiCache._S3_CACHE_PREFIX in s3_path
+        assert [job_type.value in s3_path for job_type in CiCache.JobType]
+
+        # copying from mock remote path to local cache
+        for remote_record in self.mock_remote_s3_path.glob(f"*{file_suffix}"):
+            destination_file = CiCache._LOCAL_CACHE_PATH / remote_record.name
+            shutil.copy(remote_record, destination_file)
+
+
+# pylint:disable=protected-access
+class TestCiCache(unittest.TestCase):
+    def test_cache(self):
+        s3_mock = S3HelperTestMock()
+        ci_cache = CiCache(s3_mock, DIGESTS)
+        # immitate another CI run is using cache
+        ci_cache_2 = CiCache(s3_mock, DIGESTS2)
+        NUM_BATCHES = 10
+
+        DOCS_JOBS_NUM = 1
+        assert len(set(job for job in JobNames)) == len(list(job for job in JobNames))
+        NONDOCS_JOBS_NUM = len(set(job for job in JobNames)) - DOCS_JOBS_NUM
+
+        PR_NUM = 123456
+        status = CommitStatusData(
+            status="success",
+            report_url="dummy url",
+            description="OK OK OK",
+            sha="deadbeaf2",
+            pr_num=PR_NUM,
+        )
+
+        ### add some pending statuses for two batches and on non-release branch
+        for job in JobNames:
+            ci_cache.push_pending(job, [0, 1], NUM_BATCHES, release_branch=False)
+            ci_cache_2.push_pending(job, [0, 1], NUM_BATCHES, release_branch=False)
+
+        ### add success status for 0 batch, non-release branch
+        for job in JobNames:
+            ci_cache.push_successful(job, 0, NUM_BATCHES, status, release_branch=False)
+            ci_cache_2.push_successful(
+                job, 0, NUM_BATCHES, status, release_branch=False
+            )
+
+        ### check all expected directories were created on s3 mock
+        expected_build_path_1 = f"{CiCache.JobType.SRCS.value}-{_create_mock_digest_1(Build.PACKAGE_RELEASE)}"
+        expected_docs_path_1 = (
+            f"{CiCache.JobType.DOCS.value}-{_create_mock_digest_1(JobNames.DOCS_CHECK)}"
+        )
+        expected_build_path_2 = f"{CiCache.JobType.SRCS.value}-{_create_mock_digest_2(Build.PACKAGE_RELEASE)}"
+        expected_docs_path_2 = (
+            f"{CiCache.JobType.DOCS.value}-{_create_mock_digest_2(JobNames.DOCS_CHECK)}"
+        )
+        self.assertCountEqual(
+            list(s3_mock.files_on_s3_paths.keys()),
+            [
+                f"{CiCache._S3_CACHE_PREFIX}/{expected_build_path_1}",
+                f"{CiCache._S3_CACHE_PREFIX}/{expected_docs_path_1}",
+                f"{CiCache._S3_CACHE_PREFIX}/{expected_build_path_2}",
+                f"{CiCache._S3_CACHE_PREFIX}/{expected_docs_path_2}",
+            ],
+        )
+
+        ### check number of cache files is as expected
+        FILES_PER_JOB = 3  # 1 successful + 2 pending batches = 3
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_build_path_1}"
+                ]
+            ),
+            NONDOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_docs_path_1}"
+                ]
+            ),
+            DOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_build_path_2}"
+                ]
+            ),
+            NONDOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_docs_path_2}"
+                ]
+            ),
+            DOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+
+        ### check statuses for all jobs in cache
+        for job in JobNames:
+            self.assertEqual(
+                ci_cache.is_successful(job, 0, NUM_BATCHES, release_branch=False), True
+            )
+            self.assertEqual(
+                ci_cache.is_successful(job, 0, NUM_BATCHES, release_branch=True), False
+            )
+            self.assertEqual(
+                ci_cache.is_successful(
+                    job, batch=1, num_batches=NUM_BATCHES, release_branch=False
+                ),
+                False,
+            )  # false - it's pending
+            self.assertEqual(
+                ci_cache.is_successful(
+                    job,
+                    batch=NUM_BATCHES,
+                    num_batches=NUM_BATCHES,
+                    release_branch=False,
+                ),
+                False,
+            )  # false - no such record
+            self.assertEqual(
+                ci_cache.is_pending(job, 0, NUM_BATCHES, release_branch=False), False
+            )  # false, it's successful, success has more priority than pending
+            self.assertEqual(
+                ci_cache.is_pending(job, 1, NUM_BATCHES, release_branch=False), True
+            )  # true
+            self.assertEqual(
+                ci_cache.is_pending(job, 1, NUM_BATCHES, release_branch=True), False
+            )  # false, not pending job on release_branch
+
+            status2 = ci_cache.get_successful(job, 0, NUM_BATCHES)
+            assert status2 and status2.pr_num == PR_NUM
+            status2 = ci_cache.get_successful(job, 1, NUM_BATCHES)
+            assert status2 is None
+
+        ### add some more pending statuses for two batches and for a release branch
+        for job in JobNames:
+            ci_cache.push_pending(
+                job, batches=[0, 1], num_batches=NUM_BATCHES, release_branch=True
+            )
+
+        ### add success statuses for 0 batch and release branch
+        PR_NUM = 234
+        status = CommitStatusData(
+            status="success",
+            report_url="dummy url",
+            description="OK OK OK",
+            sha="deadbeaf2",
+            pr_num=PR_NUM,
+        )
+        for job in JobNames:
+            ci_cache.push_successful(job, 0, NUM_BATCHES, status, release_branch=True)
+
+        ### check number of cache files is as expected
+        FILES_PER_JOB = 6  # 1 successful + 1 successful_release + 2 pending batches + 2 pending batches release = 6
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_build_path_1}"
+                ]
+            ),
+            NONDOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+        self.assertEqual(
+            len(
+                s3_mock.files_on_s3_paths[
+                    f"{CiCache._S3_CACHE_PREFIX}/{expected_docs_path_1}"
+                ]
+            ),
+            DOCS_JOBS_NUM * FILES_PER_JOB,
+        )
+
+        ### check statuses
+        for job in JobNames:
+            self.assertEqual(ci_cache.is_successful(job, 0, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_successful(job, 0, NUM_BATCHES, True), True)
+            self.assertEqual(ci_cache.is_successful(job, 1, NUM_BATCHES, False), False)
+            self.assertEqual(ci_cache.is_successful(job, 1, NUM_BATCHES, True), False)
+            self.assertEqual(
+                ci_cache.is_pending(job, 0, NUM_BATCHES, False), False
+            )  # it's success, not pending
+            self.assertEqual(
+                ci_cache.is_pending(job, 0, NUM_BATCHES, True), False
+            )  # it's success, not pending
+            self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, True), True)
+
+            status2 = ci_cache.get_successful(job, 0, NUM_BATCHES)
+            assert status2 and status2.pr_num == PR_NUM
+            status2 = ci_cache.get_successful(job, 1, NUM_BATCHES)
+            assert status2 is None
+
+        ### create new cache object and verify the same checks
+        ci_cache = CiCache(s3_mock, DIGESTS)
+        for job in JobNames:
+            self.assertEqual(ci_cache.is_successful(job, 0, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_successful(job, 0, NUM_BATCHES, True), True)
+            self.assertEqual(ci_cache.is_successful(job, 1, NUM_BATCHES, False), False)
+            self.assertEqual(ci_cache.is_successful(job, 1, NUM_BATCHES, True), False)
+            self.assertEqual(
+                ci_cache.is_pending(job, 0, NUM_BATCHES, False), False
+            )  # it's success, not pending
+            self.assertEqual(
+                ci_cache.is_pending(job, 0, NUM_BATCHES, True), False
+            )  # it's success, not pending
+            self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, True), True)
+
+            status2 = ci_cache.get_successful(job, 0, NUM_BATCHES)
+            assert status2 and status2.pr_num == PR_NUM
+            status2 = ci_cache.get_successful(job, 1, NUM_BATCHES)
+            assert status2 is None
+
+        ### check some job values which are not in the cache
+        self.assertEqual(ci_cache.is_successful(job, 0, NUM_BATCHES + 1, False), False)
+        self.assertEqual(
+            ci_cache.is_successful(job, NUM_BATCHES - 1, NUM_BATCHES, False), False
+        )
+        self.assertEqual(ci_cache.is_pending(job, 0, NUM_BATCHES + 1, False), False)
+        self.assertEqual(
+            ci_cache.is_pending(job, NUM_BATCHES - 1, NUM_BATCHES, False), False
+        )
+
+
+if __name__ == "__main__":
+    TestCiCache().test_cache()

From 7be91e66dda4662d7faf78727ac57edb446ff49e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 2 Feb 2024 18:11:56 +0100
Subject: [PATCH 0579/1081] Add reverse step

---
 src/Client/QueryFuzzer.cpp | 31 +++++++++++++++++++++++++++----
 src/Client/QueryFuzzer.h   |  1 +
 2 files changed, 28 insertions(+), 4 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index bb551fcb11e..24be7491ec7 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -915,18 +915,35 @@ ASTPtr QueryFuzzer::fuzzLiteralUnderExpressionList(ASTPtr child)
             "toFixedString", std::make_shared<ASTLiteral>(value), std::make_shared<ASTLiteral>(static_cast<UInt64>(value.size())));
     }
 
-    if (fuzz_rand() % 11 == 0)
+    if (fuzz_rand() % 7 == 0)
         child = makeASTFunction("toNullable", child);
 
-    if (fuzz_rand() % 11 == 0)
+    if (fuzz_rand() % 7 == 0)
         child = makeASTFunction("toLowCardinality", child);
 
-    if (fuzz_rand() % 11 == 0)
+    if (fuzz_rand() % 7 == 0)
         child = makeASTFunction("materialize", child);
 
     return child;
 }
 
+/// Tries to remove the functions added in fuzzLiteralUnderExpressionList
+/// Note that it removes them even if the child is not a literal
+ASTPtr QueryFuzzer::reverseLiteralFuzzing(ASTPtr child)
+{
+    if (auto * function = child.get()->as<ASTFunction>())
+    {
+        std::unordered_set<String> can_be_reverted{"toNullable", "toLowCardinality", "materialize"};
+        if (can_be_reverted.contains(function->name) && function->children.size() == 1)
+        {
+            if (fuzz_rand() % 7 == 0)
+                return function->children[0];
+        }
+    }
+
+    return nullptr;
+}
+
 
 void QueryFuzzer::fuzzExpressionList(ASTExpressionList & expr_list)
 {
@@ -938,7 +955,13 @@ void QueryFuzzer::fuzzExpressionList(ASTExpressionList & expr_list)
                 child = fuzzLiteralUnderExpressionList(child);
         }
         else
-            fuzz(child);
+        {
+            auto new_child = reverseLiteralFuzzing(child);
+            if (new_child)
+                child = new_child;
+            else
+                fuzz(child);
+        }
     }
 }
 
diff --git a/src/Client/QueryFuzzer.h b/src/Client/QueryFuzzer.h
index cdeba2b76fd..f5465626d96 100644
--- a/src/Client/QueryFuzzer.h
+++ b/src/Client/QueryFuzzer.h
@@ -96,6 +96,7 @@ struct QueryFuzzer
     void fuzzColumnDeclaration(ASTColumnDeclaration & column);
     void fuzzTableName(ASTTableExpression & table);
     ASTPtr fuzzLiteralUnderExpressionList(ASTPtr child);
+    ASTPtr reverseLiteralFuzzing(ASTPtr child);
     void fuzzExpressionList(ASTExpressionList & expr_list);
     void fuzz(ASTs & asts);
     void fuzz(ASTPtr & ast);

From 6504dfe0b2cefa9bbc8d83328cddbfae13ee329c Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 25 Jan 2024 19:46:57 +0000
Subject: [PATCH 0580/1081] CI: Enable ARM integration test 
 #ci_set_integration #no_merge_commit

---
 .github/workflows/pull_request.yml        | 10 ++++++++
 .gitmessage                               |  1 +
 docker/images.json                        |  1 -
 docker/test/integration/runner/Dockerfile |  2 +-
 tests/ci/ci.py                            | 13 +++++-----
 tests/ci/ci_config.py                     | 30 +++++++++++++++++++++++
 tests/ci/integration_test_check.py        |  5 ++--
 7 files changed, 52 insertions(+), 10 deletions(-)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 9c08363f674..09e2d6dbb97 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -785,6 +785,15 @@ jobs:
       test_name: Integration tests (release)
       runner_type: stress-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  IntegrationTestsAarch64:
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Integration tests (aarch64)
+      # FIXME: there is no stress-tester for aarch64. func-tester-aarch64 is ok?
+      runner_type: func-tester-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsFlakyCheck:
     needs: [RunConfig, BuilderDebAsan]
     if: ${{ !failure() && !cancelled() }}
@@ -924,6 +933,7 @@ jobs:
       - IntegrationTestsAnalyzerAsan
       - IntegrationTestsTsan
       - IntegrationTestsRelease
+      - IntegrationTestsAarch64
       - IntegrationTestsFlakyCheck
       - PerformanceComparisonX86
       - PerformanceComparisonAarch
diff --git a/.gitmessage b/.gitmessage
index 098b66aab1c..200d19e774d 100644
--- a/.gitmessage
+++ b/.gitmessage
@@ -11,6 +11,7 @@
 ## To run specified set of tests in CI:
 #ci_set_<SET_NAME>
 #ci_set_reduced
+#ci_set_arm
 
 ## To run specified job in CI:
 #job_<JOB NAME>
diff --git a/docker/images.json b/docker/images.json
index d2f098f53d7..2bf1efe005f 100644
--- a/docker/images.json
+++ b/docker/images.json
@@ -62,7 +62,6 @@
         "dependent": []
     },
     "docker/test/integration/runner": {
-        "only_amd64": true,
         "name": "clickhouse/integration-tests-runner",
         "dependent": []
     },
diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index c795fbf0672..7bdc82c7fa2 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -70,7 +70,7 @@ RUN python3 -m pip install --no-cache-dir \
     azure-storage-blob \
     boto3 \
     cassandra-driver \
-    confluent-kafka==1.9.2 \
+    confluent-kafka==2.3.0 \
     delta-spark==2.3.0 \
     dict2xml \
     dicttoxml \
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 52879a1a778..12e27b532db 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1072,12 +1072,13 @@ def _configure_jobs(
 
         if batches_to_do:
             jobs_to_do.append(job)
-            jobs_params[job] = {
-                "batches": batches_to_do,
-                "num_batches": num_batches,
-            }
-        else:
+        elif not job_config.run_by_label:
+            # treat job as being skipped only if it's controlled by digest
             jobs_to_skip.append(job)
+        jobs_params[job] = {
+            "batches": batches_to_do,
+            "num_batches": num_batches,
+        }
 
     ## c. check CI controlling labels and commit messages
     if pr_info.labels:
@@ -1136,7 +1137,7 @@ def _configure_jobs(
                 f"NOTE: Only specific job(s) were requested by commit message tokens: [{jobs_to_do_requested}]"
             )
             jobs_to_do = list(
-                set(job for job in jobs_to_do_requested if job in jobs_to_do)
+                set(job for job in jobs_to_do_requested if job not in jobs_to_skip)
             )
 
     return {
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 347de73b5ed..23270aae8ec 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -19,6 +19,8 @@ class Labels(metaclass=WithIter):
     NO_MERGE_COMMIT = "no_merge_commit"
     NO_CI_CACHE = "no_ci_cache"
     CI_SET_REDUCED = "ci_set_reduced"
+    CI_SET_ARM = "ci_set_arm"
+    CI_SET_INTEGRATION = "ci_set_integration"
 
 
 class Build(metaclass=WithIter):
@@ -90,6 +92,7 @@ class JobNames(metaclass=WithIter):
     INTEGRATION_TEST_ASAN = "Integration tests (asan)"
     INTEGRATION_TEST_ASAN_ANALYZER = "Integration tests (asan, analyzer)"
     INTEGRATION_TEST_TSAN = "Integration tests (tsan)"
+    INTEGRATION_TEST_ARM = "Integration tests (aarch64)"
     INTEGRATION_TEST_FLAKY = "Integration tests flaky check (asan)"
 
     UPGRADE_TEST_DEBUG = "Upgrade check (debug)"
@@ -615,6 +618,28 @@ class CiConfig:
 CI_CONFIG = CiConfig(
     label_configs={
         Labels.DO_NOT_TEST_LABEL: LabelConfig(run_jobs=[JobNames.STYLE_CHECK]),
+        Labels.CI_SET_ARM: LabelConfig(
+            run_jobs=[
+                # JobNames.STYLE_CHECK,
+                Build.PACKAGE_AARCH64,
+                JobNames.INTEGRATION_TEST_ARM,
+            ]
+        ),
+        Labels.CI_SET_INTEGRATION: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                Build.PACKAGE_ASAN,
+                Build.PACKAGE_RELEASE,
+                Build.PACKAGE_TSAN,
+                Build.PACKAGE_AARCH64,
+                JobNames.INTEGRATION_TEST_ASAN,
+                JobNames.INTEGRATION_TEST_ARM,
+                JobNames.INTEGRATION_TEST,
+                JobNames.INTEGRATION_TEST_ASAN_ANALYZER,
+                JobNames.INTEGRATION_TEST_TSAN,
+                JobNames.INTEGRATION_TEST_FLAKY,
+            ]
+        ),
         Labels.CI_SET_REDUCED: LabelConfig(
             run_jobs=[
                 job
@@ -996,6 +1021,11 @@ CI_CONFIG = CiConfig(
             Build.PACKAGE_TSAN,
             job_config=JobConfig(num_batches=6, **integration_test_common_params),  # type: ignore
         ),
+        JobNames.INTEGRATION_TEST_ARM: TestConfig(
+            Build.PACKAGE_AARCH64,
+            # add [run_by_label="test arm"] to not run in regular pr workflow by default
+            job_config=JobConfig(num_batches=6, **integration_test_common_params, run_by_label="test arm"),  # type: ignore
+        ),
         # FIXME: currently no wf has this job. Try to enable
         # "Integration tests (msan)": TestConfig(Build.PACKAGE_MSAN, job_config=JobConfig(num_batches=6, **integration_test_common_params) # type: ignore
         # ),
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index 18b3d2c2898..fa2529d1b89 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -18,7 +18,7 @@ from commit_status_helper import (
     post_commit_status,
     post_commit_status_to_file,
 )
-from docker_images_helper import DockerImage, get_docker_image, pull_image
+from docker_images_helper import DockerImage, get_docker_image
 from download_release_packages import download_last_release
 from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
@@ -192,7 +192,8 @@ def main():
     gh = GitHub(get_best_robot_token())
     commit = get_commit(gh, pr_info.sha)
 
-    images = [pull_image(get_docker_image(i)) for i in IMAGES]
+    images = [get_docker_image(image_) for image_ in IMAGES]
+
     result_path = temp_path / "output_dir"
     result_path.mkdir(parents=True, exist_ok=True)
 

From c7499b7395b5bc7d70895a040e967fed85cee070 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 2 Feb 2024 18:43:09 +0000
Subject: [PATCH 0581/1081] Use ConnectionPoolPtr instead of raw pointer

---
 src/Client/ConnectionEstablisher.cpp      |  9 +++++----
 src/Client/ConnectionEstablisher.h        |  6 +++---
 src/Client/ConnectionPoolWithFailover.cpp | 14 +++++++-------
 src/Client/ConnectionPoolWithFailover.h   |  2 +-
 src/Client/HedgedConnectionsFactory.cpp   |  5 +++--
 src/Common/PoolWithFailoverBase.h         |  8 ++++----
 6 files changed, 23 insertions(+), 21 deletions(-)

diff --git a/src/Client/ConnectionEstablisher.cpp b/src/Client/ConnectionEstablisher.cpp
index a9009e5bb25..bba640544d6 100644
--- a/src/Client/ConnectionEstablisher.cpp
+++ b/src/Client/ConnectionEstablisher.cpp
@@ -22,12 +22,12 @@ namespace ErrorCodes
 }
 
 ConnectionEstablisher::ConnectionEstablisher(
-    IConnectionPool * pool_,
+    ConnectionPoolPtr pool_,
     const ConnectionTimeouts * timeouts_,
     const Settings & settings_,
     LoggerPtr log_,
     const QualifiedTableName * table_to_check_)
-    : pool(pool_), timeouts(timeouts_), settings(settings_), log(log_), table_to_check(table_to_check_), is_finished(false)
+    : pool(std::move(pool_)), timeouts(timeouts_), settings(settings_), log(log_), table_to_check(table_to_check_), is_finished(false)
 {
 }
 
@@ -111,12 +111,13 @@ void ConnectionEstablisher::run(ConnectionEstablisher::TryResult & result, std::
 #if defined(OS_LINUX)
 
 ConnectionEstablisherAsync::ConnectionEstablisherAsync(
-    IConnectionPool * pool_,
+    ConnectionPoolPtr pool_,
     const ConnectionTimeouts * timeouts_,
     const Settings & settings_,
     LoggerPtr log_,
     const QualifiedTableName * table_to_check_)
-    : AsyncTaskExecutor(std::make_unique<Task>(*this)), connection_establisher(pool_, timeouts_, settings_, log_, table_to_check_)
+    : AsyncTaskExecutor(std::make_unique<Task>(*this))
+    , connection_establisher(std::move(pool_), timeouts_, settings_, log_, table_to_check_)
 {
     epoll.add(timeout_descriptor.getDescriptor());
 }
diff --git a/src/Client/ConnectionEstablisher.h b/src/Client/ConnectionEstablisher.h
index 7ea65708b1d..62e80198d03 100644
--- a/src/Client/ConnectionEstablisher.h
+++ b/src/Client/ConnectionEstablisher.h
@@ -20,7 +20,7 @@ class ConnectionEstablisher
 public:
     using TryResult = PoolWithFailoverBase<IConnectionPool>::TryResult;
 
-    ConnectionEstablisher(IConnectionPool * pool_,
+    ConnectionEstablisher(ConnectionPoolPtr pool_,
                           const ConnectionTimeouts * timeouts_,
                           const Settings & settings_,
                           LoggerPtr log,
@@ -35,7 +35,7 @@ public:
     bool isFinished() const { return is_finished; }
 
 private:
-    IConnectionPool * pool;
+    ConnectionPoolPtr pool;
     const ConnectionTimeouts * timeouts;
     const Settings & settings;
     LoggerPtr log;
@@ -58,7 +58,7 @@ class ConnectionEstablisherAsync : public AsyncTaskExecutor
 public:
     using TryResult = PoolWithFailoverBase<IConnectionPool>::TryResult;
 
-    ConnectionEstablisherAsync(IConnectionPool * pool_,
+    ConnectionEstablisherAsync(ConnectionPoolPtr pool_,
                                const ConnectionTimeouts * timeouts_,
                                const Settings & settings_,
                                LoggerPtr log_,
diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index c05fbb317c8..fdc0a11e533 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -63,7 +63,7 @@ IConnectionPool::Entry ConnectionPoolWithFailover::get(const ConnectionTimeouts
         throw DB::Exception(DB::ErrorCodes::ALL_CONNECTION_TRIES_FAILED,
                             "Cannot get connection from ConnectionPoolWithFailover cause nested pools are empty");
 
-    TryGetEntryFunc try_get_entry = [&](NestedPool & pool, std::string & fail_message)
+    TryGetEntryFunc try_get_entry = [&](const NestedPoolPtr & pool, std::string & fail_message)
     {
         return tryGetEntry(pool, timeouts, fail_message, settings, {});
     };
@@ -126,7 +126,7 @@ std::vector<IConnectionPool::Entry> ConnectionPoolWithFailover::getMany(
     std::optional<bool> skip_unavailable_endpoints,
     GetPriorityForLoadBalancing::Func priority_func)
 {
-    TryGetEntryFunc try_get_entry = [&](NestedPool & pool, std::string & fail_message)
+    TryGetEntryFunc try_get_entry = [&](const NestedPoolPtr & pool, std::string & fail_message)
     { return tryGetEntry(pool, timeouts, fail_message, settings, nullptr, async_callback); };
 
     std::vector<TryResult> results = getManyImpl(settings, pool_mode, try_get_entry, skip_unavailable_endpoints, priority_func);
@@ -143,7 +143,7 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
     const Settings & settings,
     PoolMode pool_mode)
 {
-    TryGetEntryFunc try_get_entry = [&](NestedPool & pool, std::string & fail_message)
+    TryGetEntryFunc try_get_entry = [&](const NestedPoolPtr & pool, std::string & fail_message)
     {
         return tryGetEntry(pool, timeouts, fail_message, settings);
     };
@@ -160,7 +160,7 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
     std::optional<bool> skip_unavailable_endpoints,
     GetPriorityForLoadBalancing::Func priority_func)
 {
-    TryGetEntryFunc try_get_entry = [&](NestedPool & pool, std::string & fail_message)
+    TryGetEntryFunc try_get_entry = [&](const NestedPoolPtr & pool, std::string & fail_message)
     { return tryGetEntry(pool, timeouts, fail_message, settings, &table_to_check, async_callback); };
 
     return getManyImpl(settings, pool_mode, try_get_entry, skip_unavailable_endpoints, priority_func);
@@ -216,7 +216,7 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
 
 ConnectionPoolWithFailover::TryResult
 ConnectionPoolWithFailover::tryGetEntry(
-        IConnectionPool & pool,
+        const ConnectionPoolPtr & pool,
         const ConnectionTimeouts & timeouts,
         std::string & fail_message,
         const Settings & settings,
@@ -226,7 +226,7 @@ ConnectionPoolWithFailover::tryGetEntry(
 #if defined(OS_LINUX)
     if (async_callback)
     {
-        ConnectionEstablisherAsync connection_establisher_async(&pool, &timeouts, settings, log, table_to_check);
+        ConnectionEstablisherAsync connection_establisher_async(pool, &timeouts, settings, log, table_to_check);
         while (true)
         {
             connection_establisher_async.resume();
@@ -246,7 +246,7 @@ ConnectionPoolWithFailover::tryGetEntry(
     }
 #endif
 
-    ConnectionEstablisher connection_establisher(&pool, &timeouts, settings, log, table_to_check);
+    ConnectionEstablisher connection_establisher(pool, &timeouts, settings, log, table_to_check);
     TryResult result;
     connection_establisher.run(result, fail_message);
     return result;
diff --git a/src/Client/ConnectionPoolWithFailover.h b/src/Client/ConnectionPoolWithFailover.h
index eaef717a2d6..7ccdd4787a4 100644
--- a/src/Client/ConnectionPoolWithFailover.h
+++ b/src/Client/ConnectionPoolWithFailover.h
@@ -115,7 +115,7 @@ private:
     /// If table_to_check is not null and the check is enabled in settings, check that replication delay
     /// for this table is not too large.
     TryResult tryGetEntry(
-            IConnectionPool & pool,
+            const ConnectionPoolPtr & pool,
             const ConnectionTimeouts & timeouts,
             std::string & fail_message,
             const Settings & settings,
diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index 01f9a32ce75..d226f8c9516 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -41,8 +41,9 @@ HedgedConnectionsFactory::HedgedConnectionsFactory(
     , skip_unavailable_shards(skip_unavailable_shards_)
 {
     shuffled_pools = pool->getShuffledPools(settings_, priority_func);
-    for (auto shuffled_pool : shuffled_pools)
-        replicas.emplace_back(std::make_unique<ConnectionEstablisherAsync>(shuffled_pool.pool, &timeouts, settings_, log, table_to_check.get()));
+    for (const auto & shuffled_pool : shuffled_pools)
+        replicas.emplace_back(
+            std::make_unique<ConnectionEstablisherAsync>(shuffled_pool.pool, &timeouts, settings_, log, table_to_check.get()));
 }
 
 HedgedConnectionsFactory::~HedgedConnectionsFactory()
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index 6da4445950c..c54738cb892 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -101,7 +101,7 @@ public:
 
     struct ShuffledPool
     {
-        NestedPool * pool{};
+        NestedPoolPtr pool{};
         const PoolState * state{}; // WARNING: valid only during initial ordering, dangling
         size_t index = 0;
         size_t error_count = 0;
@@ -110,7 +110,7 @@ public:
 
     /// This functor must be provided by a client. It must perform a single try that takes a connection
     /// from the provided pool and checks that it is good.
-    using TryGetEntryFunc = std::function<TryResult(NestedPool & pool, std::string & fail_message)>;
+    using TryGetEntryFunc = std::function<TryResult(const NestedPoolPtr & pool, std::string & fail_message)>;
 
     /// The client can provide this functor to affect load balancing - the index of a pool is passed to
     /// this functor. The pools with lower result value will be tried first.
@@ -181,7 +181,7 @@ PoolWithFailoverBase<TNestedPool>::getShuffledPools(
     std::vector<ShuffledPool> shuffled_pools;
     shuffled_pools.reserve(nested_pools.size());
     for (size_t i = 0; i < nested_pools.size(); ++i)
-        shuffled_pools.push_back(ShuffledPool{nested_pools[i].get(), &pool_states[i], i, /* error_count = */ 0, /* slowdown_count = */ 0});
+        shuffled_pools.push_back(ShuffledPool{nested_pools[i], &pool_states[i], i, /* error_count = */ 0, /* slowdown_count = */ 0});
 
     ::sort(
         shuffled_pools.begin(), shuffled_pools.end(),
@@ -267,7 +267,7 @@ PoolWithFailoverBase<TNestedPool>::getMany(
                 continue;
 
             std::string fail_message;
-            result = try_get_entry(*shuffled_pool.pool, fail_message);
+            result = try_get_entry(shuffled_pool.pool, fail_message);
 
             if (!fail_message.empty())
                 fail_messages += fail_message + '\n';

From 736314015003f999303c9e025fbf624f973af9d8 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 2 Feb 2024 22:28:06 +0100
Subject: [PATCH 0582/1081] remove unneeded field

---
 src/Processors/Transforms/AggregatingTransform.h | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/Processors/Transforms/AggregatingTransform.h b/src/Processors/Transforms/AggregatingTransform.h
index e05528afdc7..e167acde067 100644
--- a/src/Processors/Transforms/AggregatingTransform.h
+++ b/src/Processors/Transforms/AggregatingTransform.h
@@ -71,16 +71,12 @@ struct AggregatingTransformParams
 struct ManyAggregatedData
 {
     ManyAggregatedDataVariants variants;
-    std::vector<std::unique_ptr<std::mutex>> mutexes;
     std::atomic<UInt32> num_finished = 0;
 
-    explicit ManyAggregatedData(size_t num_threads = 0) : variants(num_threads), mutexes(num_threads)
+    explicit ManyAggregatedData(size_t num_threads = 0) : variants(num_threads)
     {
         for (auto & elem : variants)
             elem = std::make_shared<AggregatedDataVariants>();
-
-        for (auto & mut : mutexes)
-            mut = std::make_unique<std::mutex>();
     }
 
     ~ManyAggregatedData()

From e822ba3a47dea82e7d945f8cdd95591c3c1aa45c Mon Sep 17 00:00:00 2001
From: Nickolaj Jepsen <nij@billigvvs.dk>
Date: Fri, 2 Feb 2024 22:50:10 +0100
Subject: [PATCH 0583/1081] Add support for NATS credentials file

---
 docs/en/engines/table-engines/integrations/nats.md | 2 ++
 src/Storages/NATS/NATSConnection.cpp               | 2 ++
 src/Storages/NATS/NATSConnection.h                 | 1 +
 src/Storages/NATS/NATSSettings.h                   | 1 +
 src/Storages/NATS/StorageNATS.cpp                  | 2 ++
 5 files changed, 8 insertions(+)

diff --git a/docs/en/engines/table-engines/integrations/nats.md b/docs/en/engines/table-engines/integrations/nats.md
index e898d1f1b82..9f7409a6893 100644
--- a/docs/en/engines/table-engines/integrations/nats.md
+++ b/docs/en/engines/table-engines/integrations/nats.md
@@ -38,6 +38,7 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
     [nats_username = 'user',]
     [nats_password = 'password',]
     [nats_token = 'clickhouse',]
+    [nats_credential_file = '/var/nats_credentials',]
     [nats_startup_connect_tries = '5']
     [nats_max_rows_per_message = 1,]
     [nats_handle_error_mode = 'default']
@@ -63,6 +64,7 @@ Optional parameters:
 - `nats_username` - NATS username.
 - `nats_password` - NATS password.
 - `nats_token` - NATS auth token.
+- `nats_credential_file` - Path to a NATS credentials file.
 - `nats_startup_connect_tries` - Number of connect tries at startup. Default: `5`.
 - `nats_max_rows_per_message` — The maximum number of rows written in one NATS message for row-based formats. (default : `1`).
 - `nats_handle_error_mode` — How to handle errors for RabbitMQ engine. Possible values: default (the exception will be thrown if we fail to parse a message), stream (the exception message and raw message will be saved in virtual columns `_error` and `_raw_message`).
diff --git a/src/Storages/NATS/NATSConnection.cpp b/src/Storages/NATS/NATSConnection.cpp
index d7ad0cf8219..4d30d6b2360 100644
--- a/src/Storages/NATS/NATSConnection.cpp
+++ b/src/Storages/NATS/NATSConnection.cpp
@@ -91,6 +91,8 @@ void NATSConnectionManager::connectImpl()
         natsOptions_SetUserInfo(options, configuration.username.c_str(), configuration.password.c_str());
     if (!configuration.token.empty())
         natsOptions_SetToken(options, configuration.token.c_str());
+    if (!configuration.credential_file.empty())
+        natsOptions_SetUserCredentialsFromFiles(options, configuration.credential_file.c_str(), nullptr);
 
     if (configuration.secure)
     {
diff --git a/src/Storages/NATS/NATSConnection.h b/src/Storages/NATS/NATSConnection.h
index c350f395a92..859fcb72022 100644
--- a/src/Storages/NATS/NATSConnection.h
+++ b/src/Storages/NATS/NATSConnection.h
@@ -14,6 +14,7 @@ struct NATSConfiguration
     String username;
     String password;
     String token;
+    String credential_file;
 
     int max_reconnect;
     int reconnect_wait;
diff --git a/src/Storages/NATS/NATSSettings.h b/src/Storages/NATS/NATSSettings.h
index 3e3ed739d82..3273a5ff065 100644
--- a/src/Storages/NATS/NATSSettings.h
+++ b/src/Storages/NATS/NATSSettings.h
@@ -25,6 +25,7 @@ class ASTStorage;
     M(String, nats_username, "", "NATS username", 0) \
     M(String, nats_password, "", "NATS password", 0) \
     M(String, nats_token, "", "NATS token", 0) \
+    M(String, nats_credential_file, "", "Path to a NATS credentials file", 0) \
     M(UInt64, nats_startup_connect_tries, 5, "Number of connect tries at startup", 0) \
     M(UInt64, nats_max_rows_per_message, 1, "The maximum number of rows produced in one message for row-based formats.", 0) \
     M(StreamingHandleErrorMode, nats_handle_error_mode, StreamingHandleErrorMode::DEFAULT, "How to handle errors for NATS engine. Possible values: default (throw an exception after nats_skip_broken_messages broken messages), stream (save broken messages and errors in virtual columns _raw_message, _error).", 0) \
diff --git a/src/Storages/NATS/StorageNATS.cpp b/src/Storages/NATS/StorageNATS.cpp
index 2af9a9f974f..4b6ff1d8f2a 100644
--- a/src/Storages/NATS/StorageNATS.cpp
+++ b/src/Storages/NATS/StorageNATS.cpp
@@ -67,6 +67,7 @@ StorageNATS::StorageNATS(
     auto nats_username = getContext()->getMacros()->expand(nats_settings->nats_username);
     auto nats_password = getContext()->getMacros()->expand(nats_settings->nats_password);
     auto nats_token = getContext()->getMacros()->expand(nats_settings->nats_token);
+    auto nats_credential_file = getContext()->getMacros()->expand(nats_settings->nats_credential_file);
 
     configuration =
     {
@@ -75,6 +76,7 @@ StorageNATS::StorageNATS(
         .username = nats_username.empty() ? getContext()->getConfigRef().getString("nats.user", "") : nats_username,
         .password = nats_password.empty() ? getContext()->getConfigRef().getString("nats.password", "") : nats_password,
         .token = nats_token.empty() ? getContext()->getConfigRef().getString("nats.token", "") : nats_token,
+        .credential_file = nats_credential_file.empty() ? getContext()->getConfigRef().getString("nats.credential_file", "") : nats_credential_file,
         .max_reconnect = static_cast<int>(nats_settings->nats_max_reconnect.value),
         .reconnect_wait = static_cast<int>(nats_settings->nats_reconnect_wait.value),
         .secure = nats_settings->nats_secure.value

From e79ddd54afa54dc0c964774899f7250514741004 Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Sat, 3 Feb 2024 00:56:37 +0000
Subject: [PATCH 0584/1081] fix tests

---
 src/Functions/FunctionBinaryArithmetic.h      | 19 +++----------------
 .../00700_decimal_arithm.reference            |  6 +++---
 2 files changed, 6 insertions(+), 19 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 9b0afee5053..4d768311aaf 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -146,7 +146,6 @@ private: /// it's not correct for Decimal
 
 public:
     static constexpr bool allow_decimal = IsOperation<Operation>::allow_decimal;
-    static constexpr bool only_integer = IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero;
 
     /// Appropriate result type for binary operator on numeric types. "Date" can also mean
     /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
@@ -626,7 +625,10 @@ private:
             if constexpr (op_case == OpCase::RightConstant)
             {
                 if ((*right_nullmap)[0])
+                {
+                    c[0] = ResultType();
                     return;
+                }
 
                 for (size_t i = 0; i < size; ++i)
                     c[i] = apply_func(undec(a[i]), undec(b));
@@ -2094,21 +2096,6 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                     DataTypePtr type_res;
                     if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr (is_division)
-                        {
-                            if (context->getSettingsRef().decimal_check_overflow)
-                            {
-                                /// Check overflow by using operands scale (based on big decimal division implementation details):
-                                /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
-                                /// i.e. int_operand = decimal_operand*10^scale
-                                /// For division, left operand will be scaled by right operand scale also to do big integer division,
-                                /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
-                                /// So, we can check upfront possible overflow just by checking max scale used for left operand
-                                /// Note: it doesn't detect all possible overflow during big decimal division
-                                if (left.getScale() + right.getScale() > DecimalResultType::maxPrecision())
-                                    throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
-                            }
-                        }
                         DecimalResultType result_type = decimalResultType<is_multiply, is_division>(left, right);
                         type_res = std::make_shared<DecimalResultType>(result_type.getPrecision(), result_type.getScale());
                     }
diff --git a/tests/queries/0_stateless/00700_decimal_arithm.reference b/tests/queries/0_stateless/00700_decimal_arithm.reference
index 20f04696b1b..109c0632fb1 100644
--- a/tests/queries/0_stateless/00700_decimal_arithm.reference
+++ b/tests/queries/0_stateless/00700_decimal_arithm.reference
@@ -18,10 +18,10 @@
 63	-21	42	882	-882	0	2	0	2
 63	-21	42	882	-882	0	2	0	2
 1.00305798474369219219752355409390731264	0.16305798474369219219752355409390731264	-1.490591730234615865843651857942052864	-1.38847100762815390390123822295304634368	1.38847100762815390390123822295304634368	-0.00000000000000000000000000000000000001	0.00000000000000000000000000000000000001
-63.42	-21.42	41.58	890.82	-890.82	0.495	1.98	0	2
+63.42	-21.42	41.58	890.82	-890.82	0.495	1.98	0	1
 63.42	-21.42	41.58	890.82	-890.82
-63.42	-21.42	41.58	890.82	-890.82	0.495049504950495049	1.980198019801980198	0	2
-63.42	-21.42	41.58	890.82	-890.82	0.49	1.98	0	2
+63.42	-21.42	41.58	890.82	-890.82	0.495049504950495049	1.980198019801980198	0	1
+63.42	-21.42	41.58	890.82	-890.82	0.49	1.98	0	1
 -42	42	42	42	0.42	0.42	0.42	42.42	42.42	42.42
 0	0	0	0	0	0	0	0	0	0
 42	-42	-42	-42	-0.42	-0.42	-0.42	-42.42	-42.42	-42.42

From 82caaa744a51ba11e0b3be803956c875b43a6aad Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Sat, 3 Feb 2024 16:08:41 +0100
Subject: [PATCH 0585/1081] Produce stream of chunks instead of accumulating
 the whole result

---
 .../System/StorageSystemZooKeeper.cpp         | 67 ++++++++++++++-----
 1 file changed, 50 insertions(+), 17 deletions(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 7a2b830b088..cacd7cc2133 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -180,7 +180,7 @@ using Paths = std::deque<std::pair<String, ZkPathType>>;
 class ReadFromSystemZooKeeper final : public SourceStepWithFilter
 {
 public:
-    ReadFromSystemZooKeeper(const Block & header, SelectQueryInfo & query_info_, ContextPtr context_);
+    ReadFromSystemZooKeeper(const Block & header, SelectQueryInfo & query_info_, UInt64 max_block_size_, ContextPtr context_);
 
     String getName() const override { return "ReadFromSystemZooKeeper"; }
 
@@ -189,13 +189,40 @@ public:
     void applyFilters() override;
 
 private:
-    void fillData(MutableColumns & res_columns);
-
     std::shared_ptr<const StorageLimitsList> storage_limits;
+    const UInt64 max_block_size;
     ContextPtr context;
     Paths paths;
 };
 
+
+class SystemZooKeeperSource : public ISource
+{
+public:
+    SystemZooKeeperSource(
+        Paths && paths_,
+        Block header_,
+        UInt64 max_block_size_,
+        ContextPtr context_)
+        : ISource(header_)
+        , max_block_size(max_block_size_)
+        , paths(std::move(paths_))
+        , context(std::move(context_))
+    {
+    }
+
+    String getName() const override { return "SystemZooKeeper"; }
+
+protected:
+    Chunk generate() override;
+
+private:
+    const UInt64 max_block_size;
+    Paths paths;
+    ContextPtr context;
+};
+
+
 StorageSystemZooKeeper::StorageSystemZooKeeper(const StorageID & table_id_)
         : IStorage(table_id_)
 {
@@ -211,11 +238,11 @@ void StorageSystemZooKeeper::read(
     SelectQueryInfo & query_info,
     ContextPtr context,
     QueryProcessingStage::Enum /*processed_stage*/,
-    size_t /*max_block_size*/,
+    size_t max_block_size,
     size_t /*num_streams*/)
 {
     auto header = storage_snapshot->metadata->getSampleBlockWithVirtuals(getVirtuals());
-    auto read_step = std::make_unique<ReadFromSystemZooKeeper>(header, query_info, context);
+    auto read_step = std::make_unique<ReadFromSystemZooKeeper>(header, query_info, max_block_size, context);
     query_plan.addStep(std::move(read_step));
 }
 
@@ -426,8 +453,15 @@ void ReadFromSystemZooKeeper::applyFilters()
     paths = extractPath(getFilterNodes().nodes, context, context->getSettingsRef().allow_unrestricted_reads_from_keeper);
 }
 
-void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
+
+Chunk SystemZooKeeperSource::generate()
 {
+    if (paths.empty())
+        return {};
+
+    MutableColumns res_columns = getPort().getHeader().cloneEmptyColumns();
+    size_t row_count = 0;
+
     QueryStatusPtr query_status = context->getProcessListElement();
 
     const auto & settings = context->getSettingsRef();
@@ -471,7 +505,7 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
     };
     std::vector<ListTask> list_tasks;
     std::unordered_set<String> added;
-    while (!paths.empty())
+    while (!paths.empty() && (max_block_size == 0 || row_count < max_block_size))
     {
         if (query_status)
             query_status->checkTimeLimit();
@@ -519,8 +553,8 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
                 continue;
 
             auto & task = list_tasks[list_task_idx];
-            if (auto elem = context->getProcessListElement())
-                elem->checkTimeLimit();
+            if (query_status)
+                query_status->checkTimeLimit();
 
             Strings nodes = std::move(list_result.names);
 
@@ -584,17 +618,22 @@ void ReadFromSystemZooKeeper::fillData(MutableColumns & res_columns)
             res_columns[col_num++]->insert(
                 list_task.path); /// This is the original path. In order to process the request, condition in WHERE should be triggered.
 
+            ++row_count;
+
             if (list_task.path_type != ZkPathType::Exact && res.stat.numChildren > 0)
             {
                 paths.emplace_back(key, ZkPathType::Recurse);
             }
         }
     }
+
+    return Chunk(std::move(res_columns), row_count);
 }
 
-ReadFromSystemZooKeeper::ReadFromSystemZooKeeper(const Block & header, SelectQueryInfo & query_info, ContextPtr context_)
+ReadFromSystemZooKeeper::ReadFromSystemZooKeeper(const Block & header, SelectQueryInfo & query_info, UInt64 max_block_size_, ContextPtr context_)
     : SourceStepWithFilter({.header = header})
     , storage_limits(query_info.storage_limits)
+    , max_block_size(max_block_size_)
     , context(std::move(context_))
 {
 }
@@ -602,13 +641,7 @@ ReadFromSystemZooKeeper::ReadFromSystemZooKeeper(const Block & header, SelectQue
 void ReadFromSystemZooKeeper::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
     const auto & header = getOutputStream().header;
-    MutableColumns res_columns = header.cloneEmptyColumns();
-    fillData(res_columns);
-
-    UInt64 num_rows = res_columns.at(0)->size();
-    Chunk chunk(std::move(res_columns), num_rows);
-
-    auto source = std::make_shared<SourceFromSingleChunk>(header, std::move(chunk));
+    auto source = std::make_shared<SystemZooKeeperSource>(std::move(paths), header, max_block_size, context);
     source->setStorageLimits(storage_limits);
     processors.emplace_back(source);
     pipeline.init(Pipe(std::move(source)));

From 6a2867819ce091c313b1a14c3c39d42244553dab Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Sat, 3 Feb 2024 18:00:50 +0100
Subject: [PATCH 0586/1081] Test for filters w/ and w/o path column

---
 .../02976_system_zookeeper_filters.reference    |  6 ++++++
 .../02976_system_zookeeper_filters.sql          | 17 +++++++++++++++++
 2 files changed, 23 insertions(+)
 create mode 100644 tests/queries/0_stateless/02976_system_zookeeper_filters.reference
 create mode 100644 tests/queries/0_stateless/02976_system_zookeeper_filters.sql

diff --git a/tests/queries/0_stateless/02976_system_zookeeper_filters.reference b/tests/queries/0_stateless/02976_system_zookeeper_filters.reference
new file mode 100644
index 00000000000..a9e2f17562a
--- /dev/null
+++ b/tests/queries/0_stateless/02976_system_zookeeper_filters.reference
@@ -0,0 +1,6 @@
+1
+1
+1
+1
+1
+1
diff --git a/tests/queries/0_stateless/02976_system_zookeeper_filters.sql b/tests/queries/0_stateless/02976_system_zookeeper_filters.sql
new file mode 100644
index 00000000000..3664c817da7
--- /dev/null
+++ b/tests/queries/0_stateless/02976_system_zookeeper_filters.sql
@@ -0,0 +1,17 @@
+-- Tags: zookeeper, no-parallel, no-fasttest, long
+
+SET allow_unrestricted_reads_from_keeper = 'false';
+
+SELECT count() > 0 FROM system.zookeeper; -- { serverError BAD_ARGUMENTS }
+SELECT count() > 0 FROM system.zookeeper WHERE name LIKE '%_%'; -- { serverError BAD_ARGUMENTS }
+SELECT count() > 0 FROM system.zookeeper WHERE value LIKE '%'; -- { serverError BAD_ARGUMENTS }
+SELECT count() > 0 FROM system.zookeeper WHERE path LIKE '/%'; -- { serverError BAD_ARGUMENTS }
+SELECT count() > 0 FROM system.zookeeper WHERE path = '/';
+
+SET allow_unrestricted_reads_from_keeper = 'true';
+
+SELECT count() > 0 FROM system.zookeeper;
+SELECT count() > 0 FROM system.zookeeper WHERE name LIKE '%_%';
+SELECT count() > 0 FROM system.zookeeper WHERE value LIKE '%';
+SELECT count() > 0 FROM system.zookeeper WHERE path LIKE '/%';
+SELECT count() > 0 FROM system.zookeeper WHERE path = '/';

From e3716b0f38ec2f0da2cd332f59bf53bbf9fb92d7 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Sun, 4 Feb 2024 11:03:18 +0800
Subject: [PATCH 0587/1081] Backward compatibility of uncompressed state

---
 programs/server/dashboard.html | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 1f32048da79..ea81c134d07 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -1450,7 +1450,13 @@ window.onpopstate = function(event) {
 if (window.location.hash) {
     try {
         let search_query_, customized_;
-        ({host, user, queries, params, search_query_, customized_} = JSON.parse(LZString.decompressFromEncodedURIComponent(window.location.hash.substring(1))));
+        try {
+            ({host, user, queries, params, search_query_, customized_} = JSON.parse(LZString.decompressFromEncodedURIComponent(window.location.hash.substring(1))));
+        } catch {
+            // For compatibility with uncompressed state
+            ({host, user, queries, params, search_query_, customized_} = JSON.parse(atob(window.location.hash.substring(1))));
+        }
+
         // For compatibility with old URLs' hashes
         search_query = search_query_ !== undefined ? search_query_ : search_query;
         customized = customized_ !== undefined ? customized_ : true;

From 9e1a3c7c24b6499babac7dd06383af8872fc9fbf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E6=9D=8E=E6=89=AC?= <654010905@qq.com>
Date: Sun, 4 Feb 2024 14:25:04 +0800
Subject: [PATCH 0588/1081] Update
 src/AggregateFunctions/AggregateFunctionSum.h
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Raúl Marín <git@rmr.ninja>
---
 src/AggregateFunctions/AggregateFunctionSum.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index b3ba7cc7f57..53ddec597b8 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -161,7 +161,7 @@ struct AggregateFunctionSumData
             Impl::add(sum, local_sum);
             return;
         }
-        else if constexpr (is_integer<T> || is_decimal<T>)
+        else if constexpr (is_over_big_int<T>)
         {
             /// Use a mask to discard the value if it is null
             T local_sum{};

From d68a0e7b3e57b1b1471bd02531ebb0cadebf897e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E6=9D=8E=E6=89=AC?= <654010905@qq.com>
Date: Sun, 4 Feb 2024 14:25:14 +0800
Subject: [PATCH 0589/1081] Update
 src/AggregateFunctions/AggregateFunctionSum.h
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Raúl Marín <git@rmr.ninja>
---
 src/AggregateFunctions/AggregateFunctionSum.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index 53ddec597b8..ac9e77c8a33 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -146,7 +146,7 @@ struct AggregateFunctionSumData
         size_t count = end - start;
         const auto * end_ptr = ptr + count;
 
-        if constexpr ((is_integer<T> || is_decimal<T>)&&!is_over_big_int<T>)
+        if constexpr ((is_integer<T> || is_decimal<T>) && !is_over_big_int<T>)
         {
             /// For integers we can vectorize the operation if we replace the null check using a multiplication (by 0 for null, 1 for not null)
             /// https://quick-bench.com/q/MLTnfTvwC2qZFVeWHfOBR3U7a8I

From be19fb9935d0810f25cba17c96fe58de8eb85012 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sun, 4 Feb 2024 14:39:55 +0800
Subject: [PATCH 0590/1081] change as request

---
 src/AggregateFunctions/AggregateFunctionSum.h | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index ac9e77c8a33..58aaddf357a 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -163,19 +163,20 @@ struct AggregateFunctionSumData
         }
         else if constexpr (is_over_big_int<T>)
         {
-            /// Use a mask to discard the value if it is null
-            T local_sum{};
+            /// Use a mask to discard or keep the value to reduce branch miss.
+            /// Notice that for (U)Int128 or Decimal128, MaskType is Int8 instead of Int64, otherwise extra branches will be introduced by compiler (for unknown reason) and performance will be worse.
             using MaskType = std::conditional_t<sizeof(T) == 16, Int8, Int64>;
             alignas(64) const MaskType masks[2] = {0, -1};
+            T local_sum{};
             while (ptr < end_ptr)
             {
                 Value v = *ptr;
                 if constexpr (!add_if_zero)
                 {
                     if constexpr (is_integer<T>)
-                        v &= masks[*condition_map];
+                        v &= masks[!!*condition_map];
                     else
-                        v.value &= masks[*condition_map];
+                        v.value &= masks[!!*condition_map];
                 }
                 else
                 {

From 549b77021d3c448cf8802c7923ca03c0bf9a2781 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sun, 4 Feb 2024 15:55:22 +0800
Subject: [PATCH 0591/1081] add some perf tests

---
 tests/performance/sum.xml | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/tests/performance/sum.xml b/tests/performance/sum.xml
index 57b879a360d..36b898436bf 100644
--- a/tests/performance/sum.xml
+++ b/tests/performance/sum.xml
@@ -17,6 +17,13 @@
     <query>SELECT sumKahan(toNullable(toFloat32(number))) FROM numbers(100000000)</query>
     <query>SELECT sumKahan(toNullable(toFloat64(number))) FROM numbers(100000000)</query>
 
+    <query>select sumIf(number::Decimal128(3), rand32() % 2 = 0) from numbers(100000000)</query>
+    <query>select sumIf(number::Decimal256(3), rand32() % 2 = 0) from numbers(100000000)</query>
+    <query>select sumIf(number::Int128, rand32() % 2 = 0) from numbers(100000000)</query>
+    <query>select sumIf(number::UInt128, rand32() % 2 = 0) from numbers(100000000)</query>
+    <query>select sumIf(number::Int256, rand32() % 2 = 0) from numbers(100000000)</query>
+    <query>select sumIf(number::UInt256, rand32() % 2 = 0) from numbers(100000000)</query>
+
     <!-- Create a table with ~20% null values. Make it random so the branch predictor doesn't do all the work -->
     <create_query>CREATE TABLE nullfloat32 (x Nullable(Float32)) ENGINE = Memory</create_query>
     <fill_query>INSERT INTO nullfloat32

From 96b1ca7f8af39af852ab4a28ced7667f2015a09d Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sun, 4 Feb 2024 16:58:07 +0800
Subject: [PATCH 0592/1081] fix bugs

---
 src/Interpreters/castColumn.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/castColumn.cpp b/src/Interpreters/castColumn.cpp
index 906dfb84b14..2343d5b7b7a 100644
--- a/src/Interpreters/castColumn.cpp
+++ b/src/Interpreters/castColumn.cpp
@@ -43,6 +43,7 @@ static ColumnPtr castColumn(CastType cast_type, const ColumnWithTypeAndName & ar
 
 ColumnPtr castColumn(const ColumnWithTypeAndName & arg, const DataTypePtr & type, InternalCastFunctionCache * cache)
 {
+    std::cout << "cast from " << arg.dumpStructure() << " to " << type->getName() << std::endl;
     return castColumn(CastType::nonAccurate, arg, type, cache);
 }
 

From b4972bf5fbb488b38c455b06d94fb4540e5ba7c6 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Sun, 4 Feb 2024 16:59:26 +0800
Subject: [PATCH 0593/1081] revert files

---
 src/Functions/if.cpp            | 5 ++---
 src/Interpreters/castColumn.cpp | 1 -
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 9d6badcb645..5346f3a811c 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -727,7 +727,6 @@ private:
                 conditional(ConstSource<GenericArraySource>(*col_arr_then_const), ConstSource<GenericArraySource>(*col_arr_else_const), GenericArraySink(col_res->getData(), col_res->getOffsets(), rows), cond_data);
             else
                 return nullptr;
-
             return res;
         }
 
@@ -826,8 +825,8 @@ private:
             const DataTypeMap & type = static_cast<const DataTypeMap &>(*arg.type);
             const auto & key_type = type.getKeyType();
             const auto & value_type = type.getValueType();
-            key_columns[i + 1] = {key_cols[i], key_type, {}};
-            value_columns[i + 1] = {value_cols[i], value_type, {}};
+            key_columns[i + 1] = {key_cols[i], std::make_shared<DataTypeArray>(key_type), {}};
+            value_columns[i + 1] = {value_cols[i], std::make_shared<DataTypeArray>(value_type), {}};
         }
 
         /// Calculate function corresponding keys and values in map
diff --git a/src/Interpreters/castColumn.cpp b/src/Interpreters/castColumn.cpp
index 2343d5b7b7a..906dfb84b14 100644
--- a/src/Interpreters/castColumn.cpp
+++ b/src/Interpreters/castColumn.cpp
@@ -43,7 +43,6 @@ static ColumnPtr castColumn(CastType cast_type, const ColumnWithTypeAndName & ar
 
 ColumnPtr castColumn(const ColumnWithTypeAndName & arg, const DataTypePtr & type, InternalCastFunctionCache * cache)
 {
-    std::cout << "cast from " << arg.dumpStructure() << " to " << type->getName() << std::endl;
     return castColumn(CastType::nonAccurate, arg, type, cache);
 }
 

From b0994c5fa79ec6ba8dd14e028a6e2731d4e5f031 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 4 Feb 2024 11:28:20 +0100
Subject: [PATCH 0594/1081] Addressed comments, added test for named collection

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  10 +-
 src/Backups/BackupImpl.cpp                    |   1 -
 .../registerBackupEngineAzureBlobStorage.cpp  |  75 +++++++----
 .../AzureBlobStorage/AzureObjectStorage.cpp   |   1 +
 .../AzureBlobStorage/AzureObjectStorage.h     |   1 -
 .../copyAzureBlobStorageFile.cpp              |  19 +--
 src/Storages/StorageAzureBlob.cpp             |  11 --
 src/Storages/StorageAzureBlob.h               |   1 -
 .../test.py                                   | 123 ++++++++++++++++--
 9 files changed, 179 insertions(+), 63 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index d99f296cca1..27928e871ce 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -33,7 +33,7 @@ BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
     const ReadSettings & read_settings_,
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
-    : BackupReaderDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupReaderAzureBlobStorage"))
+    : BackupReaderDefault(read_settings_, write_settings_, getLogger("BackupReaderAzureBlobStorage"))
     , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
     , configuration(configuration_)
 {
@@ -96,8 +96,6 @@ std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const
 void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
                                     DiskPtr destination_disk, const String & destination_path, WriteMode write_mode)
 {
-    LOG_INFO(&Poco::Logger::get("BackupReaderAzureBlobStorage"), "Enter copyFileToDisk");
-
     auto destination_data_source_description = destination_disk->getDataSourceDescription();
     if ((destination_data_source_description.type == DataSourceType::ObjectStorage)
         && (destination_data_source_description.object_storage_type == ObjectStorageType::Azure)
@@ -143,7 +141,7 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     const ReadSettings & read_settings_,
     const WriteSettings & write_settings_,
     const ContextPtr & context_)
-    : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterAzureBlobStorage"))
+    : BackupWriterDefault(read_settings_, write_settings_, getLogger("BackupWriterAzureBlobStorage"))
     , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
     , configuration(configuration_)
 {
@@ -225,14 +223,11 @@ bool BackupWriterAzureBlobStorage::fileExists(const String & file_name)
     {
         key = file_name;
     }
-    LOG_INFO(&Poco::Logger::get("BackupWriterAzureBlobStorage"), "Result fileExists   {} ", object_storage->exists(StoredObject(key)));
-
     return object_storage->exists(StoredObject(key));
 }
 
 UInt64 BackupWriterAzureBlobStorage::getFileSize(const String & file_name)
 {
-    LOG_INFO(&Poco::Logger::get("BackupWriterAzureBlobStorage"), "Enter getFileSize");
     String key;
     if (startsWith(file_name, "."))
     {
@@ -281,6 +276,7 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
         client,
         key,
         settings.get()->max_single_part_upload_size,
+        settings.get()->max_unexpected_write_error_retries,
         DBMS_DEFAULT_BUFFER_SIZE,
         write_settings);
 }
diff --git a/src/Backups/BackupImpl.cpp b/src/Backups/BackupImpl.cpp
index 28a7d60b52c..8a4ed31bfd7 100644
--- a/src/Backups/BackupImpl.cpp
+++ b/src/Backups/BackupImpl.cpp
@@ -542,7 +542,6 @@ void BackupImpl::checkBackupDoesntExist() const
     if (!is_internal_backup)
     {
         assert(!lock_file_name.empty());
-        LOG_INFO(&Poco::Logger::get("BackupImpl"), "checkBackupDoesntExist 2");
         if (writer->fileExists(lock_file_name))
             throw Exception(ErrorCodes::BACKUP_ALREADY_EXISTS, "Backup {} is being written already", backup_name_for_logging);
     }
diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
index 3480ea75f1f..48f66569304 100644
--- a/src/Backups/registerBackupEngineAzureBlobStorage.cpp
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -49,40 +49,65 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
         const String & id_arg = params.backup_info.id_arg;
         const auto & args = params.backup_info.args;
 
-        LOG_INFO(&Poco::Logger::get("registerBackupEngineAzureBlobStorage"), "Begin id_arg={} args.size={}", id_arg, args.size());
-
         StorageAzureBlob::Configuration configuration;
 
-        if (args.size() == 3)
+        if (!id_arg.empty())
         {
-            configuration.connection_url = args[0].safeGet<String>();
-            configuration.is_connection_string = true;
+            const auto & config = params.context->getConfigRef();
+            auto config_prefix = "named_collections." + id_arg;
 
-            configuration.container =  args[1].safeGet<String>();
-            configuration.blob_path = args[2].safeGet<String>();
+            if (!config.has(config_prefix))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "There is no collection named `{}` in config", id_arg);
 
-            LOG_TRACE(&Poco::Logger::get("registerBackupEngineAzureBlobStorage"), "configuration.connection_url = {}"
-                                                                                 "configuration.container = {}"
-                                                                                 "configuration.blob_path = {}",
-                                                                                 configuration.connection_url, configuration.container, configuration.blob_path);
-        }
-        else if (args.size() == 5)
-        {
-            configuration.connection_url = args[0].safeGet<String>();
-            configuration.is_connection_string = false;
+            if (config.has(config_prefix + ".connection_string"))
+            {
+                configuration.connection_url = config.getString(config_prefix + ".connection_string");
+                configuration.is_connection_string = true;
+                configuration.container = config.getString(config_prefix + ".container");
+            }
+            else
+            {
+                configuration.connection_url = config.getString(config_prefix + ".storage_account_url");
+                configuration.is_connection_string = false;
+                configuration.container =  config.getString(config_prefix + ".container");
+                configuration.account_name = config.getString(config_prefix + ".account_name");
+                configuration.account_key =  config.getString(config_prefix + ".account_key");
+            }
 
-            configuration.container =  args[1].safeGet<String>();
-            configuration.blob_path = args[2].safeGet<String>();
-            configuration.account_name = args[3].safeGet<String>();
-            configuration.account_key = args[4].safeGet<String>();
+            if (args.size() > 1)
+                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Backup AzureBlobStorage requires 1 or 2 arguments: named_collection, [filename]");
+
+            if (args.size() == 1)
+                configuration.blob_path = args[0].safeGet<String>();
 
         }
         else
         {
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                                "Backup AzureBlobStorage requires 3 or 5 arguments: connection string>/<url, container, path, [account name], [account key]");
-        }
+            if (args.size() == 3)
+            {
+                configuration.connection_url = args[0].safeGet<String>();
+                configuration.is_connection_string = true;
 
+                configuration.container =  args[1].safeGet<String>();
+                configuration.blob_path = args[2].safeGet<String>();
+            }
+            else if (args.size() == 5)
+            {
+                configuration.connection_url = args[0].safeGet<String>();
+                configuration.is_connection_string = false;
+
+                configuration.container =  args[1].safeGet<String>();
+                configuration.blob_path = args[2].safeGet<String>();
+                configuration.account_name = args[3].safeGet<String>();
+                configuration.account_key = args[4].safeGet<String>();
+
+            }
+            else
+            {
+                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                                    "Backup AzureBlobStorage requires 3 or 5 arguments: connection string>/<url, container, path, [account name], [account key]");
+            }
+        }
 
         BackupImpl::ArchiveParams archive_params;
         if (hasRegisteredArchiveFileExtension(configuration.blob_path))
@@ -115,7 +140,7 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
                 params.base_backup_info,
                 reader,
                 params.context,
-                /*params.use_same_s3_credentials_for_base_backup*/ false);
+                /* use_same_s3_credentials_for_base_backup*/ false);
         }
         else
         {
@@ -134,7 +159,7 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
                 params.backup_coordination,
                 params.backup_uuid,
                 params.deduplicate_files,
-                /*params.use_same_s3_credentials_for_base_backup*/ false);
+                /* use_same_s3_credentials_for_base_backup */ false);
         }
 #else
         throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "AzureBlobStorage support is disabled");
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 962743b5668..74389aedb64 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -97,6 +97,7 @@ AzureObjectStorage::AzureObjectStorage(
     : name(name_)
     , client(std::move(client_))
     , settings(std::move(settings_))
+    , container(container_)
     , log(getLogger("AzureObjectStorage"))
 {
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 8556f0237e3..f16c35fb52c 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -52,7 +52,6 @@ struct AzureObjectStorageSettings
     size_t max_single_part_copy_size = 256 * 1024 * 1024;
     bool use_native_copy = false;
     size_t max_unexpected_write_error_retries = 4;
->>>>>>> master
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index ff4cfe62feb..114a970384b 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -80,7 +80,8 @@ namespace
 
         struct UploadPartTask
         {
-            std::unique_ptr<ReadBuffer> read_buffer = nullptr;
+            size_t part_offset;
+            size_t part_size;
             std::vector<std::string> block_ids;
             bool is_finished = false;
             std::exception_ptr exception;
@@ -182,7 +183,8 @@ namespace
 
                 try
                 {
-                    task->read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
+                    task->part_offset = part_offset;
+                    task->part_size = part_size;
 
                     schedule([this, task, task_finish_notify]()
                     {
@@ -206,7 +208,8 @@ namespace
             else
             {
                 UploadPartTask task;
-                task.read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), part_offset, part_size);
+                task.part_offset = part_offset;
+                task.part_size = part_size;
                 processUploadPartRequest(task);
                 block_ids.insert(block_ids.end(),task.block_ids.begin(), task.block_ids.end());
             }
@@ -219,17 +222,17 @@ namespace
                 ProfileEvents::increment(ProfileEvents::DiskAzureUploadPart);
 
             auto block_blob_client = client->GetBlockBlobClient(dest_blob);
-
-            while (!task.read_buffer->eof())
+            auto read_buffer = std::make_unique<LimitSeekableReadBuffer>(create_read_buffer(), task.part_offset, task.part_size);
+            while (!read_buffer->eof())
             {
-                  auto size = task.read_buffer->available();
+                  auto size = read_buffer->available();
                   if (size > 0)
                   {
                       auto block_id = getRandomASCIIString(64);
-                      Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(task.read_buffer->position()), size);
+                      Azure::Core::IO::MemoryBodyStream memory(reinterpret_cast<const uint8_t *>(read_buffer->position()), size);
                       block_blob_client.StageBlock(block_id, memory);
                       task.block_ids.emplace_back(block_id);
-                      task.read_buffer->ignore(size);
+                      read_buffer->ignore(size);
                       LOG_TRACE(log, "Writing part. Container: {}, Blob: {}, block_id: {}", dest_container_for_logging, dest_blob, block_id);
                   }
             }
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 67d67ea3fae..c09db0bfb7b 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -253,17 +253,6 @@ AzureObjectStorage::SettingsPtr StorageAzureBlob::createSettings(ContextPtr loca
     return settings_ptr;
 }
 
-std::shared_ptr<AzureObjectStorageSettings> StorageAzureBlob::createSettingsAsSharedPtr(ContextPtr local_context)
-{
-    const auto & context_settings = local_context->getSettingsRef();
-    auto settings_ptr = std::make_shared<AzureObjectStorageSettings>();
-    settings_ptr->max_single_part_upload_size = context_settings.azure_max_single_part_upload_size;
-    settings_ptr->max_single_read_retries = context_settings.azure_max_single_read_retries;
-    settings_ptr->list_object_keys_size = static_cast<int32_t>(context_settings.azure_list_object_keys_size);
-
-    return settings_ptr;
-}
-
 void registerStorageAzureBlob(StorageFactory & factory)
 {
     factory.registerStorage("AzureBlobStorage", [](const StorageFactory::Arguments & args)
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index 196983522bf..6fc3c5ce592 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -72,7 +72,6 @@ public:
     static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration, bool is_read_only);
 
     static AzureObjectStorage::SettingsPtr createSettings(ContextPtr local_context);
-    static std::shared_ptr<AzureObjectStorageSettings> createSettingsAsSharedPtr(ContextPtr local_context);
 
     static void processNamedCollectionResult(StorageAzureBlob::Configuration & configuration, const NamedCollection & collection);
 
diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
index 06c18d7468f..22aff39ce87 100644
--- a/tests/integration/test_backup_restore_azure_blob_storage/test.py
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -18,12 +18,45 @@ from helpers.mock_servers import start_mock_servers
 from helpers.test_tools import exec_query_with_retry
 
 
+def generate_cluster_def(port):
+    path = os.path.join(
+        os.path.dirname(os.path.realpath(__file__)),
+        "./_gen/named_collections.xml",
+    )
+    os.makedirs(os.path.dirname(path), exist_ok=True)
+    with open(path, "w") as f:
+        f.write(
+            f"""<clickhouse>
+    <named_collections>
+        <azure_conf1>
+            <connection_string>DefaultEndpointsProtocol=http;AccountName=devstoreaccount1;AccountKey=Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==;BlobEndpoint=http://azurite1:{port}/devstoreaccount1;</connection_string>
+            <container>cont</container>
+            <format>CSV</format>
+        </azure_conf1>
+        <azure_conf2>
+            <storage_account_url>http://azurite1:{port}/devstoreaccount1</storage_account_url>
+            <container>cont</container>
+            <format>CSV</format>
+            <account_name>devstoreaccount1</account_name>
+            <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
+        </azure_conf2>
+    </named_collections>
+</clickhouse>
+"""
+        )
+    return path
+
+
+
 @pytest.fixture(scope="module")
 def cluster():
     try:
         cluster = ClickHouseCluster(__file__)
+        port = cluster.azurite_port
+        path = generate_cluster_def(port)
         cluster.add_instance(
             "node",
+            main_configs=[path],
             with_azurite=True,
         )
         cluster.start()
@@ -123,15 +156,6 @@ def delete_all_files(cluster):
 
     yield
 
-
-def test_create_table_connection_string(cluster):
-    node = cluster.instances["node"]
-    azure_query(
-        node,
-        f"CREATE TABLE test_create_table_conn_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_create_connection_string', 'CSV')",
-    )
-
-
 def test_backup_restore(cluster):
     node = cluster.instances["node"]
     port = cluster.env_variables["AZURITE_PORT"]
@@ -159,3 +183,84 @@ def test_backup_restore(cluster):
         azure_query(node, f"SELECT * from test_simple_write_connection_string_restored")
         == "1\ta\n"
     )
+
+def test_backup_restore_diff_container(cluster):
+    node = cluster.instances["node"]
+    port = cluster.env_variables["AZURITE_PORT"]
+    azure_query(
+        node,
+        f"CREATE TABLE test_simple_write_connection_string_cont1 (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_c_cont1.csv', 'CSV')",
+    )
+    azure_query(
+        node, f"INSERT INTO test_simple_write_connection_string_cont1 VALUES (1, 'a')"
+    )
+    backup_destination = f"AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont1', 'test_simple_write_c_backup_cont1.csv')"
+    azure_query(
+        node,
+        f"BACKUP TABLE test_simple_write_connection_string_cont1 TO {backup_destination}",
+    )
+    azure_query(
+        node,
+        f"RESTORE TABLE test_simple_write_connection_string_cont1 AS test_simple_write_connection_string_restored_cont1 FROM {backup_destination};",
+    )
+    assert (
+            azure_query(node, f"SELECT * from test_simple_write_connection_string_restored_cont1")
+            == "1\ta\n"
+    )
+
+
+def test_backup_restore_with_named_collection_azure_conf1(cluster):
+    node = cluster.instances["node"]
+    port = cluster.env_variables["AZURITE_PORT"]
+    azure_query(
+        node,
+        f"CREATE TABLE test_write_connection_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write.csv', 'CSV')",
+    )
+    azure_query(
+        node, f"INSERT INTO test_write_connection_string VALUES (1, 'a')"
+    )
+    print(get_azure_file_content("test_simple_write.csv", port))
+    assert get_azure_file_content("test_simple_write.csv", port) == '1,"a"\n'
+
+    backup_destination = f"AzureBlobStorage(azure_conf1, 'test_simple_write_nc_backup.csv')"
+    azure_query(
+        node,
+        f"BACKUP TABLE test_write_connection_string TO {backup_destination}",
+    )
+    print(get_azure_file_content("test_simple_write_nc_backup.csv.backup", port))
+    azure_query(
+        node,
+        f"RESTORE TABLE test_write_connection_string AS test_write_connection_string_restored FROM {backup_destination};",
+    )
+    assert (
+            azure_query(node, f"SELECT * from test_write_connection_string_restored")
+            == "1\ta\n"
+    )
+
+def test_backup_restore_with_named_collection_azure_conf2(cluster):
+    node = cluster.instances["node"]
+    port = cluster.env_variables["AZURITE_PORT"]
+    azure_query(
+        node,
+        f"CREATE TABLE test_write_connection_string_2 (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_2.csv', 'CSV')",
+    )
+    azure_query(
+        node, f"INSERT INTO test_write_connection_string_2 VALUES (1, 'a')"
+    )
+    print(get_azure_file_content("test_simple_write_2.csv", port))
+    assert get_azure_file_content("test_simple_write_2.csv", port) == '1,"a"\n'
+
+    backup_destination = f"AzureBlobStorage(azure_conf2, 'test_simple_write_nc_backup_2.csv')"
+    azure_query(
+        node,
+        f"BACKUP TABLE test_write_connection_string_2 TO {backup_destination}",
+    )
+    print(get_azure_file_content("test_simple_write_nc_backup_2.csv.backup", port))
+    azure_query(
+        node,
+        f"RESTORE TABLE test_write_connection_string_2 AS test_write_connection_string_restored_2 FROM {backup_destination};",
+    )
+    assert (
+            azure_query(node, f"SELECT * from test_write_connection_string_restored_2")
+            == "1\ta\n"
+    )

From ce6df0fb137a16c574f5be561205bd171e9ce3a5 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Sun, 4 Feb 2024 10:37:05 +0000
Subject: [PATCH 0595/1081] Automatic style fix

---
 .../test.py                                   | 34 +++++++++++--------
 1 file changed, 19 insertions(+), 15 deletions(-)

diff --git a/tests/integration/test_backup_restore_azure_blob_storage/test.py b/tests/integration/test_backup_restore_azure_blob_storage/test.py
index 22aff39ce87..a7c7b439560 100644
--- a/tests/integration/test_backup_restore_azure_blob_storage/test.py
+++ b/tests/integration/test_backup_restore_azure_blob_storage/test.py
@@ -47,7 +47,6 @@ def generate_cluster_def(port):
     return path
 
 
-
 @pytest.fixture(scope="module")
 def cluster():
     try:
@@ -156,6 +155,7 @@ def delete_all_files(cluster):
 
     yield
 
+
 def test_backup_restore(cluster):
     node = cluster.instances["node"]
     port = cluster.env_variables["AZURITE_PORT"]
@@ -184,6 +184,7 @@ def test_backup_restore(cluster):
         == "1\ta\n"
     )
 
+
 def test_backup_restore_diff_container(cluster):
     node = cluster.instances["node"]
     port = cluster.env_variables["AZURITE_PORT"]
@@ -204,8 +205,10 @@ def test_backup_restore_diff_container(cluster):
         f"RESTORE TABLE test_simple_write_connection_string_cont1 AS test_simple_write_connection_string_restored_cont1 FROM {backup_destination};",
     )
     assert (
-            azure_query(node, f"SELECT * from test_simple_write_connection_string_restored_cont1")
-            == "1\ta\n"
+        azure_query(
+            node, f"SELECT * from test_simple_write_connection_string_restored_cont1"
+        )
+        == "1\ta\n"
     )
 
 
@@ -216,13 +219,13 @@ def test_backup_restore_with_named_collection_azure_conf1(cluster):
         node,
         f"CREATE TABLE test_write_connection_string (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write.csv', 'CSV')",
     )
-    azure_query(
-        node, f"INSERT INTO test_write_connection_string VALUES (1, 'a')"
-    )
+    azure_query(node, f"INSERT INTO test_write_connection_string VALUES (1, 'a')")
     print(get_azure_file_content("test_simple_write.csv", port))
     assert get_azure_file_content("test_simple_write.csv", port) == '1,"a"\n'
 
-    backup_destination = f"AzureBlobStorage(azure_conf1, 'test_simple_write_nc_backup.csv')"
+    backup_destination = (
+        f"AzureBlobStorage(azure_conf1, 'test_simple_write_nc_backup.csv')"
+    )
     azure_query(
         node,
         f"BACKUP TABLE test_write_connection_string TO {backup_destination}",
@@ -233,10 +236,11 @@ def test_backup_restore_with_named_collection_azure_conf1(cluster):
         f"RESTORE TABLE test_write_connection_string AS test_write_connection_string_restored FROM {backup_destination};",
     )
     assert (
-            azure_query(node, f"SELECT * from test_write_connection_string_restored")
-            == "1\ta\n"
+        azure_query(node, f"SELECT * from test_write_connection_string_restored")
+        == "1\ta\n"
     )
 
+
 def test_backup_restore_with_named_collection_azure_conf2(cluster):
     node = cluster.instances["node"]
     port = cluster.env_variables["AZURITE_PORT"]
@@ -244,13 +248,13 @@ def test_backup_restore_with_named_collection_azure_conf2(cluster):
         node,
         f"CREATE TABLE test_write_connection_string_2 (key UInt64, data String) Engine = AzureBlobStorage('{cluster.env_variables['AZURITE_CONNECTION_STRING']}', 'cont', 'test_simple_write_2.csv', 'CSV')",
     )
-    azure_query(
-        node, f"INSERT INTO test_write_connection_string_2 VALUES (1, 'a')"
-    )
+    azure_query(node, f"INSERT INTO test_write_connection_string_2 VALUES (1, 'a')")
     print(get_azure_file_content("test_simple_write_2.csv", port))
     assert get_azure_file_content("test_simple_write_2.csv", port) == '1,"a"\n'
 
-    backup_destination = f"AzureBlobStorage(azure_conf2, 'test_simple_write_nc_backup_2.csv')"
+    backup_destination = (
+        f"AzureBlobStorage(azure_conf2, 'test_simple_write_nc_backup_2.csv')"
+    )
     azure_query(
         node,
         f"BACKUP TABLE test_write_connection_string_2 TO {backup_destination}",
@@ -261,6 +265,6 @@ def test_backup_restore_with_named_collection_azure_conf2(cluster):
         f"RESTORE TABLE test_write_connection_string_2 AS test_write_connection_string_restored_2 FROM {backup_destination};",
     )
     assert (
-            azure_query(node, f"SELECT * from test_write_connection_string_restored_2")
-            == "1\ta\n"
+        azure_query(node, f"SELECT * from test_write_connection_string_restored_2")
+        == "1\ta\n"
     )

From 9c93a762680eff1ada31d0e335d9e021eec1f557 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Sun, 4 Feb 2024 12:50:26 +0000
Subject: [PATCH 0596/1081] Fix backward incompatibility of dashboard url
 hashes

---
 programs/server/dashboard.html | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index ea81c134d07..ae916f2527e 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -1380,11 +1380,13 @@ document.getElementById('params').onsubmit = function(event) {
     event.preventDefault();
 }
 
+const decodeState = (x) => JSON.parse(LZString.decompressFromEncodedURIComponent(x) || atob(x));
+const encodeState = (x) => LZString.compressToEncodedURIComponent(JSON.stringify(x));
 
 function saveState() {
     const state = { host, user, queries, params, search_query, customized };
     history.pushState(state, '',
-        window.location.pathname + (window.location.search || '') + '#' + LZString.compressToEncodedURIComponent(JSON.stringify(state)));
+        window.location.pathname + (window.location.search || '') + '#' + encodeState(state));
 }
 
 async function searchQueries() {
@@ -1450,12 +1452,7 @@ window.onpopstate = function(event) {
 if (window.location.hash) {
     try {
         let search_query_, customized_;
-        try {
-            ({host, user, queries, params, search_query_, customized_} = JSON.parse(LZString.decompressFromEncodedURIComponent(window.location.hash.substring(1))));
-        } catch {
-            // For compatibility with uncompressed state
-            ({host, user, queries, params, search_query_, customized_} = JSON.parse(atob(window.location.hash.substring(1))));
-        }
+        ({host, user, queries, params, search_query_, customized_} = decodeState(window.location.hash.substring(1)));
 
         // For compatibility with old URLs' hashes
         search_query = search_query_ !== undefined ? search_query_ : search_query;

From 790a2f3feb584cc268e2b12a60314cf3cd113c35 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sun, 4 Feb 2024 15:47:04 +0100
Subject: [PATCH 0597/1081] trigger CI again


From 23b9f43d4f56a99e6c6b324910e9c69a665ce92d Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 4 Feb 2024 16:18:17 +0100
Subject: [PATCH 0598/1081] Fix style

---
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 114a970384b..2f4c9374def 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -28,7 +28,6 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
     extern const int INVALID_CONFIG_PARAMETER;
     extern const int AZURE_BLOB_STORAGE_ERROR;
 }

From 3d161ca71d50f795677d7af06762f37b94abaf75 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sun, 4 Feb 2024 18:08:47 +0100
Subject: [PATCH 0599/1081] fix failing upgrade check due to identical
 previous_value and new_value

---
 src/Core/SettingsChangesHistory.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 532c272db60..c3a9cc2e4ed 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,8 +102,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"format_template_row_format", "", "", "Template row format string can be set directly in query"},
-              {"format_template_resultset_format", "", "", "Template result set format string can be set in query"},
+              {"format_template_row_format", "none", "", "Template row format string can be set directly in query"},
+              {"format_template_resultset_format", "none", "", "Template result set format string can be set in query"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},

From d7d299b8a1ef50f709b42cb0b140363f65a45d90 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sun, 4 Feb 2024 20:00:11 +0100
Subject: [PATCH 0600/1081] change back SettingsChangesHistory to empty strings
 - not the reason for CI failing on upgrade check

---
 src/Core/SettingsChangesHistory.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c3a9cc2e4ed..e17ee62c2dc 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,11 +102,11 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"format_template_row_format", "none", "", "Template row format string can be set directly in query"},
-              {"format_template_resultset_format", "none", "", "Template result set format string can be set in query"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
-              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
+              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},
+              {"format_template_row_format", "", "", "Template row format string can be set directly in query"},
+              {"format_template_resultset_format", "", "", "Template result set format string can be set in query"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From 03460ff11e3b515fbbd3211d892e24f6a6fafd20 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Sun, 4 Feb 2024 21:57:33 +0100
Subject: [PATCH 0601/1081] Update SettingsChangesHistory.h

Fix failing CI upgrade check due to setting changes being listed in v24.1 when the latest version has advanced to 24.2 after merging in master branch
---
 src/Core/SettingsChangesHistory.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 51c19f9af47..a190da575c7 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -89,7 +89,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
               {"async_insert_busy_timeout_max_ms", 200, 200, "The minimum value of the asynchronous insert timeout in milliseconds; async_insert_busy_timeout_ms is aliased to async_insert_busy_timeout_max_ms"},
               {"async_insert_busy_timeout_increase_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases"},
-              {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"}}},
+              {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
+              {"format_template_row_format", "", "", "Template row format string can be set directly in query"},
+              {"format_template_resultset_format", "", "", "Template result set format string can be set in query"}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
@@ -110,9 +112,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
-              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},
-              {"format_template_row_format", "", "", "Template row format string can be set directly in query"},
-              {"format_template_resultset_format", "", "", "Template result set format string can be set in query"}}},
+              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From f036948f91882f6a9b594fe1393f82f2122f7da4 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 5 Feb 2024 10:09:48 +0100
Subject: [PATCH 0602/1081] Fix clang tidy build

---
 src/Backups/BackupIO_AzureBlobStorage.cpp            | 12 ++++++------
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp | 10 +++++-----
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 27928e871ce..52ce20d5108 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -89,8 +89,8 @@ std::unique_ptr<SeekableReadBuffer> BackupReaderAzureBlobStorage::readFile(const
         key = file_name;
     }
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client, key, read_settings, settings.get()->max_single_read_retries,
-        settings.get()->max_single_download_retries);
+        client, key, read_settings, settings->max_single_read_retries,
+        settings->max_single_download_retries);
 }
 
 void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
@@ -257,8 +257,8 @@ std::unique_ptr<ReadBuffer> BackupWriterAzureBlobStorage::readFile(const String
     }
 
     return std::make_unique<ReadBufferFromAzureBlobStorage>(
-        client, key, read_settings, settings.get()->max_single_read_retries,
-        settings.get()->max_single_download_retries);
+        client, key, read_settings, settings->max_single_read_retries,
+        settings->max_single_download_retries);
 }
 
 std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const String & file_name)
@@ -275,8 +275,8 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
         client,
         key,
-        settings.get()->max_single_part_upload_size,
-        settings.get()->max_unexpected_write_error_retries,
+        settings->max_single_part_upload_size,
+        settings->max_unexpected_write_error_retries,
         DBMS_DEFAULT_BUFFER_SIZE,
         write_settings);
 }
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 2f4c9374def..9162f371b5b 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -97,7 +97,7 @@ namespace
 
         void calculatePartSize()
         {
-            auto max_upload_part_size = settings.get()->max_upload_part_size;
+            auto max_upload_part_size = settings->max_upload_part_size;
             if (!max_upload_part_size)
                 throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "max_upload_part_size must not be 0");
             /// We've calculated the size of a normal part (the final part can be smaller).
@@ -292,7 +292,7 @@ void copyAzureBlobStorageFile(
     bool for_disk_azure_blob_storage)
 {
 
-    if (settings.get()->use_native_copy)
+    if (settings->use_native_copy)
     {
         ProfileEvents::increment(ProfileEvents::AzureCopyObject);
         if (for_disk_azure_blob_storage)
@@ -302,7 +302,7 @@ void copyAzureBlobStorageFile(
         auto block_blob_client_dest = dest_client->GetBlockBlobClient(dest_blob);
         auto source_uri = block_blob_client_src.GetUrl();
 
-        if (size < settings.get()->max_single_part_copy_size)
+        if (size < settings->max_single_part_copy_size)
         {
             block_blob_client_dest.CopyFromUri(source_uri);
         }
@@ -326,8 +326,8 @@ void copyAzureBlobStorageFile(
         LOG_TRACE(&Poco::Logger::get("copyAzureBlobStorageFile"), "Reading from Container: {}, Blob: {}", src_container_for_logging, src_blob);
         auto create_read_buffer = [&]
         {
-            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_blob, read_settings, settings.get()->max_single_read_retries,
-            settings.get()->max_single_download_retries);
+            return std::make_unique<ReadBufferFromAzureBlobStorage>(src_client, src_blob, read_settings, settings->max_single_read_retries,
+            settings->max_single_download_retries);
         };
 
         UploadHelper helper{create_read_buffer, dest_client, offset, size, dest_container_for_logging, dest_blob, settings, schedule, for_disk_azure_blob_storage, &Poco::Logger::get("copyAzureBlobStorageFile")};

From 9223f74c917b13184340f143a79761dfdc4e387b Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Sat, 3 Feb 2024 12:10:07 +0100
Subject: [PATCH 0603/1081] Fix corner case when passing
 update_insert_deduplication_token_in_dependent_materialized_views

---
 docs/en/operations/settings/settings.md       |  2 +-
 .../Transforms/buildPushingToViewsChain.cpp   | 61 ++++++++++---------
 ...ation_token_hierarchical_inserts.reference |  6 ++
 ...duplication_token_hierarchical_inserts.sql | 51 ++++++++++++++++
 4 files changed, 91 insertions(+), 29 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index a6d66d952cd..3a826b095d2 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -2097,7 +2097,7 @@ SELECT * FROM test_table
 
 ## update_insert_deduplication_token_in_dependent_materialized_views {#update-insert-deduplication-token-in-dependent-materialized-views}
 
-Allows to update `insert_deduplication_token` with table identifier during insert in dependent materialized views, if setting `deduplicate_blocks_in_dependent_materialized_views` is enabled and `insert_deduplication_token` is set.
+Allows to update `insert_deduplication_token` with view identifier during insert in dependent materialized views, if setting `deduplicate_blocks_in_dependent_materialized_views` is enabled and `insert_deduplication_token` is set.
 
 Possible values:
 
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 8ddc3ab0c61..1e10b7dff4c 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -247,30 +247,6 @@ Chain buildPushingToViewsChain(
         {
             insert_context->setSetting("insert_deduplicate", Field{false});
         }
-        else if (insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
-            !insert_settings.insert_deduplication_token.value.empty())
-        {
-            /** Update deduplication token passed to dependent MV with current table id. So it is possible to properly handle
-              * deduplication in complex INSERT flows.
-              *
-              * Example:
-              *
-              * landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
-              *          |                                     |
-              *          └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
-              *
-              * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
-              * be inserted into `ds_2_1`.
-              */
-            auto insert_deduplication_token = insert_settings.insert_deduplication_token.value;
-
-            if (table_id.hasUUID())
-                insert_deduplication_token += "_" + toString(table_id.uuid);
-            else
-                insert_deduplication_token += "_" + table_id.getFullNameNotQuoted();
-
-            insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
-        }
 
         // Processing of blocks for MVs is done block by block, and there will
         // be no parallel reading after (plus it is not a costless operation)
@@ -327,6 +303,35 @@ Chain buildPushingToViewsChain(
         auto & target_name = runtime_stats->target_name;
         auto * view_counter_ms = &runtime_stats->elapsed_ms;
 
+        auto new_insert_context = Context::createCopy(insert_context);
+        auto insert_settings = new_insert_context->getSettings();
+
+        if (!disable_deduplication_for_children &&
+            insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
+            !insert_settings.insert_deduplication_token.value.empty())
+        {
+            /** Update deduplication token passed to dependent MV with current view id. So it is possible to properly handle
+              * deduplication in complex INSERT flows.
+              *
+              * Example:
+              *
+              * landing -┬--> mv_1_1 ---> ds_1_1 ---> mv_2_1 --┬-> ds_2_1 ---> mv_3_1 ---> ds_3_1
+              *          |                                     |
+              *          └--> mv_1_2 ---> ds_1_2 ---> mv_2_2 --┘
+              *
+              * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
+              * be inserted into `ds_2_1`.
+              */
+            auto insert_deduplication_token = insert_settings.insert_deduplication_token.value;
+
+            if (view_id.hasUUID())
+                insert_deduplication_token += "_" + toString(view_id.uuid);
+            else
+                insert_deduplication_token += "_" + view_id.getFullNameNotQuoted();
+
+            new_insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
+        }
+
         if (auto * materialized_view = dynamic_cast<StorageMaterializedView *>(view.get()))
         {
             auto lock = materialized_view->tryLockForShare(context->getInitialQueryId(), context->getSettingsRef().lock_acquire_timeout);
@@ -394,7 +399,7 @@ Chain buildPushingToViewsChain(
                     insert_columns.emplace_back(column.name);
             }
 
-            InterpreterInsertQuery interpreter(nullptr, insert_context, false, false, false);
+            InterpreterInsertQuery interpreter(nullptr, new_insert_context, false, false, false);
             out = interpreter.buildChain(inner_table, inner_metadata_snapshot, insert_columns, thread_status_holder, view_counter_ms);
             out.addStorageHolder(view);
             out.addStorageHolder(inner_table);
@@ -404,7 +409,7 @@ Chain buildPushingToViewsChain(
             runtime_stats->type = QueryViewsLogElement::ViewType::LIVE;
             query = live_view->getInnerQuery(); // Used only to log in system.query_views_log
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, insert_context, ASTPtr(),
+                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
                 /* no_destination= */ true,
                 thread_status_holder, running_group, view_counter_ms, async_insert, storage_header);
         }
@@ -413,13 +418,13 @@ Chain buildPushingToViewsChain(
             runtime_stats->type = QueryViewsLogElement::ViewType::WINDOW;
             query = window_view->getMergeableQuery(); // Used only to log in system.query_views_log
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, insert_context, ASTPtr(),
+                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
                 /* no_destination= */ true,
                 thread_status_holder, running_group, view_counter_ms, async_insert);
         }
         else
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, insert_context, ASTPtr(),
+                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
                 /* no_destination= */ false,
                 thread_status_holder, running_group, view_counter_ms, async_insert);
 
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
index 71c9053d644..b0aa78d061c 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -7,3 +7,9 @@ ds_3_1	all_1_1_0	0
 ds_3_1	all_2_2_0	0
 landing	all_1_1_0	0
 10
+-----
+0
+ds_1_1_fix	all_1_1_0	0
+ds_1_1_fix	all_2_2_0	0
+landing_fix	all_1_1_0	0
+10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 242133e9122..31c860cc5d0 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -101,3 +101,54 @@ DROP VIEW mv_2_2;
 
 DROP TABLE ds_3_1;
 DROP VIEW mv_3_1;
+
+SELECT '-----';
+
+DROP TABLE IF EXISTS landing_fix;
+CREATE TABLE landing_fix
+(
+    timestamp UInt64,
+    value UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP TABLE IF EXISTS ds_1_1_fix;
+CREATE TABLE ds_1_1_fix
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_1;
+CREATE MATERIALIZED VIEW mv_1_1 TO ds_1_1_fix as
+SELECT
+    timestamp t, sum(value) v
+FROM landing_fix
+GROUP BY t;
+
+DROP VIEW IF EXISTS mv_1_2;
+CREATE MATERIALIZED VIEW mv_1_2 TO ds_1_1_fix as
+SELECT
+    timestamp t, sum(value) v
+FROM landing_fix
+GROUP BY t;
+
+INSERT INTO landing_fix SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SELECT sleep(3);
+
+INSERT INTO landing_fix SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SYSTEM FLUSH LOGS;
+SELECT table, name, error FROM system.part_log
+WHERE database = currentDatabase() AND table LIKE '%_fix'
+ORDER BY table, name;
+
+SELECT count() FROM landing_fix;
+
+DROP TABLE landing_fix;
+
+DROP TABLE ds_1_1_fix;
+DROP VIEW mv_1_1;
+DROP VIEW mv_1_2;
\ No newline at end of file

From 08492ae0c5608a003f1a4a0e7aabd2861bca071b Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Sun, 4 Feb 2024 12:02:09 +0100
Subject: [PATCH 0604/1081] Only copy insert_context when needed

---
 src/Processors/Transforms/buildPushingToViewsChain.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 1e10b7dff4c..44c5234c00e 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -303,8 +303,8 @@ Chain buildPushingToViewsChain(
         auto & target_name = runtime_stats->target_name;
         auto * view_counter_ms = &runtime_stats->elapsed_ms;
 
-        auto new_insert_context = Context::createCopy(insert_context);
-        auto insert_settings = new_insert_context->getSettings();
+        auto insert_settings = insert_context->getSettings();
+        ContextMutablePtr new_insert_context = insert_context;
 
         if (!disable_deduplication_for_children &&
             insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
@@ -329,6 +329,7 @@ Chain buildPushingToViewsChain(
             else
                 insert_deduplication_token += "_" + view_id.getFullNameNotQuoted();
 
+            new_insert_context = Context::createCopy(insert_context);
             new_insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
         }
 

From 2fb7f980ef1b9f80c37c3f68d9b939216924b715 Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Mon, 5 Feb 2024 10:16:07 +0100
Subject: [PATCH 0605/1081] Address PR comments

---
 .../Transforms/buildPushingToViewsChain.cpp   | 26 +++++++++++++------
 ...duplication_token_hierarchical_inserts.sql |  2 +-
 2 files changed, 19 insertions(+), 9 deletions(-)

diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 44c5234c00e..40f4166283b 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -303,8 +303,8 @@ Chain buildPushingToViewsChain(
         auto & target_name = runtime_stats->target_name;
         auto * view_counter_ms = &runtime_stats->elapsed_ms;
 
-        auto insert_settings = insert_context->getSettings();
-        ContextMutablePtr new_insert_context = insert_context;
+        const auto & insert_settings = insert_context->getSettingsRef();
+        ContextMutablePtr view_insert_context = insert_context;
 
         if (!disable_deduplication_for_children &&
             insert_settings.update_insert_deduplication_token_in_dependent_materialized_views &&
@@ -321,6 +321,16 @@ Chain buildPushingToViewsChain(
               *
               * Here we want to avoid deduplication for two different blocks generated from `mv_2_1` and `mv_2_2` that will
               * be inserted into `ds_2_1`.
+              *
+              * We are forced to use view id instead of table id because there are some possible INSERT flows where no tables
+              * are involved.
+              *
+              * Example:
+              *
+              * landing -┬--> mv_1_1 --┬-> ds_1_1
+              *          |             |
+              *          └--> mv_1_2 --┘
+              *
               */
             auto insert_deduplication_token = insert_settings.insert_deduplication_token.value;
 
@@ -329,8 +339,8 @@ Chain buildPushingToViewsChain(
             else
                 insert_deduplication_token += "_" + view_id.getFullNameNotQuoted();
 
-            new_insert_context = Context::createCopy(insert_context);
-            new_insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
+            view_insert_context = Context::createCopy(insert_context);
+            view_insert_context->setSetting("insert_deduplication_token", insert_deduplication_token);
         }
 
         if (auto * materialized_view = dynamic_cast<StorageMaterializedView *>(view.get()))
@@ -400,7 +410,7 @@ Chain buildPushingToViewsChain(
                     insert_columns.emplace_back(column.name);
             }
 
-            InterpreterInsertQuery interpreter(nullptr, new_insert_context, false, false, false);
+            InterpreterInsertQuery interpreter(nullptr, view_insert_context, false, false, false);
             out = interpreter.buildChain(inner_table, inner_metadata_snapshot, insert_columns, thread_status_holder, view_counter_ms);
             out.addStorageHolder(view);
             out.addStorageHolder(inner_table);
@@ -410,7 +420,7 @@ Chain buildPushingToViewsChain(
             runtime_stats->type = QueryViewsLogElement::ViewType::LIVE;
             query = live_view->getInnerQuery(); // Used only to log in system.query_views_log
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
+                view, view_metadata_snapshot, view_insert_context, ASTPtr(),
                 /* no_destination= */ true,
                 thread_status_holder, running_group, view_counter_ms, async_insert, storage_header);
         }
@@ -419,13 +429,13 @@ Chain buildPushingToViewsChain(
             runtime_stats->type = QueryViewsLogElement::ViewType::WINDOW;
             query = window_view->getMergeableQuery(); // Used only to log in system.query_views_log
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
+                view, view_metadata_snapshot, view_insert_context, ASTPtr(),
                 /* no_destination= */ true,
                 thread_status_holder, running_group, view_counter_ms, async_insert);
         }
         else
             out = buildPushingToViewsChain(
-                view, view_metadata_snapshot, new_insert_context, ASTPtr(),
+                view, view_metadata_snapshot, view_insert_context, ASTPtr(),
                 /* no_destination= */ false,
                 thread_status_holder, running_group, view_counter_ms, async_insert);
 
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index 31c860cc5d0..c033b500e14 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -151,4 +151,4 @@ DROP TABLE landing_fix;
 
 DROP TABLE ds_1_1_fix;
 DROP VIEW mv_1_1;
-DROP VIEW mv_1_2;
\ No newline at end of file
+DROP VIEW mv_1_2;

From 87cc319cc4d194bc819b46ce4ce2f5e942bf1a00 Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Mon, 5 Feb 2024 10:27:32 +0100
Subject: [PATCH 0606/1081] Split tests

---
 ...ation_token_hierarchical_inserts.reference |  6 ---
 ...duplication_token_hierarchical_inserts.sql | 51 ------------------
 ...token_hierarchical_inserts_views.reference |  5 ++
 ...ation_token_hierarchical_inserts_views.sql | 53 +++++++++++++++++++
 4 files changed, 58 insertions(+), 57 deletions(-)
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.reference
 create mode 100644 tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.sql

diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
index b0aa78d061c..71c9053d644 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.reference
@@ -7,9 +7,3 @@ ds_3_1	all_1_1_0	0
 ds_3_1	all_2_2_0	0
 landing	all_1_1_0	0
 10
------
-0
-ds_1_1_fix	all_1_1_0	0
-ds_1_1_fix	all_2_2_0	0
-landing_fix	all_1_1_0	0
-10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
index c033b500e14..242133e9122 100644
--- a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts.sql
@@ -101,54 +101,3 @@ DROP VIEW mv_2_2;
 
 DROP TABLE ds_3_1;
 DROP VIEW mv_3_1;
-
-SELECT '-----';
-
-DROP TABLE IF EXISTS landing_fix;
-CREATE TABLE landing_fix
-(
-    timestamp UInt64,
-    value UInt64
-)
-ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
-
-DROP TABLE IF EXISTS ds_1_1_fix;
-CREATE TABLE ds_1_1_fix
-(
-    t UInt64,
-    v UInt64
-)
-ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
-
-DROP VIEW IF EXISTS mv_1_1;
-CREATE MATERIALIZED VIEW mv_1_1 TO ds_1_1_fix as
-SELECT
-    timestamp t, sum(value) v
-FROM landing_fix
-GROUP BY t;
-
-DROP VIEW IF EXISTS mv_1_2;
-CREATE MATERIALIZED VIEW mv_1_2 TO ds_1_1_fix as
-SELECT
-    timestamp t, sum(value) v
-FROM landing_fix
-GROUP BY t;
-
-INSERT INTO landing_fix SELECT 1 as timestamp, 1 AS value FROM numbers(10);
-
-SELECT sleep(3);
-
-INSERT INTO landing_fix SELECT 1 as timestamp, 1 AS value FROM numbers(10);
-
-SYSTEM FLUSH LOGS;
-SELECT table, name, error FROM system.part_log
-WHERE database = currentDatabase() AND table LIKE '%_fix'
-ORDER BY table, name;
-
-SELECT count() FROM landing_fix;
-
-DROP TABLE landing_fix;
-
-DROP TABLE ds_1_1_fix;
-DROP VIEW mv_1_1;
-DROP VIEW mv_1_2;
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.reference b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.reference
new file mode 100644
index 00000000000..e1bcc64aaeb
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.reference
@@ -0,0 +1,5 @@
+0
+ds_1_1	all_1_1_0	0
+ds_1_1	all_2_2_0	0
+landing	all_1_1_0	0
+10
diff --git a/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.sql b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.sql
new file mode 100644
index 00000000000..d82ff4afd93
--- /dev/null
+++ b/tests/queries/0_stateless/02972_insert_deduplication_token_hierarchical_inserts_views.sql
@@ -0,0 +1,53 @@
+SET insert_deduplicate = 1;
+SET deduplicate_blocks_in_dependent_materialized_views = 1;
+SET update_insert_deduplication_token_in_dependent_materialized_views = 1;
+SET insert_deduplication_token = 'test';
+
+DROP TABLE IF EXISTS landing;
+CREATE TABLE landing
+(
+    timestamp UInt64,
+    value UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP TABLE IF EXISTS ds_1_1;
+CREATE TABLE ds_1_1
+(
+    t UInt64,
+    v UInt64
+)
+ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS mv_1_1;
+CREATE MATERIALIZED VIEW mv_1_1 TO ds_1_1 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+DROP VIEW IF EXISTS mv_1_2;
+CREATE MATERIALIZED VIEW mv_1_2 TO ds_1_1 as
+SELECT
+    timestamp t, sum(value) v
+FROM landing
+GROUP BY t;
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SELECT sleep(3);
+
+INSERT INTO landing SELECT 1 as timestamp, 1 AS value FROM numbers(10);
+
+SYSTEM FLUSH LOGS;
+SELECT table, name, error FROM system.part_log
+WHERE database = currentDatabase()
+ORDER BY table, name;
+
+SELECT count() FROM landing;
+
+DROP TABLE landing;
+
+DROP TABLE ds_1_1;
+DROP VIEW mv_1_1;
+DROP VIEW mv_1_2;

From 454b03270988494e4291cacef2361af5586c1260 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 5 Feb 2024 12:52:18 +0300
Subject: [PATCH 0607/1081] MultiVersion use mutex

---
 src/Common/MultiVersion.h | 28 ++++++++++++++++++++++------
 1 file changed, 22 insertions(+), 6 deletions(-)

diff --git a/src/Common/MultiVersion.h b/src/Common/MultiVersion.h
index 6ea337e6a7c..8f488f9fcbc 100644
--- a/src/Common/MultiVersion.h
+++ b/src/Common/MultiVersion.h
@@ -2,6 +2,7 @@
 
 #include <atomic>
 #include <memory>
+#include <mutex>
 #include <base/defines.h>
 
 
@@ -20,6 +21,9 @@
   * }   // now we finish own current version; if the version is outdated and no one else is using it - it will be destroyed.
   *
   * All methods are thread-safe.
+  *
+  * Standard library does not have atomic_shared_ptr, and we do not use std::atomic* operations on shared_ptr,
+  * because standard library implementation uses fixed table of mutexes, and it is better to avoid contention here.
   */
 template <typename T>
 class MultiVersion
@@ -42,25 +46,37 @@ public:
     MultiVersion & operator=(MultiVersion && src)
     {
         if (this != &src)
-            std::atomic_store(&current_version, std::atomic_exchange(&src.current_version, Version{}));
+        {
+            Version version;
+
+            {
+                std::lock_guard<std::mutex> lock(src.mutex);
+                src.current_version.swap(version);
+            }
+
+            std::lock_guard<std::mutex> lock(mutex);
+            current_version = std::move(version);
+        }
+
         return *this;
     }
 
     /// Obtain current version for read-only usage. Returns shared_ptr, that manages lifetime of version.
     Version get() const
     {
-        return std::atomic_load(&current_version);
+        std::lock_guard<std::mutex> lock(mutex);
+        return current_version;
     }
 
-    /// TODO: replace atomic_load/store() on shared_ptr (which is deprecated as of C++20) by C++20 std::atomic<std::shared_ptr>.
-    /// Clang 15 currently does not support it.
-
     /// Update an object with new version.
     void set(std::unique_ptr<const T> && value)
     {
-        std::atomic_store(&current_version, Version{std::move(value)});
+        Version version{std::move(value)};
+        std::lock_guard<std::mutex> lock(mutex);
+        current_version = std::move(version);
     }
 
 private:
+    mutable std::mutex mutex;
     Version current_version;
 };

From 10efb30e657623e67cbc15e046ef29e8f423f61e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 10:55:13 +0100
Subject: [PATCH 0608/1081] Fix aws submodule reference

---
 contrib/aws | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/aws b/contrib/aws
index 4ec215f3607..9eb5097a0ab 160000
--- a/contrib/aws
+++ b/contrib/aws
@@ -1 +1 @@
-Subproject commit 4ec215f3607c2111bf2cc91ba842046a6b5eb0c4
+Subproject commit 9eb5097a0abfa837722cca7a5114a25837817bf2

From 6ba35b54597b44fe674f98964df6a12a670b96e5 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 5 Feb 2024 11:17:58 +0100
Subject: [PATCH 0609/1081] Make comments for system tables also available in
 local mode and enforce comments not to be empty (#59493)

Co-authored-by: Alexey Milovidov <milovidov@clickhouse.com>
---
 src/Interpreters/SystemLog.cpp                | 11 ++++----
 src/Storages/System/attachSystemTablesImpl.h  | 28 +++++++++++--------
 .../02982_comments_in_system_tables.reference |  0
 .../02982_comments_in_system_tables.sh        |  8 ++++++
 4 files changed, 31 insertions(+), 16 deletions(-)
 create mode 100644 tests/queries/0_stateless/02982_comments_in_system_tables.reference
 create mode 100755 tests/queries/0_stateless/02982_comments_in_system_tables.sh

diff --git a/src/Interpreters/SystemLog.cpp b/src/Interpreters/SystemLog.cpp
index 2fb782befa1..6580dc3e9b7 100644
--- a/src/Interpreters/SystemLog.cpp
+++ b/src/Interpreters/SystemLog.cpp
@@ -211,16 +211,17 @@ std::shared_ptr<TSystemLog> createSystemLog(
             if (!settings.empty())
                 log_settings.engine += (storage_policy.empty() ? " " : ", ") + settings;
         }
-
-        /// Add comment to AST. So it will be saved when the table will be renamed.
-        log_settings.engine += fmt::format(" COMMENT {} ", quoteString(comment));
     }
 
     /// Validate engine definition syntax to prevent some configuration errors.
     ParserStorageWithComment storage_parser;
-
-    parseQuery(storage_parser, log_settings.engine.data(), log_settings.engine.data() + log_settings.engine.size(),
+    auto storage_ast = parseQuery(storage_parser, log_settings.engine.data(), log_settings.engine.data() + log_settings.engine.size(),
             "Storage to create table for " + config_prefix, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    auto & storage_with_comment = storage_ast->as<StorageWithComment &>();
+
+    /// Add comment to AST. So it will be saved when the table will be renamed.
+    if (!storage_with_comment.comment || storage_with_comment.comment->as<ASTLiteral &>().value.safeGet<String>().empty())
+        log_settings.engine += fmt::format(" COMMENT {} ", quoteString(comment));
 
     log_settings.queue_settings.flush_interval_milliseconds = config.getUInt64(config_prefix + ".flush_interval_milliseconds",
                                                                                TSystemLog::getDefaultFlushIntervalMilliseconds());
diff --git a/src/Storages/System/attachSystemTablesImpl.h b/src/Storages/System/attachSystemTablesImpl.h
index 0b0a22baa13..9f2c4e8016d 100644
--- a/src/Storages/System/attachSystemTablesImpl.h
+++ b/src/Storages/System/attachSystemTablesImpl.h
@@ -7,14 +7,20 @@
 namespace DB
 {
 
-template<typename StorageT, typename... StorageArgs>
-void attach(ContextPtr context, IDatabase & system_database, const String & table_name, const String & comment, StorageArgs && ... args)
+template <int Length>
+using StringLiteral = const char(&)[Length];
+
+template<typename StorageT, int CommentSize, typename... StorageArgs>
+void attach(ContextPtr context, IDatabase & system_database, const String & table_name, StringLiteral<CommentSize> comment, StorageArgs && ... args)
 {
+    static_assert(CommentSize > 15, "The comment for a system table is too short or empty");
     assert(system_database.getDatabaseName() == DatabaseCatalog::SYSTEM_DATABASE);
+
+    auto table_id = StorageID::createEmpty();
     if (system_database.getUUID() == UUIDHelpers::Nil)
     {
         /// Attach to Ordinary database.
-        auto table_id = StorageID(DatabaseCatalog::SYSTEM_DATABASE, table_name);
+        table_id = StorageID(DatabaseCatalog::SYSTEM_DATABASE, table_name);
         system_database.attachTable(context, table_name, std::make_shared<StorageT>(table_id, std::forward<StorageArgs>(args)...));
     }
     else
@@ -22,18 +28,18 @@ void attach(ContextPtr context, IDatabase & system_database, const String & tabl
         /// Attach to Atomic database.
         /// NOTE: UUIDs are not persistent, but it's ok since no data are stored on disk for these storages
         /// and path is actually not used
-        auto table_id = StorageID(DatabaseCatalog::SYSTEM_DATABASE, table_name, UUIDHelpers::generateV4());
+        table_id = StorageID(DatabaseCatalog::SYSTEM_DATABASE, table_name, UUIDHelpers::generateV4());
         DatabaseCatalog::instance().addUUIDMapping(table_id.uuid);
         String path = "store/" + DatabaseCatalog::getPathForUUID(table_id.uuid);
         system_database.attachTable(context, table_name, std::make_shared<StorageT>(table_id, std::forward<StorageArgs>(args)...), path);
-
-        /// Set the comment
-        auto table = DatabaseCatalog::instance().getTable(table_id, context);
-        assert(table);
-        auto metadata = table->getInMemoryMetadata();
-        metadata.comment = comment;
-        table->setInMemoryMetadata(metadata);
     }
+
+    /// Set the comment
+    auto table = DatabaseCatalog::instance().getTable(table_id, context);
+    assert(table);
+    auto metadata = table->getInMemoryMetadata();
+    metadata.comment = comment;
+    table->setInMemoryMetadata(metadata);
 }
 
 }
diff --git a/tests/queries/0_stateless/02982_comments_in_system_tables.reference b/tests/queries/0_stateless/02982_comments_in_system_tables.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02982_comments_in_system_tables.sh b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
new file mode 100755
index 00000000000..cc04592bc27
--- /dev/null
+++ b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+${CLICKHOUSE_LOCAL}  --query "SELECT 'Table ' || database || '.' || name || ' doesnt have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
+${CLICKHOUSE_CLIENT} --query "SELECT 'Table ' || database || '.' || name || ' doesnt have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"

From a2fc3facca0f62405addeb4119c745faaa191c11 Mon Sep 17 00:00:00 2001
From: mikhnenko <mikhnenko@yandex-team.com>
Date: Mon, 5 Feb 2024 13:21:06 +0300
Subject: [PATCH 0610/1081] Add missed #include <bit> and <exception>

---
 base/base/bit_cast.h          | 1 +
 base/base/wide_integer_impl.h | 1 +
 src/Common/Exception.h        | 1 +
 3 files changed, 3 insertions(+)

diff --git a/base/base/bit_cast.h b/base/base/bit_cast.h
index 4783a84586b..9a92b7660f1 100644
--- a/base/base/bit_cast.h
+++ b/base/base/bit_cast.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <bit>
 #include <cstring>
 #include <algorithm>
 #include <type_traits>
diff --git a/base/base/wide_integer_impl.h b/base/base/wide_integer_impl.h
index c1fd7b69b7f..17b1fa7cd6a 100644
--- a/base/base/wide_integer_impl.h
+++ b/base/base/wide_integer_impl.h
@@ -6,6 +6,7 @@
 
 #include "throwError.h"
 
+#include <bit>
 #include <cmath>
 #include <cfloat>
 #include <cassert>
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 817a4400080..94e4a986feb 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <cerrno>
+#include <exception>
 #include <vector>
 #include <memory>
 

From fd2fdcdb4b33fe91227d7d623aea24a0356f29f0 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 5 Feb 2024 11:23:37 +0100
Subject: [PATCH 0611/1081] Fixed unwanted dereferencing

---
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
index 9162f371b5b..4714c795927 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.cpp
@@ -58,7 +58,7 @@ namespace
             , schedule(schedule_)
             , for_disk_azure_blob_storage(for_disk_azure_blob_storage_)
             , log(log_)
-            , max_single_part_upload_size(settings_.get()->max_single_part_upload_size)
+            , max_single_part_upload_size(settings_->max_single_part_upload_size)
         {
         }
 

From 8581bdbe58bdeea57c33f1e499624111ad26d09b Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Fri, 2 Feb 2024 18:44:01 +0100
Subject: [PATCH 0612/1081] do not call value() on empty optional query_info

---
 src/Server/GRPCServer.cpp | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index f31a8d6feb5..7c532312612 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -419,7 +419,11 @@ namespace
         void read(GRPCQueryInfo & query_info_, const CompletionCallback & callback) override
         {
             if (!query_info.has_value())
+            {
                 callback(false);
+                return;
+            }
+
             query_info_ = std::move(query_info).value();
             query_info.reset();
             callback(true);
@@ -486,7 +490,11 @@ namespace
         void read(GRPCQueryInfo & query_info_, const CompletionCallback & callback) override
         {
             if (!query_info.has_value())
+            {
                 callback(false);
+                return;
+            }
+
             query_info_ = std::move(query_info).value();
             query_info.reset();
             callback(true);

From 45bcc04d98ebaaf511ccf2920c1eaca98ee3a10c Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 5 Feb 2024 12:56:03 +0000
Subject: [PATCH 0613/1081] Use ConnectionPoolPtr instead of raw pointer

---
 src/Processors/QueryPlan/ReadFromRemote.cpp | 2 +-
 src/Processors/QueryPlan/ReadFromRemote.h   | 2 +-
 src/QueryPipeline/RemoteQueryExecutor.cpp   | 2 +-
 src/QueryPipeline/RemoteQueryExecutor.h     | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 379ea950081..1edb672aa38 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -439,7 +439,7 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
 
 
 void ReadFromParallelRemoteReplicasStep::addPipeForSingeReplica(
-    Pipes & pipes, IConnectionPool * pool, IConnections::ReplicaInfo replica_info)
+    Pipes & pipes, const ConnectionPoolPtr & pool, IConnections::ReplicaInfo replica_info)
 {
     bool add_agg_info = stage == QueryProcessingStage::WithMergeableState;
     bool add_totals = false;
diff --git a/src/Processors/QueryPlan/ReadFromRemote.h b/src/Processors/QueryPlan/ReadFromRemote.h
index eb3bcd12cc3..67fd9d24261 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.h
+++ b/src/Processors/QueryPlan/ReadFromRemote.h
@@ -90,7 +90,7 @@ public:
     void enforceAggregationInOrder();
 
 private:
-    void addPipeForSingeReplica(Pipes & pipes, IConnectionPool * pool, IConnections::ReplicaInfo replica_info);
+    void addPipeForSingeReplica(Pipes & pipes, const ConnectionPoolPtr & pool, IConnections::ReplicaInfo replica_info);
 
     ClusterPtr cluster;
     ASTPtr query_ast;
diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 8a4bee1d8af..1a68c9d4471 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -64,7 +64,7 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 }
 
 RemoteQueryExecutor::RemoteQueryExecutor(
-    IConnectionPool * pool,
+    ConnectionPoolPtr pool,
     const String & query_,
     const Block & header_,
     ContextPtr context_,
diff --git a/src/QueryPipeline/RemoteQueryExecutor.h b/src/QueryPipeline/RemoteQueryExecutor.h
index e617deef7e8..6b1539bd08e 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.h
+++ b/src/QueryPipeline/RemoteQueryExecutor.h
@@ -54,7 +54,7 @@ public:
 
     /// Takes a connection pool for a node (not cluster)
     RemoteQueryExecutor(
-        IConnectionPool * pool,
+        ConnectionPoolPtr pool,
         const String & query_,
         const Block & header_,
         ContextPtr context_,

From ad13a57b7f462fa7c0ed0a50a2572969d334e845 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 5 Feb 2024 13:43:55 +0000
Subject: [PATCH 0614/1081] Improve detection of v2 capabilities

---
 base/base/getMemoryAmount.cpp | 27 +++++++++++++++++++--------
 1 file changed, 19 insertions(+), 8 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 7f50683944e..ccdc0f0f976 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -27,14 +27,26 @@ std::optional<uint64_t> getCgroupsV2MemoryLimit()
     if (!controllers_file.is_open())
         return {};
 
-    /// We also need the memory controller enabled
-    std::stringstream controllers_buf;
-    controllers_buf << controllers_file.rdbuf();
-    std::string controllers = controllers_buf.str();
-    if (controllers.find("memory") == std::string::npos)
+    /// Make sure that the memory controller is enabled.
+    /// - cgroup.controllers defines which controllers *can* be enabled.
+    /// - cgroup.subtree_control defines which controllers *are* enabled.
+    /// (see https://docs.kernel.org/admin-guide/cgroup-v2.html)
+    /// Caveat: nested groups may disable controllers. For simplicity, check only the top-level group.
+    /// ReadBufferFromFile subtree_control_file(default_cgroups_mount / "cgroup.subtree_control");
+    /// std::string subtree_control;
+    /// readString(subtree_control, subtree_control_file);
+    /// if (subtree_control.find("memory") == std::string::npos)
+    ///     return {};
+    std::ifstream subtree_control_file(default_cgroups_mount / "cgroup.subtree_control");
+    std::stringstream subtree_control_buf;
+    subtree_control_buf << subtree_control_file.rdbuf();
+    std::string subtree_control = subtree_control_buf.str();
+    if (subtree_control.find("memory") == std::string::npos)
         return {};
 
     /// Identify the cgroup the process belongs to
+    /// All PIDs assigned to a cgroup are in /sys/fs/cgroups/{cgroup_name}/cgroup.procs
+    /// A simpler way to get the membership is:
     std::ifstream cgroup_name_file("/proc/self/cgroup");
     if (!cgroup_name_file.is_open())
         return {};
@@ -44,10 +56,9 @@ std::optional<uint64_t> getCgroupsV2MemoryLimit()
     std::string cgroup_name = cgroup_name_buf.str();
     if (!cgroup_name.empty() && cgroup_name.back() == '\n')
         cgroup_name.pop_back(); /// remove trailing newline, if any
-    /// cgroups v2 will show a single line with prefix "0::/"
-    /// - https://book.hacktricks.xyz/linux-hardening/privilege-escalation/docker-security/cgroups
+    /// With cgroups v2, there will be a *single* line with prefix "0::/"
     const std::string v2_prefix = "0::/";
-    if (cgroup_name.find('\n') != std::string::npos || !cgroup_name.starts_with(v2_prefix))
+    if (!cgroup_name.starts_with(v2_prefix))
         return {};
     cgroup_name = cgroup_name.substr(v2_prefix.length());
 

From f03d8006d46b35d862a77bc20a8e6bc4296a76e6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 5 Feb 2024 17:12:39 +0300
Subject: [PATCH 0615/1081] Update CHANGELOG.md

---
 CHANGELOG.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 50db3292ca8..60618402174 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -6,8 +6,6 @@
 
 ### <a id="241"></a> ClickHouse release 24.1, 2024-01-30
 
-### ClickHouse release master (b4a5b6060ea) FIXME as compared to v23.12.1.1368-stable (a2faa65b080)
-
 #### Backward Incompatible Change
 * The setting `print_pretty_type_names` is turned on by default. You can turn it off to keep the old behavior or `SET compatibility = '23.12'`. [#57726](https://github.com/ClickHouse/ClickHouse/pull/57726) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
 * The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58316](https://github.com/ClickHouse/ClickHouse/pull/58316) ([Alexander Tokmakov](https://github.com/tavplubix)).

From 576cfdbf5cb4428868a03f1b78da760f776010fd Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 5 Feb 2024 14:27:07 +0000
Subject: [PATCH 0616/1081] Includes cleanup

---
 src/Client/Connection.h                     | 1 -
 src/Client/IConnections.h                   | 2 --
 src/Processors/QueryPlan/ReadFromRemote.cpp | 2 +-
 src/Processors/QueryPlan/ReadFromRemote.h   | 3 ---
 4 files changed, 1 insertion(+), 7 deletions(-)

diff --git a/src/Client/Connection.h b/src/Client/Connection.h
index e93a7539d15..5d0411027a1 100644
--- a/src/Client/Connection.h
+++ b/src/Client/Connection.h
@@ -19,7 +19,6 @@
 
 #include <Storages/MergeTree/RequestResponse.h>
 
-#include <atomic>
 #include <optional>
 
 #include "config.h"
diff --git a/src/Client/IConnections.h b/src/Client/IConnections.h
index ee17d198fc3..ebc71511834 100644
--- a/src/Client/IConnections.h
+++ b/src/Client/IConnections.h
@@ -1,7 +1,5 @@
 #pragma once
 
-#include <compare>
-
 #include <Client/Connection.h>
 #include <Storages/MergeTree/RequestResponse.h>
 
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 1edb672aa38..6764e095088 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -12,7 +12,7 @@
 #include <Processors/Sources/DelayedSource.h>
 #include <Processors/Transforms/ExpressionTransform.h>
 #include <Interpreters/ActionsDAG.h>
-#include "Common/logger_useful.h"
+#include <Common/logger_useful.h>
 #include <Common/checkStackSize.h>
 #include <Core/QueryProcessingStage.h>
 #include <Client/ConnectionPool.h>
diff --git a/src/Processors/QueryPlan/ReadFromRemote.h b/src/Processors/QueryPlan/ReadFromRemote.h
index 67fd9d24261..498d584e85a 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.h
+++ b/src/Processors/QueryPlan/ReadFromRemote.h
@@ -9,9 +9,6 @@
 
 namespace DB
 {
-
-class IConnectionPool;
-
 class Throttler;
 using ThrottlerPtr = std::shared_ptr<Throttler>;
 

From 8748d8c537c96dccb31df76099425b3321ff9e02 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 5 Feb 2024 15:10:51 +0000
Subject: [PATCH 0617/1081] UNEXPECTED_CLUSTER error for cluster with more than
 1 shard

---
 src/Common/ErrorCodes.cpp                      | 1 +
 src/Interpreters/ClusterProxy/executeQuery.cpp | 7 +++++--
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 2e154ddb32d..8e81a626b41 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -593,6 +593,7 @@
     M(711, FILECACHE_ACCESS_DENIED) \
     M(712, TOO_MANY_MATERIALIZED_VIEWS) \
     M(713, BROKEN_PROJECTION) \
+    M(714, UNEXPECTED_CLUSTER) \
     \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 023ed6c7b61..33b86854ba9 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -32,6 +32,7 @@ namespace ErrorCodes
     extern const int TOO_LARGE_DISTRIBUTED_DEPTH;
     extern const int LOGICAL_ERROR;
     extern const int CLUSTER_DOESNT_EXIST;
+    extern const int UNEXPECTED_CLUSTER;
 }
 
 namespace ClusterProxy
@@ -399,8 +400,10 @@ void executeQueryWithParallelReplicas(
     }
     else
     {
-        // todo: add error and exception for this case
-        chassert(not_optimized_cluster->getShardCount() == 1);
+        if (not_optimized_cluster->getShardCount() > 1)
+            throw DB::Exception(
+                ErrorCodes::UNEXPECTED_CLUSTER,
+                "`cluster_for_parallel_replicas` setting refers to cluster with several shards. Expected a cluster with one shard");
     }
 
     auto coordinator = std::make_shared<ParallelReplicasReadingCoordinator>(

From a50a14062621733b938cb9fb986c18d698ee3c36 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 5 Feb 2024 15:29:08 +0000
Subject: [PATCH 0618/1081] Test for UNEXPECTED_CLUSTER

---
 .../02982_parallel_replicas_unexpected_cluster.reference  | 0
 .../02982_parallel_replicas_unexpected_cluster.sql        | 8 ++++++++
 2 files changed, 8 insertions(+)
 create mode 100644 tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.reference
 create mode 100644 tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.sql

diff --git a/tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.reference b/tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.sql b/tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.sql
new file mode 100644
index 00000000000..210b7d2a18a
--- /dev/null
+++ b/tests/queries/0_stateless/02982_parallel_replicas_unexpected_cluster.sql
@@ -0,0 +1,8 @@
+DROP TABLE IF EXISTS test_unexpected_cluster;
+CREATE TABLE test_unexpected_cluster (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
+INSERT INTO test_unexpected_cluster SELECT * FROM numbers(10);
+
+SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=2, cluster_for_parallel_replicas='test_cluster_two_shards', parallel_replicas_for_non_replicated_merge_tree=1;
+SELECT count() FROM test_unexpected_cluster WHERE NOT ignore(*); -- { serverError UNEXPECTED_CLUSTER }
+
+DROP TABLE test_unexpected_cluster;

From 9b5ea7bb8a966da3681b8887ab6c87debc4e3e39 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Thu, 1 Feb 2024 14:29:25 +0000
Subject: [PATCH 0619/1081] Analyzer: Fix 00917_multiple_joins_denny_crane

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index cb1e94305fb..5e1e42b25ac 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -2759,7 +2759,13 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromAliases(const Identifier
     {
         if (identifier_lookup.isExpressionLookup())
         {
-            return tryResolveIdentifierFromCompoundExpression(identifier_lookup.identifier, 1 /*identifier_bind_size*/, it->second, {}, scope);
+            return tryResolveIdentifierFromCompoundExpression(
+                identifier_lookup.identifier,
+                1 /*identifier_bind_size*/,
+                it->second,
+                {} /* compound_expression_source */,
+                scope,
+                identifier_resolve_settings.allow_to_check_join_tree /* can_be_not_found */);
         }
         else if (identifier_lookup.isFunctionLookup() || identifier_lookup.isTableExpressionLookup())
         {

From cbb63e333c1e263e89accc5262e4076753453fa3 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Fri, 2 Feb 2024 14:48:38 +0100
Subject: [PATCH 0620/1081] Update analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index d944dd96e25..b84b46114b4 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -23,7 +23,6 @@
 02428_parameterized_view
 02493_inconsistent_hex_and_binary_number
 02575_merge_prewhere_different_default_kind
-00917_multiple_joins_denny_crane
 02725_agg_projection_resprect_PK
 02763_row_policy_storage_merge_alias
 02818_parameterized_view_with_cte_multiple_usage

From c4e1d09c66914b95bb8e8d82bff6ee7d24ecc986 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 17:33:14 +0100
Subject: [PATCH 0621/1081] Reserve enough memory for
 memcpySmallAllowReadWriteOverflow15

---
 src/Functions/array/arrayElement.cpp | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Functions/array/arrayElement.cpp b/src/Functions/array/arrayElement.cpp
index cea407aee02..8669fd1f3a7 100644
--- a/src/Functions/array/arrayElement.cpp
+++ b/src/Functions/array/arrayElement.cpp
@@ -670,8 +670,7 @@ struct ArrayElementStringImpl
         ColumnArray::Offset current_offset = 0;
         /// get the total result bytes at first, and reduce the cost of result_data.resize.
         size_t total_result_bytes = 0;
-        ColumnString::Chars zero_buf(1);
-        zero_buf.push_back(0);
+        ColumnString::Chars zero_buf(16, '\0'); /// Needs 15 extra bytes for memcpySmallAllowReadWriteOverflow15
         std::vector<std::pair<const ColumnString::Char *, UInt64>> selected_bufs;
         selected_bufs.reserve(size);
         for (size_t i = 0; i < size; ++i)
@@ -737,8 +736,7 @@ struct ArrayElementStringImpl
         size_t size = offsets.size();
         result_offsets.resize(size);
 
-        ColumnString::Chars zero_buf(1);
-        zero_buf.push_back(0);
+        ColumnString::Chars zero_buf(16, '\0'); /// Needs 15 extra bytes for memcpySmallAllowReadWriteOverflow15
         ColumnArray::Offset current_offset = 0;
         /// get the total result bytes at first, and reduce the cost of result_data.resize.
         size_t total_result_bytes = 0;

From ca9e2cac8a6c6fa368a38f8b81360072343aef7b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 17:37:06 +0100
Subject: [PATCH 0622/1081] Add test

---
 .../0_stateless/02983_empty_map.reference     |  7 +++++++
 tests/queries/0_stateless/02983_empty_map.sql | 21 +++++++++++++++++++
 2 files changed, 28 insertions(+)
 create mode 100644 tests/queries/0_stateless/02983_empty_map.reference
 create mode 100644 tests/queries/0_stateless/02983_empty_map.sql

diff --git a/tests/queries/0_stateless/02983_empty_map.reference b/tests/queries/0_stateless/02983_empty_map.reference
new file mode 100644
index 00000000000..fadedaf23ae
--- /dev/null
+++ b/tests/queries/0_stateless/02983_empty_map.reference
@@ -0,0 +1,7 @@
+-- { echoOn }
+SELECT f1, f2['2'], count() FROM t1 GROUP BY 1,2 order by 1,2;
+1		1000111
+SELECT f1, f3['2'], count() FROM t1 GROUP BY 1,2 order by 1,2;
+1		1000111
+SELECT f1, f4[2], count() FROM t1 GROUP BY 1,2 order by 1,2;
+1	0	1000111
diff --git a/tests/queries/0_stateless/02983_empty_map.sql b/tests/queries/0_stateless/02983_empty_map.sql
new file mode 100644
index 00000000000..78bc5d8736f
--- /dev/null
+++ b/tests/queries/0_stateless/02983_empty_map.sql
@@ -0,0 +1,21 @@
+--https://github.com/ClickHouse/ClickHouse/issues/59402
+CREATE TABLE t1
+(
+    f1 Int32,
+    f2 Map(LowCardinality(String),LowCardinality(String)),
+    f3 Map(String,String),
+    f4 Map(Int32,Int32)
+)
+ENGINE=Memory AS
+SELECT 1 as f1,
+       map(number%2,number%10) as f2,
+       f2 as f3,
+       f2 as f4
+from numbers(1000111);
+
+SET max_block_size=10;
+
+-- { echoOn }
+SELECT f1, f2['2'], count() FROM t1 GROUP BY 1,2 order by 1,2;
+SELECT f1, f3['2'], count() FROM t1 GROUP BY 1,2 order by 1,2;
+SELECT f1, f4[2], count() FROM t1 GROUP BY 1,2 order by 1,2;

From a0170bcbd5a7f9fbc956a6667a0929a72c1f189e Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 5 Feb 2024 15:30:00 +0100
Subject: [PATCH 0623/1081] Fix utils

---
 programs/keeper-converter/KeeperConverter.cpp | 43 +++++++------
 programs/keeper/CMakeLists.txt                |  2 +-
 src/Coordination/KeeperSnapshotManager.cpp    | 24 +++-----
 src/Coordination/KeeperStorage.cpp            | 44 ++++++++++++-
 src/Coordination/KeeperStorage.h              | 61 +++++++------------
 src/Coordination/SnapshotableHashTable.h      |  4 +-
 src/Coordination/ZooKeeperDataReader.cpp      | 37 ++++++-----
 src/Coordination/tests/gtest_coordination.cpp | 42 ++++++-------
 utils/keeper-bench/Generator.cpp              |  1 +
 utils/keeper-data-dumper/main.cpp             | 14 ++---
 10 files changed, 146 insertions(+), 126 deletions(-)

diff --git a/programs/keeper-converter/KeeperConverter.cpp b/programs/keeper-converter/KeeperConverter.cpp
index f39a7bd5eb8..92bdea28738 100644
--- a/programs/keeper-converter/KeeperConverter.cpp
+++ b/programs/keeper-converter/KeeperConverter.cpp
@@ -1,5 +1,4 @@
 #include <iostream>
-#include <optional>
 #include <boost/program_options.hpp>
 
 #include <Coordination/KeeperSnapshotManager.h>
@@ -38,31 +37,31 @@ int mainEntryClickHouseKeeperConverter(int argc, char ** argv)
         return 0;
     }
 
-    //try
-    //{
-    //    auto keeper_context = std::make_shared<KeeperContext>(true);
-    //    keeper_context->setDigestEnabled(true);
-    //    keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("Keeper-snapshots", options["output-dir"].as<std::string>()));
+    try
+    {
+        auto keeper_context = std::make_shared<KeeperContext>(true);
+        keeper_context->setDigestEnabled(true);
+        keeper_context->setSnapshotDisk(std::make_shared<DiskLocal>("Keeper-snapshots", options["output-dir"].as<std::string>()));
 
-    //    DB::KeeperStorage storage(/* tick_time_ms */ 500, /* superdigest */ "", keeper_context, /* initialize_system_nodes */ false);
+        DB::KeeperStorage storage(/* tick_time_ms */ 500, /* superdigest */ "", keeper_context, /* initialize_system_nodes */ false);
 
-    //    DB::deserializeKeeperStorageFromSnapshotsDir(storage, options["zookeeper-snapshots-dir"].as<std::string>(), logger);
-    //    storage.initializeSystemNodes();
+        DB::deserializeKeeperStorageFromSnapshotsDir(storage, options["zookeeper-snapshots-dir"].as<std::string>(), logger);
+        storage.initializeSystemNodes();
 
-    //    DB::deserializeLogsAndApplyToStorage(storage, options["zookeeper-logs-dir"].as<std::string>(), logger);
-    //    DB::SnapshotMetadataPtr snapshot_meta = std::make_shared<DB::SnapshotMetadata>(storage.getZXID(), 1, std::make_shared<nuraft::cluster_config>());
-    //    DB::KeeperStorageSnapshot snapshot(&storage, snapshot_meta);
+        DB::deserializeLogsAndApplyToStorage(storage, options["zookeeper-logs-dir"].as<std::string>(), logger);
+        DB::SnapshotMetadataPtr snapshot_meta = std::make_shared<DB::SnapshotMetadata>(storage.getZXID(), 1, std::make_shared<nuraft::cluster_config>());
+        DB::KeeperStorageSnapshot snapshot(&storage, snapshot_meta);
 
-    //    DB::KeeperSnapshotManager manager(1, keeper_context);
-    //    auto snp = manager.serializeSnapshotToBuffer(snapshot);
-    //    auto file_info = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
-    //    std::cout << "Snapshot serialized to path:" << fs::path(file_info.disk->getPath()) / file_info.path << std::endl;
-    //}
-    //catch (...)
-    //{
-    //    std::cerr << getCurrentExceptionMessage(true) << '\n';
-    //    return getCurrentExceptionCode();
-    //}
+        DB::KeeperSnapshotManager manager(1, keeper_context);
+        auto snp = manager.serializeSnapshotToBuffer(snapshot);
+        auto file_info = manager.serializeSnapshotBufferToDisk(*snp, storage.getZXID());
+        std::cout << "Snapshot serialized to path:" << fs::path(file_info.disk->getPath()) / file_info.path << std::endl;
+    }
+    catch (...)
+    {
+        std::cerr << getCurrentExceptionMessage(true) << '\n';
+        return getCurrentExceptionCode();
+    }
 
     return 0;
 }
diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index fba9b3e4d86..143ded0ee85 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -44,7 +44,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SessionExpiryQueue.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SummingStateMachine.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/WriteBufferFromNuraftBuffer.cpp
-        #${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/ZooKeeperDataReader.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/ZooKeeperDataReader.cpp
 
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/SettingsFields.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Core/BaseSettings.cpp
diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index e1466172fd9..fe6c7e3a389 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -86,14 +86,14 @@ namespace
         writeBinary(node.version, out);
         writeBinary(node.cversion, out);
         writeBinary(node.aversion, out);
-        const bool is_ephemeral = node.isEphemeral(); 
+        const bool is_ephemeral = node.isEphemeral();
         writeBinary(is_ephemeral ? node.ephemeralOwner() : 0, out);
         if (version < SnapshotVersion::V6)
             writeBinary(static_cast<int32_t>(node.data_size), out);
         writeBinary(is_ephemeral ? 0 : node.numChildren(), out);
         writeBinary(node.pzxid, out);
 
-        writeBinary(node.seqNum(), out);
+        writeBinary(is_ephemeral ? 0 : node.seqNum(), out);
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
             writeBinary(node.sizeInBytes(), out);
@@ -153,26 +153,23 @@ namespace
         int64_t ephemeral_owner = 0;
         readBinary(ephemeral_owner, in);
         if (ephemeral_owner != 0)
-        {
-            node.is_ephemeral_and_mtime.is_ephemeral = true;
-            node.ephemeral_or_children_data.ephemeral_owner = ephemeral_owner;
-        }
+            node.setEphemeralOwner(ephemeral_owner);
 
         if (version < SnapshotVersion::V6)
         {
             int32_t data_length = 0;
             readBinary(data_length, in);
         }
-        int32_t num_children;
+        int32_t num_children = 0;
         readBinary(num_children, in);
-        if (num_children)
+        if (num_children != 0)
             node.ephemeral_or_children_data.children_info.num_children = num_children;
 
         readBinary(node.pzxid, in);
 
-        int32_t seq_num;
+        int32_t seq_num = 0;
         readBinary(seq_num, in);
-        if (seq_num)
+        if (seq_num != 0)
             node.ephemeral_or_children_data.children_info.seq_num = seq_num;
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
@@ -383,11 +380,6 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
     if (recalculate_digest)
         storage.nodes_digest = 0;
 
-    const auto is_node_empty = [](const auto & /*node*/)
-    {
-        return false; //node.getData().empty() && node == KeeperStorage::Node{};
-    };
-
     for (size_t nodes_read = 0; nodes_read < snapshot_container_size; ++nodes_read)
     {
         std::string path;
@@ -415,7 +407,7 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
         }
         else if (match_result == EXACT)
         {
-            if (!is_node_empty(node))
+            if (!node.empty())
             {
                 if (keeper_context->ignoreSystemPathOnStartup() || keeper_context->getServerState() != KeeperContext::Phase::INIT)
                 {
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index b06f87fc054..ac4a9433e30 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -191,6 +191,47 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
 
 }
 
+KeeperStorage::Node::~Node()
+{
+    if (data_size)
+        delete[] data;
+}
+
+KeeperStorage::Node & KeeperStorage::Node::operator=(const Node & other)
+{
+    if (this == &other)
+        return *this;
+
+    czxid = other.czxid;
+    mzxid = other.mzxid;
+    pzxid = other.pzxid;
+    acl_id = other.acl_id;
+    has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
+    is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
+    ephemeral_or_children_data = other.ephemeral_or_children_data;
+    data_size = other.data_size;
+    version = other.version;
+    cversion = other.cversion;
+    aversion = other.aversion;
+
+    if (data_size != 0)
+    {
+        data = new char[data_size];
+        memcpy(data, other.data, data_size);
+    }
+    return *this;
+}
+
+KeeperStorage::Node::Node(const Node & other)
+{
+    *this = other;
+}
+
+bool KeeperStorage::Node::empty() const
+{
+    return data_size == 0 && mzxid == 0;
+}
+
 void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
 {
     czxid = stat.czxid;
@@ -211,8 +252,7 @@ void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
     }
     else
     {
-        is_ephemeral_and_mtime.is_ephemeral = true;
-        ephemeral_or_children_data.ephemeral_owner = stat.ephemeralOwner;
+        setEphemeralOwner(stat.ephemeralOwner);
     }
 }
 
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 76b6ab43c50..55d2e20d44c 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -5,17 +5,15 @@
 #include <Coordination/ACLMap.h>
 #include <Coordination/SessionExpiryQueue.h>
 #include <Coordination/SnapshotableHashTable.h>
-#include <IO/WriteBufferFromString.h>
-#include <Common/ConcurrentBoundedQueue.h>
-#include <Common/ZooKeeper/IKeeper.h>
-#include <Common/ZooKeeper/ZooKeeperCommon.h>
-#include <Coordination/KeeperContext.h>
 
 #include <absl/container/flat_hash_set.h>
 
 namespace DB
 {
 
+class KeeperContext;
+using KeeperContextPtr = std::shared_ptr<KeeperContext>;
+
 struct KeeperStorageRequestProcessor;
 using KeeperStorageRequestProcessorPtr = std::shared_ptr<KeeperStorageRequestProcessor>;
 using ResponseCallback = std::function<void(const Coordination::ZooKeeperResponsePtr &)>;
@@ -43,13 +41,13 @@ public:
         mutable struct
         {
             bool has_cached_digest : 1;
-            int64_t ctime : 7;
+            int64_t ctime : 63;
         } has_cached_digest_and_ctime{false, 0};
 
         struct
         {
             bool is_ephemeral : 1;
-            int64_t mtime : 7;
+            int64_t mtime : 63;
         } is_ephemeral_and_mtime{false, 0};
 
 
@@ -74,47 +72,18 @@ public:
         /// pack the boolean with seq_num above
         mutable uint64_t cached_digest = 0;
 
-        ~Node()
-        {
-            if (data_size)
-                delete [] data;
-        }
+        ~Node();
 
         Node() = default;
 
-        Node & operator=(const Node & other)
-        {
-            if (this == &other)
-                return *this;
+        Node & operator=(const Node & other);
 
-            czxid = other.czxid;
-            mzxid = other.mzxid;
-            pzxid = other.pzxid;
-            acl_id = other.acl_id;
-            has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
-            is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
-            ephemeral_or_children_data = other.ephemeral_or_children_data;
-            data_size = other.data_size;
-            version = other.version;
-            cversion = other.cversion;
-            aversion = other.aversion;
+        Node(const Node & other);
 
-            if (data_size != 0)
-            {
-                data = new char[data_size];
-                memcpy(data, other.data, data_size);
-            }
-            return *this;
-        }
-
-        Node(const Node & other)
-        {
-            *this = other;
-        }
+        bool empty() const;
 
         bool isEphemeral() const
         {
-
             return is_ephemeral_and_mtime.is_ephemeral;
         }
 
@@ -123,6 +92,12 @@ public:
             return isEphemeral() ? ephemeral_or_children_data.ephemeral_owner : 0;
         }
 
+        void setEphemeralOwner(int64_t ephemeral_owner)
+        {
+            is_ephemeral_and_mtime.is_ephemeral = true;
+            ephemeral_or_children_data.ephemeral_owner = ephemeral_owner;
+        }
+
         int32_t numChildren() const
         {
             return ephemeral_or_children_data.children_info.num_children;
@@ -130,6 +105,7 @@ public:
 
         void increaseNumChildren()
         {
+            chassert(!isEphemeral());
             ++ephemeral_or_children_data.children_info.num_children;
         }
 
@@ -138,6 +114,11 @@ public:
             return ephemeral_or_children_data.children_info.seq_num;
         }
 
+        void setSeqNum(int32_t seq_num)
+        {
+            ephemeral_or_children_data.children_info.seq_num = seq_num;
+        }
+
         void increaseSeqNum()
         {
             ++ephemeral_or_children_data.children_info.seq_num;
diff --git a/src/Coordination/SnapshotableHashTable.h b/src/Coordination/SnapshotableHashTable.h
index 6a763a93210..5533913b3b8 100644
--- a/src/Coordination/SnapshotableHashTable.h
+++ b/src/Coordination/SnapshotableHashTable.h
@@ -18,11 +18,11 @@ struct ListNode
     StringRef key;
     V value;
 
-    struct 
+    struct
     {
         bool active_in_map : 1;
         bool free_key : 1;
-        uint64_t version : 6;
+        uint64_t version : 62;
     } node_metadata{false, false, 0};
 
     void setInactiveInMap()
diff --git a/src/Coordination/ZooKeeperDataReader.cpp b/src/Coordination/ZooKeeperDataReader.cpp
index 11a33e198a9..2e173667e28 100644
--- a/src/Coordination/ZooKeeperDataReader.cpp
+++ b/src/Coordination/ZooKeeperDataReader.cpp
@@ -101,30 +101,37 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, LoggerP
         KeeperStorage::Node node{};
         String data;
         Coordination::read(data, in);
-        node.setData(std::move(data));
+        node.setData(data);
         Coordination::read(node.acl_id, in);
 
         /// Deserialize stat
-        Coordination::read(node.src/Coordination/ZooKeeperDataReader.cppstat.czxid, in);
-        Coordination::read(node.stat.mzxid, in);
+        Coordination::read(node.czxid, in);
+        Coordination::read(node.mzxid, in);
         /// For some reason ZXID specified in filename can be smaller
         /// then actual zxid from nodes. In this case we will use zxid from nodes.
-        max_zxid = std::max(max_zxid, node.stat.mzxid);
+        max_zxid = std::max(max_zxid, node.mzxid);
 
-        Coordination::read(node.stat.ctime, in);
-        Coordination::read(node.stat.mtime, in);
-        Coordination::read(node.stat.version, in);
-        Coordination::read(node.stat.cversion, in);
-        Coordination::read(node.stat.aversion, in);
-        Coordination::read(node.stat.ephemeralOwner, in);
-        Coordination::read(node.stat.pzxid, in);
+        int64_t ctime;
+        Coordination::read(ctime, in);
+        node.setCtime(ctime);
+        int64_t mtime;
+        Coordination::read(mtime, in);
+        node.setMtime(mtime);
+        Coordination::read(node.version, in);
+        Coordination::read(node.cversion, in);
+        Coordination::read(node.aversion, in);
+        int64_t ephemeral_owner;
+        Coordination::read(ephemeral_owner, in);
+        if (ephemeral_owner != 0)
+          node.setEphemeralOwner(ephemeral_owner);
+        Coordination::read(node.pzxid, in);
         if (!path.empty())
         {
-            node.seq_num = node.stat.cversion;
+            node.setSeqNum(node.cversion);
             storage.container.insertOrReplace(path, node);
 
-            if (node.stat.ephemeralOwner != 0)
-                storage.ephemerals[node.stat.ephemeralOwner].insert(path);
+            if (ephemeral_owner != 0)
+                storage.ephemerals[ephemeral_owner].insert(path);
 
             storage.acl_map.addUsage(node.acl_id);
         }
@@ -139,7 +146,7 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, LoggerP
         if (itr.key != "/")
         {
             auto parent_path = parentNodePath(itr.key);
-            storage.container.updateValue(parent_path, [my_path = itr.key] (KeeperStorage::Node & value) { value.addChild(getBaseNodeName(my_path)); ++value.stat.numChildren; });
+            storage.container.updateValue(parent_path, [my_path = itr.key] (KeeperStorage::Node & value) { value.addChild(getBaseNodeName(my_path)); value.increaseNumChildren(); });
         }
     }
 
diff --git a/src/Coordination/tests/gtest_coordination.cpp b/src/Coordination/tests/gtest_coordination.cpp
index 59a550177a4..bd9dc4c3fd3 100644
--- a/src/Coordination/tests/gtest_coordination.cpp
+++ b/src/Coordination/tests/gtest_coordination.cpp
@@ -1508,7 +1508,7 @@ void addNode(DB::KeeperStorage & storage, const std::string & path, const std::s
     using Node = DB::KeeperStorage::Node;
     Node node{};
     node.setData(data);
-    node.stat.ephemeralOwner = ephemeral_owner;
+    node.setEphemeralOwner(ephemeral_owner);
     storage.container.insertOrReplace(path, node);
     auto child_it = storage.container.find(path);
     auto child_path = DB::getBaseNodeName(child_it->key);
@@ -1517,7 +1517,7 @@ void addNode(DB::KeeperStorage & storage, const std::string & path, const std::s
         [&](auto & parent)
         {
             parent.addChild(child_path);
-            parent.stat.numChildren++;
+            parent.increaseNumChildren();
         });
 }
 
@@ -1530,12 +1530,12 @@ TEST_P(CoordinationTest, TestStorageSnapshotSimple)
     DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
-    addNode(storage, "/hello", "world", 1);
-    addNode(storage, "/hello/somepath", "somedata", 3);
+    addNode(storage, "/hello1", "world", 1);
+    addNode(storage, "/hello2", "somedata", 3);
     storage.session_id_counter = 5;
     storage.zxid = 2;
-    storage.ephemerals[3] = {"/hello"};
-    storage.ephemerals[1] = {"/hello/somepath"};
+    storage.ephemerals[3] = {"/hello2"};
+    storage.ephemerals[1] = {"/hello1"};
     storage.getSessionID(130);
     storage.getSessionID(130);
 
@@ -1556,13 +1556,13 @@ TEST_P(CoordinationTest, TestStorageSnapshotSimple)
     auto [restored_storage, snapshot_meta, _] = manager.deserializeSnapshotFromBuffer(debuf);
 
     EXPECT_EQ(restored_storage->container.size(), 6);
-    EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 2);
-    EXPECT_EQ(restored_storage->container.getValue("/hello").getChildren().size(), 1);
-    EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getChildren().size(), 0);
+    EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 3);
+    EXPECT_EQ(restored_storage->container.getValue("/hello1").getChildren().size(), 0);
+    EXPECT_EQ(restored_storage->container.getValue("/hello2").getChildren().size(), 0);
 
     EXPECT_EQ(restored_storage->container.getValue("/").getData(), "");
-    EXPECT_EQ(restored_storage->container.getValue("/hello").getData(), "world");
-    EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getData(), "somedata");
+    EXPECT_EQ(restored_storage->container.getValue("/hello1").getData(), "world");
+    EXPECT_EQ(restored_storage->container.getValue("/hello2").getData(), "somedata");
     EXPECT_EQ(restored_storage->session_id_counter, 7);
     EXPECT_EQ(restored_storage->zxid, 2);
     EXPECT_EQ(restored_storage->ephemerals.size(), 2);
@@ -2251,12 +2251,12 @@ TEST_P(CoordinationTest, TestStorageSnapshotDifferentCompressions)
     DB::KeeperSnapshotManager manager(3, keeper_context, params.enable_compression);
 
     DB::KeeperStorage storage(500, "", keeper_context);
-    addNode(storage, "/hello", "world", 1);
-    addNode(storage, "/hello/somepath", "somedata", 3);
+    addNode(storage, "/hello1", "world", 1);
+    addNode(storage, "/hello2", "somedata", 3);
     storage.session_id_counter = 5;
     storage.zxid = 2;
-    storage.ephemerals[3] = {"/hello"};
-    storage.ephemerals[1] = {"/hello/somepath"};
+    storage.ephemerals[3] = {"/hello2"};
+    storage.ephemerals[1] = {"/hello1"};
     storage.getSessionID(130);
     storage.getSessionID(130);
 
@@ -2273,13 +2273,13 @@ TEST_P(CoordinationTest, TestStorageSnapshotDifferentCompressions)
     auto [restored_storage, snapshot_meta, _] = new_manager.deserializeSnapshotFromBuffer(debuf);
 
     EXPECT_EQ(restored_storage->container.size(), 6);
-    EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 2);
-    EXPECT_EQ(restored_storage->container.getValue("/hello").getChildren().size(), 1);
-    EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getChildren().size(), 0);
+    EXPECT_EQ(restored_storage->container.getValue("/").getChildren().size(), 3);
+    EXPECT_EQ(restored_storage->container.getValue("/hello1").getChildren().size(), 0);
+    EXPECT_EQ(restored_storage->container.getValue("/hello2").getChildren().size(), 0);
 
     EXPECT_EQ(restored_storage->container.getValue("/").getData(), "");
-    EXPECT_EQ(restored_storage->container.getValue("/hello").getData(), "world");
-    EXPECT_EQ(restored_storage->container.getValue("/hello/somepath").getData(), "somedata");
+    EXPECT_EQ(restored_storage->container.getValue("/hello1").getData(), "world");
+    EXPECT_EQ(restored_storage->container.getValue("/hello2").getData(), "somedata");
     EXPECT_EQ(restored_storage->session_id_counter, 7);
     EXPECT_EQ(restored_storage->zxid, 2);
     EXPECT_EQ(restored_storage->ephemerals.size(), 2);
@@ -2948,7 +2948,7 @@ TEST_P(CoordinationTest, TestCheckNotExistsRequest)
     create_path("/test_node");
     auto node_it = storage.container.find("/test_node");
     ASSERT_NE(node_it, storage.container.end());
-    auto node_version = node_it->value.stat.version;
+    auto node_version = node_it->value.version;
 
     {
         SCOPED_TRACE("CheckNotExists returns ZNODEEXISTS");
diff --git a/utils/keeper-bench/Generator.cpp b/utils/keeper-bench/Generator.cpp
index 2212f7158ae..a3e85f670d6 100644
--- a/utils/keeper-bench/Generator.cpp
+++ b/utils/keeper-bench/Generator.cpp
@@ -455,6 +455,7 @@ Coordination::ZooKeeperRequestPtr CreateRequestGenerator::generateImpl(const Coo
 
     auto request = std::make_shared<ZooKeeperCreateRequest>();
     request->acls = acls;
+    request->is_sequential = true;
 
     std::string path_candidate = std::filesystem::path(parent_path.getPath()) / name.getString();
 
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index e06b301edbf..12acd0a8db9 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -25,13 +25,13 @@ void dumpMachine(std::shared_ptr<KeeperStateMachine> machine)
         keys.pop();
         std::cout << key << "\n";
         auto value = storage.container.getValue(key);
-        std::cout << "\tStat: {version: " << value.stat.version <<
-            ", mtime: " << value.stat.mtime <<
-            ", emphemeralOwner: " << value.stat.ephemeralOwner <<
-            ", czxid: " << value.stat.czxid <<
-            ", mzxid: " << value.stat.mzxid <<
-            ", numChildren: " << value.stat.numChildren <<
-            ", dataLength: " << value.getData().size() <<
+        std::cout << "\tStat: {version: " << value.version <<
+            ", mtime: " << value.mtime() <<
+            ", emphemeralOwner: " << value.ephemeralOwner() <<
+            ", czxid: " << value.czxid <<
+            ", mzxid: " << value.mzxid <<
+            ", numChildren: " << value.numChildren() <<
+            ", dataLength: " << value.data_size <<
             "}" << std::endl;
         std::cout << "\tData: " << storage.container.getValue(key).getData() << std::endl;
 

From b60228af3fd7fca55df2a2e015495f85bb905f9d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 16 Jan 2024 19:02:32 +0000
Subject: [PATCH 0624/1081] Allow to send a chain of subqueries for parallel
 replicas with analyzer.

---
 src/Planner/Planner.cpp                       |  41 +-
 src/Planner/Planner.h                         |   4 +
 src/Planner/PlannerContext.h                  |  10 +-
 src/Planner/PlannerJoinTree.cpp               |  10 +
 src/Planner/PlannerJoinTree.h                 |   1 +
 src/Planner/findParallelReplicasQuery.cpp     | 381 ++++++++++++++++++
 src/Planner/findParallelReplicasQuery.h       |  30 ++
 src/Storages/StorageDistributed.cpp           |   2 +-
 src/Storages/StorageMergeTree.cpp             |   2 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |   2 +-
 src/Storages/buildQueryTreeForShard.cpp       |   4 +-
 src/Storages/buildQueryTreeForShard.h         |   5 +-
 ...llel_replicas_joins_and_analyzer.reference | 251 ++++++++++++
 ...7_parallel_replicas_joins_and_analyzer.sql | 123 ++++++
 14 files changed, 850 insertions(+), 16 deletions(-)
 create mode 100644 src/Planner/findParallelReplicasQuery.cpp
 create mode 100644 src/Planner/findParallelReplicasQuery.h
 create mode 100644 tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
 create mode 100644 tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index efccadcbe1a..d8f9153cd4f 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -64,6 +64,7 @@
 #include <Analyzer/AggregationUtils.h>
 #include <Analyzer/WindowFunctionsUtils.h>
 
+#include <Planner/findParallelReplicasQuery.h>
 #include <Planner/Utils.h>
 #include <Planner/PlannerContext.h>
 #include <Planner/PlannerActionsVisitor.h>
@@ -481,6 +482,11 @@ void addMergingAggregatedStep(QueryPlan & query_plan,
         settings.max_block_size,
         settings.min_hit_rate_to_use_consecutive_keys_optimization);
 
+    // WriteBufferFromOwnString buf;
+    // params.explain(buf, 0);
+    // std::cerr << "........... " << buf.str() << std::endl;
+    // std::cerr << query_plan.getCurrentDataStream().header.dumpStructure() << std::endl;
+
     bool is_remote_storage = false;
     bool parallel_replicas_from_merge_tree = false;
 
@@ -1066,7 +1072,7 @@ void addBuildSubqueriesForSetsStepIfNeeded(
         Planner subquery_planner(
             query_tree,
             subquery_options,
-            std::make_shared<GlobalPlannerContext>()); //planner_context->getGlobalPlannerContext());
+            std::make_shared<GlobalPlannerContext>(nullptr)); //planner_context->getGlobalPlannerContext());
         subquery_planner.buildQueryPlanIfNeeded();
 
         subquery->setQueryPlan(std::make_unique<QueryPlan>(std::move(subquery_planner).extractQueryPlan()));
@@ -1169,7 +1175,7 @@ Planner::Planner(const QueryTreeNodePtr & query_tree_,
     SelectQueryOptions & select_query_options_)
     : query_tree(query_tree_)
     , select_query_options(select_query_options_)
-    , planner_context(buildPlannerContext(query_tree, select_query_options, std::make_shared<GlobalPlannerContext>()))
+    , planner_context(buildPlannerContext(query_tree, select_query_options, std::make_shared<GlobalPlannerContext>(findParallelReplicasQuery(query_tree, select_query_options))))
 {
 }
 
@@ -1232,6 +1238,8 @@ void Planner::buildPlanForUnionNode()
         query_planner.buildQueryPlanIfNeeded();
         for (const auto & row_policy : query_planner.getUsedRowPolicies())
             used_row_policies.insert(row_policy);
+        const auto & mapping = query_planner.getQueryNodeToPlanStepMapping();
+        query_node_to_plan_step_mapping.insert(mapping.begin(), mapping.end());
         auto query_node_plan = std::make_unique<QueryPlan>(std::move(query_planner).extractQueryPlan());
         query_plans_headers.push_back(query_node_plan->getCurrentDataStream().header);
         query_plans.push_back(std::move(query_node_plan));
@@ -1411,16 +1419,31 @@ void Planner::buildPlanForQueryNode()
         }
     }
 
-    auto top_level_identifiers = collectTopLevelColumnIdentifiers(query_tree, planner_context);
-    auto join_tree_query_plan = buildJoinTreeQueryPlan(query_tree,
-        select_query_info,
-        select_query_options,
-        top_level_identifiers,
-        planner_context);
+    JoinTreeQueryPlan join_tree_query_plan;
+    if (planner_context->getMutableQueryContext()->canUseTaskBasedParallelReplicas()
+        && planner_context->getGlobalPlannerContext()->parallel_replicas_node == &query_node)
+    {
+        join_tree_query_plan = buildQueryPlanForParallelReplicas(query_node, planner_context, select_query_info.storage_limits);
+    }
+    else
+    {
+        auto top_level_identifiers = collectTopLevelColumnIdentifiers(query_tree, planner_context);
+        join_tree_query_plan = buildJoinTreeQueryPlan(query_tree,
+            select_query_info,
+            select_query_options,
+            top_level_identifiers,
+            planner_context);
+    }
 
     auto from_stage = join_tree_query_plan.from_stage;
     query_plan = std::move(join_tree_query_plan.query_plan);
     used_row_policies = std::move(join_tree_query_plan.used_row_policies);
+    auto & mapping = join_tree_query_plan.query_node_to_plan_step_mapping;
+    query_node_to_plan_step_mapping.insert(mapping.begin(), mapping.end());
+
+    // WriteBufferFromOwnString buf;
+    // query_plan.explainPlan(buf, {.header = true});
+    // LOG_TRACE(&Poco::Logger::get("Planner"), "Plan\n{}", buf.str());
 
     LOG_TRACE(getLogger("Planner"), "Query {} from stage {} to stage {}{}",
         query_tree->formatConvertedASTForErrorMessage(),
@@ -1690,6 +1713,8 @@ void Planner::buildPlanForQueryNode()
 
     if (!select_query_options.only_analyze)
         addBuildSubqueriesForSetsStepIfNeeded(query_plan, select_query_options, planner_context, result_actions_to_execute);
+
+    query_node_to_plan_step_mapping[&query_node] = query_plan.getRootNode();
 }
 
 SelectQueryInfo Planner::buildSelectQueryInfo() const
diff --git a/src/Planner/Planner.h b/src/Planner/Planner.h
index 2177ed59fc6..5667686b058 100644
--- a/src/Planner/Planner.h
+++ b/src/Planner/Planner.h
@@ -65,6 +65,9 @@ public:
         return planner_context;
     }
 
+    using QueryNodeToPlanStepMapping = std::unordered_map<const QueryNode *, const QueryPlan::Node *>;
+    const QueryNodeToPlanStepMapping & getQueryNodeToPlanStepMapping() const { return query_node_to_plan_step_mapping; }
+
 private:
     void buildPlanForUnionNode();
 
@@ -76,6 +79,7 @@ private:
     QueryPlan query_plan;
     StorageLimitsList storage_limits;
     std::set<std::string> used_row_policies;
+    QueryNodeToPlanStepMapping query_node_to_plan_step_mapping;
 };
 
 }
diff --git a/src/Planner/PlannerContext.h b/src/Planner/PlannerContext.h
index d7ea4fd95dd..a5a64fc0a6b 100644
--- a/src/Planner/PlannerContext.h
+++ b/src/Planner/PlannerContext.h
@@ -18,10 +18,16 @@ namespace DB
   *
   * 1. Column identifiers.
   */
+
+class QueryNode;
+
 class GlobalPlannerContext
 {
 public:
-    GlobalPlannerContext() = default;
+    explicit GlobalPlannerContext(const QueryNode * parallel_replicas_node_)
+        : parallel_replicas_node(parallel_replicas_node_)
+    {
+    }
 
     /** Create column identifier for column node.
       *
@@ -38,6 +44,8 @@ public:
     /// Check if context has column identifier
     bool hasColumnIdentifier(const ColumnIdentifier & column_identifier);
 
+    const QueryNode * const parallel_replicas_node = nullptr;
+
 private:
     std::unordered_set<ColumnIdentifier> column_identifiers;
 };
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index ab25f6d2423..a35f396aee9 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -593,6 +593,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
     auto * union_node = table_expression->as<UnionNode>();
 
     QueryPlan query_plan;
+    std::unordered_map<const QueryNode *, const QueryPlan::Node *> query_node_to_plan_step_mapping;
     std::set<std::string> used_row_policies;
 
     if (table_node || table_function_node)
@@ -895,6 +896,8 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
             /// Propagate storage limits to subquery
             subquery_planner.addStorageLimits(*select_query_info.storage_limits);
             subquery_planner.buildQueryPlanIfNeeded();
+            const auto & mapping = subquery_planner.getQueryNodeToPlanStepMapping();
+            query_node_to_plan_step_mapping.insert(mapping.begin(), mapping.end());
             query_plan = std::move(subquery_planner).extractQueryPlan();
         }
     }
@@ -954,6 +957,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
         .query_plan = std::move(query_plan),
         .from_stage = from_stage,
         .used_row_policies = std::move(used_row_policies),
+        .query_node_to_plan_step_mapping = std::move(query_node_to_plan_step_mapping),
     };
 }
 
@@ -1500,11 +1504,16 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
     if (join_clauses_and_actions.right_join_expressions_actions)
         left_join_tree_query_plan.actions_dags.emplace_back(std::move(join_clauses_and_actions.right_join_expressions_actions));
 
+    auto mapping = std::move(left_join_tree_query_plan.query_node_to_plan_step_mapping);
+    auto & r_mapping = right_join_tree_query_plan.query_node_to_plan_step_mapping;
+    mapping.insert(r_mapping.begin(), r_mapping.end());
+
     return JoinTreeQueryPlan{
         .query_plan = std::move(result_plan),
         .from_stage = QueryProcessingStage::FetchColumns,
         .used_row_policies = std::move(left_join_tree_query_plan.used_row_policies),
         .actions_dags = std::move(left_join_tree_query_plan.actions_dags),
+        .query_node_to_plan_step_mapping = std::move(mapping),
     };
 }
 
@@ -1591,6 +1600,7 @@ JoinTreeQueryPlan buildQueryPlanForArrayJoinNode(const QueryTreeNodePtr & array_
         .from_stage = QueryProcessingStage::FetchColumns,
         .used_row_policies = std::move(join_tree_query_plan.used_row_policies),
         .actions_dags = std::move(join_tree_query_plan.actions_dags),
+        .query_node_to_plan_step_mapping = std::move(join_tree_query_plan.query_node_to_plan_step_mapping),
     };
 }
 
diff --git a/src/Planner/PlannerJoinTree.h b/src/Planner/PlannerJoinTree.h
index c5a7d14fa55..a21438d466f 100644
--- a/src/Planner/PlannerJoinTree.h
+++ b/src/Planner/PlannerJoinTree.h
@@ -17,6 +17,7 @@ struct JoinTreeQueryPlan
     QueryProcessingStage::Enum from_stage;
     std::set<std::string> used_row_policies;
     std::vector<ActionsDAGPtr> actions_dags;
+    std::unordered_map<const QueryNode *, const QueryPlan::Node *> query_node_to_plan_step_mapping;
 };
 
 /// Build JOIN TREE query plan for query node
diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
new file mode 100644
index 00000000000..08ca559dd77
--- /dev/null
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -0,0 +1,381 @@
+#include <Planner/findParallelReplicasQuery.h>
+#include <Interpreters/ClusterProxy/SelectStreamFactory.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <Processors/QueryPlan/JoinStep.h>
+#include <Storages/buildQueryTreeForShard.h>
+#include <Interpreters/ClusterProxy/executeQuery.h>
+#include <Planner/PlannerJoinTree.h>
+#include <Planner/Utils.h>
+#include "Analyzer/ArrayJoinNode.h"
+#include "Analyzer/InDepthQueryTreeVisitor.h"
+#include "Analyzer/JoinNode.h"
+#include "Analyzer/QueryNode.h"
+#include "Analyzer/TableNode.h"
+#include "Analyzer/UnionNode.h"
+#include "Parsers/ASTSubquery.h"
+#include "Parsers/queryToString.h"
+#include "Processors/QueryPlan/ExpressionStep.h"
+#include "Processors/QueryPlan/FilterStep.h"
+#include "Storages/MergeTree/MergeTreeData.h"
+#include <Storages/StorageDummy.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int UNSUPPORTED_METHOD;
+}
+
+std::stack<const QueryNode *> getSupportingParallelReplicasQuery(const IQueryTreeNode * query_tree_node)
+{
+    std::stack<const QueryNode *> res;
+
+    while (query_tree_node)
+    {
+        auto join_tree_node_type = query_tree_node->getNodeType();
+
+        switch (join_tree_node_type)
+        {
+            case QueryTreeNodeType::TABLE:
+            {
+                const auto & table_node = query_tree_node->as<TableNode &>();
+                const auto & storage = table_node.getStorage();
+                if (std::dynamic_pointer_cast<MergeTreeData>(storage) || typeid_cast<const StorageDummy *>(storage.get()))
+                    return res;
+
+                return {};
+            }
+            case QueryTreeNodeType::TABLE_FUNCTION:
+            {
+                return {};
+            }
+            case QueryTreeNodeType::QUERY:
+            {
+                const auto & query_node_to_process = query_tree_node->as<QueryNode &>();
+                query_tree_node = query_node_to_process.getJoinTree().get();
+                res.push(&query_node_to_process);
+                break;
+            }
+            case QueryTreeNodeType::UNION:
+            {
+                const auto & union_node = query_tree_node->as<UnionNode &>();
+                const auto & union_queries = union_node.getQueries().getNodes();
+
+                if (union_queries.empty())
+                    return {};
+
+                query_tree_node = union_queries.front().get();
+                break;
+            }
+            case QueryTreeNodeType::ARRAY_JOIN:
+            {
+                const auto & array_join_node = query_tree_node->as<ArrayJoinNode &>();
+                query_tree_node = array_join_node.getTableExpression().get();
+                break;
+            }
+            case QueryTreeNodeType::JOIN:
+            {
+                const auto & join_node = query_tree_node->as<JoinNode &>();
+                auto join_kind = join_node.getKind();
+                if (join_kind != JoinKind::Inner && join_kind != JoinKind::Left)
+                    return {};
+
+                query_tree_node = join_node.getLeftTableExpression().get();
+                break;
+            }
+            default:
+            {
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                "Unexpected node type for table expression. "
+                                "Expected table, table function, query, union, join or array join. Actual {}",
+                                query_tree_node->getNodeTypeName());
+            }
+        }
+    }
+
+    return res;
+}
+
+class ReplaceTableNodeToDummyVisitor : public InDepthQueryTreeVisitor<ReplaceTableNodeToDummyVisitor, true>
+{
+public:
+    using Base = InDepthQueryTreeVisitor<ReplaceTableNodeToDummyVisitor, true>;
+    using Base::Base;
+
+    void visitImpl(const QueryTreeNodePtr & node)
+    {
+        auto * table_node = node->as<TableNode>();
+        auto * table_function_node = node->as<TableFunctionNode>();
+
+        if (table_node || table_function_node)
+        {
+            const auto & storage_snapshot = table_node ? table_node->getStorageSnapshot() : table_function_node->getStorageSnapshot();
+            auto get_column_options = GetColumnsOptions(GetColumnsOptions::All).withExtendedObjects().withVirtuals();
+
+            auto storage_dummy
+                = std::make_shared<StorageDummy>(storage_snapshot->storage.getStorageID(), ColumnsDescription(storage_snapshot->getColumns(get_column_options)));
+
+            auto dummy_table_node = std::make_shared<TableNode>(std::move(storage_dummy), context);
+
+            dummy_table_node->setAlias(node->getAlias());
+            replacement_map.emplace(node.get(), std::move(dummy_table_node));
+        }
+    }
+
+    ContextPtr context;
+    std::unordered_map<const IQueryTreeNode *, QueryTreeNodePtr> replacement_map;
+};
+
+QueryTreeNodePtr replaceTablesWithDummyTables(const QueryTreeNodePtr & query, const ContextPtr & context)
+{
+    ReplaceTableNodeToDummyVisitor visitor;
+    visitor.context = context;
+    visitor.visit(query);
+
+    return query->cloneAndReplace(visitor.replacement_map);
+}
+
+const QueryNode * findParallelReplicasQuery(
+    std::stack<const QueryNode *> stack,
+    const std::unordered_map<const QueryNode *, const QueryPlan::Node *> & mapping)
+{
+    const QueryPlan::Node * prev_checked_node = nullptr;
+    const QueryNode * res = nullptr;
+
+    while (!stack.empty())
+    {
+        const QueryNode * subquery_node = stack.top();
+        stack.pop();
+
+        // std::cerr << "----- trying " << reinterpret_cast<const void *>(subquery_node) << std::endl;
+
+        // const QueryNode * mapped_node = subquery_node;
+        // if (auto it = replacement_map.find(subquery_node); it != replacement_map.end())
+        //     mapped_node = it->second.get();
+
+        auto it = mapping.find(subquery_node);
+        /// This should not happen ideally.
+        if (it == mapping.end())
+            break;
+
+        const QueryPlan::Node * curr_node = it->second;
+        const QueryPlan::Node * next_node_to_check = curr_node;
+        bool can_distribute_full_node = true;
+
+        // std::cerr << "trying " << curr_node->step->getName() << '\n' << subquery_node->dumpTree() << std::endl;
+
+        while (next_node_to_check && next_node_to_check != prev_checked_node)
+        {
+            const auto & children = next_node_to_check->children;
+            auto * step = next_node_to_check->step.get();
+
+            if (children.empty())
+            {
+                /// Found a source step. This should be possible only in the first iteration.
+                if (prev_checked_node)
+                    return nullptr;
+
+                next_node_to_check = nullptr;
+            }
+            else if (children.size() == 1)
+            {
+                const auto * expression = typeid_cast<ExpressionStep *>(step);
+                const auto * filter = typeid_cast<FilterStep *>(step);
+                if (!expression && !filter)
+                    can_distribute_full_node = false;
+
+                next_node_to_check = children.front();
+            }
+            else
+            {
+                const auto * join = typeid_cast<JoinStep *>(step);
+                /// We've checked that JOIN is INNER/LEFT in query tree.
+                /// Don't distribute UNION node.
+                if (!join)
+                    return res;
+
+                next_node_to_check = children.front();
+            }
+        }
+
+        /// Current node contains steps like GROUP BY / DISTINCT
+        /// Will try to execute query up to WithMergableStage
+        if (!can_distribute_full_node)
+        {
+            /// Current query node does not contain subqueries already.
+            /// We can execute parallel replicas over storage.
+            if (!res)
+                return nullptr;
+
+            return subquery_node;
+        }
+
+        /// Query is simple enough to be fully distributed.
+        res = subquery_node;
+        prev_checked_node = curr_node;
+    }
+
+    return res;
+}
+
+const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options)
+{
+    if (select_query_options.only_analyze)
+        return nullptr;
+
+    auto * query_node = query_tree_node->as<QueryNode>();
+    auto * union_node = query_tree_node->as<UnionNode>();
+
+    if (!query_node && !union_node)
+        throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
+            "Expected QUERY or UNION node. Actual {}",
+            query_tree_node->formatASTForErrorMessage());
+
+    auto context = query_node ? query_node->getContext() : union_node->getContext();
+    // const auto & settings = context->getSettingsRef();
+
+    if (!context->canUseParallelReplicasOnInitiator())
+        return nullptr;
+
+    auto stack = getSupportingParallelReplicasQuery(query_tree_node.get());
+    // std::cerr << "=============== findParallelReplicasQuery stack size " << stack.size() << std::endl;
+    // std::cerr << "=============== findParallelReplicasQuery tree\n " << query_tree_node->dumpTree() << std::endl;
+    // std::cerr << "=============== findParallelReplicasQuery trace \n" << StackTrace().toString() << std::endl;
+    /// Empty stack means that storage does not support parallel replicas.
+    if (stack.empty())
+        return nullptr;
+
+    /// We don't have any subquery and storage can process parallel replicas by itself.
+    if (stack.top() == query_tree_node.get())
+        return nullptr;
+
+    auto mutable_context = Context::createCopy(context);
+    mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+
+    ResultReplacementMap replacement_map;
+    auto updated_query_tree = replaceTablesWithDummyTables(query_tree_node, mutable_context);
+
+    // std::cerr << "=============== findParallelReplicasQuery updated tree\n " << updated_query_tree->dumpTree() << std::endl;
+
+    SelectQueryOptions options;
+    //options.only_analyze = true;
+    Planner planner(updated_query_tree, options, std::make_shared<GlobalPlannerContext>(nullptr));
+    planner.buildQueryPlanIfNeeded();
+
+    // WriteBufferFromOwnString buf;
+    // planner.getQueryPlan().explainPlan(buf, {.actions = true});
+    // std::cerr << buf.str() << std::endl;
+
+    auto new_stack = getSupportingParallelReplicasQuery(updated_query_tree.get());
+
+    //const auto & result_query_plan = planner.getQueryPlan();
+    const auto & mapping = planner.getQueryNodeToPlanStepMapping();
+
+    // for (const auto & [k, v] : mapping)
+    //     std::cerr << "----- " << v->step->getName() << '\n' << reinterpret_cast<const void *>(k) << std::endl;
+
+    const auto * res = findParallelReplicasQuery(new_stack, mapping);
+    // if (res)
+    //     std::cerr << "Result subtree " << res->dumpTree() << std::endl;
+    // else
+    //     std::cerr << "Result subtree is empty" << std::endl;
+
+    if (res)
+    {
+        while (!new_stack.empty())
+        {
+            if (res == new_stack.top())
+                return stack.top();
+
+            stack.pop();
+            new_stack.pop();
+        }
+    }
+
+    return res;
+}
+
+static void removeCTEs(ASTPtr & ast)
+{
+    std::stack<IAST *> stack;
+    stack.push(ast.get());
+    while (!stack.empty())
+    {
+        auto * node = stack.top();
+        stack.pop();
+
+        if (auto * subquery = typeid_cast<ASTSubquery *>(node))
+            subquery->cte_name = {};
+
+        for (const auto & child : node->children)
+            stack.push(child.get());
+    }
+}
+
+JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
+    const QueryNode & query_node,
+    const PlannerContextPtr & planner_context,
+    std::shared_ptr<const StorageLimitsList> storage_limits)
+{
+    // std::cerr << "buildQueryPlanForParallelReplicas 1 " << query_node.dumpTree() << std::endl;
+    ASTPtr modified_query_ast;
+    Block header;
+    auto processed_stage = QueryProcessingStage::WithMergeableState;
+    auto context = planner_context->getQueryContext();
+
+    QueryTreeNodePtr modified_query_tree = query_node.clone();
+
+    Block initial_header = InterpreterSelectQueryAnalyzer::getSampleBlock(
+        modified_query_tree, context, SelectQueryOptions(processed_stage).analyze());
+
+    rewriteJoinToGlobalJoin(modified_query_tree);
+    // std::cerr << "buildQueryPlanForParallelReplicas 1 " << modified_query_tree->dumpTree() << std::endl;
+    modified_query_tree = buildQueryTreeForShard(planner_context, modified_query_tree);
+    // std::cerr << "buildQueryPlanForParallelReplicas 2 " << modified_query_tree->dumpTree() << std::endl;
+    modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
+    removeCTEs(modified_query_ast);
+
+    // std::cerr << "buildQueryPlanForParallelReplicas AST " << queryToString(modified_query_ast) << std::endl;
+    // std::cerr << "buildQueryPlanForParallelReplicas AST " << modified_query_ast->dumpTree() << std::endl;
+
+    // SelectQueryOptions opt(processed_stage);
+    // Planner planner(modified_query_tree, opt, std::make_shared<GlobalPlannerContext>(nullptr));
+    // planner.buildQueryPlanIfNeeded();
+    // header = planner.getQueryPlan().getCurrentDataStream().header;
+
+    // InterpreterSelectQueryAnalyzer interpreter(modified_query_tree, context, SelectQueryOptions(processed_stage));
+    // header = interpreter.getSampleBlock();
+
+    header = InterpreterSelectQueryAnalyzer::getSampleBlock(
+        modified_query_tree, context, SelectQueryOptions(processed_stage).analyze());
+
+    ClusterProxy::SelectStreamFactory select_stream_factory =
+        ClusterProxy::SelectStreamFactory(
+            header,
+            {},
+            {},
+            processed_stage);
+
+    QueryPlan query_plan;
+    ClusterProxy::executeQueryWithParallelReplicas(
+        query_plan,
+        select_stream_factory,
+        modified_query_ast,
+        context,
+        storage_limits);
+
+    auto converting = ActionsDAG::makeConvertingActions(
+        header.getColumnsWithTypeAndName(),
+        initial_header.getColumnsWithTypeAndName(),
+        ActionsDAG::MatchColumnsMode::Position);
+
+    auto step = std::make_unique<ExpressionStep>(query_plan.getCurrentDataStream(), std::move(converting));
+    step->setStepDescription("Convert distributed names");
+    query_plan.addStep(std::move(step));
+
+    return {std::move(query_plan), std::move(processed_stage), {}, {}, {}};
+}
+
+}
diff --git a/src/Planner/findParallelReplicasQuery.h b/src/Planner/findParallelReplicasQuery.h
new file mode 100644
index 00000000000..56085604539
--- /dev/null
+++ b/src/Planner/findParallelReplicasQuery.h
@@ -0,0 +1,30 @@
+#pragma once
+#include <list>
+#include <memory>
+
+namespace DB
+{
+
+class QueryNode;
+
+class IQueryTreeNode;
+using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
+
+struct SelectQueryOptions;
+
+const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
+
+struct JoinTreeQueryPlan;
+
+class PlannerContext;
+using PlannerContextPtr = std::shared_ptr<PlannerContext>;
+
+struct StorageLimits;
+using StorageLimitsList = std::list<StorageLimits>;
+
+JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
+    const QueryNode & query_node,
+    const PlannerContextPtr & planner_context,
+    std::shared_ptr<const StorageLimitsList> storage_limits);
+
+}
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index f711ed5ac92..70a678b0d86 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -796,7 +796,7 @@ QueryTreeNodePtr buildQueryTreeDistributed(SelectQueryInfo & query_info,
 
     auto query_tree_to_modify = query_info.query_tree->cloneAndReplace(query_info.table_expression, std::move(replacement_table_expression));
 
-    return buildQueryTreeForShard(query_info, query_tree_to_modify);
+    return buildQueryTreeForShard(query_info.planner_context, query_tree_to_modify);
 }
 
 }
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 0f75c726bce..77c506fca7f 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -225,7 +225,7 @@ void StorageMergeTree::read(
         {
             QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
             rewriteJoinToGlobalJoin(modified_query_tree);
-            modified_query_tree = buildQueryTreeForShard(query_info, modified_query_tree);
+            modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
             header = InterpreterSelectQueryAnalyzer::getSampleBlock(
                 modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
             modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6bd57cc4d6d..998bad17e53 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -5413,7 +5413,7 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
     {
         QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
         rewriteJoinToGlobalJoin(modified_query_tree);
-        modified_query_tree = buildQueryTreeForShard(query_info, modified_query_tree);
+        modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
 
         header = InterpreterSelectQueryAnalyzer::getSampleBlock(
             modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index 5ea28d9e09c..26212d15917 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -295,10 +295,8 @@ TableNodePtr executeSubqueryNode(const QueryTreeNodePtr & subquery_node,
 
 }
 
-QueryTreeNodePtr buildQueryTreeForShard(SelectQueryInfo & query_info, QueryTreeNodePtr query_tree_to_modify)
+QueryTreeNodePtr buildQueryTreeForShard(const PlannerContextPtr & planner_context, QueryTreeNodePtr query_tree_to_modify)
 {
-    auto & planner_context = query_info.planner_context;
-
     CollectColumnSourceToColumnsVisitor collect_column_source_to_columns_visitor;
     collect_column_source_to_columns_visitor.visit(query_tree_to_modify);
 
diff --git a/src/Storages/buildQueryTreeForShard.h b/src/Storages/buildQueryTreeForShard.h
index eec5a0dc38a..3ffb5707c2b 100644
--- a/src/Storages/buildQueryTreeForShard.h
+++ b/src/Storages/buildQueryTreeForShard.h
@@ -10,7 +10,10 @@ struct SelectQueryInfo;
 class IQueryTreeNode;
 using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
 
-QueryTreeNodePtr buildQueryTreeForShard(SelectQueryInfo & query_info, QueryTreeNodePtr query_tree_to_modify);
+class PlannerContext;
+using PlannerContextPtr = std::shared_ptr<PlannerContext>;
+
+QueryTreeNodePtr buildQueryTreeForShard(const PlannerContextPtr & planner_context, QueryTreeNodePtr query_tree_to_modify);
 
 void rewriteJoinToGlobalJoin(QueryTreeNodePtr query_tree_to_modify);
 
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
new file mode 100644
index 00000000000..fdb4a761015
--- /dev/null
+++ b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
@@ -0,0 +1,251 @@
+-- { echoOn }
+
+-- A query with only INNER/LEFT joins is fully send to replicas. JOIN is executed in GLOBAL mode.
+select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  ReadFromRemoteParallelReplicas
+--
+-- The same query with cte;
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      ReadFromRemoteParallelReplicas
+--
+-- GROUP BY should work up to WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+54	54	50	50	12	12	0
+64	64	0	0	0	0	1
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      MergingAggregated
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- ORDER BY in sub3 : sub1 is fully pushed, sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- ORDER BY in sub1 : sub1 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          Join
+            Expression
+              ReadFromRemoteParallelReplicas
+            Expression
+              ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- RIGHT JOIN in sub3: sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+6	6	6	6	0	0
+8	8	8	8	0	0
+10	10	10	10	0	0
+12	12	12	12	12	12
+14	14	14	14	0	0
+4	4	0	0	0	0
+3	3	0	0	0	0
+5	5	0	0	0	0
+1	1	0	0	0	0
+7	7	0	0	0	0
+9	9	0	0	0	0
+15	15	0	0	0	0
+11	11	0	0	0	0
+13	13	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Join
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+    Expression
+      ReadFromRemoteParallelReplicas
+--
+-- RIGHT JOIN in sub5: sub5 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+0	0	1	1	0	0
+0	0	3	3	0	0
+0	0	4	4	0	0
+0	0	5	5	0	0
+0	0	6	6	6	6
+0	0	7	7	0	0
+0	0	8	8	8	8
+0	0	9	9	0	0
+0	0	10	10	10	10
+0	0	11	11	0	0
+12	12	12	12	12	12
+0	0	13	13	0	0
+0	0	14	14	14	14
+0	0	15	15	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          Join
+            Expression
+              ReadFromRemoteParallelReplicas
+            Expression
+              ReadFromRemoteParallelReplicas
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql
new file mode 100644
index 00000000000..a3a2269fabb
--- /dev/null
+++ b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql
@@ -0,0 +1,123 @@
+drop table if exists tab1;
+drop table if exists tab2;
+drop table if exists tab3;
+
+create table tab1 (x UInt32, y UInt32, shard UInt32) engine = MergeTree order by shard;
+create table tab2 (y UInt32, z UInt32) engine = MergeTree order by tuple();
+create table tab3 (z UInt32, a UInt32) engine = MergeTree order by tuple();
+
+insert into tab1 select number, number, number from numbers(16);
+insert into tab2 select number * 2, number * 2 from numbers(8);
+insert into tab3 select number * 4, number * 4 from numbers(4);
+
+-- { echoOn }
+
+-- A query with only INNER/LEFT joins is fully send to replicas. JOIN is executed in GLOBAL mode.
+select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+explain description=0 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- The same query with cte;
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- GROUP BY should work up to WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- ORDER BY in sub3 : sub1 is fully pushed, sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- ORDER BY in sub1 : sub1 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- RIGHT JOIN in sub3: sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+--
+-- RIGHT JOIN in sub5: sub5 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;

From 7f2a5d38c55cd21d4b91f49df67ba4507f072bbd Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 26 Jan 2024 11:18:50 +0000
Subject: [PATCH 0625/1081] Prohibit any inner join.

---
 src/Planner/findParallelReplicasQuery.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
index 08ca559dd77..5519478fea2 100644
--- a/src/Planner/findParallelReplicasQuery.cpp
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -79,7 +79,13 @@ std::stack<const QueryNode *> getSupportingParallelReplicasQuery(const IQueryTre
             {
                 const auto & join_node = query_tree_node->as<JoinNode &>();
                 auto join_kind = join_node.getKind();
-                if (join_kind != JoinKind::Inner && join_kind != JoinKind::Left)
+                auto join_strictness = join_node.getStrictness();
+
+                bool can_parallelize_join =
+                    join_kind == JoinKind::Left
+                    || (join_kind == JoinKind::Inner && join_strictness == JoinStrictness::All);
+
+                if (!can_parallelize_join)
                     return {};
 
                 query_tree_node = join_node.getLeftTableExpression().get();

From 1892318e465722df59f561aa2da0c5f35ecc6b64 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 26 Jan 2024 11:19:34 +0000
Subject: [PATCH 0626/1081] Squash temporary tables.

---
 src/Storages/buildQueryTreeForShard.cpp | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index 26212d15917..f423d7e6a83 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -16,6 +16,7 @@
 #include <Storages/StorageDummy.h>
 #include <Planner/Utils.h>
 #include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <Processors/Transforms/SquashingChunksTransform.h>
 #include <Processors/QueryPlan/ExpressionStep.h>
 #include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
@@ -283,7 +284,16 @@ TableNodePtr executeSubqueryNode(const QueryTreeNodePtr & subquery_node,
 
     auto optimization_settings = QueryPlanOptimizationSettings::fromContext(mutable_context);
     auto build_pipeline_settings = BuildQueryPipelineSettings::fromContext(mutable_context);
-    auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*query_plan.buildQueryPipeline(optimization_settings, build_pipeline_settings)));
+    auto builder = query_plan.buildQueryPipeline(optimization_settings, build_pipeline_settings);
+
+    /// It's 16M squashing. 16 is a multiplier for compression.
+    size_t min_block_size_bytes = DBMS_DEFAULT_BUFFER_SIZE * 16;
+    auto squashing = std::make_shared<SimpleSquashingChunksTransform>(builder->getHeader(), 0, min_block_size_bytes);
+
+    builder->resize(1);
+    builder->addTransform(std::move(squashing));
+
+    auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
 
     pipeline.complete(std::move(table_out));
     CompletedPipelineExecutor executor(pipeline);

From 8692e8f752fcafe5da21213ae1f9b7e51e498d48 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 29 Jan 2024 15:33:36 +0000
Subject: [PATCH 0627/1081] Add settings to squash external table blocks.

---
 src/Core/Settings.h                     | 2 ++
 src/Storages/buildQueryTreeForShard.cpp | 6 +++---
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 2b36b83edd2..c42909b930f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -40,6 +40,8 @@ class IColumn;
     M(UInt64, min_insert_block_size_bytes, (DEFAULT_INSERT_BLOCK_SIZE * 256), "Squash blocks passed to INSERT query to specified size in bytes, if blocks are not big enough.", 0) \
     M(UInt64, min_insert_block_size_rows_for_materialized_views, 0, "Like min_insert_block_size_rows, but applied only during pushing to MATERIALIZED VIEW (default: min_insert_block_size_rows)", 0) \
     M(UInt64, min_insert_block_size_bytes_for_materialized_views, 0, "Like min_insert_block_size_bytes, but applied only during pushing to MATERIALIZED VIEW (default: min_insert_block_size_bytes)", 0) \
+    M(UInt64, min_external_table_block_size_rows, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough.", 0) \
+    M(UInt64, min_external_table_block_size_bytes, (DEFAULT_INSERT_BLOCK_SIZE * 256), "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough.", 0) \
     M(UInt64, max_joined_block_size_rows, DEFAULT_BLOCK_SIZE, "Maximum block size for JOIN result (if join algorithm supports it). 0 means unlimited.", 0) \
     M(UInt64, max_insert_threads, 0, "The maximum number of threads to execute the INSERT SELECT query. Values 0 or 1 means that INSERT SELECT is not run in parallel. Higher values will lead to higher memory usage. Parallel INSERT SELECT has effect only if the SELECT part is run on parallel, see 'max_threads' setting.", 0) \
     M(UInt64, max_insert_delayed_streams_for_parallel_write, 0, "The maximum number of streams (columns) to delay final part flush. Default - auto (1000 in case of underlying storage supports parallel write, for example S3 and disabled otherwise)", 0) \
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index f423d7e6a83..5f7afe99f33 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -286,9 +286,9 @@ TableNodePtr executeSubqueryNode(const QueryTreeNodePtr & subquery_node,
     auto build_pipeline_settings = BuildQueryPipelineSettings::fromContext(mutable_context);
     auto builder = query_plan.buildQueryPipeline(optimization_settings, build_pipeline_settings);
 
-    /// It's 16M squashing. 16 is a multiplier for compression.
-    size_t min_block_size_bytes = DBMS_DEFAULT_BUFFER_SIZE * 16;
-    auto squashing = std::make_shared<SimpleSquashingChunksTransform>(builder->getHeader(), 0, min_block_size_bytes);
+    size_t min_block_size_rows = mutable_context->getSettingsRef().min_external_table_block_size_rows;
+    size_t min_block_size_bytes = mutable_context->getSettingsRef().min_external_table_block_size_bytes;
+    auto squashing = std::make_shared<SimpleSquashingChunksTransform>(builder->getHeader(), min_block_size_rows, min_block_size_bytes);
 
     builder->resize(1);
     builder->addTransform(std::move(squashing));

From 15bf263153ed9cc9fa0332f7f3a1cc61bad2266d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 31 Jan 2024 13:00:46 +0000
Subject: [PATCH 0628/1081] Support non global in mode.

---
 src/Core/Settings.h                         |  1 +
 src/Planner/Planner.cpp                     |  7 +-
 src/Planner/PlannerContext.h                |  5 +-
 src/Planner/PlannerJoinTree.cpp             |  1 +
 src/Planner/findParallelReplicasQuery.cpp   | 92 ++++++++++++++++++++-
 src/Planner/findParallelReplicasQuery.h     |  2 +
 src/Storages/SelectQueryInfo.h              |  2 +
 src/Storages/StorageMergeTree.cpp           |  6 +-
 src/Storages/StorageReplicatedMergeTree.cpp |  7 +-
 src/Storages/buildQueryTreeForShard.cpp     | 41 +++++++--
 src/Storages/buildQueryTreeForShard.h       |  5 +-
 11 files changed, 154 insertions(+), 15 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index c42909b930f..37987d70c9a 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -187,6 +187,7 @@ class IColumn;
     M(Float, parallel_replicas_single_task_marks_count_multiplier, 2, "A multiplier which will be added during calculation for minimal number of marks to retrieve from coordinator. This will be applied only for remote replicas.", 0) \
     M(Bool, parallel_replicas_for_non_replicated_merge_tree, false, "If true, ClickHouse will use parallel replicas algorithm also for non-replicated MergeTree tables", 0) \
     M(UInt64, parallel_replicas_min_number_of_rows_per_replica, 0, "Limit the number of replicas used in a query to (estimated rows to read / min_number_of_rows_per_replica). The max is still limited by 'max_parallel_replicas'", 0) \
+    M(Bool, parallel_replicas_prefer_local_join, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN.", 0) \
     M(UInt64, parallel_replicas_mark_segment_size, 128, "Parts virtually divided into segments to be distributed between replicas for parallel reading. This setting controls the size of these segments. Not recommended to change until you're absolutely sure in what you're doing", 0) \
     \
     M(Bool, skip_unavailable_shards, false, "If true, ClickHouse silently skips unavailable shards. Shard is marked as unavailable when: 1) The shard cannot be reached due to a connection failure. 2) Shard is unresolvable through DNS. 3) Table does not exist on the shard.", 0) \
diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index d8f9153cd4f..8dcce627cce 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -1072,7 +1072,7 @@ void addBuildSubqueriesForSetsStepIfNeeded(
         Planner subquery_planner(
             query_tree,
             subquery_options,
-            std::make_shared<GlobalPlannerContext>(nullptr)); //planner_context->getGlobalPlannerContext());
+            std::make_shared<GlobalPlannerContext>(nullptr, nullptr)); //planner_context->getGlobalPlannerContext());
         subquery_planner.buildQueryPlanIfNeeded();
 
         subquery->setQueryPlan(std::make_unique<QueryPlan>(std::move(subquery_planner).extractQueryPlan()));
@@ -1175,7 +1175,10 @@ Planner::Planner(const QueryTreeNodePtr & query_tree_,
     SelectQueryOptions & select_query_options_)
     : query_tree(query_tree_)
     , select_query_options(select_query_options_)
-    , planner_context(buildPlannerContext(query_tree, select_query_options, std::make_shared<GlobalPlannerContext>(findParallelReplicasQuery(query_tree, select_query_options))))
+    , planner_context(buildPlannerContext(query_tree, select_query_options,
+        std::make_shared<GlobalPlannerContext>(
+            findParallelReplicasQuery(query_tree, select_query_options),
+            findTableForParallelReplicas(query_tree, select_query_options))))
 {
 }
 
diff --git a/src/Planner/PlannerContext.h b/src/Planner/PlannerContext.h
index a5a64fc0a6b..d0e1497061e 100644
--- a/src/Planner/PlannerContext.h
+++ b/src/Planner/PlannerContext.h
@@ -20,12 +20,14 @@ namespace DB
   */
 
 class QueryNode;
+class TableNode;
 
 class GlobalPlannerContext
 {
 public:
-    explicit GlobalPlannerContext(const QueryNode * parallel_replicas_node_)
+    explicit GlobalPlannerContext(const QueryNode * parallel_replicas_node_, const TableNode * parallel_replicas_table_)
         : parallel_replicas_node(parallel_replicas_node_)
+        , parallel_replicas_table(parallel_replicas_table_)
     {
     }
 
@@ -45,6 +47,7 @@ public:
     bool hasColumnIdentifier(const ColumnIdentifier & column_identifier);
 
     const QueryNode * const parallel_replicas_node = nullptr;
+    const TableNode * const parallel_replicas_table = nullptr;
 
 private:
     std::unordered_set<ColumnIdentifier> column_identifiers;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index a35f396aee9..6cebc4696c0 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -604,6 +604,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
         auto table_expression_query_info = select_query_info;
         table_expression_query_info.table_expression = table_expression;
         table_expression_query_info.filter_actions_dag = table_expression_data.getFilterActions();
+        table_expression_query_info.analyzer_can_use_parallel_replicas_on_follower = table_node == planner_context->getGlobalPlannerContext()->parallel_replicas_table;
 
         size_t max_streams = settings.max_threads;
         size_t max_threads_execute_query = settings.max_threads;
diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
index 5519478fea2..014052fecd2 100644
--- a/src/Planner/findParallelReplicasQuery.cpp
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -267,7 +267,7 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
 
     SelectQueryOptions options;
     //options.only_analyze = true;
-    Planner planner(updated_query_tree, options, std::make_shared<GlobalPlannerContext>(nullptr));
+    Planner planner(updated_query_tree, options, std::make_shared<GlobalPlannerContext>(nullptr, nullptr));
     planner.buildQueryPlanIfNeeded();
 
     // WriteBufferFromOwnString buf;
@@ -303,6 +303,94 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
     return res;
 }
 
+static const TableNode * findTableForParallelReplicas(const IQueryTreeNode * query_tree_node)
+{
+    while (query_tree_node)
+    {
+        auto join_tree_node_type = query_tree_node->getNodeType();
+
+        switch (join_tree_node_type)
+        {
+            case QueryTreeNodeType::TABLE:
+            {
+                const auto & table_node = query_tree_node->as<TableNode &>();
+                const auto & storage = table_node.getStorage();
+                if (std::dynamic_pointer_cast<MergeTreeData>(storage) || typeid_cast<const StorageDummy *>(storage.get()))
+                    return &table_node;
+
+                return {};
+            }
+            case QueryTreeNodeType::TABLE_FUNCTION:
+            {
+                return {};
+            }
+            case QueryTreeNodeType::QUERY:
+            {
+                const auto & query_node_to_process = query_tree_node->as<QueryNode &>();
+                query_tree_node = query_node_to_process.getJoinTree().get();
+                break;
+            }
+            case QueryTreeNodeType::UNION:
+            {
+                const auto & union_node = query_tree_node->as<UnionNode &>();
+                const auto & union_queries = union_node.getQueries().getNodes();
+
+                if (union_queries.empty())
+                    return {};
+
+                query_tree_node = union_queries.front().get();
+                break;
+            }
+            case QueryTreeNodeType::ARRAY_JOIN:
+            {
+                const auto & array_join_node = query_tree_node->as<ArrayJoinNode &>();
+                query_tree_node = array_join_node.getTableExpression().get();
+                break;
+            }
+            case QueryTreeNodeType::JOIN:
+            {
+                const auto & join_node = query_tree_node->as<JoinNode &>();
+                if (const auto * res = findTableForParallelReplicas(join_node.getLeftTableExpression().get()))
+                    return res;
+
+                query_tree_node = join_node.getRightTableExpression().get();
+                break;
+            }
+            default:
+            {
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                "Unexpected node type for table expression. "
+                                "Expected table, table function, query, union, join or array join. Actual {}",
+                                query_tree_node->getNodeTypeName());
+            }
+        }
+    }
+
+    return nullptr;
+}
+
+const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options)
+{
+    if (select_query_options.only_analyze)
+        return nullptr;
+
+    auto * query_node = query_tree_node->as<QueryNode>();
+    auto * union_node = query_tree_node->as<UnionNode>();
+
+    if (!query_node && !union_node)
+        throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
+            "Expected QUERY or UNION node. Actual {}",
+            query_tree_node->formatASTForErrorMessage());
+
+    auto context = query_node ? query_node->getContext() : union_node->getContext();
+    // const auto & settings = context->getSettingsRef();
+
+    if (!context->canUseParallelReplicasOnFollower())
+        return nullptr;
+
+    return findTableForParallelReplicas(query_tree_node.get());
+}
+
 static void removeCTEs(ASTPtr & ast)
 {
     std::stack<IAST *> stack;
@@ -336,7 +424,7 @@ JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
     Block initial_header = InterpreterSelectQueryAnalyzer::getSampleBlock(
         modified_query_tree, context, SelectQueryOptions(processed_stage).analyze());
 
-    rewriteJoinToGlobalJoin(modified_query_tree);
+    rewriteJoinToGlobalJoin(modified_query_tree, context);
     // std::cerr << "buildQueryPlanForParallelReplicas 1 " << modified_query_tree->dumpTree() << std::endl;
     modified_query_tree = buildQueryTreeForShard(planner_context, modified_query_tree);
     // std::cerr << "buildQueryPlanForParallelReplicas 2 " << modified_query_tree->dumpTree() << std::endl;
diff --git a/src/Planner/findParallelReplicasQuery.h b/src/Planner/findParallelReplicasQuery.h
index 56085604539..ab30de3adaf 100644
--- a/src/Planner/findParallelReplicasQuery.h
+++ b/src/Planner/findParallelReplicasQuery.h
@@ -6,6 +6,7 @@ namespace DB
 {
 
 class QueryNode;
+class TableNode;
 
 class IQueryTreeNode;
 using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
@@ -13,6 +14,7 @@ using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
 struct SelectQueryOptions;
 
 const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
+const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
 
 struct JoinTreeQueryPlan;
 
diff --git a/src/Storages/SelectQueryInfo.h b/src/Storages/SelectQueryInfo.h
index 662a5c0ef5a..4cb88a6d3fc 100644
--- a/src/Storages/SelectQueryInfo.h
+++ b/src/Storages/SelectQueryInfo.h
@@ -161,6 +161,8 @@ struct SelectQueryInfo
     /// It's guaranteed to be present in JOIN TREE of `query_tree`
     QueryTreeNodePtr table_expression;
 
+    bool analyzer_can_use_parallel_replicas_on_follower = false;
+
     /// Table expression modifiers for storage
     std::optional<TableExpressionModifiers> table_expression_modifiers;
 
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 77c506fca7f..93d21c80698 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -224,7 +224,7 @@ void StorageMergeTree::read(
         if (local_context->getSettingsRef().allow_experimental_analyzer)
         {
             QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
-            rewriteJoinToGlobalJoin(modified_query_tree);
+            rewriteJoinToGlobalJoin(modified_query_tree, local_context);
             modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
             header = InterpreterSelectQueryAnalyzer::getSampleBlock(
                 modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
@@ -255,7 +255,9 @@ void StorageMergeTree::read(
     }
     else
     {
-        const bool enable_parallel_reading = local_context->canUseParallelReplicasOnFollower() && local_context->getSettingsRef().parallel_replicas_for_non_replicated_merge_tree;
+        const bool enable_parallel_reading = local_context->canUseParallelReplicasOnFollower()
+            && local_context->getSettingsRef().parallel_replicas_for_non_replicated_merge_tree
+            && (!local_context->getSettingsRef().allow_experimental_analyzer || query_info.analyzer_can_use_parallel_replicas_on_follower);
 
         if (auto plan = reader.read(
                 column_names,
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 998bad17e53..2024449e009 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -5412,7 +5412,7 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
     if (local_context->getSettingsRef().allow_experimental_analyzer)
     {
         QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
-        rewriteJoinToGlobalJoin(modified_query_tree);
+        rewriteJoinToGlobalJoin(modified_query_tree, local_context);
         modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
 
         header = InterpreterSelectQueryAnalyzer::getSampleBlock(
@@ -5451,11 +5451,14 @@ void StorageReplicatedMergeTree::readLocalImpl(
     const size_t max_block_size,
     const size_t num_streams)
 {
+    const bool enable_parallel_reading = local_context->canUseParallelReplicasOnFollower()
+        && (!local_context->getSettingsRef().allow_experimental_analyzer || query_info.analyzer_can_use_parallel_replicas_on_follower);
+
     auto plan = reader.read(
         column_names, storage_snapshot, query_info,
         local_context, max_block_size, num_streams,
         /* max_block_numbers_to_read= */ nullptr,
-        /* enable_parallel_reading= */ local_context->canUseParallelReplicasOnFollower());
+        enable_parallel_reading);
 
     if (plan)
         query_plan = std::move(*plan);
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index 5f7afe99f33..c87a1b216ca 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -386,16 +386,47 @@ QueryTreeNodePtr buildQueryTreeForShard(const PlannerContextPtr & planner_contex
     return query_tree_to_modify;
 }
 
-class RewriteJoinToGlobalJoinVisitor : public InDepthQueryTreeVisitor<RewriteJoinToGlobalJoinVisitor>
+class CollectStoragesVisitor : public InDepthQueryTreeVisitor<CollectStoragesVisitor>
 {
 public:
-    using Base = InDepthQueryTreeVisitor<RewriteJoinToGlobalJoinVisitor>;
+    using Base = InDepthQueryTreeVisitor<CollectStoragesVisitor>;
     using Base::Base;
 
     void visitImpl(QueryTreeNodePtr & node)
+    {
+        if (auto * table_node = node->as<TableNode>())
+            storages.push_back(table_node->getStorage());
+    }
+
+    std::vector<StoragePtr> storages;
+};
+
+class RewriteJoinToGlobalJoinVisitor : public InDepthQueryTreeVisitorWithContext<RewriteJoinToGlobalJoinVisitor>
+{
+public:
+    using Base = InDepthQueryTreeVisitorWithContext<RewriteJoinToGlobalJoinVisitor>;
+    using Base::Base;
+
+    static bool allStoragesAreMergeTree(QueryTreeNodePtr & node)
+    {
+        CollectStoragesVisitor collect_storages;
+        collect_storages.visit(node);
+        for (const auto & storage : collect_storages.storages)
+            if (!storage->isMergeTree())
+                return false;
+
+        return true;
+    }
+
+    void enterImpl(QueryTreeNodePtr & node)
     {
         if (auto * join_node = node->as<JoinNode>())
-            join_node->setLocality(JoinLocality::Global);
+        {
+            bool prefer_local_join = getContext()->getSettingsRef().parallel_replicas_prefer_local_join;
+            bool should_use_global_join = !prefer_local_join || !allStoragesAreMergeTree(join_node->getRightTableExpression());
+            if (should_use_global_join)
+                join_node->setLocality(JoinLocality::Global);
+        }
     }
 
     static bool needChildVisit(QueryTreeNodePtr & parent, QueryTreeNodePtr & child)
@@ -408,9 +439,9 @@ public:
     }
 };
 
-void rewriteJoinToGlobalJoin(QueryTreeNodePtr query_tree_to_modify)
+void rewriteJoinToGlobalJoin(QueryTreeNodePtr query_tree_to_modify, ContextPtr context)
 {
-    RewriteJoinToGlobalJoinVisitor visitor;
+    RewriteJoinToGlobalJoinVisitor visitor(context);
     visitor.visit(query_tree_to_modify);
 }
 
diff --git a/src/Storages/buildQueryTreeForShard.h b/src/Storages/buildQueryTreeForShard.h
index 3ffb5707c2b..5b00b89c729 100644
--- a/src/Storages/buildQueryTreeForShard.h
+++ b/src/Storages/buildQueryTreeForShard.h
@@ -13,8 +13,11 @@ using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
 class PlannerContext;
 using PlannerContextPtr = std::shared_ptr<PlannerContext>;
 
+class Context;
+using ContextPtr = std::shared_ptr<const Context>;
+
 QueryTreeNodePtr buildQueryTreeForShard(const PlannerContextPtr & planner_context, QueryTreeNodePtr query_tree_to_modify);
 
-void rewriteJoinToGlobalJoin(QueryTreeNodePtr query_tree_to_modify);
+void rewriteJoinToGlobalJoin(QueryTreeNodePtr query_tree_to_modify, ContextPtr context);
 
 }

From ec745713922a8bfdbfa670ef9dd6a8b016cf8f24 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 31 Jan 2024 14:51:17 +0000
Subject: [PATCH 0629/1081] Fixing fasttest.

---
 .../02731_parallel_replicas_join_subquery.reference            | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
index ec4928bc325..e296e115cbc 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
@@ -58,8 +58,7 @@ U	c	10
 UlI+1		10
 bX?}ix [	Ny]2 G	10
 t<iT	X48q:Z]t0	10
-0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > 1610517366120) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2`
-0	3	SELECT `__table2`.`value1` AS `value1`, `__table2`.`value2` AS `value2`, count() AS `count` FROM `default`.`join_outer_table` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` USING (`key`) GROUP BY `__table1`.`key`, `__table2`.`value1`, `__table2`.`value2`
+0	3	SELECT `__table2`.`value1` AS `value1`, `__table2`.`value2` AS `value2`, count() AS `count` FROM `default`.`join_outer_table` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`key` AS `key`, `__table3`.`value1` AS `value1`, `__table3`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table3` PREWHERE (`__table3`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table3`.`number` > 1610517366120) GROUP BY `__table3`.`key`, `__table3`.`value1`, `__table3`.`value2`) AS `__table2` USING (`key`) GROUP BY `__table1`.`key`, `__table2`.`value1`, `__table2`.`value2`
 0	3	SELECT `key`, `value1`, `value2` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2`
 0	3	SELECT `value1`, `value2`, count() AS `count` FROM `default`.`join_outer_table` ALL INNER JOIN `_data_` USING (`key`) GROUP BY `key`, `value1`, `value2`
 1	1	-- Parallel full query\nSELECT\n    value1,\n    value2,\n    avg(count) AS avg\nFROM\n    (\n        SELECT\n            key,\n            value1,\n            value2,\n            count() AS count\n        FROM join_outer_table\n        INNER JOIN\n        (\n            SELECT\n                key,\n                value1,\n                value2,\n                toUInt64(min(time)) AS start_ts\n            FROM join_inner_table\n            PREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\n            GROUP BY key, value1, value2\n        ) USING (key)\n        GROUP BY key, value1, value2\n        )\nGROUP BY value1, value2\nORDER BY value1, value2\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=0;

From 9c6538b9148e63fafcb7f4645a16e8a7b3ab9de6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 31 Jan 2024 16:00:31 +0000
Subject: [PATCH 0630/1081] Update test.

---
 ...llel_replicas_joins_and_analyzer.reference | 251 ++++++++++++++++++
 ...rallel_replicas_joins_and_analyzer.sql.j2} |   6 +
 2 files changed, 257 insertions(+)
 rename tests/queries/0_stateless/{02967_parallel_replicas_joins_and_analyzer.sql => 02967_parallel_replicas_joins_and_analyzer.sql.j2} (98%)

diff --git a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
index fdb4a761015..6b1fdfd42a2 100644
--- a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
+++ b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.reference
@@ -1,5 +1,256 @@
 -- { echoOn }
 
+set parallel_replicas_prefer_local_join = 0;
+-- A query with only INNER/LEFT joins is fully send to replicas. JOIN is executed in GLOBAL mode.
+select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  ReadFromRemoteParallelReplicas
+--
+-- The same query with cte;
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      ReadFromRemoteParallelReplicas
+--
+-- GROUP BY should work up to WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+54	54	50	50	12	12	0
+64	64	0	0	0	0	1
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select sum(x), sum(y), sum(r.y), sum(z), sum(rr.z), sum(a), key from sub3 ll any left join sub4 rr on ll.z = rr.z group by x % 2 as key)
+select * from sub5 order by key
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      MergingAggregated
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- ORDER BY in sub3 : sub1 is fully pushed, sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y order by l.x),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- ORDER BY in sub1 : sub1 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+1	1	0	0	0	0
+3	3	0	0	0	0
+4	4	0	0	0	0
+5	5	0	0	0	0
+6	6	6	6	0	0
+7	7	0	0	0	0
+8	8	8	8	0	0
+9	9	0	0	0	0
+10	10	10	10	0	0
+11	11	0	0	0	0
+12	12	12	12	12	12
+13	13	0	0	0	0
+14	14	14	14	0	0
+15	15	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2 order by y),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, y, r.y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5 order by x
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          Join
+            Expression
+              ReadFromRemoteParallelReplicas
+            Expression
+              ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+--
+-- RIGHT JOIN in sub3: sub3 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+6	6	6	6	0	0
+8	8	8	8	0	0
+10	10	10	10	0	0
+12	12	12	12	12	12
+14	14	14	14	0	0
+4	4	0	0	0	0
+3	3	0	0	0	0
+5	5	0	0	0	0
+1	1	0	0	0	0
+7	7	0	0	0	0
+9	9	0	0	0	0
+15	15	0	0	0	0
+11	11	0	0	0	0
+13	13	0	0	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub2 r any right join sub1 l on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select x, l.y, y, z, rr.z, a from sub3 ll any left join sub4 rr on ll.z = rr.z)
+select * from sub5
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+Expression
+  Join
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          ReadFromRemoteParallelReplicas
+    Expression
+      ReadFromRemoteParallelReplicas
+--
+-- RIGHT JOIN in sub5: sub5 -> WithMergableStage
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+0	0	0	0	0	0
+0	0	1	1	0	0
+0	0	3	3	0	0
+0	0	4	4	0	0
+0	0	5	5	0	0
+0	0	6	6	6	6
+0	0	7	7	0	0
+0	0	8	8	8	8
+0	0	9	9	0	0
+0	0	10	10	10	10
+0	0	11	11	0	0
+12	12	12	12	12	12
+0	0	13	13	0	0
+0	0	14	14	14	14
+0	0	15	15	0	0
+explain description=0
+with sub1 as (select x, y from tab1 where x != 2),
+sub2 as (select y, z from tab2 where y != 4),
+sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y = r.y),
+sub4 as (select z, a from tab3 where z != 8),
+sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
+select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;-- { echoOn }
+Expression
+  Sorting
+    Expression
+      Join
+        Expression
+          ReadFromRemoteParallelReplicas
+        Expression
+          Join
+            Expression
+              ReadFromRemoteParallelReplicas
+            Expression
+              ReadFromRemoteParallelReplicas
+set parallel_replicas_prefer_local_join = 1;
 -- A query with only INNER/LEFT joins is fully send to replicas. JOIN is executed in GLOBAL mode.
 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
 0	0	0	0	0	0
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql.j2
similarity index 98%
rename from tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql
rename to tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql.j2
index a3a2269fabb..7d2766d52f8 100644
--- a/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql
+++ b/tests/queries/0_stateless/02967_parallel_replicas_joins_and_analyzer.sql.j2
@@ -10,8 +10,12 @@ insert into tab1 select number, number, number from numbers(16);
 insert into tab2 select number * 2, number * 2 from numbers(8);
 insert into tab3 select number * 4, number * 4 from numbers(4);
 
+{% for use_global_in in [0, 1] -%}
+
 -- { echoOn }
 
+set parallel_replicas_prefer_local_join = {{use_global_in}};
+
 -- A query with only INNER/LEFT joins is fully send to replicas. JOIN is executed in GLOBAL mode.
 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
 explain description=0 select x, y, r.y, z, rr.z, a from (select l.x, l.y, r.y, r.z as z from (select x, y from tab1 where x != 2) l any left join (select y, z from tab2 where y != 4) r on l.y = r.y) ll any left join (select z, a from tab3 where z != 8) rr on ll.z = rr.z SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
@@ -121,3 +125,5 @@ sub3 as (select l.x, l.y, r.y, r.z as z from sub1 l any left join sub2 r on l.y
 sub4 as (select z, a from tab3 where z != 8),
 sub5 as (select z, a, x, y, r.y, ll.z from sub4 rr any right join sub3 ll on ll.z = rr.z)
 select * from sub5 order by x SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_analyzer=1;
+
+{%- endfor %}

From 8a933e969882c3e6aa7e9c9aa387cfe492be7f38 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 2 Feb 2024 17:24:17 +0000
Subject: [PATCH 0631/1081] Add a test.

---
 ..._replicas_join_algo_and_analyzer.reference | 166 ++++++++++++
 ...arallel_replicas_join_algo_and_analyzer.sh | 252 ++++++++++++++++++
 2 files changed, 418 insertions(+)
 create mode 100644 tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
 create mode 100755 tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh

diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
new file mode 100644
index 00000000000..1e3ffec2cd9
--- /dev/null
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
@@ -0,0 +1,166 @@
+simple join with analyzer
+4200000	4200000	4200000	-1400000
+4200006	4200006	4200006	-1400002
+4200012	4200012	4200012	-1400004
+4200018	4200018	4200018	-1400006
+4200024	4200024	4200024	-1400008
+4200030	4200030	4200030	-1400010
+4200036	4200036	4200036	-1400012
+4200042	4200042	4200042	-1400014
+4200048	4200048	4200048	-1400016
+4200054	4200054	4200054	-1400018
+simple (global) join with analyzer and parallel replicas
+4200000	4200000	4200000	-1400000
+4200006	4200006	4200006	-1400002
+4200012	4200012	4200012	-1400004
+4200018	4200018	4200018	-1400006
+4200024	4200024	4200024	-1400008
+4200030	4200030	4200030	-1400010
+4200036	4200036	4200036	-1400012
+4200042	4200042	4200042	-1400014
+4200048	4200048	4200048	-1400016
+4200054	4200054	4200054	-1400018
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+simple (local) join with analyzer and parallel replicas
+4200000	4200000	4200000	-1400000
+4200006	4200006	4200006	-1400002
+4200012	4200012	4200012	-1400004
+4200018	4200018	4200018	-1400006
+4200024	4200024	4200024	-1400008
+4200030	4200030	4200030	-1400010
+4200036	4200036	4200036	-1400012
+4200042	4200042	4200042	-1400014
+4200048	4200048	4200048	-1400016
+4200054	4200054	4200054	-1400018
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+simple (local) join with analyzer and parallel replicas and full sorting merge join
+4200000	4200000	4200000	-1400000
+4200006	4200006	4200006	-1400002
+4200012	4200012	4200012	-1400004
+4200018	4200018	4200018	-1400006
+4200024	4200024	4200024	-1400008
+4200030	4200030	4200030	-1400010
+4200036	4200036	4200036	-1400012
+4200042	4200042	4200042	-1400014
+4200048	4200048	4200048	-1400016
+4200054	4200054	4200054	-1400018
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+nested join with analyzer
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+nested join with analyzer and parallel replicas, both local
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+nested join with analyzer and parallel replicas, both global
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+nested join with analyzer and parallel replicas, global + local
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+nested join with analyzer and parallel replicas, both local, both full sorting merge join
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+nested join with analyzer and parallel replicas, both local, both full sorting and hash join
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'hash' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'hash' (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+nested join with analyzer and parallel replicas, both local, both full sorting and hash join
+420000	420000	420000	-140000
+420042	420042	420042	-140014
+420084	420084	420084	-140028
+420126	420126	420126	-140042
+420168	420168	420168	-140056
+420210	420210	420210	-140070
+420252	420252	420252	-140084
+420294	420294	420294	-140098
+420336	420336	420336	-140112
+420378	420378	420378	-140126
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+<Debug> WithOrderCoordinator: Coordination done
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'hash' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'hash' (stage: WithMergeableState)
+<Debug> DefaultCoordinator: Coordination done
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
new file mode 100755
index 00000000000..aecd01d7547
--- /dev/null
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
@@ -0,0 +1,252 @@
+#!/usr/bin/env bash
+# Tags: no-random-merge-tree-settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+$CLICKHOUSE_CLIENT -nm -q "
+drop table if exists num_1;
+drop table if exists num_2;
+
+create table num_1 (key UInt64, value String) engine = MergeTree order by key;
+create table num_2 (key UInt64, value Int64) engine = MergeTree order by key;
+
+insert into num_1 select number * 2, toString(number * 2) from numbers(1e7);
+insert into num_2 select number * 3, -number from numbers(1.5e6);
+"
+
+##############
+echo "simple join with analyzer"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1"
+
+##############
+echo "simple (global) join with analyzer and parallel replicas"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1, allow_experimental_parallel_reading_from_replicas = 2,
+max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level='trace',
+max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+##############
+echo "simple (local) join with analyzer and parallel replicas"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+
+##############
+echo "simple (local) join with analyzer and parallel replicas and full sorting merge join"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1, join_algorithm='full_sorting_merge',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2) r on l.key = r.key
+order by l.key limit 10 offset 700000
+SETTINGS allow_experimental_analyzer=1, join_algorithm='full_sorting_merge', send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+
+##############
+echo "nested join with analyzer"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=1) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1"
+
+
+##############
+echo "nested join with analyzer and parallel replicas, both local"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=1) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=1) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, join_algorithm='full_sorting_merge', send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=1" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+
+##############
+echo "nested join with analyzer and parallel replicas, both global"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=0) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=0) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+##############
+echo "nested join with analyzer and parallel replicas, global + local"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=1) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings parallel_replicas_prefer_local_join=1) r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join=0" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+
+##############
+echo "nested join with analyzer and parallel replicas, both local, both full sorting merge join"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='full_sorting_merge') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='full_sorting_merge'"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='full_sorting_merge') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='full_sorting_merge'" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+##############
+echo "nested join with analyzer and parallel replicas, both local, both full sorting and hash join"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='hash') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='full_sorting_merge'"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='hash') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='full_sorting_merge'" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
+
+##############
+echo "nested join with analyzer and parallel replicas, both local, both full sorting and hash join"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='full_sorting_merge') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0,
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='hash'"
+
+$CLICKHOUSE_CLIENT -q "
+select * from (select key, value from num_1) l
+inner join (select key, value from num_2 inner join
+  (select number * 7 as key from numbers(1e5)) as nn on num_2.key = nn.key settings join_algorithm='full_sorting_merge') r
+on l.key = r.key order by l.key limit 10 offset 10000
+SETTINGS allow_experimental_analyzer=1, parallel_replicas_prefer_local_join=0, send_logs_level='trace',
+allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1,
+cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm='hash'" 2>&1 |
+grep "executeQuery\|<Debug>.*Coordinator: Coordination done" |
+grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
+sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'

From e5a8e36d5e6feef0c9054054c4412ac75650f6ae Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 2 Feb 2024 18:57:57 +0000
Subject: [PATCH 0632/1081] Update test

---
 .../02967_parallel_replicas_join_algo_and_analyzer.sh           | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
index aecd01d7547..bda93d08bb1 100755
--- a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-random-merge-tree-settings
+# Tags: long, no-random-settings, no-random-merge-tree-settings
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 29780b146810fe4f781f824d21a66ccd93260640 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 5 Feb 2024 17:04:14 +0000
Subject: [PATCH 0633/1081] Fixing tests.

---
 src/Core/SettingsChangesHistory.h                            | 5 ++++-
 .../02784_parallel_replicas_automatic_decision_join.sh       | 1 +
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c3b0cee00a4..1e4cb72c350 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -108,9 +108,12 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
+              {"min_external_table_block_size_rows", DEFAULT_INSERT_BLOCK_SIZE, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough"},
+              {"min_external_table_block_size_bytes", DEFAULT_INSERT_BLOCK_SIZE * 256, DEFAULT_INSERT_BLOCK_SIZE * 256, "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough."},
+              {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
+              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
index 1a74c3230c6..ef3e6000903 100755
--- a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
@@ -64,6 +64,7 @@ function run_query_with_pure_parallel_replicas () {
         --query_id "${1}_pure" \
         --max_parallel_replicas 3 \
         --prefer_localhost_replica 1 \
+        --parallel_replicas_prefer_local_join 0 \
         --cluster_for_parallel_replicas "parallel_replicas" \
         --allow_experimental_parallel_reading_from_replicas 1 \
         --parallel_replicas_for_non_replicated_merge_tree 1 \

From 3ddaa1b5f19251974d16431d6c35f0965f639610 Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Mon, 5 Feb 2024 18:09:43 +0100
Subject: [PATCH 0634/1081] CI: nightly job to update latest docker tag only
 (#59586)

* CI: nightly job to update latest docker tag only

---------

Co-authored-by: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
---
 .github/workflows/master.yml          | 10 ---
 .github/workflows/nightly.yml         |  2 +-
 .github/workflows/reusable_docker.yml | 16 ++---
 tests/ci/ci.py                        | 99 ++++++++++-----------------
 tests/ci/ci_config.py                 |  9 ++-
 tests/ci/docker_manifests_merge.py    | 14 ++--
 6 files changed, 58 insertions(+), 92 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 5d57e6fc1d8..2471e4f9194 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -55,7 +55,6 @@ jobs:
     uses: ./.github/workflows/reusable_docker.yml
     with:
       data: ${{ needs.RunConfig.outputs.data }}
-      set_latest: true
   StyleCheck:
     needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
@@ -362,14 +361,6 @@ jobs:
       test_name: Stateless tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-  FunctionalStatelessTestReleaseDatabaseOrdinary:
-    needs: [RunConfig, BuilderDebRelease]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (release, DatabaseOrdinary)
-      runner_type: func-tester
-      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
     needs: [RunConfig, BuilderDebRelease]
     if: ${{ !failure() && !cancelled() }}
@@ -733,7 +724,6 @@ jobs:
       - MarkReleaseReady
       - FunctionalStatelessTestDebug
       - FunctionalStatelessTestRelease
-      - FunctionalStatelessTestReleaseDatabaseOrdinary
       - FunctionalStatelessTestReleaseDatabaseReplicated
       - FunctionalStatelessTestReleaseAnalyzer
       - FunctionalStatelessTestReleaseS3
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 2774eae24cc..770e1ec3789 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -28,7 +28,7 @@ jobs:
         id: runconfig
         run: |
             echo "::group::configure CI run"
-            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --skip-jobs --rebuild-all-docker --outfile ${{ runner.temp }}/ci_run_data.json
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --skip-jobs --outfile ${{ runner.temp }}/ci_run_data.json
             echo "::endgroup::"
 
             echo "::group::CI run configure results"
diff --git a/.github/workflows/reusable_docker.yml b/.github/workflows/reusable_docker.yml
index 08a5740e7e0..1b186350580 100644
--- a/.github/workflows/reusable_docker.yml
+++ b/.github/workflows/reusable_docker.yml
@@ -46,7 +46,7 @@ jobs:
     needs: [DockerBuildAmd64, DockerBuildAarch64]
     runs-on: [self-hosted, style-checker]
     if: |
-      !failure() && !cancelled() && toJson(fromJson(inputs.data).docker_data.missing_multi) != '[]'
+      !failure() && !cancelled() && (toJson(fromJson(inputs.data).docker_data.missing_multi) != '[]' || inputs.set_latest)
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
@@ -55,14 +55,12 @@ jobs:
       - name: Build images
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
+          FLAG_LATEST=''
           if [ "${{ inputs.set_latest }}" == "true" ]; then
+            FLAG_LATEST='--set-latest'
             echo "latest tag will be set for resulting manifests"
-            python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
-              --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
-              --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}' \
-              --set-latest
-          else
-            python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
-              --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
-              --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}'
           fi
+          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
+            --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
+            --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}' \
+            "$FLAG_LATEST"
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 12e27b532db..d2d05b1ed2d 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -734,12 +734,6 @@ def parse_args(parser: argparse.ArgumentParser) -> argparse.Namespace:
         default=False,
         help="skip fetching data about job runs, used in --configure action (for debugging and nigthly ci)",
     )
-    parser.add_argument(
-        "--rebuild-all-docker",
-        action="store_true",
-        default=False,
-        help="will create run config for rebuilding all dockers, used in --configure action (for nightly docker job)",
-    )
     # FIXME: remove, not used
     parser.add_argument(
         "--rebuild-all-binaries",
@@ -939,9 +933,7 @@ def _update_config_for_docs_only(jobs_data: dict) -> None:
     }
 
 
-def _configure_docker_jobs(
-    rebuild_all_dockers: bool, docker_digest_or_latest: bool = False
-) -> Dict:
+def _configure_docker_jobs(docker_digest_or_latest: bool) -> Dict:
     print("::group::Docker images check")
     # generate docker jobs data
     docker_digester = DockerDigester()
@@ -950,50 +942,33 @@ def _configure_docker_jobs(
     )  # 'image name - digest' mapping
     images_info = docker_images_helper.get_images_info()
 
-    # a. check missing images
-    if not rebuild_all_dockers:
-        # FIXME: we need login as docker manifest inspect goes directly to one of the *.docker.com hosts instead of "registry-mirrors" : ["http://dockerhub-proxy.dockerhub-proxy-zone:5000"]
-        #         find if it's possible to use the setting of /etc/docker/daemon.json
-        docker_images_helper.docker_login()
-        missing_multi_dict = check_missing_images_on_dockerhub(imagename_digest_dict)
-        missing_multi = list(missing_multi_dict)
-        missing_amd64 = []
-        missing_aarch64 = []
-        if not docker_digest_or_latest:
-            # look for missing arm and amd images only among missing multiarch manifests @missing_multi_dict
-            # to avoid extra dockerhub api calls
-            missing_amd64 = list(
-                check_missing_images_on_dockerhub(missing_multi_dict, "amd64")
-            )
-            # FIXME: WA until full arm support: skip not supported arm images
-            missing_aarch64 = list(
-                check_missing_images_on_dockerhub(
-                    {
-                        im: digest
-                        for im, digest in missing_multi_dict.items()
-                        if not images_info[im]["only_amd64"]
-                    },
-                    "aarch64",
-                )
-            )
-        # FIXME: temporary hack, remove after transition to docker digest as tag
-        else:
-            if missing_multi:
-                print(
-                    f"WARNING: Missing images {list(missing_multi)} - fallback to latest tag"
-                )
-                for image in missing_multi:
-                    imagename_digest_dict[image] = "latest"
-    else:
-        # add all images to missing
-        missing_multi = list(imagename_digest_dict)
-        missing_amd64 = missing_multi
+    # FIXME: we need login as docker manifest inspect goes directly to one of the *.docker.com hosts instead of "registry-mirrors" : ["http://dockerhub-proxy.dockerhub-proxy-zone:5000"]
+    #   find if it's possible to use the setting of /etc/docker/daemon.json (https://github.com/docker/cli/issues/4484#issuecomment-1688095463)
+    docker_images_helper.docker_login()
+    missing_multi_dict = check_missing_images_on_dockerhub(imagename_digest_dict)
+    missing_multi = list(missing_multi_dict)
+    missing_amd64 = []
+    missing_aarch64 = []
+    if not docker_digest_or_latest:
+        # look for missing arm and amd images only among missing multiarch manifests @missing_multi_dict
+        # to avoid extra dockerhub api calls
+        missing_amd64 = list(
+            check_missing_images_on_dockerhub(missing_multi_dict, "amd64")
+        )
         # FIXME: WA until full arm support: skip not supported arm images
-        missing_aarch64 = [
-            name
-            for name in imagename_digest_dict
-            if not images_info[name]["only_amd64"]
-        ]
+        missing_aarch64 = list(
+            check_missing_images_on_dockerhub(
+                {
+                    im: digest
+                    for im, digest in missing_multi_dict.items()
+                    if not images_info[im]["only_amd64"]
+                },
+                "aarch64",
+            )
+        )
+    else:
+        if missing_multi:
+            assert False, f"Missing images [{missing_multi}], cannot proceed"
     print("::endgroup::")
 
     return {
@@ -1502,9 +1477,7 @@ def main() -> int:
         print(f"Got CH version for this commit: [{version}]")
 
         docker_data = (
-            _configure_docker_jobs(
-                args.rebuild_all_docker, args.docker_digest_or_latest
-            )
+            _configure_docker_jobs(args.docker_digest_or_latest)
             if not args.skip_docker
             else {}
         )
@@ -1528,17 +1501,16 @@ def main() -> int:
             else {}
         )
 
-        # FIXME: Early style check manipulates with job names might be not robust with await feature
-        if pr_info.number != 0 and not args.docker_digest_or_latest:
-            # FIXME: it runs style check before docker build if possible (style-check images is not changed)
-            #    find a way to do style check always before docker build and others
-            _check_and_update_for_early_style_check(jobs_data, docker_data)
-        if args.skip_jobs and pr_info.has_changes_in_documentation_only():
+        # # FIXME: Early style check manipulates with job names might be not robust with await feature
+        # if pr_info.number != 0:
+        #     # FIXME: it runs style check before docker build if possible (style-check images is not changed)
+        #     #    find a way to do style check always before docker build and others
+        #     _check_and_update_for_early_style_check(jobs_data, docker_data)
+        if not args.skip_jobs and pr_info.has_changes_in_documentation_only():
             _update_config_for_docs_only(jobs_data)
 
         # TODO: await pending jobs
         # wait for pending jobs to be finished, await_jobs is a long blocking call if any job has to be awaited
-        ci_cache = CiCache(s3, jobs_data["digests"])
         # awaited_jobs = ci_cache.await_jobs(jobs_data.get("jobs_to_wait", {}))
         # for job in awaited_jobs:
         #     jobs_to_do = jobs_data["jobs_to_do"]
@@ -1548,7 +1520,8 @@ def main() -> int:
         #         assert False, "BUG"
 
         # set planned jobs as pending in the CI cache if on the master
-        if pr_info.is_master():
+        if pr_info.is_master() and not args.skip_jobs:
+            ci_cache = CiCache(s3, jobs_data["digests"])
             for job in jobs_data["jobs_to_do"]:
                 config = CI_CONFIG.get_job_config(job)
                 if config.run_always or config.run_by_label:
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 23270aae8ec..6036a04080c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -296,6 +296,7 @@ stateless_check_digest = DigestConfig(
     include_paths=[
         "./tests/queries/0_stateless/",
         "./tests/clickhouse-test",
+        "./tests/config",
         "./tests/*.txt",
     ],
     exclude_files=[".md"],
@@ -305,6 +306,7 @@ stateful_check_digest = DigestConfig(
     include_paths=[
         "./tests/queries/1_stateful/",
         "./tests/clickhouse-test",
+        "./tests/config",
         "./tests/*.txt",
     ],
     exclude_files=[".md"],
@@ -316,6 +318,7 @@ stress_check_digest = DigestConfig(
         "./tests/queries/0_stateless/",
         "./tests/queries/1_stateful/",
         "./tests/clickhouse-test",
+        "./tests/config",
         "./tests/*.txt",
     ],
     exclude_files=[".md"],
@@ -962,10 +965,6 @@ CI_CONFIG = CiConfig(
         JobNames.STATELESS_TEST_ANALYZER_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
         ),
-        # delete?
-        # "Stateless tests (release, DatabaseOrdinary)": TestConfig(
-        #     Build.PACKAGE_RELEASE, job_config=JobConfig(**statless_test_common_params)  # type: ignore
-        # ),
         JobNames.STATELESS_TEST_DB_REPL_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE,
             job_config=JobConfig(num_batches=4, **statless_test_common_params),  # type: ignore
@@ -1112,7 +1111,7 @@ CI_CONFIG = CiConfig(
         JobNames.SQL_LOGIC_TEST: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**sqllogic_test_params)  # type: ignore
         ),
-        JobNames.SQL_LOGIC_TEST: TestConfig(
+        JobNames.SQLTEST: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**sql_test_params)  # type: ignore
         ),
         JobNames.CLCIKBENCH_TEST: TestConfig(Build.PACKAGE_RELEASE),
diff --git a/tests/ci/docker_manifests_merge.py b/tests/ci/docker_manifests_merge.py
index f87246be24b..1ae92807c16 100644
--- a/tests/ci/docker_manifests_merge.py
+++ b/tests/ci/docker_manifests_merge.py
@@ -154,22 +154,28 @@ def main():
     ok_cnt, fail_cnt = 0, 0
     images = get_images_oredered_list()
     for image_obj in images:
-        if image_obj.repo not in missing_images:
-            continue
         tag = image_tags[image_obj.repo]
         if image_obj.only_amd64:
             # FIXME: WA until full arm support
             tags = [f"{tag}-{arch}" for arch in archs if arch != "aarch64"]
         else:
             tags = [f"{tag}-{arch}" for arch in archs]
-        manifest, test_result = create_manifest(image_obj.repo, tag, tags, args.push)
-        test_results.append(TestResult(manifest, test_result))
+
+        # 1. update multiarch latest manifest for every image
         if args.set_latest:
             manifest, test_result = create_manifest(
                 image_obj.repo, "latest", tags, args.push
             )
             test_results.append(TestResult(manifest, test_result))
 
+        # 2. skip manifest create if not missing
+        if image_obj.repo not in missing_images:
+            continue
+
+        # 3. created image:digest multiarch manifest for changed images only
+        manifest, test_result = create_manifest(image_obj.repo, tag, tags, args.push)
+        test_results.append(TestResult(manifest, test_result))
+
         if test_result != "OK":
             status = "failure"
             fail_cnt += 1

From 6563d0b24a778cfa739994723f2857b46c21a255 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 5 Feb 2024 17:10:14 +0000
Subject: [PATCH 0635/1081] Fixing merge

---
 src/Core/SettingsChangesHistory.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 1e4cb72c350..9686684cc24 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -113,7 +113,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
-              {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},

From c9954a7eb8e75c130435b84fd14e0be17765adb2 Mon Sep 17 00:00:00 2001
From: Bhavna Jindal <bhavna.jindal@ibm.com>
Date: Mon, 5 Feb 2024 09:23:11 -0800
Subject: [PATCH 0636/1081] added check for NaN and infinite values

---
 src/Functions/seriesOutliersDetectTukey.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Functions/seriesOutliersDetectTukey.cpp b/src/Functions/seriesOutliersDetectTukey.cpp
index a2fc9cf8eb6..8a2e276c74a 100644
--- a/src/Functions/seriesOutliersDetectTukey.cpp
+++ b/src/Functions/seriesOutliersDetectTukey.cpp
@@ -6,6 +6,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <Common/NaNUtils.h>
 #include <cmath>
 
 namespace DB
@@ -80,19 +81,19 @@ public:
         if (arguments.size() > 1)
         {
             Float64 p_min = arguments[1].column->getFloat64(0);
-            if (p_min < min_quartile|| p_min > max_quartile)
+            if (isnan(p_min) || !isFinite(p_min) || p_min < min_quartile|| p_min > max_quartile)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The second argument of function {} must be in range [2.0, 98.0]", getName());
 
             min_percentile = p_min / 100;
 
             Float64 p_max = arguments[2].column->getFloat64(0);
-            if (p_max < min_quartile || p_max > max_quartile || p_max < min_percentile * 100)
+            if (isnan(p_max) || !isFinite(p_max) || p_max < min_quartile || p_max > max_quartile || p_max < min_percentile * 100)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The third argument of function {} must be in range [2.0, 98.0]", getName());
 
             max_percentile = p_max / 100;
 
             auto k_val = arguments[3].column->getFloat64(0);
-            if (k_val < 0.0)
+            if (k_val < 0.0 || isnan(k_val) || !isFinite(k_val))
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The fourth argument of function {} must be a positive number", getName());
 
             k = k_val;

From 6b06fcf7fcbbb1c9aeb85d9d4692974e1aa57b5a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 5 Feb 2024 17:54:15 +0000
Subject: [PATCH 0637/1081] Fix more tests.

---
 src/Planner/Utils.cpp                         | 26 +++++++++++++++++++
 src/Planner/Utils.h                           |  3 +++
 src/Planner/findParallelReplicasQuery.cpp     | 20 +-------------
 src/Storages/StorageDistributed.cpp           |  2 +-
 src/Storages/StorageMergeTree.cpp             |  2 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |  2 +-
 ..._replicas_join_algo_and_analyzer.reference | 11 ++++++++
 ...arallel_replicas_join_algo_and_analyzer.sh | 11 ++++++++
 8 files changed, 55 insertions(+), 22 deletions(-)

diff --git a/src/Planner/Utils.cpp b/src/Planner/Utils.cpp
index 63f68ccf838..e127a1a053e 100644
--- a/src/Planner/Utils.cpp
+++ b/src/Planner/Utils.cpp
@@ -37,6 +37,8 @@
 #include <Planner/CollectTableExpressionData.h>
 #include <Planner/CollectSets.h>
 
+#include <stack>
+
 namespace DB
 {
 
@@ -130,6 +132,30 @@ ASTPtr queryNodeToSelectQuery(const QueryTreeNodePtr & query_node)
     return result_ast;
 }
 
+static void removeCTEs(ASTPtr & ast)
+{
+    std::stack<IAST *> stack;
+    stack.push(ast.get());
+    while (!stack.empty())
+    {
+        auto * node = stack.top();
+        stack.pop();
+
+        if (auto * subquery = typeid_cast<ASTSubquery *>(node))
+            subquery->cte_name = {};
+
+        for (const auto & child : node->children)
+            stack.push(child.get());
+    }
+}
+
+ASTPtr queryNodeToDistributedSelectQuery(const QueryTreeNodePtr & query_node)
+{
+    auto ast = queryNodeToSelectQuery(query_node);
+    removeCTEs(ast);
+    return ast;
+}
+
 /** There are no limits on the maximum size of the result for the subquery.
   * Since the result of the query is not the result of the entire query.
   */
diff --git a/src/Planner/Utils.h b/src/Planner/Utils.h
index 1b8397f47cc..8df26d598b1 100644
--- a/src/Planner/Utils.h
+++ b/src/Planner/Utils.h
@@ -34,6 +34,9 @@ Block buildCommonHeaderForUnion(const Blocks & queries_headers, SelectUnionMode
 /// Convert query node to ASTSelectQuery
 ASTPtr queryNodeToSelectQuery(const QueryTreeNodePtr & query_node);
 
+/// Convert query node to ASTSelectQuery for distributed processing
+ASTPtr queryNodeToDistributedSelectQuery(const QueryTreeNodePtr & query_node);
+
 /// Build context for subquery execution
 ContextPtr buildSubqueryContext(const ContextPtr & context);
 
diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
index 014052fecd2..cf14fc08351 100644
--- a/src/Planner/findParallelReplicasQuery.cpp
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -391,23 +391,6 @@ const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tr
     return findTableForParallelReplicas(query_tree_node.get());
 }
 
-static void removeCTEs(ASTPtr & ast)
-{
-    std::stack<IAST *> stack;
-    stack.push(ast.get());
-    while (!stack.empty())
-    {
-        auto * node = stack.top();
-        stack.pop();
-
-        if (auto * subquery = typeid_cast<ASTSubquery *>(node))
-            subquery->cte_name = {};
-
-        for (const auto & child : node->children)
-            stack.push(child.get());
-    }
-}
-
 JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
     const QueryNode & query_node,
     const PlannerContextPtr & planner_context,
@@ -428,8 +411,7 @@ JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
     // std::cerr << "buildQueryPlanForParallelReplicas 1 " << modified_query_tree->dumpTree() << std::endl;
     modified_query_tree = buildQueryTreeForShard(planner_context, modified_query_tree);
     // std::cerr << "buildQueryPlanForParallelReplicas 2 " << modified_query_tree->dumpTree() << std::endl;
-    modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
-    removeCTEs(modified_query_ast);
+    modified_query_ast = queryNodeToDistributedSelectQuery(modified_query_tree);
 
     // std::cerr << "buildQueryPlanForParallelReplicas AST " << queryToString(modified_query_ast) << std::endl;
     // std::cerr << "buildQueryPlanForParallelReplicas AST " << modified_query_ast->dumpTree() << std::endl;
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 70a678b0d86..23e6d1b303e 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -830,7 +830,7 @@ void StorageDistributed::read(
           */
         for (auto & column : header)
             column.column = column.column->convertToFullColumnIfConst();
-        query_ast = queryNodeToSelectQuery(query_tree_distributed);
+        query_ast = queryNodeToDistributedSelectQuery(query_tree_distributed);
     }
     else
     {
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 93d21c80698..d0f834a011f 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -228,7 +228,7 @@ void StorageMergeTree::read(
             modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
             header = InterpreterSelectQueryAnalyzer::getSampleBlock(
                 modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
-            modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
+            modified_query_ast = queryNodeToDistributedSelectQuery(modified_query_tree);
         }
         else
         {
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 2024449e009..4a8de500755 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -5417,7 +5417,7 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
 
         header = InterpreterSelectQueryAnalyzer::getSampleBlock(
             modified_query_tree, local_context, SelectQueryOptions(processed_stage).analyze());
-        modified_query_ast = queryNodeToSelectQuery(modified_query_tree);
+        modified_query_ast = queryNodeToDistributedSelectQuery(modified_query_tree);
     }
     else
     {
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
index 1e3ffec2cd9..fa343571ba0 100644
--- a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
@@ -1,3 +1,4 @@
+
 simple join with analyzer
 4200000	4200000	4200000	-1400000
 4200006	4200006	4200006	-1400002
@@ -9,6 +10,7 @@ simple join with analyzer
 4200042	4200042	4200042	-1400014
 4200048	4200048	4200048	-1400016
 4200054	4200054	4200054	-1400018
+
 simple (global) join with analyzer and parallel replicas
 4200000	4200000	4200000	-1400000
 4200006	4200006	4200006	-1400002
@@ -26,6 +28,7 @@ SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
+
 simple (local) join with analyzer and parallel replicas
 4200000	4200000	4200000	-1400000
 4200006	4200006	4200006	-1400002
@@ -40,6 +43,7 @@ simple (local) join with analyzer and parallel replicas
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
+
 simple (local) join with analyzer and parallel replicas and full sorting merge join
 4200000	4200000	4200000	-1400000
 4200006	4200006	4200006	-1400002
@@ -54,6 +58,7 @@ simple (local) join with analyzer and parallel replicas and full sorting merge j
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
+
 nested join with analyzer
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -65,6 +70,7 @@ nested join with analyzer
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
+
 nested join with analyzer and parallel replicas, both local
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -79,6 +85,7 @@ nested join with analyzer and parallel replicas, both local
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
+
 nested join with analyzer and parallel replicas, both global
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -96,6 +103,7 @@ SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
+
 nested join with analyzer and parallel replicas, global + local
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -113,6 +121,7 @@ SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
+
 nested join with analyzer and parallel replicas, both local, both full sorting merge join
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -130,6 +139,7 @@ SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
+
 nested join with analyzer and parallel replicas, both local, both full sorting and hash join
 420000	420000	420000	-140000
 420042	420042	420042	-140014
@@ -147,6 +157,7 @@ SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
+
 nested join with analyzer and parallel replicas, both local, both full sorting and hash join
 420000	420000	420000	-140000
 420042	420042	420042	-140014
diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
index bda93d08bb1..2840482da6d 100755
--- a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.sh
@@ -18,6 +18,7 @@ insert into num_2 select number * 3, -number from numbers(1.5e6);
 "
 
 ##############
+echo
 echo "simple join with analyzer"
 
 $CLICKHOUSE_CLIENT -q "
@@ -27,6 +28,7 @@ order by l.key limit 10 offset 700000
 SETTINGS allow_experimental_analyzer=1"
 
 ##############
+echo
 echo "simple (global) join with analyzer and parallel replicas"
 
 $CLICKHOUSE_CLIENT -q "
@@ -49,6 +51,7 @@ grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
 sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 ##############
+echo
 echo "simple (local) join with analyzer and parallel replicas"
 
 $CLICKHOUSE_CLIENT -q "
@@ -72,6 +75,7 @@ sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 
 ##############
+echo
 echo "simple (local) join with analyzer and parallel replicas and full sorting merge join"
 
 $CLICKHOUSE_CLIENT -q "
@@ -95,6 +99,7 @@ sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 
 ##############
+echo
 echo "nested join with analyzer"
 
 $CLICKHOUSE_CLIENT -q "
@@ -106,6 +111,7 @@ SETTINGS allow_experimental_analyzer=1"
 
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, both local"
 
 $CLICKHOUSE_CLIENT -q "
@@ -131,6 +137,7 @@ sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, both global"
 
 $CLICKHOUSE_CLIENT -q "
@@ -155,6 +162,7 @@ grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
 sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, global + local"
 
 $CLICKHOUSE_CLIENT -q "
@@ -180,6 +188,7 @@ sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, both local, both full sorting merge join"
 
 $CLICKHOUSE_CLIENT -q "
@@ -204,6 +213,7 @@ grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
 sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, both local, both full sorting and hash join"
 
 $CLICKHOUSE_CLIENT -q "
@@ -228,6 +238,7 @@ grep -o "SELECT.*WithMergeableState)\|<Debug>.*Coordinator: Coordination done" |
 sed -re 's/_data_[[:digit:]]+_[[:digit:]]+/_data_/g'
 
 ##############
+echo
 echo "nested join with analyzer and parallel replicas, both local, both full sorting and hash join"
 
 $CLICKHOUSE_CLIENT -q "

From d782c9bde622f5fbe10cebf6bd76df363a13a5c8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 20:52:14 +0100
Subject: [PATCH 0638/1081] Fix crash in topK when merging empty states

---
 src/AggregateFunctions/AggregateFunctionTopK.cpp           | 3 +++
 src/Common/SpaceSaving.h                                   | 3 +++
 tests/queries/0_stateless/02984_topk_empty_merge.reference | 1 +
 tests/queries/0_stateless/02984_topk_empty_merge.sql       | 2 ++
 4 files changed, 9 insertions(+)
 create mode 100644 tests/queries/0_stateless/02984_topk_empty_merge.reference
 create mode 100644 tests/queries/0_stateless/02984_topk_empty_merge.sql

diff --git a/src/AggregateFunctions/AggregateFunctionTopK.cpp b/src/AggregateFunctions/AggregateFunctionTopK.cpp
index 660f136e4dc..dcbd5586406 100644
--- a/src/AggregateFunctions/AggregateFunctionTopK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionTopK.cpp
@@ -234,6 +234,9 @@ public:
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena *) const override
     {
+        if (!this->data(rhs).value.size())
+            return;
+
         auto & set = this->data(place).value;
         if (set.capacity() != reserved)
             set.resize(reserved);
diff --git a/src/Common/SpaceSaving.h b/src/Common/SpaceSaving.h
index 8dc0ee074c0..7a740ae6c9b 100644
--- a/src/Common/SpaceSaving.h
+++ b/src/Common/SpaceSaving.h
@@ -206,6 +206,9 @@ public:
      */
     void merge(const Self & rhs)
     {
+        if (!rhs.size())
+            return;
+
         UInt64 m1 = 0;
         UInt64 m2 = 0;
 
diff --git a/tests/queries/0_stateless/02984_topk_empty_merge.reference b/tests/queries/0_stateless/02984_topk_empty_merge.reference
new file mode 100644
index 00000000000..fe51488c706
--- /dev/null
+++ b/tests/queries/0_stateless/02984_topk_empty_merge.reference
@@ -0,0 +1 @@
+[]
diff --git a/tests/queries/0_stateless/02984_topk_empty_merge.sql b/tests/queries/0_stateless/02984_topk_empty_merge.sql
new file mode 100644
index 00000000000..754b0cb26a2
--- /dev/null
+++ b/tests/queries/0_stateless/02984_topk_empty_merge.sql
@@ -0,0 +1,2 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/59107
+SELECT topK('102.4') FROM remote('127.0.0.{1,2}', view(SELECT NULL FROM system.one WHERE dummy = 1));

From dab078f7d24bca61a1cf05dc0294fdee48103202 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 5 Feb 2024 20:21:48 +0000
Subject: [PATCH 0639/1081] Profile events

---
 src/Common/ProfileEvents.cpp                              | 2 ++
 src/QueryPipeline/RemoteQueryExecutor.cpp                 | 6 ++++++
 .../MergeTree/ParallelReplicasReadingCoordinator.cpp      | 8 ++++----
 .../02769_parallel_replicas_unavailable_shards.sql        | 4 +---
 4 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 8782f895f3f..0218545c3a4 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -616,6 +616,8 @@ The server successfully detected this situation and will download merged part fr
     M(InterfacePostgreSQLReceiveBytes, "Number of bytes received through PostgreSQL interfaces") \
     \
     M(ParallelReplicasUsedCount, "Number of replicas used to execute a query with task-based parallel replicas") \
+    M(ParallelReplicasAvailableCount, "Number of replicas available to execute a query with task-based parallel replicas") \
+    M(ParallelReplicasUnavailableCount, "Number of replicas which was chosen, but unavailable, to execute a query with task-based parallel replicas") \
 
 #ifdef APPLY_FOR_EXTERNAL_EVENTS
     #define APPLY_FOR_EVENTS(M) APPLY_FOR_BUILTIN_EVENTS(M) APPLY_FOR_EXTERNAL_EVENTS(M)
diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index 1a68c9d4471..e44749dfb97 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -30,6 +30,7 @@ namespace ProfileEvents
     extern const Event SuspendSendingQueryToShard;
     extern const Event ReadTaskRequestsReceived;
     extern const Event MergeTreeReadTaskRequestsReceived;
+    extern const Event ParallelReplicasAvailableCount;
 }
 
 namespace DB
@@ -97,7 +98,12 @@ RemoteQueryExecutor::RemoteQueryExecutor(
 
         std::vector<IConnectionPool::Entry> connection_entries;
         if (!result.entry.isNull() && result.is_usable)
+        {
+            if (extension_ && extension_->parallel_reading_coordinator)
+                ProfileEvents::increment(ProfileEvents::ParallelReplicasAvailableCount);
+
             connection_entries.emplace_back(std::move(result.entry));
+        }
 
         auto res = std::make_unique<MultiplexedConnections>(std::move(connection_entries), context->getSettingsRef(), throttler);
         if (extension_ && extension_->replica_info)
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index abc51bde3fb..2fe237efdc7 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -97,11 +97,9 @@ extern const Event ParallelReplicasCollectingOwnedSegmentsMicroseconds;
 extern const Event ParallelReplicasReadAssignedMarks;
 extern const Event ParallelReplicasReadUnassignedMarks;
 extern const Event ParallelReplicasReadAssignedForStealingMarks;
-}
 
-namespace ProfileEvents
-{
-    extern const Event ParallelReplicasUsedCount;
+extern const Event ParallelReplicasUsedCount;
+extern const Event ParallelReplicasUnavailableCount;
 }
 
 namespace DB
@@ -1025,6 +1023,8 @@ ParallelReadResponse ParallelReplicasReadingCoordinator::handleRequest(ParallelR
 
 void ParallelReplicasReadingCoordinator::markReplicaAsUnavailable(size_t replica_number)
 {
+    ProfileEvents::increment(ProfileEvents::ParallelReplicasUnavailableCount);
+
     std::lock_guard lock(mutex);
 
     if (!pimpl)
diff --git a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
index be200353f06..1a75e000349 100644
--- a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
+++ b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
@@ -2,8 +2,6 @@ DROP TABLE IF EXISTS test_parallel_replicas_unavailable_shards;
 CREATE TABLE test_parallel_replicas_unavailable_shards (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
 INSERT INTO test_parallel_replicas_unavailable_shards SELECT * FROM numbers(10);
 
-SYSTEM FLUSH LOGS;
-
 SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=11, cluster_for_parallel_replicas='parallel_replicas', parallel_replicas_for_non_replicated_merge_tree=1;
 SET send_logs_level='error';
 SELECT count() FROM test_parallel_replicas_unavailable_shards WHERE NOT ignore(*) SETTINGS log_comment = '02769_7b513191-5082-4073-8568-53b86a49da79';
@@ -11,6 +9,6 @@ SELECT count() FROM test_parallel_replicas_unavailable_shards WHERE NOT ignore(*
 SYSTEM FLUSH LOGS;
 
 SET allow_experimental_parallel_reading_from_replicas=0;
-SELECT count() FROM system.text_log WHERE yesterday() <= event_date AND query_id in (select query_id from system.query_log where log_comment = '02769_7b513191-5082-4073-8568-53b86a49da79' and current_database = currentDatabase()) and message LIKE '%Replica number % is unavailable%';
+SELECT ProfileEvents['ParallelReplicasUnavailableCount'] FROM system.query_log WHERE yesterday() <= event_date AND query_id in (select query_id from system.query_log where log_comment = '02769_7b513191-5082-4073-8568-53b86a49da79' and current_database = currentDatabase()) and type = 'QueryFinish' and query_id == initial_query_id;
 
 DROP TABLE test_parallel_replicas_unavailable_shards;

From 40885d7f16d2a5e72d500a799c8b718c36626e63 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 21:51:26 +0100
Subject: [PATCH 0640/1081] Add extra sanity check

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index cb1e94305fb..de7788997be 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5570,6 +5570,14 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
                 column = function_base->getConstantResultForNonConstArguments(argument_columns, result_type);
             }
 
+            if (column->getDataType() != result_type->getColumnType())
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "Unexpected return type from {}. Expected {}. Got {}",
+                    function->getName(),
+                    result_type->getColumnType(),
+                    column->getDataType());
+
             /** Do not perform constant folding if there are aggregate or arrayJoin functions inside function.
               * Example: SELECT toTypeName(sum(number)) FROM numbers(10);
               */

From 86ac7b14d0bc1ea1796285755a87c68ba59e46b2 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 5 Feb 2024 21:55:32 +0100
Subject: [PATCH 0641/1081] Fix Distributed table engine with a constant
 sharding key.

---
 src/Storages/StorageDistributed.cpp | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index f711ed5ac92..8b0c1b63306 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -1533,10 +1533,7 @@ ClusterPtr StorageDistributed::getOptimizedCluster(
 IColumn::Selector StorageDistributed::createSelector(const ClusterPtr cluster, const ColumnWithTypeAndName & result)
 {
     const auto & slot_to_shard = cluster->getSlotToShard();
-
     const IColumn * column = result.column.get();
-    if (const auto * col_const = typeid_cast<const ColumnConst *>(column))
-        column = &col_const->getDataColumn();
 
 // If result.type is DataTypeLowCardinality, do shard according to its dictionaryType
 #define CREATE_FOR_TYPE(TYPE)                                                                                       \

From c9b8559b29d8521ea0242ca4201717d920f63ee4 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Mon, 5 Feb 2024 13:13:33 -0800
Subject: [PATCH 0642/1081] [Docs] Add Cloud details for quorum insert settings

---
 docs/en/operations/settings/settings.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 3a826b095d2..59d8bf2d858 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1769,6 +1769,10 @@ Default value: 0 (no restriction).
 
 ## insert_quorum {#insert_quorum}
 
+:::note
+`insert_quorum` does not apply to ClickHouse Cloud as all inserts are quorum inserted when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree).
+:::
+
 Enables the quorum writes.
 
 - If `insert_quorum < 2`, the quorum writes are disabled.
@@ -1808,6 +1812,10 @@ See also:
 
 ## insert_quorum_parallel {#insert_quorum_parallel}
 
+:::note
+`insert_quorum_parallel` does not apply to ClickHouse Cloud as all inserts are quorum inserted when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree).
+:::
+
 Enables or disables parallelism for quorum `INSERT` queries. If enabled, additional `INSERT` queries can be sent while previous queries have not yet finished. If disabled, additional writes to the same table will be rejected.
 
 Possible values:

From b9bb04ebf03f6677d6f81ac628ea94ca3b9b43bd Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Mon, 5 Feb 2024 13:23:54 -0800
Subject: [PATCH 0643/1081] [Docs] Specify Memory table engine usage on cloud

---
 docs/en/engines/table-engines/special/memory.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index 5cd766a318a..a30f620f5c5 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -6,6 +6,10 @@ sidebar_label:  Memory
 
 # Memory Table Engine
 
+:::note
+When using the Memory table engine on ClickHouse Cloud, you must use a client that uses TCP (such as [clickhouse-client](/en/interfaces/cli)) or a native interface, and not one that uses HTTP (such as [clickhouse-connect](/en/integrations/python)). If you use HTTP, all queries must be submitted and executed at once using a multi-statement query.
+:::
+
 The Memory engine stores data in RAM, in uncompressed form. Data is stored in exactly the same form as it is received when read. In other words, reading from this table is completely free.
 Concurrent data access is synchronized. Locks are short: read and write operations do not block each other.
 Indexes are not supported. Reading is parallelized.

From 15b6dd143175e1540139cf4a9076a3a170d463b5 Mon Sep 17 00:00:00 2001
From: Tyler Hannan <tyler@clickhouse.com>
Date: Mon, 5 Feb 2024 22:27:13 +0100
Subject: [PATCH 0644/1081] Update README.md

Fixing dated Recordings link
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index d356e429892..9ada350d173 100644
--- a/README.md
+++ b/README.md
@@ -37,7 +37,7 @@ Keep an eye out for upcoming meetups around the world. Somewhere else you want u
 
 ## Recent Recordings
 * **Recent Meetup Videos**: [Meetup Playlist](https://www.youtube.com/playlist?list=PL0Z2YDlm0b3iNDUzpY1S3L_iV4nARda_U) Whenever possible recordings of the ClickHouse Community Meetups are edited and presented as individual talks. Current featuring "Modern SQL in 2023", "Fast, Concurrent, and Consistent Asynchronous INSERTS in ClickHouse", and "Full-Text Indices: Design and Experiments"
-* **Recording available**: [**v23.10 Release Webinar**](https://www.youtube.com/watch?v=PGQS6uPb970) All the features of 23.10, one convenient video! Watch it now!
+* **Recording available**: [**v24.1 Release Webinar**](https://www.youtube.com/watch?v=pBF9g0wGAGs) All the features of 24.1, one convenient video! Watch it now!
 * **All release webinar recordings**: [YouTube playlist](https://www.youtube.com/playlist?list=PL0Z2YDlm0b3jAlSy1JxyP8zluvXaN3nxU)
 
   
From 5de010ddda8311ff178519c0161b6d8314e2641e Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Mon, 5 Feb 2024 13:29:02 -0800
Subject: [PATCH 0645/1081] [Docs] Add detail on using temporary tables in
 Cloud

---
 docs/en/sql-reference/statements/create/table.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/sql-reference/statements/create/table.md b/docs/en/sql-reference/statements/create/table.md
index 7322bc17b76..067761e760b 100644
--- a/docs/en/sql-reference/statements/create/table.md
+++ b/docs/en/sql-reference/statements/create/table.md
@@ -514,6 +514,10 @@ ENGINE = MergeTree ORDER BY x;
 
 ## Temporary Tables
 
+:::note
+Please note that on ClickHouse Cloud, temporary tables are not replicated. As a result, there is no guarantee that data inserted into a temporary table will be available in other replicas. The primary use case where temporary tables can be useful in ClickHouse Cloud is for querying or joining small external datasets during a single session.
+:::
+
 ClickHouse supports temporary tables which have the following characteristics:
 
 - Temporary tables disappear when the session ends, including if the connection is lost.

From d8555af44836d6ecf4ce2d9bae04b1e7d7ae8f6b Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 5 Feb 2024 22:41:28 +0100
Subject: [PATCH 0646/1081] Change the default value for
 `async_insert_max_data_size` to 10 MiB (#59536)

---
 src/Core/Settings.h               | 2 +-
 src/Core/SettingsChangesHistory.h | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 2b36b83edd2..dc863576a85 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -748,7 +748,7 @@ class IColumn;
     M(Bool, async_insert, false, "If true, data from INSERT query is stored in queue and later flushed to table in background. If wait_for_async_insert is false, INSERT query is processed almost instantly, otherwise client will wait until data will be flushed to table", 0) \
     M(Bool, wait_for_async_insert, true, "If true wait for processing of asynchronous insertion", 0) \
     M(Seconds, wait_for_async_insert_timeout, DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC, "Timeout for waiting for processing asynchronous insertion", 0) \
-    M(UInt64, async_insert_max_data_size, 1000000, "Maximum size in bytes of unparsed data collected per query before being inserted", 0) \
+    M(UInt64, async_insert_max_data_size, 10485760, "Maximum size in bytes of unparsed data collected per query before being inserted", 0) \
     M(UInt64, async_insert_max_query_number, 450, "Maximum number of insert queries before being inserted", 0) \
     M(Milliseconds, async_insert_poll_timeout_ms, 10, "Timeout for polling data from asynchronous insert queue", 0) \
     M(Bool, async_insert_use_adaptive_busy_timeout, true, "If it is set to true, use adaptive busy timeout for asynchronous inserts", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c3b0cee00a4..db3a76e29cd 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -84,7 +84,8 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
-    {"24.2", {{"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
+    {"24.2", {{"async_insert_max_data_size", 1000000, 10485760, "The previous value appeared to be too small."},
+              {"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
               {"async_insert_use_adaptive_busy_timeout", true, true, "Use adaptive asynchronous insert timeout"},
               {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
               {"async_insert_busy_timeout_max_ms", 200, 200, "The minimum value of the asynchronous insert timeout in milliseconds; async_insert_busy_timeout_ms is aliased to async_insert_busy_timeout_max_ms"},

From a26e8b3a9e4594d648c7a7693b27114038aee89f Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Sat, 3 Feb 2024 18:03:38 +0100
Subject: [PATCH 0647/1081] Fix for filters w/o path column

---
 .../System/StorageSystemZooKeeper.cpp         | 24 ++++++++++++-------
 1 file changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index cacd7cc2133..6d2166ff5f9 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -220,6 +220,7 @@ private:
     const UInt64 max_block_size;
     Paths paths;
     ContextPtr context;
+    bool started = false;
 };
 
 
@@ -441,7 +442,7 @@ static Paths extractPath(const ActionsDAG::NodeRawConstPtrs & filter_nodes, Cont
     for (const auto * node : filter_nodes)
         extractPathImpl(*node, res, context, allow_unrestricted);
 
-    if (filter_nodes.empty() && allow_unrestricted)
+    if (res.empty() && allow_unrestricted)
         res.emplace_back("/", ZkPathType::Recurse);
 
     return res;
@@ -457,7 +458,18 @@ void ReadFromSystemZooKeeper::applyFilters()
 Chunk SystemZooKeeperSource::generate()
 {
     if (paths.empty())
+    {
+        if (!started)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "SELECT from system.zookeeper table must contain condition like path = 'path' "
+                        "or path IN ('path1','path2'...) or path IN (subquery) "
+                        "in WHERE clause unless `set allow_unrestricted_reads_from_keeper = 'true'`.");
+
+        /// No more work
         return {};
+    }
+
+    started = true;
 
     MutableColumns res_columns = getPort().getHeader().cloneEmptyColumns();
     size_t row_count = 0;
@@ -487,12 +499,6 @@ Chunk SystemZooKeeperSource::generate()
         return zookeeper;
     };
 
-    if (paths.empty())
-        throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                        "SELECT from system.zookeeper table must contain condition like path = 'path' "
-                        "or path IN ('path1','path2'...) or path IN (subquery) "
-                        "in WHERE clause unless `set allow_unrestricted_reads_from_keeper = 'true'`.");
-
     const Int64 max_inflight_requests = std::max<Int64>(1, context->getSettingsRef().max_download_threads.value);
 
     struct ListTask
@@ -591,8 +597,8 @@ Chunk SystemZooKeeperSource::generate()
 
             auto & get_task = get_tasks[i];
             auto & list_task = list_tasks[get_task.list_task_idx];
-            if (auto elem = context->getProcessListElement())
-                elem->checkTimeLimit();
+            if (query_status)
+                query_status->checkTimeLimit();
 
             // Deduplication
             String key = list_task.path_part + '/' + get_task.node;

From e673d8bd0cc08d3a53587425b5ddd4f48c5bf943 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 6 Feb 2024 01:50:59 +0300
Subject: [PATCH 0648/1081] Update 85_bug-report.md

---
 .github/ISSUE_TEMPLATE/85_bug-report.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/ISSUE_TEMPLATE/85_bug-report.md b/.github/ISSUE_TEMPLATE/85_bug-report.md
index 93b2342af70..6bf265260ac 100644
--- a/.github/ISSUE_TEMPLATE/85_bug-report.md
+++ b/.github/ISSUE_TEMPLATE/85_bug-report.md
@@ -17,7 +17,7 @@ assignees: ''
 
 > A link to reproducer in [https://fiddle.clickhouse.com/](https://fiddle.clickhouse.com/).
 
-**Does it reproduce on recent release?**
+**Does it reproduce on the most recent release?**
 
 [The list of releases](https://github.com/ClickHouse/ClickHouse/blob/master/utils/list-versions/version_date.tsv)
 
@@ -34,11 +34,11 @@ assignees: ''
 **How to reproduce**
 
 * Which ClickHouse server version to use
-* Which interface to use, if matters
+* Which interface to use, if it matters
 * Non-default settings, if any
 * `CREATE TABLE` statements for all tables involved
 * Sample data for all these tables, use [clickhouse-obfuscator](https://github.com/ClickHouse/ClickHouse/blob/master/programs/obfuscator/Obfuscator.cpp#L42-L80) if necessary
-* Queries to run that lead to unexpected result
+* Queries to run that lead to an unexpected result
 
 **Expected behavior**
 

From 1c0fa345ac341030d76a687b0900f8e66739d384 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Mon, 5 Feb 2024 15:51:28 -0800
Subject: [PATCH 0649/1081] Fix broken link for Variant data type (#59539)

---
 docs/en/sql-reference/data-types/variant.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/data-types/variant.md b/docs/en/sql-reference/data-types/variant.md
index 17d51878420..f027e3fe343 100644
--- a/docs/en/sql-reference/data-types/variant.md
+++ b/docs/en/sql-reference/data-types/variant.md
@@ -1,5 +1,5 @@
 ---
-slug: /en/sql-reference/data-types/json
+slug: /en/sql-reference/data-types/variant
 sidebar_position: 55
 sidebar_label: Variant
 ---

From 2c882f012ef23efa95d577cb00d08dbeb34e2783 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 6 Feb 2024 11:35:14 +0800
Subject: [PATCH 0650/1081] opt isNotnull

---
 src/Functions/isNotNull.cpp | 93 ++++++++++++++++++++++++++++++-------
 1 file changed, 76 insertions(+), 17 deletions(-)

diff --git a/src/Functions/isNotNull.cpp b/src/Functions/isNotNull.cpp
index 360c2fc7f9f..a15a0e82e3c 100644
--- a/src/Functions/isNotNull.cpp
+++ b/src/Functions/isNotNull.cpp
@@ -1,19 +1,25 @@
-#include <Functions/IFunction.h>
-#include <Functions/FunctionHelpers.h>
-#include <Functions/FunctionFactory.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <Core/ColumnNumbers.h>
-#include <Columns/ColumnNullable.h>
 #include <Columns/ColumnLowCardinality.h>
+#include <Columns/ColumnNullable.h>
 #include <Columns/ColumnVariant.h>
+#include <Core/ColumnNumbers.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/IFunction.h>
+#include <Functions/PerformanceAdaptors.h>
 #include <Common/assert_cast.h>
 
-
 namespace DB
 {
 namespace
 {
 
+
+#define DECLARE_SEVERAL_IMPLEMENTATIONS(...) \
+DECLARE_DEFAULT_CODE      (__VA_ARGS__) \
+DECLARE_AVX2_SPECIFIC_CODE(__VA_ARGS__)
+
+DECLARE_SEVERAL_IMPLEMENTATIONS(
 /// Implements the function isNotNull which returns true if a value
 /// is not null, false otherwise.
 class FunctionIsNotNull : public IFunction
@@ -21,11 +27,6 @@ class FunctionIsNotNull : public IFunction
 public:
     static constexpr auto name = "isNotNull";
 
-    static FunctionPtr create(ContextPtr)
-    {
-        return std::make_shared<FunctionIsNotNull>();
-    }
-
     std::string getName() const override
     {
         return name;
@@ -52,9 +53,9 @@ public:
             const auto & discriminators = checkAndGetColumn<ColumnVariant>(*elem.column)->getLocalDiscriminators();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
-            data.reserve(discriminators.size());
-            for (auto discr : discriminators)
-                data.push_back(discr != ColumnVariant::NULL_DISCRIMINATOR);
+            data.resize(discriminators.size());
+            for (size_t i = 0; i < discriminators.size(); ++i)
+                data[i] = discriminators[i] != ColumnVariant::NULL_DISCRIMINATOR;
             return res;
         }
 
@@ -64,9 +65,9 @@ public:
             const size_t null_index = low_cardinality_column->getDictionary().getNullValueIndex();
             auto res = DataTypeUInt8().createColumn();
             auto & data = typeid_cast<ColumnUInt8 &>(*res).getData();
-            data.reserve(low_cardinality_column->size());
+            data.resize(low_cardinality_column->size());
             for (size_t i = 0; i != low_cardinality_column->size(); ++i)
-                data.push_back(low_cardinality_column->getIndexAt(i) != null_index);
+                data[i] = (low_cardinality_column->getIndexAt(i) != null_index);
             return res;
         }
 
@@ -88,6 +89,64 @@ public:
             return DataTypeUInt8().createColumnConst(elem.column->size(), 1u);
         }
     }
+
+private:
+    MULTITARGET_FUNCTION_AVX2_SSE42(
+    MULTITARGET_FUNCTION_HEADER(static void NO_INLINE), vectorImpl, MULTITARGET_FUNCTION_BODY((const PaddedPODArray<UInt8> & null_map, PaddedPODArray<UInt8> & res) /// NOLINT
+    {
+        size_t size = null_map.size();
+        for (size_t i = 0; i < size; ++i)
+            res[i] = !null_map[i];
+    }))
+
+    static void NO_INLINE vector(const PaddedPODArray<UInt8> & null_map, PaddedPODArray<UInt8> & res)
+    {
+#if USE_MULTITARGET_CODE
+        if (isArchSupported(TargetArch::AVX2))
+        {
+            vectorImplAVX2(null_map, res);
+            return;
+        }
+
+        if (isArchSupported(TargetArch::SSE42))
+        {
+            vectorImplSSE42(null_map, res);
+            return;
+        }
+#endif
+        vectorImpl(null_map, res);
+    }
+};
+
+) // DECLARE_SEVERAL_IMPLEMENTATIONS
+#undef DECLARE_SEVERAL_IMPLEMENTATIONS
+
+class FunctionIsNotNull : public TargetSpecific::Default::FunctionIsNotNull
+{
+public:
+    explicit FunctionIsNotNull(ContextPtr context) : selector(context)
+    {
+        selector.registerImplementation<TargetArch::Default,
+            TargetSpecific::Default::FunctionIsNotNull>();
+
+    #if USE_MULTITARGET_CODE
+        selector.registerImplementation<TargetArch::AVX2,
+            TargetSpecific::AVX2::FunctionIsNotNull>();
+    #endif
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        return selector.selectAndExecute(arguments, result_type, input_rows_count);
+    }
+
+    static FunctionPtr create(ContextPtr context)
+    {
+        return std::make_shared<FunctionIsNotNull>(context);
+    }
+
+private:
+    ImplementationSelector<IFunction> selector;
 };
 
 }

From bc9c1bf34583ebb7e5974a96725bbcb68da54008 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 6 Feb 2024 11:48:13 +0800
Subject: [PATCH 0651/1081] improve ifnotnull

---
 src/Functions/isNotNull.cpp | 45 +++----------------------------------
 1 file changed, 3 insertions(+), 42 deletions(-)

diff --git a/src/Functions/isNotNull.cpp b/src/Functions/isNotNull.cpp
index a15a0e82e3c..dd5182aeade 100644
--- a/src/Functions/isNotNull.cpp
+++ b/src/Functions/isNotNull.cpp
@@ -14,12 +14,6 @@ namespace DB
 namespace
 {
 
-
-#define DECLARE_SEVERAL_IMPLEMENTATIONS(...) \
-DECLARE_DEFAULT_CODE      (__VA_ARGS__) \
-DECLARE_AVX2_SPECIFIC_CODE(__VA_ARGS__)
-
-DECLARE_SEVERAL_IMPLEMENTATIONS(
 /// Implements the function isNotNull which returns true if a value
 /// is not null, false otherwise.
 class FunctionIsNotNull : public IFunction
@@ -27,6 +21,8 @@ class FunctionIsNotNull : public IFunction
 public:
     static constexpr auto name = "isNotNull";
 
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionIsNotNull>(); }
+
     std::string getName() const override
     {
         return name;
@@ -77,10 +73,7 @@ public:
             auto res_column = ColumnUInt8::create(input_rows_count);
             const auto & src_data = nullable->getNullMapData();
             auto & res_data = assert_cast<ColumnUInt8 &>(*res_column).getData();
-
-            for (size_t i = 0; i < input_rows_count; ++i)
-                res_data[i] = !src_data[i];
-
+            vector(src_data, res_data);
             return res_column;
         }
         else
@@ -117,38 +110,6 @@ private:
         vectorImpl(null_map, res);
     }
 };
-
-) // DECLARE_SEVERAL_IMPLEMENTATIONS
-#undef DECLARE_SEVERAL_IMPLEMENTATIONS
-
-class FunctionIsNotNull : public TargetSpecific::Default::FunctionIsNotNull
-{
-public:
-    explicit FunctionIsNotNull(ContextPtr context) : selector(context)
-    {
-        selector.registerImplementation<TargetArch::Default,
-            TargetSpecific::Default::FunctionIsNotNull>();
-
-    #if USE_MULTITARGET_CODE
-        selector.registerImplementation<TargetArch::AVX2,
-            TargetSpecific::AVX2::FunctionIsNotNull>();
-    #endif
-    }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        return selector.selectAndExecute(arguments, result_type, input_rows_count);
-    }
-
-    static FunctionPtr create(ContextPtr context)
-    {
-        return std::make_shared<FunctionIsNotNull>(context);
-    }
-
-private:
-    ImplementationSelector<IFunction> selector;
-};
-
 }
 
 REGISTER_FUNCTION(IsNotNull)

From 754b73a38bd8743a8f4ec87c543f2e56a508e2d8 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Tue, 6 Feb 2024 09:35:48 +0100
Subject: [PATCH 0652/1081] remove unused

---
 src/Coordination/SnapshotableHashTable.h | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/Coordination/SnapshotableHashTable.h b/src/Coordination/SnapshotableHashTable.h
index 5533913b3b8..0c6af29d24a 100644
--- a/src/Coordination/SnapshotableHashTable.h
+++ b/src/Coordination/SnapshotableHashTable.h
@@ -7,11 +7,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
 template<typename V>
 struct ListNode
 {

From 5962ed0bd3ee89ba283c541982f60d13b1f010fa Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 5 Feb 2024 21:54:27 +0100
Subject: [PATCH 0653/1081] Add test.

---
 .../02983_const_sharding_key.reference        |  7 +++++
 .../0_stateless/02983_const_sharding_key.sql  | 26 +++++++++++++++++++
 2 files changed, 33 insertions(+)
 create mode 100644 tests/queries/0_stateless/02983_const_sharding_key.reference
 create mode 100644 tests/queries/0_stateless/02983_const_sharding_key.sql

diff --git a/tests/queries/0_stateless/02983_const_sharding_key.reference b/tests/queries/0_stateless/02983_const_sharding_key.reference
new file mode 100644
index 00000000000..06e567b11df
--- /dev/null
+++ b/tests/queries/0_stateless/02983_const_sharding_key.reference
@@ -0,0 +1,7 @@
+1
+2
+3
+4
+5
+6
+7
diff --git a/tests/queries/0_stateless/02983_const_sharding_key.sql b/tests/queries/0_stateless/02983_const_sharding_key.sql
new file mode 100644
index 00000000000..339293b8b81
--- /dev/null
+++ b/tests/queries/0_stateless/02983_const_sharding_key.sql
@@ -0,0 +1,26 @@
+-- Tags: distributed, no-parallel
+
+DROP DATABASE IF EXISTS shard_0;
+DROP DATABASE IF EXISTS shard_1;
+DROP TABLE IF EXISTS t_distr;
+
+CREATE DATABASE IF NOT EXISTS shard_0;
+CREATE DATABASE IF NOT EXISTS shard_1;
+
+CREATE TABLE shard_0.t_local (a Int) ENGINE = Memory;
+CREATE TABLE shard_1.t_local (a Int) ENGINE = Memory;
+CREATE TABLE t_distr (a Int) ENGINE = Distributed(test_cluster_two_shards_different_databases, '', 't_local', 1000);
+
+SET distributed_foreground_insert=0;
+INSERT INTO t_distr VALUES (1), (2), (3);
+
+SET distributed_foreground_insert=1;
+INSERT INTO t_distr VALUES (4), (5), (6), (7);
+
+SYSTEM FLUSH DISTRIBUTED t_distr;
+
+SELECT * FROM t_distr ORDER BY a;
+
+DROP TABLE t_distr;
+DROP DATABASE shard_0;
+DROP DATABASE shard_1;

From 127996486602e9ecf46ff8e3ca8cd59cfefcbce6 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Tue, 6 Feb 2024 10:18:02 +0100
Subject: [PATCH 0654/1081] fix build

---
 src/Coordination/KeeperSnapshotManager.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index fe6c7e3a389..c176536dfbf 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -454,7 +454,7 @@ void KeeperStorageSnapshot::deserialize(SnapshotDeserializationResult & deserial
 #else
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Children counter in stat.numChildren {}"
                                 " is different from actual children size {} for node {}",
-                                itr.value.stat.numChildren, itr.value.getChildren().size(), itr.key);
+                                itr.value.numChildren(), itr.value.getChildren().size(), itr.key);
 #endif
             }
         }

From cbd81b506fb9acddd59087eddc2d431db91c26af Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Tue, 6 Feb 2024 09:56:15 +0000
Subject: [PATCH 0655/1081] CI: fix ast fuzzer job report (slack bot issue)

 #job_ast_fuzzer_debug #job_style_check
---
 tests/ci/ast_fuzzer_check.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 26ce7f5140b..5a0eca51570 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -13,7 +13,7 @@ from clickhouse_helper import (
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport
+from report import FAIL, FAILURE, OK, SUCCESS, JobReport, TestResult
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -144,12 +144,16 @@ def main():
         with open(workspace_path / "description.txt", "r", encoding="utf-8") as desc_f:
             description = desc_f.readline().rstrip("\n")
     except:
-        status = "failure"
+        status = FAILURE
         description = "Task failed: $?=" + str(retcode)
 
+    test_result = TestResult(description, OK)
+    if "fail" in status:
+        test_result.status = FAIL
+
     JobReport(
         description=description,
-        test_results=[],
+        test_results=[test_result],
         status=status,
         start_time=stopwatch.start_time_str,
         duration=stopwatch.duration_seconds,
@@ -158,7 +162,7 @@ def main():
     ).dump()
 
     logging.info("Result: '%s', '%s'", status, description)
-    if status == "failure":
+    if status != SUCCESS:
         sys.exit(1)
 
 
From 306e739daadaf0ae52f9cb33e8fd13c852e9b4a1 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Tue, 6 Feb 2024 12:33:11 +0100
Subject: [PATCH 0656/1081] Updated a list of trusted contributors (#59616)

* Updated a list of trusted contributors

* Automatic style fix

---------

Co-authored-by: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
---
 tests/ci/lambda_shared_package/lambda_shared/pr.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/ci/lambda_shared_package/lambda_shared/pr.py b/tests/ci/lambda_shared_package/lambda_shared/pr.py
index 4872ecb4d59..ce38475b3ee 100644
--- a/tests/ci/lambda_shared_package/lambda_shared/pr.py
+++ b/tests/ci/lambda_shared_package/lambda_shared/pr.py
@@ -43,6 +43,7 @@ TRUSTED_CONTRIBUTORS = {
         "tsolodov",  # ClickHouse, Inc
         "kitaisreal",
         "k-morozov",  # Konstantin Morozov, Yandex Cloud
+        "justindeguzman",  # ClickHouse, Inc
     ]
 }
 

From df93062472c32402ca96c9ff7d92fbc481df9008 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 2 Feb 2024 15:33:08 +0100
Subject: [PATCH 0657/1081] Apply and fix isort in scripts

---
 tests/ci/clickbench.py             | 14 +++++---------
 tests/ci/commit_status_helper.py   | 17 ++++++++++-------
 tests/ci/docker_images_check.py    | 11 +++++++----
 tests/ci/docker_manifests_merge.py | 11 +++++------
 tests/ci/functional_test_check.py  |  9 ++++++---
 tests/ci/report.py                 | 15 +++++++--------
 tests/ci/sqllogic_test.py          | 11 +++++------
 7 files changed, 45 insertions(+), 43 deletions(-)

diff --git a/tests/ci/clickbench.py b/tests/ci/clickbench.py
index 72827929ff9..f81a946e994 100644
--- a/tests/ci/clickbench.py
+++ b/tests/ci/clickbench.py
@@ -10,18 +10,14 @@ from pathlib import Path
 from typing import List, Tuple
 
 from build_download_helper import download_all_deb_packages
-from clickhouse_helper import (
-    CiLogsCredentials,
-)
-from commit_status_helper import (
-    override_status,
-)
-from docker_images_helper import get_docker_image, pull_image, DockerImage
-from env_helper import TEMP_PATH, REPORT_PATH
+from clickhouse_helper import CiLogsCredentials
+from commit_status_helper import override_status
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
+from report import JobReport, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
-from report import JobReport, TestResults
 
 
 def get_image_name() -> str:
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 851a4cc5298..c8dc6f713b3 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -1,14 +1,15 @@
 #!/usr/bin/env python3
 
-from collections import defaultdict
-import json
-from pathlib import Path
-from typing import Dict, List, Optional, Union
 import csv
+import json
 import logging
 import time
+from collections import defaultdict
 from dataclasses import asdict, dataclass
+from pathlib import Path
+from typing import Dict, List, Optional, Union
 
+# isort: off
 from github import Github
 from github.Commit import Commit
 from github.CommitStatus import CommitStatus
@@ -17,15 +18,17 @@ from github.GithubObject import NotSet
 from github.IssueComment import IssueComment
 from github.Repository import Repository
 
-from ci_config import CI_CONFIG, REQUIRED_CHECKS, CHECK_DESCRIPTIONS, CheckDescription
+# isort: on
+
+from ci_config import CHECK_DESCRIPTIONS, CI_CONFIG, REQUIRED_CHECKS, CheckDescription
 from env_helper import GITHUB_JOB_URL, GITHUB_REPOSITORY, TEMP_PATH
-from pr_info import PRInfo, SKIP_MERGEABLE_CHECK_LABEL
+from pr_info import SKIP_MERGEABLE_CHECK_LABEL, PRInfo
 from report import (
     ERROR,
     FAILURE,
     PENDING,
-    StatusType,
     SUCCESS,
+    StatusType,
     TestResult,
     TestResults,
     get_worst_status,
diff --git a/tests/ci/docker_images_check.py b/tests/ci/docker_images_check.py
index a25669d85d0..e88deae9a38 100644
--- a/tests/ci/docker_images_check.py
+++ b/tests/ci/docker_images_check.py
@@ -3,24 +3,27 @@ import argparse
 import json
 import logging
 import os
-import time
 import sys
+import time
 from pathlib import Path
 from typing import List, Optional, Tuple
 
+# isort: off
 from github import Github
 
+# isort: on
+
 from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import format_description, get_commit, post_commit_status
-from env_helper import RUNNER_TEMP, GITHUB_RUN_URL
+from docker_images_helper import DockerImageData, docker_login, get_images_oredered_list
+from env_helper import GITHUB_RUN_URL, RUNNER_TEMP
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
-from report import TestResults, TestResult
+from report import TestResult, TestResults
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 from upload_result_helper import upload_results
-from docker_images_helper import DockerImageData, docker_login, get_images_oredered_list
 
 NAME = "Push to Dockerhub"
 TEMP_PATH = Path(RUNNER_TEMP) / "docker_images_check"
diff --git a/tests/ci/docker_manifests_merge.py b/tests/ci/docker_manifests_merge.py
index 1ae92807c16..f99bfc247cc 100644
--- a/tests/ci/docker_manifests_merge.py
+++ b/tests/ci/docker_manifests_merge.py
@@ -5,24 +5,23 @@ import json
 import logging
 import os
 import subprocess
-
 import sys
 from typing import List, Tuple
 
+# isort: off
 from github import Github
 
-from clickhouse_helper import (
-    ClickHouseHelper,
-    prepare_tests_results_for_clickhouse,
-)
+# isort: on
+
+from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import format_description, get_commit, post_commit_status
+from docker_images_helper import docker_login, get_images_oredered_list
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResult
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from upload_result_helper import upload_results
-from docker_images_helper import docker_login, get_images_oredered_list
 
 NAME = "Push multi-arch images to Dockerhub"
 
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index b7e6c656b1f..f5dabe0c26d 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -1,18 +1,21 @@
 #!/usr/bin/env python3
 
 import argparse
+import atexit
 import csv
 import logging
 import os
 import re
 import subprocess
 import sys
-import atexit
 from pathlib import Path
 from typing import List, Tuple
 
+# isort: off
 from github import Github
 
+# isort: on
+
 from build_download_helper import download_all_deb_packages
 from clickhouse_helper import (
     CiLogsCredentials,
@@ -26,9 +29,9 @@ from commit_status_helper import (
     post_commit_status_to_file,
     update_mergeable_check,
 )
-from docker_images_helper import DockerImage, pull_image, get_docker_image
+from docker_images_helper import DockerImage, get_docker_image, pull_image
 from download_release_packages import download_last_release
-from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
+from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import TestResults, read_test_results
diff --git a/tests/ci/report.py b/tests/ci/report.py
index b478f737963..a1213300151 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -1,6 +1,12 @@
 # -*- coding: utf-8 -*-
+import csv
+import datetime
+import json
+import logging
+import os
 from ast import literal_eval
 from dataclasses import asdict, dataclass
+from html import escape
 from pathlib import Path
 from typing import (
     Dict,
@@ -13,18 +19,11 @@ from typing import (
     Tuple,
     Union,
 )
-from html import escape
-import csv
-import datetime
-import json
-import logging
-import os
 
 from build_download_helper import get_gh_api
-from ci_config import BuildConfig, CI_CONFIG
+from ci_config import CI_CONFIG, BuildConfig
 from env_helper import REPORT_PATH, TEMP_PATH
 
-
 logger = logging.getLogger(__name__)
 
 ERROR: Final = "error"
diff --git a/tests/ci/sqllogic_test.py b/tests/ci/sqllogic_test.py
index a7b3e3cf69e..14018eaa7a7 100755
--- a/tests/ci/sqllogic_test.py
+++ b/tests/ci/sqllogic_test.py
@@ -10,22 +10,21 @@ from typing import Tuple
 
 from build_download_helper import download_all_deb_packages
 from commit_status_helper import override_status
-from docker_images_helper import DockerImage, pull_image, get_docker_image
-from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from report import (
-    OK,
-    FAIL,
     ERROR,
+    FAIL,
+    OK,
     SUCCESS,
     JobReport,
-    TestResults,
     TestResult,
+    TestResults,
     read_test_results,
 )
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
-
 NO_CHANGES_MSG = "Nothing to run"
 IMAGE_NAME = "clickhouse/sqllogic-test"
 

From 5b9bf80f0960f79c59dd0f0ec07a1999090d9db3 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 2 Feb 2024 15:35:13 +0100
Subject: [PATCH 0658/1081] Fix usage of status types to prevent API exceptions

---
 tests/ci/clickbench.py             |  6 +++---
 tests/ci/commit_status_helper.py   |  8 +++++---
 tests/ci/docker_images_check.py    |  6 +++---
 tests/ci/docker_manifests_merge.py |  6 +++---
 tests/ci/functional_test_check.py  |  6 +++---
 tests/ci/integration_test_check.py |  6 +++---
 tests/ci/report.py                 | 26 ++++++++++++++------------
 tests/ci/sqllogic_test.py          |  7 ++++---
 8 files changed, 38 insertions(+), 33 deletions(-)

diff --git a/tests/ci/clickbench.py b/tests/ci/clickbench.py
index f81a946e994..61d15373a78 100644
--- a/tests/ci/clickbench.py
+++ b/tests/ci/clickbench.py
@@ -15,7 +15,7 @@ from commit_status_helper import override_status
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import JobReport, TestResults
+from report import JobReport, StatusType, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -48,7 +48,7 @@ def get_run_command(
 def process_results(
     result_directory: Path,
     server_log_path: Path,
-) -> Tuple[str, str, TestResults, List[Path]]:
+) -> Tuple[StatusType, str, TestResults, List[Path]]:
     test_results = []  # type: TestResults
     additional_files = []  # type: List[Path]
     # Just upload all files from result_directory.
@@ -90,7 +90,7 @@ def process_results(
             additional_files,
         )
 
-    return state, description, test_results, additional_files
+    return state, description, test_results, additional_files  # type: ignore
 
 
 def parse_args():
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index c8dc6f713b3..9f1a33d7db6 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -67,7 +67,9 @@ class RerunHelper:
         return None
 
 
-def override_status(status: str, check_name: str, invert: bool = False) -> str:
+def override_status(
+    status: StatusType, check_name: str, invert: bool = False
+) -> StatusType:
     test_config = CI_CONFIG.test_configs.get(check_name)
     if test_config and test_config.force_tests:
         return SUCCESS
@@ -96,7 +98,7 @@ def get_commit(gh: Github, commit_sha: str, retry_count: int = RETRY) -> Commit:
 
 def post_commit_status(
     commit: Commit,
-    state: str,
+    state: StatusType,
     report_url: Optional[str] = None,
     description: Optional[str] = None,
     check_name: Optional[str] = None,
@@ -291,7 +293,7 @@ def generate_status_comment(pr_info: PRInfo, statuses: CommitStatuses) -> str:
     return "".join(result)
 
 
-def get_worst_state(statuses: CommitStatuses) -> str:
+def get_worst_state(statuses: CommitStatuses) -> StatusType:
     return get_worst_status(status.state for status in statuses)
 
 
diff --git a/tests/ci/docker_images_check.py b/tests/ci/docker_images_check.py
index e88deae9a38..4fdaabac633 100644
--- a/tests/ci/docker_images_check.py
+++ b/tests/ci/docker_images_check.py
@@ -19,7 +19,7 @@ from docker_images_helper import DockerImageData, docker_login, get_images_orede
 from env_helper import GITHUB_RUN_URL, RUNNER_TEMP
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
-from report import TestResult, TestResults
+from report import FAILURE, SUCCESS, StatusType, TestResult, TestResults
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
@@ -192,7 +192,7 @@ def main():
     #     additional_cache.append(str(pr_info.merged_pr))
 
     ok_cnt = 0
-    status = "success"
+    status = SUCCESS  # type: StatusType
     image_tags = (
         json.loads(args.image_tags)
         if not os.path.isfile(args.image_tags)
@@ -236,7 +236,7 @@ def main():
         if all(x.status == "OK" for x in res):
             ok_cnt += 1
         else:
-            status = "failure"
+            status = FAILURE
             break  # No need to continue with next images
 
     description = format_description(
diff --git a/tests/ci/docker_manifests_merge.py b/tests/ci/docker_manifests_merge.py
index f99bfc247cc..9d25ad65ce6 100644
--- a/tests/ci/docker_manifests_merge.py
+++ b/tests/ci/docker_manifests_merge.py
@@ -18,7 +18,7 @@ from commit_status_helper import format_description, get_commit, post_commit_sta
 from docker_images_helper import docker_login, get_images_oredered_list
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
-from report import TestResult
+from report import FAILURE, SUCCESS, StatusType, TestResult
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from upload_result_helper import upload_results
@@ -148,7 +148,7 @@ def main():
         else json.load(open(args.missing_images))
     )
     test_results = []
-    status = "success"
+    status = SUCCESS  # type: StatusType
 
     ok_cnt, fail_cnt = 0, 0
     images = get_images_oredered_list()
@@ -176,7 +176,7 @@ def main():
         test_results.append(TestResult(manifest, test_result))
 
         if test_result != "OK":
-            status = "failure"
+            status = FAILURE
             fail_cnt += 1
         else:
             ok_cnt += 1
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index f5dabe0c26d..a05e2501504 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -34,7 +34,7 @@ from download_release_packages import download_last_release
 from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import TestResults, read_test_results
+from report import StatusType, TestResults, read_test_results
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
@@ -155,7 +155,7 @@ def get_tests_to_run(pr_info: PRInfo) -> List[str]:
 def process_results(
     result_directory: Path,
     server_log_path: Path,
-) -> Tuple[str, str, TestResults, List[Path]]:
+) -> Tuple[StatusType, str, TestResults, List[Path]]:
     test_results = []  # type: TestResults
     additional_files = []
     # Just upload all files from result_directory.
@@ -200,7 +200,7 @@ def process_results(
             additional_files,
         )
 
-    return state, description, test_results, additional_files
+    return state, description, test_results, additional_files  # type: ignore
 
 
 def parse_args():
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index fa2529d1b89..bab89ea0941 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -25,7 +25,7 @@ from get_robot_token import get_best_robot_token
 from github_helper import GitHub
 from integration_test_images import IMAGES
 from pr_info import PRInfo
-from report import ERROR, TestResult, TestResults, read_test_results
+from report import ERROR, StatusType, TestResult, TestResults, read_test_results
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
@@ -84,7 +84,7 @@ def get_env_for_runner(
 
 def process_results(
     result_directory: Path,
-) -> Tuple[str, str, TestResults, List[Path]]:
+) -> Tuple[StatusType, str, TestResults, List[Path]]:
     test_results = []  # type: TestResults
     additional_files = []
     # Just upload all files from result_directory.
@@ -118,7 +118,7 @@ def process_results(
             additional_files,
         )
 
-    return state, description, test_results, additional_files
+    return state, description, test_results, additional_files  # type: ignore
 
 
 def parse_args():
diff --git a/tests/ci/report.py b/tests/ci/report.py
index a1213300151..ce20c7293f9 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -35,26 +35,28 @@ OK: Final = "OK"
 FAIL: Final = "FAIL"
 
 StatusType = Literal["error", "failure", "pending", "success"]
+STATUSES = [ERROR, FAILURE, PENDING, SUCCESS]  # type: List[StatusType]
+
+
 # The order of statuses from the worst to the best
-_STATES = {ERROR: 0, FAILURE: 1, PENDING: 2, SUCCESS: 3}
+def _state_rank(status: str) -> int:
+    "return the index of status or index of SUCCESS in case of wrong status"
+    try:
+        return STATUSES.index(status)  # type: ignore
+    except ValueError:
+        return 3
 
 
-def get_worst_status(statuses: Iterable[str]) -> str:
-    worst_status = None
+def get_worst_status(statuses: Iterable[str]) -> StatusType:
+    worst_status = SUCCESS  # type: StatusType
     for status in statuses:
-        if _STATES.get(status) is None:
-            continue
-        if worst_status is None:
-            worst_status = status
-            continue
-        if _STATES.get(status) < _STATES.get(worst_status):
-            worst_status = status
+        ind = _state_rank(status)
+        if ind < _state_rank(worst_status):
+            worst_status = STATUSES[ind]
 
         if worst_status == ERROR:
             break
 
-    if worst_status is None:
-        return ""
     return worst_status
 
 
diff --git a/tests/ci/sqllogic_test.py b/tests/ci/sqllogic_test.py
index 14018eaa7a7..344eaea8277 100755
--- a/tests/ci/sqllogic_test.py
+++ b/tests/ci/sqllogic_test.py
@@ -18,6 +18,7 @@ from report import (
     OK,
     SUCCESS,
     JobReport,
+    StatusType,
     TestResult,
     TestResults,
     read_test_results,
@@ -46,7 +47,7 @@ def get_run_command(
     )
 
 
-def read_check_status(result_folder: Path) -> Tuple[str, str]:
+def read_check_status(result_folder: Path) -> Tuple[StatusType, str]:
     status_path = result_folder / "check_status.tsv"
     if not status_path.exists():
         return ERROR, "Not found check_status.tsv"
@@ -59,9 +60,9 @@ def read_check_status(result_folder: Path) -> Tuple[str, str]:
         if len(row) != 2:
             return ERROR, "Invalid check_status.tsv"
         if row[0] != SUCCESS:
-            return row[0], row[1]
+            return row[0], row[1]  # type: ignore
 
-    return status_rows[-1][0], status_rows[-1][1]
+    return status_rows[-1][0], status_rows[-1][1]  # type: ignore
 
 
 def parse_args() -> argparse.Namespace:

From c4846b661373dd59609583f2f5de79313d65a39d Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 6 Feb 2024 15:55:16 +0300
Subject: [PATCH 0659/1081] MergeTree FINAL optimization diagnostics and
 settings

---
 src/Core/Settings.h                           |  2 +
 src/Core/SettingsChangesHistory.h             |  4 +-
 src/Processors/QueryPlan/PartsSplitter.cpp    | 38 +++++++++++++++----
 src/Processors/QueryPlan/PartsSplitter.h      |  3 +-
 .../QueryPlan/ReadFromMergeTree.cpp           |  6 ++-
 5 files changed, 42 insertions(+), 11 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index dc863576a85..67bd721d3d1 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -215,6 +215,8 @@ class IColumn;
     M(UInt64, merge_tree_max_rows_to_use_cache, (128 * 8192), "The maximum number of rows per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(UInt64, merge_tree_max_bytes_to_use_cache, (192 * 10 * 1024 * 1024), "The maximum number of bytes per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(Bool, do_not_merge_across_partitions_select_final, false, "Merge parts only in one partition in select final", 0) \
+    M(Bool, split_parts_ranges_into_intersecting_and_non_intersecting_final, true, "Split parts ranges into intersecting and non intersecting during FINAL optimization", 0) \
+    M(Bool, split_intersecting_parts_ranges_into_layers_final, true, "Split intersecting parts ranges into layers during FINAL optimization", 0) \
     M(Bool, allow_experimental_inverted_index, false, "If it is set to true, allow to use experimental inverted index.", 0) \
     \
     M(UInt64, mysql_max_rows_to_insert, 65536, "The maximum number of rows in MySQL batch insertion of the MySQL storage engine", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index db3a76e29cd..a2612cab850 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -115,7 +115,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
-              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"}}},
+              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"},
+              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", false, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
+              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
     {"23.9", {{"optimize_group_by_constant_keys", false, true, "Optimize group by constant keys by default"},
               {"input_format_json_try_infer_named_tuples_from_objects", false, true, "Try to infer named Tuples from JSON objects by default"},
               {"input_format_json_read_numbers_as_strings", false, true, "Allow to read numbers as strings in JSON formats by default"},
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 7c66c0cc8df..363fdca22c5 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -228,7 +228,7 @@ struct SplitPartsRangesResult
     RangesInDataParts intersecting_parts_ranges;
 };
 
-SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts)
+SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts, const LoggerPtr & logger)
 {
     /** Split ranges in data parts into intersecting ranges in data parts and non intersecting ranges in data parts.
       *
@@ -483,10 +483,15 @@ SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts)
         intersecting_ranges_in_data_parts.end(),
         [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
 
+    LOG_TEST(logger, "Non intersecting ranges in data parts {}", non_intersecting_ranges_in_data_parts.getDescriptions().describe());
+    LOG_TEST(logger, "Intersecting ranges in data parts {}", intersecting_ranges_in_data_parts.getDescriptions().describe());
+
     return {std::move(non_intersecting_ranges_in_data_parts), std::move(intersecting_ranges_in_data_parts)};
 }
 
-std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts, size_t max_layers)
+std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts,
+    size_t max_layers,
+    const LoggerPtr & logger)
 {
     // We will advance the iterator pointing to the mark with the smallest PK value until
     // there will be not less than rows_per_layer rows in the current layer (roughly speaking).
@@ -591,8 +596,18 @@ std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersecting
         result_layers.back() = std::move(current_layer_builder.getCurrentRangesInDataParts());
     }
 
-    for (auto & layer : result_layers)
+    size_t result_layers_size = result_layers.size();
+    LOG_TEST(logger, "Split intersecting ranges into {} layers", result_layers_size);
+
+    for (size_t i = 0; i < result_layers_size; ++i)
     {
+        auto & layer = result_layers[i];
+
+        LOG_TEST(logger, "Layer {} {} filter values in ({}, {}])",
+            i,
+            layer.getDescriptions().describe(),
+            i ? ::toString(borders[i - 1]) : "-inf", i < borders.size() ? ::toString(borders[i]) : "+inf");
+
         std::stable_sort(
             layer.begin(),
             layer.end(),
@@ -712,23 +727,32 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool force_process_all_ranges)
+    bool split_parts_ranges_into_intersecting_and_non_intersecting_final,
+    bool split_intersecting_parts_ranges_into_layers)
 {
     if (max_layers <= 1)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "max_layer should be greater than 1");
 
+    auto logger = getLogger("PartsSplitter");
+
     SplitPartsWithRangesByPrimaryKeyResult result;
 
     RangesInDataParts intersecting_parts_ranges = std::move(parts);
 
-    if (!force_process_all_ranges)
+    if (split_parts_ranges_into_intersecting_and_non_intersecting_final)
     {
-        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges);
+        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges, logger);
         result.non_intersecting_parts_ranges = std::move(split_result.non_intersecting_parts_ranges);
         intersecting_parts_ranges = std::move(split_result.intersecting_parts_ranges);
     }
 
-    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers);
+    if (!split_intersecting_parts_ranges_into_layers)
+    {
+        result.merging_pipes.emplace_back(in_order_reading_step_getter(intersecting_parts_ranges));
+        return result;
+    }
+
+    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers, logger);
     auto filters = buildFilters(primary_key, borders);
     result.merging_pipes.resize(layers.size());
 
diff --git a/src/Processors/QueryPlan/PartsSplitter.h b/src/Processors/QueryPlan/PartsSplitter.h
index f1ed1cb0b9c..9bceb344589 100644
--- a/src/Processors/QueryPlan/PartsSplitter.h
+++ b/src/Processors/QueryPlan/PartsSplitter.h
@@ -34,5 +34,6 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool force_process_all_ranges);
+    bool split_parts_ranges_into_intersecting_and_non_intersecting,
+    bool split_intersecting_parts_ranges_into_layers);
 }
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 5ed56f59fc1..8a04caede80 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1175,7 +1175,8 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
 
                 /// Parts of non-zero level still may contain duplicate PK values to merge on FINAL if there's is_deleted column,
                 /// so we have to process all ranges. It would be more optimal to remove this flag and add an extra filtering step.
-                bool force_process_all_ranges = !data.merging_params.is_deleted_column.empty();
+                bool split_parts_ranges_into_intersecting_and_non_intersecting_final = settings.split_parts_ranges_into_intersecting_and_non_intersecting_final &&
+                    data.merging_params.is_deleted_column.empty();
 
                 SplitPartsWithRangesByPrimaryKeyResult split_ranges_result = splitPartsWithRangesByPrimaryKey(
                     metadata_for_reading->getPrimaryKey(),
@@ -1184,7 +1185,8 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
                     num_streams,
                     context,
                     std::move(in_order_reading_step_getter),
-                    force_process_all_ranges);
+                    split_parts_ranges_into_intersecting_and_non_intersecting_final,
+                    settings.split_intersecting_parts_ranges_into_layers_final);
 
                 for (auto && non_intersecting_parts_range : split_ranges_result.non_intersecting_parts_ranges)
                     non_intersecting_parts_by_primary_key.push_back(std::move(non_intersecting_parts_range));

From ca4f46ab418afab56deea3ae51c2378e42489db7 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Tue, 6 Feb 2024 14:27:15 +0100
Subject: [PATCH 0660/1081] Check block size in bytes instead of rows

---
 src/Storages/System/StorageSystemZooKeeper.cpp | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index 6d2166ff5f9..a4920d49b6d 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -511,11 +511,21 @@ Chunk SystemZooKeeperSource::generate()
     };
     std::vector<ListTask> list_tasks;
     std::unordered_set<String> added;
-    while (!paths.empty() && (max_block_size == 0 || row_count < max_block_size))
+    while (!paths.empty())
     {
         if (query_status)
             query_status->checkTimeLimit();
 
+        /// Check if the block is big enough already
+        if (max_block_size > 0 && row_count > 0)
+        {
+            size_t total_size = 0;
+            for (const auto & column : res_columns)
+                total_size += column->byteSize();
+            if (total_size > max_block_size)
+                break;
+        }
+
         list_tasks.clear();
         std::vector<String> paths_to_list;
         while (!paths.empty() && static_cast<Int64>(list_tasks.size()) < max_inflight_requests)

From ba94cd2ef70e3263aea35fa6c4687582ca1864f5 Mon Sep 17 00:00:00 2001
From: Val Doroshchuk <valbok@gmail.com>
Date: Tue, 30 Jan 2024 10:09:58 +0100
Subject: [PATCH 0661/1081] MaterializedMySQL: Fix gtid_after_attach_test to
 retry on detach

---
 .../materialized_with_ddl.py                              | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
index 97c8b65f15d..57f2ccd720d 100644
--- a/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
+++ b/tests/integration/test_materialized_mysql_database/materialized_with_ddl.py
@@ -3379,7 +3379,7 @@ def gtid_after_attach_test(clickhouse_node, mysql_node, replication):
         f"CREATE TABLE {db}.t(id INT PRIMARY KEY AUTO_INCREMENT, score int, create_time DATETIME DEFAULT NOW())"
     )
 
-    db_count = 6
+    db_count = 4
     for i in range(db_count):
         replication.create_db_ch(
             f"{db}{i}",
@@ -3392,7 +3392,11 @@ def gtid_after_attach_test(clickhouse_node, mysql_node, replication):
         "t\n",
     )
     for i in range(int(db_count / 2)):
-        clickhouse_node.query(f"DETACH DATABASE {db}{i}")
+        check_query(
+            clickhouse_node,
+            f"DETACH DATABASE {db}{i}",
+            "",
+        )
 
     mysql_node.query(f"USE {db}")
     rows = 10000

From 13948cbb201cb76a335bcccfe86cca49313dac05 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 6 Feb 2024 13:39:34 +0100
Subject: [PATCH 0662/1081] Use constants from report instead of string
 literals

---
 tests/ci/artifacts_helper.py             |  9 +++---
 tests/ci/ast_fuzzer_check.py             |  4 +--
 tests/ci/bugfix_validate_check.py        | 13 +++++----
 tests/ci/ci.py                           | 12 ++++----
 tests/ci/clickbench.py                   | 10 +++----
 tests/ci/commit_status_helper.py         | 12 ++++----
 tests/ci/compatibility_check.py          | 24 ++++++++--------
 tests/ci/docker_images_check.py          |  2 +-
 tests/ci/docker_manifests_merge.py       |  2 +-
 tests/ci/docker_server.py                | 15 +++++-----
 tests/ci/docs_check.py                   | 16 +++++------
 tests/ci/fast_test_check.py              | 32 ++++++++++++++--------
 tests/ci/finish_check.py                 |  9 ++++--
 tests/ci/functional_test_check.py        | 16 +++++------
 tests/ci/integration_test_check.py       | 19 +++++++++----
 tests/ci/jepsen_check.py                 | 13 ++++-----
 tests/ci/mark_release_ready.py           |  5 ++--
 tests/ci/merge_pr.py                     |  8 ++++--
 tests/ci/performance_comparison_check.py | 35 +++++++++++++-----------
 tests/ci/release.py                      |  3 +-
 tests/ci/run_check.py                    |  4 +--
 tests/ci/sqlancer_check.py               | 13 ++++-----
 tests/ci/sqllogic_test.py                |  2 +-
 tests/ci/sqltest.py                      | 15 ++++------
 tests/ci/stress_check.py                 | 11 ++++----
 tests/ci/style_check.py                  | 10 +++----
 tests/ci/unit_tests_check.py             | 10 +++----
 27 files changed, 171 insertions(+), 153 deletions(-)

diff --git a/tests/ci/artifacts_helper.py b/tests/ci/artifacts_helper.py
index a9f3385585b..5feca927a96 100644
--- a/tests/ci/artifacts_helper.py
+++ b/tests/ci/artifacts_helper.py
@@ -10,14 +10,17 @@ from pathlib import Path
 from shutil import copy2
 from typing import List, Optional, Union
 
+# isort: off
 from github.Commit import Commit
 
+# isort: on
+
 from build_download_helper import download_build_with_progress
 from commit_status_helper import post_commit_status
 from compress_files import SUFFIX, compress_fast, decompress_fast
 from env_helper import CI, RUNNER_TEMP, S3_BUILDS_BUCKET
 from git_helper import SHA_REGEXP
-from report import HEAD_HTML_TEMPLATE, FOOTER_HTML_TEMPLATE
+from report import FOOTER_HTML_TEMPLATE, HEAD_HTML_TEMPLATE, SUCCESS
 from s3_helper import S3Helper
 
 ARTIFACTS_PATH = Path(RUNNER_TEMP) / "artifacts"
@@ -128,9 +131,7 @@ class ArtifactsHelper:
 
     @staticmethod
     def post_commit_status(commit: Commit, url: str) -> None:
-        post_commit_status(
-            commit, "success", url, "Artifacts for workflow", "Artifacts"
-        )
+        post_commit_status(commit, SUCCESS, url, "Artifacts for workflow", "Artifacts")
 
     def _regenerate_index(self) -> None:
         if CI:
diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 5a0eca51570..0a69d8aab49 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -7,9 +7,7 @@ import sys
 from pathlib import Path
 
 from build_download_helper import get_build_name_for_check, read_build_urls
-from clickhouse_helper import (
-    CiLogsCredentials,
-)
+from clickhouse_helper import CiLogsCredentials
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import PRInfo
diff --git a/tests/ci/bugfix_validate_check.py b/tests/ci/bugfix_validate_check.py
index 107c02a0f56..7fda81f11b2 100644
--- a/tests/ci/bugfix_validate_check.py
+++ b/tests/ci/bugfix_validate_check.py
@@ -1,17 +1,20 @@
 #!/usr/bin/env python3
 
-from pathlib import Path
-from typing import List, Tuple, Optional
 import argparse
 import csv
 import logging
+from pathlib import Path
+from typing import List, Optional, Tuple
 
+# isort: off
 from github import Github
 
+# isort: on
+
 from commit_status_helper import get_commit, post_commit_status
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
-from report import TestResults, TestResult
+from report import ERROR, SUCCESS, TestResult, TestResults
 from s3_helper import S3Helper
 from upload_result_helper import upload_results
 
@@ -49,7 +52,7 @@ def process_result(file_path: Path) -> Tuple[bool, TestResults, Optional[str]]:
         )
         return False, [TestResult(f"{prefix}: {description}", status)], "Check failed"
 
-    is_ok = state == "success"
+    is_ok = state == SUCCESS
     if is_ok and report_url == "null":
         return is_ok, test_results, None
 
@@ -111,7 +114,7 @@ def main():
     commit = get_commit(gh, pr_info.sha)
     post_commit_status(
         commit,
-        "success" if is_ok else "error",
+        SUCCESS if is_ok else ERROR,
         report_url,
         description,
         check_name_with_group,
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index d2d05b1ed2d..622b7bb005a 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1,21 +1,21 @@
 import argparse
 import concurrent.futures
-from dataclasses import asdict, dataclass
-from enum import Enum
 import json
 import logging
 import os
 import re
 import subprocess
 import sys
-from pathlib import Path
 import time
+from dataclasses import asdict, dataclass
+from enum import Enum
+from pathlib import Path
 from typing import Any, Dict, List, Optional, Sequence, Union
 
 import docker_images_helper
 import upload_result_helper
 from build_check import get_release_or_pr
-from ci_config import CI_CONFIG, Build, Labels, JobNames
+from ci_config import CI_CONFIG, Build, JobNames, Labels
 from ci_utils import GHActions, is_hex
 from clickhouse_helper import (
     CiLogsCredentials,
@@ -859,7 +859,7 @@ def _mark_success_action(
         # there is no status for build jobs
         # create dummy success to mark it as done
         # FIXME: consider creating commit status for build jobs too, to treat everything the same way
-        CommitStatusData("success", "dummy description", "dummy_url").dump_status()
+        CommitStatusData(SUCCESS, "dummy description", "dummy_url").dump_status()
 
     job_status = None
     if CommitStatusData.exist():
@@ -1142,7 +1142,7 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
         if not job_status:
             return
         print(f"Going to re-create GH status for job [{job}] sha [{pr_info.sha}]")
-        assert job_status.status == "success", "BUG!"
+        assert job_status.status == SUCCESS, "BUG!"
         commit.create_status(
             state=job_status.status,
             target_url=job_status.report_url,
diff --git a/tests/ci/clickbench.py b/tests/ci/clickbench.py
index 61d15373a78..f8707cbcff7 100644
--- a/tests/ci/clickbench.py
+++ b/tests/ci/clickbench.py
@@ -15,7 +15,7 @@ from commit_status_helper import override_status
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import JobReport, StatusType, TestResults
+from report import ERROR, SUCCESS, JobReport, StatusType, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -70,7 +70,7 @@ def process_results(
 
     if len(status) != 1 or len(status[0]) != 2:
         logging.info("Files in result folder %s", os.listdir(result_directory))
-        return "error", "Invalid check_status.tsv", test_results, additional_files
+        return ERROR, "Invalid check_status.tsv", test_results, additional_files
     state, description = status[0][0], status[0][1]
 
     try:
@@ -80,11 +80,11 @@ def process_results(
             logging.info("Found %s", results_path.name)
         else:
             logging.info("Files in result folder %s", os.listdir(result_directory))
-            return "error", "Not found test_results.tsv", test_results, additional_files
+            return ERROR, "Not found test_results.tsv", test_results, additional_files
 
     except Exception as e:
         return (
-            "error",
+            ERROR,
             f"Cannot parse test_results.tsv ({e})",
             test_results,
             additional_files,
@@ -175,7 +175,7 @@ def main():
         additional_files=[run_log_path] + additional_logs,
     ).dump()
 
-    if state != "success":
+    if state != SUCCESS:
         if FORCE_TESTS_LABEL in pr_info.labels:
             print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
         else:
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 9f1a33d7db6..5dd2a33adaf 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -378,12 +378,12 @@ class CommitStatusData:
 def get_commit_filtered_statuses(commit: Commit) -> CommitStatuses:
     """
     Squash statuses to latest state
-    1. context="first", state="success", update_time=1
-    2. context="second", state="success", update_time=2
-    3. context="first", stat="failure", update_time=3
+    1. context="first", state=SUCCESS, update_time=1
+    2. context="second", state=SUCCESS, update_time=2
+    3. context="first", stat=FAILURE, update_time=3
     =========>
-    1. context="second", state="success"
-    2. context="first", stat="failure"
+    1. context="second", state=SUCCESS
+    2. context="first", stat=FAILURE
     """
     filtered = {}
     for status in sorted(commit.get_statuses(), key=lambda x: x.updated_at):
@@ -435,7 +435,7 @@ def format_description(description: str) -> str:
 def set_mergeable_check(
     commit: Commit,
     description: str = "",
-    state: StatusType = "success",
+    state: StatusType = SUCCESS,
 ) -> None:
     commit.create_status(
         context=MERGEABLE_NAME,
diff --git a/tests/ci/compatibility_check.py b/tests/ci/compatibility_check.py
index a0c6294d8fd..a2e6c94cf48 100644
--- a/tests/ci/compatibility_check.py
+++ b/tests/ci/compatibility_check.py
@@ -1,17 +1,17 @@
 #!/usr/bin/env python3
 
-from distutils.version import StrictVersion
-from pathlib import Path
-from typing import List, Tuple
 import argparse
 import logging
 import subprocess
 import sys
+from distutils.version import StrictVersion
+from pathlib import Path
+from typing import List, Tuple
 
 from build_download_helper import download_builds_filter
 from docker_images_helper import DockerImage, get_docker_image, pull_image
-from env_helper import TEMP_PATH, REPORT_PATH
-from report import JobReport, TestResults, TestResult
+from env_helper import REPORT_PATH, TEMP_PATH
+from report import FAILURE, SUCCESS, JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 
 IMAGE_UBUNTU = "clickhouse/test-old-ubuntu"
@@ -55,19 +55,19 @@ def process_result(
     glibc_log_path = result_directory / "glibc.log"
     test_results = process_glibc_check(glibc_log_path, max_glibc_version)
 
-    status = "success"
+    status = SUCCESS
     description = "Compatibility check passed"
 
     if check_glibc:
         if len(test_results) > 1 or test_results[0].status != "OK":
-            status = "failure"
+            status = FAILURE
             description = "glibc check failed"
 
-    if status == "success" and check_distributions:
+    if status == SUCCESS and check_distributions:
         for operating_system in ("ubuntu:12.04", "centos:5"):
             test_result = process_os_check(result_directory / operating_system)
             if test_result.status != "OK":
-                status = "failure"
+                status = FAILURE
                 description = f"Old {operating_system} failed"
                 test_results += [test_result]
                 break
@@ -178,14 +178,14 @@ def main():
         )
         run_commands.extend(check_distributions_commands)
 
-    state = "success"
+    state = SUCCESS
     for run_command in run_commands:
         try:
             logging.info("Running command %s", run_command)
             subprocess.check_call(run_command, shell=True)
         except subprocess.CalledProcessError as ex:
             logging.info("Exception calling command %s", ex)
-            state = "failure"
+            state = FAILURE
 
     subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
 
@@ -215,7 +215,7 @@ def main():
         additional_files=additional_logs,
     ).dump()
 
-    if state == "failure":
+    if state == FAILURE:
         sys.exit(1)
 
 
diff --git a/tests/ci/docker_images_check.py b/tests/ci/docker_images_check.py
index 4fdaabac633..af0416d83dc 100644
--- a/tests/ci/docker_images_check.py
+++ b/tests/ci/docker_images_check.py
@@ -271,7 +271,7 @@ def main():
     ch_helper = ClickHouseHelper()
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
 
-    if status == "failure":
+    if status == FAILURE:
         sys.exit(1)
 
 
diff --git a/tests/ci/docker_manifests_merge.py b/tests/ci/docker_manifests_merge.py
index 9d25ad65ce6..fc00969d5d6 100644
--- a/tests/ci/docker_manifests_merge.py
+++ b/tests/ci/docker_manifests_merge.py
@@ -212,7 +212,7 @@ def main():
     )
     ch_helper = ClickHouseHelper()
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
-    if status == "failure":
+    if status == FAILURE:
         sys.exit(1)
 
 
diff --git a/tests/ci/docker_server.py b/tests/ci/docker_server.py
index b9e5c13ec42..7f53034fd0f 100644
--- a/tests/ci/docker_server.py
+++ b/tests/ci/docker_server.py
@@ -6,25 +6,26 @@ import json
 import logging
 import sys
 import time
+from os import makedirs
+from os import path as p
 from pathlib import Path
-from os import path as p, makedirs
 from typing import Dict, List
 
 from build_check import get_release_or_pr
+from build_download_helper import read_build_urls
 from docker_images_helper import DockerImageData, docker_login
 from env_helper import (
     GITHUB_RUN_URL,
     REPORT_PATH,
-    TEMP_PATH,
     S3_BUILDS_BUCKET,
     S3_DOWNLOAD,
+    TEMP_PATH,
 )
 from git_helper import Git
 from pr_info import PRInfo
-from report import JobReport, TestResults, TestResult
+from report import FAILURE, SUCCESS, JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
-from build_download_helper import read_build_urls
 from version_helper import (
     ClickHouseVersion,
     get_tagged_versions,
@@ -378,7 +379,7 @@ def main():
         docker_login()
 
     logging.info("Following tags will be created: %s", ", ".join(tags))
-    status = "success"
+    status = SUCCESS
     test_results = []  # type: TestResults
     for os in args.os:
         for tag in tags:
@@ -388,7 +389,7 @@ def main():
                 )
             )
             if test_results[-1].status != "OK":
-                status = "failure"
+                status = FAILURE
     pr_info = pr_info or PRInfo()
 
     description = f"Processed tags: {', '.join(tags)}"
@@ -401,7 +402,7 @@ def main():
         additional_files=[],
     ).dump()
 
-    if status != "success":
+    if status != SUCCESS:
         sys.exit(1)
 
 
diff --git a/tests/ci/docs_check.py b/tests/ci/docs_check.py
index 400d4bc6ad5..6bd4ef49675 100644
--- a/tests/ci/docs_check.py
+++ b/tests/ci/docs_check.py
@@ -8,7 +8,7 @@ from pathlib import Path
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import REPO_COPY, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport, TestResult, TestResults
+from report import FAILURE, SUCCESS, JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -49,7 +49,7 @@ def main():
         JobReport(
             description="No changes in docs",
             test_results=[],
-            status="success",
+            status=SUCCESS,
             start_time=stopwatch.start_time_str,
             duration=stopwatch.duration_seconds,
             additional_files=[],
@@ -79,11 +79,11 @@ def main():
         retcode = process.wait()
         if retcode == 0:
             logging.info("Run successfully")
-            status = "success"
+            status = SUCCESS
             description = "Docs check passed"
         else:
             description = "Docs check failed (non zero exit code)"
-            status = "failure"
+            status = FAILURE
             logging.info("Run failed")
 
     subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
@@ -92,7 +92,7 @@ def main():
     if not any(test_output.iterdir()):
         logging.error("No output files after docs check")
         description = "No output files after docs check"
-        status = "failure"
+        status = FAILURE
     else:
         for p in test_output.iterdir():
             additional_files.append(p)
@@ -101,9 +101,9 @@ def main():
                     if "ERROR" in line:
                         test_results.append(TestResult(line.split(":")[-1], "FAIL"))
         if test_results:
-            status = "failure"
+            status = FAILURE
             description = "Found errors in docs"
-        elif status != "failure":
+        elif status != FAILURE:
             test_results.append(TestResult("No errors found", "OK"))
         else:
             test_results.append(TestResult("Non zero exit code", "FAIL"))
@@ -117,7 +117,7 @@ def main():
         additional_files=additional_files,
     ).dump()
 
-    if status == "failure":
+    if status == FAILURE:
         sys.exit(1)
 
 
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index b558253ca95..e483e9d4ac2 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -11,7 +11,15 @@ from typing import Tuple
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPO_COPY, S3_BUILDS_BUCKET, TEMP_PATH
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import JobReport, TestResult, TestResults, read_test_results
+from report import (
+    ERROR,
+    FAILURE,
+    SUCCESS,
+    JobReport,
+    TestResult,
+    TestResults,
+    read_test_results,
+)
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -56,16 +64,16 @@ def process_results(result_directory: Path) -> Tuple[str, str, TestResults]:
             status = list(csv.reader(status_file, delimiter="\t"))
     if len(status) != 1 or len(status[0]) != 2:
         logging.info("Files in result folder %s", os.listdir(result_directory))
-        return "error", "Invalid check_status.tsv", test_results
+        return ERROR, "Invalid check_status.tsv", test_results
     state, description = status[0][0], status[0][1]
 
     try:
         results_path = result_directory / "test_results.tsv"
         test_results = read_test_results(results_path)
         if len(test_results) == 0:
-            return "error", "Empty test_results.tsv", test_results
+            return ERROR, "Empty test_results.tsv", test_results
     except Exception as e:
-        return ("error", f"Cannot parse test_results.tsv ({e})", test_results)
+        return (ERROR, f"Cannot parse test_results.tsv ({e})", test_results)
 
     return state, description, test_results
 
@@ -149,25 +157,25 @@ def main():
     test_results = []  # type: TestResults
     if "submodule_log.txt" not in test_output_files:
         description = "Cannot clone repository"
-        state = "failure"
+        state = FAILURE
     elif "cmake_log.txt" not in test_output_files:
         description = "Cannot fetch submodules"
-        state = "failure"
+        state = FAILURE
     elif "build_log.txt" not in test_output_files:
         description = "Cannot finish cmake"
-        state = "failure"
+        state = FAILURE
     elif "install_log.txt" not in test_output_files:
         description = "Cannot build ClickHouse"
-        state = "failure"
+        state = FAILURE
     elif not test_log_exists and not test_result_exists:
         description = "Cannot install or start ClickHouse"
-        state = "failure"
+        state = FAILURE
     else:
         state, description, test_results = process_results(output_path)
 
     if timeout_expired:
         test_results.append(TestResult.create_check_timeout_expired(args.timeout))
-        state = "failure"
+        state = FAILURE
         description = test_results[-1].name
 
     JobReport(
@@ -181,8 +189,8 @@ def main():
     ).dump()
 
     # Refuse other checks to run if fast test failed
-    if state != "success":
-        if state == "error":
+    if state != SUCCESS:
+        if state == ERROR:
             print("The status is 'error', report failure disregard the labels")
             sys.exit(1)
         elif FORCE_TESTS_LABEL in pr_info.labels:
diff --git a/tests/ci/finish_check.py b/tests/ci/finish_check.py
index 6c615817164..e5268947304 100644
--- a/tests/ci/finish_check.py
+++ b/tests/ci/finish_check.py
@@ -1,7 +1,11 @@
 #!/usr/bin/env python3
 import logging
+
+# isort: off
 from github import Github
 
+# isort: on
+
 from commit_status_helper import (
     CI_STATUS_NAME,
     get_commit,
@@ -11,6 +15,7 @@ from commit_status_helper import (
 )
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
+from report import PENDING, SUCCESS
 
 
 def main():
@@ -31,10 +36,10 @@ def main():
         return
     # Take the latest status
     status = statuses[-1]
-    if status.state == "pending":
+    if status.state == PENDING:
         post_commit_status(
             commit,
-            "success",
+            SUCCESS,
             status.target_url,
             "All checks finished",
             CI_STATUS_NAME,
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index a05e2501504..e230aa5a679 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -34,7 +34,7 @@ from download_release_packages import download_last_release
 from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import StatusType, TestResults, read_test_results
+from report import ERROR, SUCCESS, StatusType, TestResults, read_test_results
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
@@ -177,7 +177,7 @@ def process_results(
 
     if len(status) != 1 or len(status[0]) != 2:
         logging.info("Files in result folder %s", os.listdir(result_directory))
-        return "error", "Invalid check_status.tsv", test_results, additional_files
+        return ERROR, "Invalid check_status.tsv", test_results, additional_files
     state, description = status[0][0], status[0][1]
 
     try:
@@ -187,14 +187,14 @@ def process_results(
             logging.info("Found test_results.tsv")
         else:
             logging.info("Files in result folder %s", os.listdir(result_directory))
-            return "error", "Not found test_results.tsv", test_results, additional_files
+            return ERROR, "Not found test_results.tsv", test_results, additional_files
 
         test_results = read_test_results(results_path)
         if len(test_results) == 0:
-            return "error", "Empty test_results.tsv", test_results, additional_files
+            return ERROR, "Empty test_results.tsv", test_results, additional_files
     except Exception as e:
         return (
-            "error",
+            ERROR,
             f"Cannot parse test_results.tsv ({e})",
             test_results,
             additional_files,
@@ -265,7 +265,7 @@ def main():
             post_commit_status_to_file(
                 post_commit_path,
                 f"Skipped (no pr-bugfix in {pr_info.labels})",
-                "success",
+                SUCCESS,
                 "null",
             )
         logging.info("Skipping '%s' (no pr-bugfix in %s)", check_name, pr_info.labels)
@@ -286,7 +286,7 @@ def main():
     if run_changed_tests:
         tests_to_run = get_tests_to_run(pr_info)
         if not tests_to_run:
-            state = override_status("success", check_name, validate_bugfix_check)
+            state = override_status(SUCCESS, check_name, validate_bugfix_check)
             if args.post_commit_status == "commit_status":
                 post_commit_status(
                     commit,
@@ -418,7 +418,7 @@ def main():
     )
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
 
-    if state != "success":
+    if state != SUCCESS:
         if FORCE_TESTS_LABEL in pr_info.labels:
             print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
         else:
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index bab89ea0941..5af4d5e625b 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -25,7 +25,14 @@ from get_robot_token import get_best_robot_token
 from github_helper import GitHub
 from integration_test_images import IMAGES
 from pr_info import PRInfo
-from report import ERROR, StatusType, TestResult, TestResults, read_test_results
+from report import (
+    ERROR,
+    SUCCESS,
+    StatusType,
+    TestResult,
+    TestResults,
+    read_test_results,
+)
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
@@ -102,17 +109,17 @@ def process_results(
 
     if len(status) != 1 or len(status[0]) != 2:
         logging.info("Files in result folder %s", os.listdir(result_directory))
-        return "error", "Invalid check_status.tsv", test_results, additional_files
+        return ERROR, "Invalid check_status.tsv", test_results, additional_files
     state, description = status[0][0], status[0][1]
 
     try:
         results_path = result_directory / "test_results.tsv"
         test_results = read_test_results(results_path, False)
         if len(test_results) == 0:
-            return "error", "Empty test_results.tsv", test_results, additional_files
+            return ERROR, "Empty test_results.tsv", test_results, additional_files
     except Exception as e:
         return (
-            "error",
+            ERROR,
             f"Cannot parse test_results.tsv ({e})",
             test_results,
             additional_files,
@@ -182,7 +189,7 @@ def main():
             post_commit_status_to_file(
                 post_commit_path,
                 f"Skipped (no pr-bugfix in {pr_info.labels})",
-                "success",
+                SUCCESS,
                 "null",
             )
         logging.info("Skipping '%s' (no pr-bugfix in '%s')", check_name, pr_info.labels)
@@ -315,7 +322,7 @@ def main():
 
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
 
-    if state == "failure":
+    if state != SUCCESS:
         sys.exit(1)
 
 
diff --git a/tests/ci/jepsen_check.py b/tests/ci/jepsen_check.py
index 93e33d62293..fb7540abda3 100644
--- a/tests/ci/jepsen_check.py
+++ b/tests/ci/jepsen_check.py
@@ -5,29 +5,26 @@ import logging
 import os
 import sys
 import time
-
 from pathlib import Path
 from typing import Any, List
 
 import boto3  # type: ignore
 import requests  # type: ignore
-
 from build_download_helper import (
     download_build_with_progress,
     get_build_name_for_check,
     read_build_urls,
 )
 from compress_files import compress_fast
-from env_helper import REPO_COPY, REPORT_PATH, S3_URL, TEMP_PATH, S3_BUILDS_BUCKET
+from env_helper import REPO_COPY, REPORT_PATH, S3_BUILDS_BUCKET, S3_URL, TEMP_PATH
 from get_robot_token import get_parameter_from_ssm
 from git_helper import git_runner
 from pr_info import PRInfo
-from report import JobReport, TestResults, TestResult
+from report import FAILURE, SUCCESS, JobReport, TestResult, TestResults
 from ssh import SSHKey
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
-
 JEPSEN_GROUP_NAME = "jepsen_group"
 
 KEEPER_DESIRED_INSTANCE_COUNT = 3
@@ -263,21 +260,21 @@ def main():
             else:
                 logging.info("Run failed")
 
-    status = "success"
+    status = SUCCESS
     description = "No invalid analysis found ヽ(‘ー`)ノ"
     jepsen_log_path = result_path / "jepsen_run_all_tests.log"
     additional_data = []
     try:
         test_result = _parse_jepsen_output(jepsen_log_path)
         if any(r.status == "FAIL" for r in test_result):
-            status = "failure"
+            status = FAILURE
             description = "Found invalid analysis (ﾉಥ益ಥ）ﾉ ┻━┻"
 
         compress_fast(result_path / "store", result_path / "jepsen_store.tar.zst")
         additional_data.append(result_path / "jepsen_store.tar.zst")
     except Exception as ex:
         print("Exception", ex)
-        status = "failure"
+        status = FAILURE
         description = "No Jepsen output log"
         test_result = [TestResult("No Jepsen output log", "FAIL")]
 
diff --git a/tests/ci/mark_release_ready.py b/tests/ci/mark_release_ready.py
index 0ad4b2bd2ed..011b3f28843 100755
--- a/tests/ci/mark_release_ready.py
+++ b/tests/ci/mark_release_ready.py
@@ -7,10 +7,11 @@ import os
 from commit_status_helper import get_commit, post_commit_status
 from env_helper import GITHUB_JOB_URL
 from get_robot_token import get_best_robot_token
+from git_helper import commit as commit_arg
 from github_helper import GitHub
 from pr_info import PRInfo
 from release import RELEASE_READY_STATUS
-from git_helper import commit as commit_arg
+from report import SUCCESS
 
 
 def main():
@@ -50,7 +51,7 @@ def main():
     gh.get_rate_limit()
     post_commit_status(
         commit,
-        "success",
+        SUCCESS,
         url,
         description,
         RELEASE_READY_STATUS,
diff --git a/tests/ci/merge_pr.py b/tests/ci/merge_pr.py
index 772821f4960..cc92fe4f42c 100644
--- a/tests/ci/merge_pr.py
+++ b/tests/ci/merge_pr.py
@@ -4,21 +4,23 @@
 
 import argparse
 import logging
-
 from datetime import datetime
 from os import getenv
 from pprint import pformat
 from typing import Dict, List
 
+# isort: off
 from github.PaginatedList import PaginatedList
 from github.PullRequestReview import PullRequestReview
 from github.WorkflowRun import WorkflowRun
 
+# isort: on
+
 from commit_status_helper import get_commit_filtered_statuses
 from get_robot_token import get_best_robot_token
 from github_helper import GitHub, NamedUser, PullRequest, Repository
 from pr_info import PRInfo
-
+from report import SUCCESS
 
 # The team name for accepted approvals
 TEAM_NAME = getenv("GITHUB_TEAM_NAME", "core")
@@ -269,7 +271,7 @@ def main():
         failed_statuses = [
             status.context
             for status in get_commit_filtered_statuses(commit)
-            if status.state != "success"
+            if status.state != SUCCESS
         ]
         if failed_statuses:
             logging.warning(
diff --git a/tests/ci/performance_comparison_check.py b/tests/ci/performance_comparison_check.py
index 5a98fa06b39..f0af15397c7 100644
--- a/tests/ci/performance_comparison_check.py
+++ b/tests/ci/performance_comparison_check.py
@@ -1,35 +1,38 @@
 #!/usr/bin/env python3
 
-import os
-import logging
-import sys
 import json
-import subprocess
-import traceback
+import logging
+import os
 import re
+import subprocess
+import sys
+import traceback
 from pathlib import Path
 
+# isort: off
 from github import Github
 
-from commit_status_helper import get_commit
+# isort: on
+
+from build_download_helper import download_builds_filter
 from ci_config import CI_CONFIG
-from docker_images_helper import pull_image, get_docker_image
+from clickhouse_helper import get_instance_id, get_instance_type
+from commit_status_helper import get_commit
+from docker_images_helper import get_docker_image, pull_image
 from env_helper import (
     GITHUB_EVENT_PATH,
     GITHUB_RUN_URL,
     REPO_COPY,
+    REPORT_PATH,
     S3_BUILDS_BUCKET,
     S3_DOWNLOAD,
     TEMP_PATH,
-    REPORT_PATH,
 )
 from get_robot_token import get_best_robot_token, get_parameter_from_ssm
 from pr_info import PRInfo
-from tee_popen import TeePopen
-from clickhouse_helper import get_instance_type, get_instance_id
+from report import FAILURE, SUCCESS, JobReport
 from stopwatch import Stopwatch
-from build_download_helper import download_builds_filter
-from report import SUCCESS, JobReport
+from tee_popen import TeePopen
 
 IMAGE_NAME = "clickhouse/performance-comparison"
 
@@ -225,18 +228,18 @@ def main():
         # TODO: Remove me, always green mode for the first time, unless errors
         status = SUCCESS
         if "errors" in message.lower() or too_many_slow(message.lower()):
-            status = "failure"
+            status = FAILURE
         # TODO: Remove until here
     except Exception:
         traceback.print_exc()
-        status = "failure"
+        status = FAILURE
         message = "Failed to parse the report."
 
     if not status:
-        status = "failure"
+        status = FAILURE
         message = "No status in report."
     elif not message:
-        status = "failure"
+        status = FAILURE
         message = "No message in report."
 
     JobReport(
diff --git a/tests/ci/release.py b/tests/ci/release.py
index f96845dad95..2b3331938e7 100755
--- a/tests/ci/release.py
+++ b/tests/ci/release.py
@@ -18,6 +18,7 @@ from contextlib import contextmanager
 from typing import Any, Final, Iterator, List, Optional, Tuple
 
 from git_helper import Git, commit, release_branch
+from report import SUCCESS
 from version_helper import (
     FILE_WITH_VERSION_PATH,
     GENERATED_CONTRIBUTORS,
@@ -142,7 +143,7 @@ class Release:
 
             for status in statuses:
                 if status["context"] == RELEASE_READY_STATUS:
-                    if not status["state"] == "success":
+                    if not status["state"] == SUCCESS:
                         raise Exception(
                             f"the status {RELEASE_READY_STATUS} is {status['state']}"
                             ", not success"
diff --git a/tests/ci/run_check.py b/tests/ci/run_check.py
index a6312872c2a..2aeac5b5740 100644
--- a/tests/ci/run_check.py
+++ b/tests/ci/run_check.py
@@ -27,7 +27,7 @@ from lambda_shared_package.lambda_shared.pr import (
     check_pr_description,
 )
 from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import FAILURE
+from report import FAILURE, PENDING
 
 TRUSTED_ORG_IDS = {
     54801242,  # clickhouse
@@ -188,7 +188,7 @@ def main():
     print("::notice ::Can run")
     post_commit_status(
         commit,
-        "pending",
+        PENDING,
         ci_report_url,
         description,
         CI_STATUS_NAME,
diff --git a/tests/ci/sqlancer_check.py b/tests/ci/sqlancer_check.py
index f85ab2be9a3..59d2a3d6275 100644
--- a/tests/ci/sqlancer_check.py
+++ b/tests/ci/sqlancer_check.py
@@ -7,12 +7,9 @@ import sys
 from pathlib import Path
 
 from build_download_helper import get_build_name_for_check, read_build_urls
-from docker_images_helper import DockerImage, pull_image, get_docker_image
-from env_helper import (
-    REPORT_PATH,
-    TEMP_PATH,
-)
-from report import JobReport, TestResults, TestResult
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import REPORT_PATH, TEMP_PATH
+from report import FAILURE, SUCCESS, JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -94,7 +91,7 @@ def main():
     paths += [workspace_path / f"{t}.err" for t in tests]
     paths += [workspace_path / f"{t}.out" for t in tests]
 
-    status = "success"
+    status = SUCCESS
     test_results = []  # type: TestResults
     # Try to get status message saved by the SQLancer
     try:
@@ -109,7 +106,7 @@ def main():
         with open(workspace_path / "description.txt", "r", encoding="utf-8") as desc_f:
             description = desc_f.readline().rstrip("\n")
     except:
-        status = "failure"
+        status = FAILURE
         description = "Task failed: $?=" + str(retcode)
 
     if not test_results:
diff --git a/tests/ci/sqllogic_test.py b/tests/ci/sqllogic_test.py
index 344eaea8277..bbd81fd76bb 100755
--- a/tests/ci/sqllogic_test.py
+++ b/tests/ci/sqllogic_test.py
@@ -172,7 +172,7 @@ def main():
         )
     )
 
-    # Until it pass all tests, do not block CI, report "success"
+    # Until it pass all tests, do not block CI, report SUCCESS
     assert description is not None
     # FIXME: force SUCCESS until all cases are fixed
     status = SUCCESS
diff --git a/tests/ci/sqltest.py b/tests/ci/sqltest.py
index b2105d4f5c0..2fe6aabd69c 100644
--- a/tests/ci/sqltest.py
+++ b/tests/ci/sqltest.py
@@ -1,21 +1,16 @@
 #!/usr/bin/env python3
 
 import logging
-import subprocess
 import os
+import subprocess
 import sys
 from pathlib import Path
-from typing import Dict
-
 
 from build_download_helper import get_build_name_for_check, read_build_urls
-from docker_images_helper import pull_image, get_docker_image
-from env_helper import (
-    REPORT_PATH,
-    TEMP_PATH,
-)
+from docker_images_helper import get_docker_image, pull_image
+from env_helper import REPORT_PATH, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport, TestResult
+from report import SUCCESS, JobReport, TestResult
 from stopwatch import Stopwatch
 
 IMAGE_NAME = "clickhouse/sqltest"
@@ -98,7 +93,7 @@ def main():
         "report.html": workspace_path / "report.html",
         "test.log": workspace_path / "test.log",
     }
-    status = "success"
+    status = SUCCESS
     description = "See the report"
     test_results = [TestResult(description, "OK")]
 
diff --git a/tests/ci/stress_check.py b/tests/ci/stress_check.py
index 46bb2261aba..49c1515c69f 100644
--- a/tests/ci/stress_check.py
+++ b/tests/ci/stress_check.py
@@ -10,11 +10,10 @@ from typing import List, Tuple
 
 from build_download_helper import download_all_deb_packages
 from clickhouse_helper import CiLogsCredentials
-
-from docker_images_helper import DockerImage, pull_image, get_docker_image
-from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from pr_info import PRInfo
-from report import JobReport, TestResult, TestResults, read_test_results
+from report import ERROR, JobReport, TestResult, TestResults, read_test_results
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -89,7 +88,7 @@ def process_results(
         status = list(csv.reader(status_file, delimiter="\t"))
 
     if len(status) != 1 or len(status[0]) != 2:
-        return "error", "Invalid check_status.tsv", test_results, additional_files
+        return ERROR, "Invalid check_status.tsv", test_results, additional_files
     state, description = status[0][0], status[0][1]
 
     try:
@@ -99,7 +98,7 @@ def process_results(
             raise Exception("Empty results")
     except Exception as e:
         return (
-            "error",
+            ERROR,
             f"Cannot parse test_results.tsv ({e})",
             test_results,
             additional_files,
diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 785e29b2359..0c7160aeea4 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -12,7 +12,7 @@ from docker_images_helper import get_docker_image, pull_image
 from env_helper import REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
 from pr_info import PRInfo
-from report import JobReport, TestResults, read_test_results
+from report import ERROR, FAILURE, SUCCESS, JobReport, TestResults, read_test_results
 from ssh import SSHKey
 from stopwatch import Stopwatch
 
@@ -36,7 +36,7 @@ def process_result(
             status = list(csv.reader(status_file, delimiter="\t"))
     if len(status) != 1 or len(status[0]) != 2:
         logging.info("Files in result folder %s", os.listdir(result_directory))
-        return "error", "Invalid check_status.tsv", test_results, additional_files
+        return ERROR, "Invalid check_status.tsv", test_results, additional_files
     state, description = status[0][0], status[0][1]
 
     try:
@@ -47,8 +47,8 @@ def process_result(
 
         return state, description, test_results, additional_files
     except Exception:
-        if state == "success":
-            state, description = "error", "Failed to read test_results.tsv"
+        if state == SUCCESS:
+            state, description = ERROR, "Failed to read test_results.tsv"
         return state, description, test_results, additional_files
 
 
@@ -161,7 +161,7 @@ def main():
         additional_files=additional_files,
     ).dump()
 
-    if state in ["error", "failure"]:
+    if state in [ERROR, FAILURE]:
         print(f"Style check failed: [{description}]")
         sys.exit(1)
 
diff --git a/tests/ci/unit_tests_check.py b/tests/ci/unit_tests_check.py
index 495547e1dfc..41c52d53020 100644
--- a/tests/ci/unit_tests_check.py
+++ b/tests/ci/unit_tests_check.py
@@ -3,15 +3,15 @@
 import json
 import logging
 import os
-import sys
 import subprocess
+import sys
 from pathlib import Path
 from typing import Tuple
 
 from build_download_helper import download_unit_tests
-from docker_images_helper import pull_image, get_docker_image
+from docker_images_helper import get_docker_image, pull_image
 from env_helper import REPORT_PATH, TEMP_PATH
-from report import ERROR, FAILURE, FAIL, OK, SUCCESS, JobReport, TestResults, TestResult
+from report import ERROR, FAIL, FAILURE, OK, SUCCESS, JobReport, TestResult, TestResults
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 
@@ -104,7 +104,7 @@ def process_results(
             if "failures" in test_case:
                 raw_logs = ""
                 for failure in test_case["failures"]:
-                    raw_logs += failure["failure"]
+                    raw_logs += failure[FAILURE]
                 if (
                     "Segmentation fault" in raw_logs  # type: ignore
                     and SEGFAULT not in description
@@ -205,7 +205,7 @@ def main():
         additional_files=additional_files,
     ).dump()
 
-    if state == "failure":
+    if state == FAILURE:
         sys.exit(1)
 
 
From b9848dbd2c73698db7e281b78011463984282bd1 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 6 Feb 2024 14:30:19 +0000
Subject: [PATCH 0663/1081] Remove unused is_finished

---
 src/Client/ConnectionEstablisher.cpp | 4 +---
 src/Client/ConnectionEstablisher.h   | 3 ---
 2 files changed, 1 insertion(+), 6 deletions(-)

diff --git a/src/Client/ConnectionEstablisher.cpp b/src/Client/ConnectionEstablisher.cpp
index bc242604b01..c43aa6d8087 100644
--- a/src/Client/ConnectionEstablisher.cpp
+++ b/src/Client/ConnectionEstablisher.cpp
@@ -27,14 +27,12 @@ ConnectionEstablisher::ConnectionEstablisher(
     const Settings & settings_,
     LoggerPtr log_,
     const QualifiedTableName * table_to_check_)
-    : pool(std::move(pool_)), timeouts(timeouts_), settings(settings_), log(log_), table_to_check(table_to_check_), is_finished(false)
+    : pool(std::move(pool_)), timeouts(timeouts_), settings(settings_), log(log_), table_to_check(table_to_check_)
 {
 }
 
 void ConnectionEstablisher::run(ConnectionEstablisher::TryResult & result, std::string & fail_message)
 {
-    is_finished = false;
-    SCOPE_EXIT(is_finished = true);
     try
     {
         ProfileEvents::increment(ProfileEvents::DistributedConnectionTries);
diff --git a/src/Client/ConnectionEstablisher.h b/src/Client/ConnectionEstablisher.h
index 52c78ff76c2..1fa08d435e9 100644
--- a/src/Client/ConnectionEstablisher.h
+++ b/src/Client/ConnectionEstablisher.h
@@ -30,8 +30,6 @@ public:
     /// Set async callback that will be called when reading from socket blocks.
     void setAsyncCallback(AsyncCallback async_callback_) { async_callback = std::move(async_callback_); }
 
-    bool isFinished() const { return is_finished; }
-
 private:
     ConnectionPoolPtr pool;
     const ConnectionTimeouts * timeouts;
@@ -39,7 +37,6 @@ private:
     LoggerPtr log;
     const QualifiedTableName * table_to_check;
 
-    bool is_finished;
     AsyncCallback async_callback = {};
 };
 

From 1abcf26df69bd75efb7f54960fc11486fe3a37a4 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 6 Feb 2024 15:39:52 +0000
Subject: [PATCH 0664/1081] Fix filter expressions

---
 src/Storages/StorageMerge.cpp | 187 +++++++++++++++++++++++-----------
 1 file changed, 129 insertions(+), 58 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 5ef6b5117f6..df5b0cd715d 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1,7 +1,9 @@
 #include <algorithm>
 #include <functional>
+#include <iterator>
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/ColumnNode.h>
+#include <Analyzer/FunctionNode.h>
 #include <Analyzer/IdentifierNode.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
 #include <Analyzer/Passes/QueryAnalysisPass.h>
@@ -59,6 +61,7 @@
 #include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
 #include "Core/NamesAndTypes.h"
+#include <Functions/FunctionFactory.h>
 
 namespace
 {
@@ -635,40 +638,106 @@ public:
     }
 };
 
-// bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
-// {
-//     QueryTreeNodes stack = { node };
-//     while (!stack.empty())
-//     {
-//         auto current = stack.back();
-//         stack.pop_back();
+bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
+{
+    QueryTreeNodes stack = { node };
+    while (!stack.empty())
+    {
+        auto current = stack.back();
+        stack.pop_back();
 
-//         switch (current->getNodeType())
-//         {
-//             case QueryTreeNodeType::CONSTANT:
-//                 break;
-//             case QueryTreeNodeType::COLUMN:
-//             {
-//                 auto * column_node = current->as<ColumnNode>();
-//                 auto source = column_node->getColumnSourceOrNull();
-//                 if (source != replacement_table_expression)
-//                     return true;
-//                 break;
-//             }
-//             default:
-//             {
-//                 for (const auto & child : current->getChildren())
-//                 {
-//                     if (child)
-//                         stack.push_back(child);
-//                 }
-//             }
-//         }
-//     }
-//     return false;
-// }
+        switch (current->getNodeType())
+        {
+            case QueryTreeNodeType::CONSTANT:
+                break;
+            case QueryTreeNodeType::COLUMN:
+            {
+                auto * column_node = current->as<ColumnNode>();
+                auto source = column_node->getColumnSourceOrNull();
+                if (source != replacement_table_expression)
+                    return true;
+                break;
+            }
+            default:
+            {
+                for (const auto & child : current->getChildren())
+                {
+                    if (child)
+                        stack.push_back(child);
+                }
+            }
+        }
+    }
+    return false;
+}
 
-QueryTreeNodePtr removeJoin(
+void replaceFilterExpression(
+    QueryTreeNodePtr & expression,
+    const QueryTreeNodePtr & replacement_table_expression,
+    const ContextPtr & context)
+{
+    auto * function = expression->as<FunctionNode>();
+    if (!function)
+        return;
+
+    if (function->getFunctionName() != "and")
+    {
+        if (hasUnknownColumn(expression, replacement_table_expression))
+            expression = nullptr;
+        return;
+    }
+
+    QueryTreeNodes conjunctions;
+    QueryTreeNodes processing{ expression };
+
+    while (!processing.empty())
+    {
+        auto node = std::move(processing.back());
+        processing.pop_back();
+
+        if (auto * function_node = node->as<FunctionNode>())
+        {
+            if (function_node->getFunctionName() == "and")
+                std::copy(
+                    function_node->getArguments().begin(),
+                    function_node->getArguments().end(),
+                    std::back_inserter(processing)
+                );
+            else
+                conjunctions.push_back(node);
+        }
+        else
+        {
+            conjunctions.push_back(node);
+        }
+    }
+
+    std::swap(processing, conjunctions);
+
+    for (const auto & node : processing)
+    {
+        if (!hasUnknownColumn(node, replacement_table_expression))
+            conjunctions.push_back(node);
+    }
+
+    if (conjunctions.empty())
+    {
+        expression = {};
+        return;
+    }
+    if (conjunctions.size() == 1)
+    {
+        expression = conjunctions[0];
+        return;
+    }
+
+    function->getArguments().getNodes() = std::move(conjunctions);
+
+    const auto function_impl = FunctionFactory::instance().get("and", context);
+    function->resolveAsFunction(function_impl->build(function->getArgumentColumns()));
+}
+
+QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     QueryTreeNodePtr query,
     QueryTreeNodePtr original_table_expression,
     QueryTreeNodePtr replacement_table_expression,
@@ -676,9 +745,12 @@ QueryTreeNodePtr removeJoin(
     const Names & required_column_names)
 {
     auto * query_node = query->as<QueryNode>();
-    auto join_tree = query_node->getJoinTree();
+    auto join_tree_type = query_node->getJoinTree()->getNodeType();
     auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
 
+    if (join_tree_type == QueryTreeNodeType::TABLE || join_tree_type == QueryTreeNodeType::TABLE_FUNCTION)
+        return modified_query;
+
     auto * modified_query_node = modified_query->as<QueryNode>();
 
     modified_query = modified_query->cloneAndReplace(modified_query_node->getJoinTree(), replacement_table_expression);
@@ -686,41 +758,40 @@ QueryTreeNodePtr removeJoin(
 
     query_node = modified_query->as<QueryNode>();
 
-    //TODO: change the predicates to make it valid and execute it on shards.
-    query_node->getPrewhere() = {};
-    query_node->getWhere() = {};
+    if (query_node->hasPrewhere())
+        replaceFilterExpression(query_node->getPrewhere(), replacement_table_expression, context);
+    if (query_node->hasWhere())
+        replaceFilterExpression(query_node->getWhere(), replacement_table_expression, context);
+
     query_node->getGroupBy().getNodes().clear();
     query_node->getHaving() = {};
     query_node->getOrderBy().getNodes().clear();
 
-    if (join_tree->as<TableNode>() == nullptr && join_tree->as<TableFunctionNode>() == nullptr)
+    auto & projection = modified_query_node->getProjection().getNodes();
+    projection.clear();
+    NamesAndTypes projection_columns;
+
+    for (auto const & column_name : required_column_names)
     {
-        auto & projection = modified_query_node->getProjection().getNodes();
-        projection.clear();
-        NamesAndTypes projection_columns;
+        QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column_name});
 
-        for (auto const & column_name : required_column_names)
-        {
-            QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column_name});
+        QueryAnalysisPass query_analysis_pass(original_table_expression);
+        query_analysis_pass.run(fake_node, context);
 
-            QueryAnalysisPass query_analysis_pass(original_table_expression);
-            query_analysis_pass.run(fake_node, context);
+        auto * resolved_column = fake_node->as<ColumnNode>();
+        if (!resolved_column)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Required column '{}' is not resolved", column_name);
+        auto fake_column = resolved_column->getColumn();
 
-            auto * resolved_column = fake_node->as<ColumnNode>();
-            if (!resolved_column)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Required column '{}' is not resolved", column_name);
-            auto fake_column = resolved_column->getColumn();
+        ApplyAliasColumnExpressionsVisitor visitor;
+        visitor.visit(fake_node);
 
-            ApplyAliasColumnExpressionsVisitor visitor;
-            visitor.visit(fake_node);
-
-            projection.push_back(fake_node);
-            projection_columns.push_back(fake_column);
-        }
-
-        query_node->resolveProjectionColumns(std::move(projection_columns));
+        projection.push_back(fake_node);
+        projection_columns.push_back(fake_column);
     }
 
+    query_node->resolveProjectionColumns(std::move(projection_columns));
+
     LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Result:\n{}", modified_query->dumpTree());
 
     return modified_query;
@@ -746,7 +817,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
-        modified_query_info.query_tree = removeJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression, modified_context, required_column_names);
+        modified_query_info.query_tree = replaceTableExpressionAndRemoveJoin(modified_query_info.query_tree, modified_query_info.table_expression, replacement_table_expression, modified_context, required_column_names);
         modified_query_info.table_expression = replacement_table_expression;
         modified_query_info.planner_context->getOrCreateTableExpressionData(replacement_table_expression);
 

From 29908ddd09f85957e61c7ffc95f16f382a0fd0fa Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 6 Feb 2024 15:59:13 +0000
Subject: [PATCH 0665/1081] Remove commented code. Add more comments.

---
 src/Planner/Planner.cpp                   | 11 +--
 src/Planner/Planner.h                     |  2 +
 src/Planner/PlannerContext.h              |  4 +
 src/Planner/Utils.cpp                     |  4 +
 src/Planner/findParallelReplicasQuery.cpp | 96 +++++++++--------------
 src/Planner/findParallelReplicasQuery.h   |  6 ++
 6 files changed, 52 insertions(+), 71 deletions(-)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index 8dcce627cce..64d43a2ba1f 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -482,11 +482,6 @@ void addMergingAggregatedStep(QueryPlan & query_plan,
         settings.max_block_size,
         settings.min_hit_rate_to_use_consecutive_keys_optimization);
 
-    // WriteBufferFromOwnString buf;
-    // params.explain(buf, 0);
-    // std::cerr << "........... " << buf.str() << std::endl;
-    // std::cerr << query_plan.getCurrentDataStream().header.dumpStructure() << std::endl;
-
     bool is_remote_storage = false;
     bool parallel_replicas_from_merge_tree = false;
 
@@ -1072,7 +1067,7 @@ void addBuildSubqueriesForSetsStepIfNeeded(
         Planner subquery_planner(
             query_tree,
             subquery_options,
-            std::make_shared<GlobalPlannerContext>(nullptr, nullptr)); //planner_context->getGlobalPlannerContext());
+            std::make_shared<GlobalPlannerContext>(nullptr, nullptr));
         subquery_planner.buildQueryPlanIfNeeded();
 
         subquery->setQueryPlan(std::make_unique<QueryPlan>(std::move(subquery_planner).extractQueryPlan()));
@@ -1444,10 +1439,6 @@ void Planner::buildPlanForQueryNode()
     auto & mapping = join_tree_query_plan.query_node_to_plan_step_mapping;
     query_node_to_plan_step_mapping.insert(mapping.begin(), mapping.end());
 
-    // WriteBufferFromOwnString buf;
-    // query_plan.explainPlan(buf, {.header = true});
-    // LOG_TRACE(&Poco::Logger::get("Planner"), "Plan\n{}", buf.str());
-
     LOG_TRACE(getLogger("Planner"), "Query {} from stage {} to stage {}{}",
         query_tree->formatConvertedASTForErrorMessage(),
         QueryProcessingStage::toString(from_stage),
diff --git a/src/Planner/Planner.h b/src/Planner/Planner.h
index 5667686b058..ae78f05cbd4 100644
--- a/src/Planner/Planner.h
+++ b/src/Planner/Planner.h
@@ -65,6 +65,8 @@ public:
         return planner_context;
     }
 
+    /// We support mapping QueryNode -> QueryPlanStep (the last step added to plan from this query)
+    /// It is useful for parallel replicas analysis.
     using QueryNodeToPlanStepMapping = std::unordered_map<const QueryNode *, const QueryPlan::Node *>;
     const QueryNodeToPlanStepMapping & getQueryNodeToPlanStepMapping() const { return query_node_to_plan_step_mapping; }
 
diff --git a/src/Planner/PlannerContext.h b/src/Planner/PlannerContext.h
index d0e1497061e..fe9eabc558b 100644
--- a/src/Planner/PlannerContext.h
+++ b/src/Planner/PlannerContext.h
@@ -46,7 +46,11 @@ public:
     /// Check if context has column identifier
     bool hasColumnIdentifier(const ColumnIdentifier & column_identifier);
 
+    /// The query which will be executed with parallel replicas.
+    /// In case if only the most inner subquery can be executed with parallel replicas, node is nullptr.
     const QueryNode * const parallel_replicas_node = nullptr;
+    /// Table which is used with parallel replicas reading. Now, only one table is supported by the protocol.
+    /// It is the left-most table of the query (in JOINs, UNIONs and subqueries).
     const TableNode * const parallel_replicas_table = nullptr;
 
 private:
diff --git a/src/Planner/Utils.cpp b/src/Planner/Utils.cpp
index e127a1a053e..50ffa83a272 100644
--- a/src/Planner/Utils.cpp
+++ b/src/Planner/Utils.cpp
@@ -152,6 +152,10 @@ static void removeCTEs(ASTPtr & ast)
 ASTPtr queryNodeToDistributedSelectQuery(const QueryTreeNodePtr & query_node)
 {
     auto ast = queryNodeToSelectQuery(query_node);
+    /// Remove CTEs information from distributed queries.
+    /// Now, if cte_name is set for subquery node, AST -> String serialization will only print cte name.
+    /// But CTE is defined only for top-level query part, so may not be sent.
+    /// Removing cte_name forces subquery to be always printed.
     removeCTEs(ast);
     return ast;
 }
diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
index cf14fc08351..8b03fc97bec 100644
--- a/src/Planner/findParallelReplicasQuery.cpp
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -6,17 +6,17 @@
 #include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Planner/PlannerJoinTree.h>
 #include <Planner/Utils.h>
-#include "Analyzer/ArrayJoinNode.h"
-#include "Analyzer/InDepthQueryTreeVisitor.h"
-#include "Analyzer/JoinNode.h"
-#include "Analyzer/QueryNode.h"
-#include "Analyzer/TableNode.h"
-#include "Analyzer/UnionNode.h"
-#include "Parsers/ASTSubquery.h"
-#include "Parsers/queryToString.h"
-#include "Processors/QueryPlan/ExpressionStep.h"
-#include "Processors/QueryPlan/FilterStep.h"
-#include "Storages/MergeTree/MergeTreeData.h"
+#include <Analyzer/ArrayJoinNode.h>
+#include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/JoinNode.h>
+#include <Analyzer/QueryNode.h>
+#include <Analyzer/TableNode.h>
+#include <Analyzer/UnionNode.h>
+#include <Parsers/ASTSubquery.h>
+#include <Parsers/queryToString.h>
+#include <Processors/QueryPlan/ExpressionStep.h>
+#include <Processors/QueryPlan/FilterStep.h>
+#include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/StorageDummy.h>
 
 namespace DB
@@ -28,6 +28,11 @@ namespace ErrorCodes
     extern const int UNSUPPORTED_METHOD;
 }
 
+/// Returns a list of (sub)queries (candidates) which may support parallel replicas.
+/// The rule is :
+/// subquery has only LEFT or ALL INNER JOIN (or none), and left part is MergeTree table or subquery candidate as well.
+///
+/// Additional checks are required, so we return many candidates. The innermost subquery is on top.
 std::stack<const QueryNode *> getSupportingParallelReplicasQuery(const IQueryTreeNode * query_tree_node)
 {
     std::stack<const QueryNode *> res;
@@ -42,6 +47,7 @@ std::stack<const QueryNode *> getSupportingParallelReplicasQuery(const IQueryTre
             {
                 const auto & table_node = query_tree_node->as<TableNode &>();
                 const auto & storage = table_node.getStorage();
+                /// Here we check StorageDummy as well, to support a query tree with replaced storages.
                 if (std::dynamic_pointer_cast<MergeTreeData>(storage) || typeid_cast<const StorageDummy *>(storage.get()))
                     return res;
 
@@ -143,6 +149,9 @@ QueryTreeNodePtr replaceTablesWithDummyTables(const QueryTreeNodePtr & query, co
     return query->cloneAndReplace(visitor.replacement_map);
 }
 
+/// Find the best candidate for parallel replicas execution by verifying query plan.
+/// If query plan has only Expression, Filter of Join steps, we can execute it fully remotely and check the next query.
+/// Otherwise we can execute current query up to WithMergableStage only.
 const QueryNode * findParallelReplicasQuery(
     std::stack<const QueryNode *> stack,
     const std::unordered_map<const QueryNode *, const QueryPlan::Node *> & mapping)
@@ -155,12 +164,6 @@ const QueryNode * findParallelReplicasQuery(
         const QueryNode * subquery_node = stack.top();
         stack.pop();
 
-        // std::cerr << "----- trying " << reinterpret_cast<const void *>(subquery_node) << std::endl;
-
-        // const QueryNode * mapped_node = subquery_node;
-        // if (auto it = replacement_map.find(subquery_node); it != replacement_map.end())
-        //     mapped_node = it->second.get();
-
         auto it = mapping.find(subquery_node);
         /// This should not happen ideally.
         if (it == mapping.end())
@@ -170,8 +173,6 @@ const QueryNode * findParallelReplicasQuery(
         const QueryPlan::Node * next_node_to_check = curr_node;
         bool can_distribute_full_node = true;
 
-        // std::cerr << "trying " << curr_node->step->getName() << '\n' << subquery_node->dumpTree() << std::endl;
-
         while (next_node_to_check && next_node_to_check != prev_checked_node)
         {
             const auto & children = next_node_to_check->children;
@@ -210,8 +211,8 @@ const QueryNode * findParallelReplicasQuery(
         /// Will try to execute query up to WithMergableStage
         if (!can_distribute_full_node)
         {
-            /// Current query node does not contain subqueries already.
-            /// We can execute parallel replicas over storage.
+            /// Current query node does not contain subqueries.
+            /// We can execute parallel replicas over storage::read.
             if (!res)
                 return nullptr;
 
@@ -240,15 +241,11 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
             query_tree_node->formatASTForErrorMessage());
 
     auto context = query_node ? query_node->getContext() : union_node->getContext();
-    // const auto & settings = context->getSettingsRef();
 
     if (!context->canUseParallelReplicasOnInitiator())
         return nullptr;
 
     auto stack = getSupportingParallelReplicasQuery(query_tree_node.get());
-    // std::cerr << "=============== findParallelReplicasQuery stack size " << stack.size() << std::endl;
-    // std::cerr << "=============== findParallelReplicasQuery tree\n " << query_tree_node->dumpTree() << std::endl;
-    // std::cerr << "=============== findParallelReplicasQuery trace \n" << StackTrace().toString() << std::endl;
     /// Empty stack means that storage does not support parallel replicas.
     if (stack.empty())
         return nullptr;
@@ -257,37 +254,27 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
     if (stack.top() == query_tree_node.get())
         return nullptr;
 
+    /// This is needed to avoid infinite recursion.
     auto mutable_context = Context::createCopy(context);
     mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
 
+    /// Here we replace tables to dummy, in order to build a temporary query plan for parallel replicas analysis.
     ResultReplacementMap replacement_map;
     auto updated_query_tree = replaceTablesWithDummyTables(query_tree_node, mutable_context);
 
-    // std::cerr << "=============== findParallelReplicasQuery updated tree\n " << updated_query_tree->dumpTree() << std::endl;
-
     SelectQueryOptions options;
-    //options.only_analyze = true;
     Planner planner(updated_query_tree, options, std::make_shared<GlobalPlannerContext>(nullptr, nullptr));
     planner.buildQueryPlanIfNeeded();
 
-    // WriteBufferFromOwnString buf;
-    // planner.getQueryPlan().explainPlan(buf, {.actions = true});
-    // std::cerr << buf.str() << std::endl;
-
+    /// This part is a bit clumsy.
+    /// We updated a query_tree with dummy storages, and mapping is using updated_query_tree now.
+    /// But QueryNode result should be taken from initial query tree.
+    /// So that we build a list of candidates again, and call findParallelReplicasQuery for it.
     auto new_stack = getSupportingParallelReplicasQuery(updated_query_tree.get());
-
-    //const auto & result_query_plan = planner.getQueryPlan();
     const auto & mapping = planner.getQueryNodeToPlanStepMapping();
-
-    // for (const auto & [k, v] : mapping)
-    //     std::cerr << "----- " << v->step->getName() << '\n' << reinterpret_cast<const void *>(k) << std::endl;
-
     const auto * res = findParallelReplicasQuery(new_stack, mapping);
-    // if (res)
-    //     std::cerr << "Result subtree " << res->dumpTree() << std::endl;
-    // else
-    //     std::cerr << "Result subtree is empty" << std::endl;
 
+    /// Now, return a query from initial stack.
     if (res)
     {
         while (!new_stack.empty())
@@ -383,7 +370,6 @@ const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tr
             query_tree_node->formatASTForErrorMessage());
 
     auto context = query_node ? query_node->getContext() : union_node->getContext();
-    // const auto & settings = context->getSettingsRef();
 
     if (!context->canUseParallelReplicasOnFollower())
         return nullptr;
@@ -396,9 +382,6 @@ JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
     const PlannerContextPtr & planner_context,
     std::shared_ptr<const StorageLimitsList> storage_limits)
 {
-    // std::cerr << "buildQueryPlanForParallelReplicas 1 " << query_node.dumpTree() << std::endl;
-    ASTPtr modified_query_ast;
-    Block header;
     auto processed_stage = QueryProcessingStage::WithMergeableState;
     auto context = planner_context->getQueryContext();
 
@@ -408,23 +391,10 @@ JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
         modified_query_tree, context, SelectQueryOptions(processed_stage).analyze());
 
     rewriteJoinToGlobalJoin(modified_query_tree, context);
-    // std::cerr << "buildQueryPlanForParallelReplicas 1 " << modified_query_tree->dumpTree() << std::endl;
     modified_query_tree = buildQueryTreeForShard(planner_context, modified_query_tree);
-    // std::cerr << "buildQueryPlanForParallelReplicas 2 " << modified_query_tree->dumpTree() << std::endl;
-    modified_query_ast = queryNodeToDistributedSelectQuery(modified_query_tree);
+    ASTPtr modified_query_ast = queryNodeToDistributedSelectQuery(modified_query_tree);
 
-    // std::cerr << "buildQueryPlanForParallelReplicas AST " << queryToString(modified_query_ast) << std::endl;
-    // std::cerr << "buildQueryPlanForParallelReplicas AST " << modified_query_ast->dumpTree() << std::endl;
-
-    // SelectQueryOptions opt(processed_stage);
-    // Planner planner(modified_query_tree, opt, std::make_shared<GlobalPlannerContext>(nullptr));
-    // planner.buildQueryPlanIfNeeded();
-    // header = planner.getQueryPlan().getCurrentDataStream().header;
-
-    // InterpreterSelectQueryAnalyzer interpreter(modified_query_tree, context, SelectQueryOptions(processed_stage));
-    // header = interpreter.getSampleBlock();
-
-    header = InterpreterSelectQueryAnalyzer::getSampleBlock(
+    Block header = InterpreterSelectQueryAnalyzer::getSampleBlock(
         modified_query_tree, context, SelectQueryOptions(processed_stage).analyze());
 
     ClusterProxy::SelectStreamFactory select_stream_factory =
@@ -447,6 +417,10 @@ JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
         initial_header.getColumnsWithTypeAndName(),
         ActionsDAG::MatchColumnsMode::Position);
 
+    /// initial_header is a header expected by initial query.
+    /// header is a header which is returned by the follower.
+    /// They are different because tables will have different aliases (e.g. _table1 or _table5).
+    /// Here we just rename columns by position, with the hope the types would match.
     auto step = std::make_unique<ExpressionStep>(query_plan.getCurrentDataStream(), std::move(converting));
     step->setStepDescription("Convert distributed names");
     query_plan.addStep(std::move(step));
diff --git a/src/Planner/findParallelReplicasQuery.h b/src/Planner/findParallelReplicasQuery.h
index ab30de3adaf..ee910cbdaaa 100644
--- a/src/Planner/findParallelReplicasQuery.h
+++ b/src/Planner/findParallelReplicasQuery.h
@@ -13,7 +13,11 @@ using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
 
 struct SelectQueryOptions;
 
+/// Find a qury which can be executed with parallel replicas up to WithMergableStage.
+/// Returned query will always contain some (>1) subqueries, possibly with joins.
 const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
+
+/// Find a table from which we should read on follower replica. It's the left-most table within all JOINs and UNIONs.
 const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
 
 struct JoinTreeQueryPlan;
@@ -24,6 +28,8 @@ using PlannerContextPtr = std::shared_ptr<PlannerContext>;
 struct StorageLimits;
 using StorageLimitsList = std::list<StorageLimits>;
 
+/// Execute QueryNode with parallel replicas up to WithMergableStage and return a plan.
+/// This method does not check that QueryNode is valid. Ideally it should be a result of findParallelReplicasQuery.
 JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
     const QueryNode & query_node,
     const PlannerContextPtr & planner_context,

From aad9f49626d9b64aa299b5433020e012ba489207 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Thu, 1 Feb 2024 16:10:59 +0000
Subject: [PATCH 0666/1081] analyzer fix
 test_select_access_rights/test_main.py::test_select_count

---
 src/Planner/PlannerJoinTree.cpp             | 44 +++++++++++++++------
 tests/analyzer_integration_broken_tests.txt |  1 -
 2 files changed, 32 insertions(+), 13 deletions(-)

diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index ab25f6d2423..fc0e17e70a1 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -84,32 +84,38 @@ namespace
 {
 
 /// Check if current user has privileges to SELECT columns from table
-void checkAccessRights(const TableNode & table_node, const Names & column_names, const ContextPtr & query_context)
+/// Throws an exception if access to any column from `column_names` is not granted
+/// If `column_names` is empty, check access to any columns and retun names of accessible columns
+NameSet checkAccessRights(const TableNode & table_node, Names & column_names, const ContextPtr & query_context)
 {
     /// StorageDummy is created on preliminary stage, ignore access check for it.
     if (typeid_cast<const StorageDummy *>(table_node.getStorage().get()))
-        return;
+        return {};
 
     const auto & storage_id = table_node.getStorageID();
     const auto & storage_snapshot = table_node.getStorageSnapshot();
 
     if (column_names.empty())
     {
+        NameSet accessible_columns;
         /** For a trivial queries like "SELECT count() FROM table", "SELECT 1 FROM table" access is granted if at least
           * one table column is accessible.
           */
         auto access = query_context->getAccess();
-
         for (const auto & column : storage_snapshot->metadata->getColumns())
         {
             if (access->isGranted(AccessType::SELECT, storage_id.database_name, storage_id.table_name, column.name))
-                return;
+                accessible_columns.insert(column.name);
         }
 
-        throw Exception(ErrorCodes::ACCESS_DENIED,
-            "{}: Not enough privileges. To execute this query, it's necessary to have the grant SELECT for at least one column on {}",
-            query_context->getUserName(),
-            storage_id.getFullTableName());
+        if (accessible_columns.empty())
+        {
+            throw Exception(ErrorCodes::ACCESS_DENIED,
+                "{}: Not enough privileges. To execute this query, it's necessary to have the grant SELECT for at least one column on {}",
+                query_context->getUserName(),
+                storage_id.getFullTableName());
+        }
+        return accessible_columns;
     }
 
     // In case of cross-replication we don't know what database is used for the table.
@@ -117,6 +123,8 @@ void checkAccessRights(const TableNode & table_node, const Names & column_names,
     // Each shard will use the default database (in the case of cross-replication shards may have different defaults).
     if (storage_id.hasDatabase())
         query_context->checkAccess(AccessType::SELECT, storage_id, column_names);
+
+    return {};
 }
 
 bool shouldIgnoreQuotaAndLimits(const TableNode & table_node)
@@ -133,7 +141,7 @@ bool shouldIgnoreQuotaAndLimits(const TableNode & table_node)
     return false;
 }
 
-NameAndTypePair chooseSmallestColumnToReadFromStorage(const StoragePtr & storage, const StorageSnapshotPtr & storage_snapshot)
+NameAndTypePair chooseSmallestColumnToReadFromStorage(const StoragePtr & storage, const StorageSnapshotPtr & storage_snapshot, const NameSet & column_names_allowed_to_select)
 {
     /** We need to read at least one column to find the number of rows.
       * We will find a column with minimum <compressed_size, type_size, uncompressed_size>.
@@ -167,6 +175,18 @@ NameAndTypePair chooseSmallestColumnToReadFromStorage(const StoragePtr & storage
     auto column_sizes = storage->getColumnSizes();
     auto column_names_and_types = storage_snapshot->getColumns(GetColumnsOptions(GetColumnsOptions::AllPhysical).withSubcolumns());
 
+    if (!column_names_allowed_to_select.empty())
+    {
+        auto it = column_names_and_types.begin();
+        while (it != column_names_and_types.end())
+        {
+            if (!column_names_allowed_to_select.contains(it->name))
+                it = column_names_and_types.erase(it);
+            else
+                ++it;
+        }
+    }
+
     if (!column_sizes.empty())
     {
         for (auto & column_name_and_type : column_names_and_types)
@@ -330,12 +350,13 @@ void prepareBuildQueryPlanForTableExpression(const QueryTreeNodePtr & table_expr
     /** The current user must have the SELECT privilege.
       * We do not check access rights for table functions because they have been already checked in ITableFunction::execute().
       */
+    NameSet columns_names_allowed_to_select;
     if (table_node)
     {
         auto column_names_with_aliases = columns_names;
         const auto & alias_columns_names = table_expression_data.getAliasColumnsNames();
         column_names_with_aliases.insert(column_names_with_aliases.end(), alias_columns_names.begin(), alias_columns_names.end());
-        checkAccessRights(*table_node, column_names_with_aliases, query_context);
+        columns_names_allowed_to_select = checkAccessRights(*table_node, column_names_with_aliases, query_context);
     }
 
     if (columns_names.empty())
@@ -346,8 +367,7 @@ void prepareBuildQueryPlanForTableExpression(const QueryTreeNodePtr & table_expr
         {
             const auto & storage = table_node ? table_node->getStorage() : table_function_node->getStorage();
             const auto & storage_snapshot = table_node ? table_node->getStorageSnapshot() : table_function_node->getStorageSnapshot();
-            additional_column_to_read = chooseSmallestColumnToReadFromStorage(storage, storage_snapshot);
-
+            additional_column_to_read = chooseSmallestColumnToReadFromStorage(storage, storage_snapshot, columns_names_allowed_to_select);
         }
         else if (query_node || union_node)
         {
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 06142f98da1..c1c7882a4b9 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -12,7 +12,6 @@ test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_replicating_constants/test.py::test_different_versions
 test_select_access_rights/test_main.py::test_alias_columns
-test_select_access_rights/test_main.py::test_select_count
 test_select_access_rights/test_main.py::test_select_join
 test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote

From 9438118745297d39b02392fdaabb8d22f8a849d7 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 2 Feb 2024 09:29:55 +0000
Subject: [PATCH 0667/1081] fix
 test_select_access_rights/test_main.py::test_select_join

---
 src/Planner/PlannerJoinTree.cpp               |  2 +-
 tests/analyzer_integration_broken_tests.txt   |  1 -
 .../test_select_access_rights/test_main.py    | 41 +++++++++++++------
 3 files changed, 29 insertions(+), 15 deletions(-)

diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index fc0e17e70a1..aced82645d0 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -85,7 +85,7 @@ namespace
 
 /// Check if current user has privileges to SELECT columns from table
 /// Throws an exception if access to any column from `column_names` is not granted
-/// If `column_names` is empty, check access to any columns and retun names of accessible columns
+/// If `column_names` is empty, check access to any columns and return names of accessible columns
 NameSet checkAccessRights(const TableNode & table_node, Names & column_names, const ContextPtr & query_context)
 {
     /// StorageDummy is created on preliminary stage, ignore access check for it.
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c1c7882a4b9..c04ed440c18 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -12,7 +12,6 @@ test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_replicating_constants/test.py::test_different_versions
 test_select_access_rights/test_main.py::test_alias_columns
-test_select_access_rights/test_main.py::test_select_join
 test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
diff --git a/tests/integration/test_select_access_rights/test_main.py b/tests/integration/test_select_access_rights/test_main.py
index eedecc2d30c..bca3c698911 100644
--- a/tests/integration/test_select_access_rights/test_main.py
+++ b/tests/integration/test_select_access_rights/test_main.py
@@ -1,6 +1,7 @@
 import pytest
+
+import re
 from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance("instance")
@@ -185,25 +186,39 @@ def test_select_join():
     )
 
     select_query = "SELECT * FROM table1 JOIN table2 USING(d)"
-    assert (
-        "it's necessary to have the grant SELECT(d, x, y) ON default.table2"
-        in instance.query_and_get_error(select_query, user="A")
-    )
+
+    def match_error(err, columns, table):
+        """Check if the error message contains the expected table and columns"""
+
+        match = re.search(
+            r"it's necessary to have the grant SELECT\((.*)\) ON default\.(\w+)", err
+        )
+        if not match:
+            return False
+        if match.group(2) != table:
+            return False
+        assert set(match.group(1).split(", ")) == set(
+            columns.split(", ")
+        ), f"expected {columns} in {err}"
+        return True
+
+    response = instance.query_and_get_error(select_query, user="A")
+    table1_match = match_error(response, "d, a, b", "table1")
+    table2_match = match_error(response, "d, x, y", "table2")
+    assert table1_match or table2_match, response
 
     instance.query("GRANT SELECT(d, x, y) ON default.table2 TO A")
-    assert (
-        "it's necessary to have the grant SELECT(d, a, b) ON default.table1"
-        in instance.query_and_get_error(select_query, user="A")
-    )
+    response = instance.query_and_get_error(select_query, user="A")
+    assert match_error(response, "d, a, b", "table1")
 
+    response = instance.query_and_get_error(select_query, user="A")
     instance.query("GRANT SELECT(d, a, b) ON default.table1 TO A")
+
     assert instance.query(select_query, user="A") == ""
 
     instance.query("REVOKE SELECT ON default.table2 FROM A")
-    assert (
-        "it's necessary to have the grant SELECT(d, x, y) ON default.table2"
-        in instance.query_and_get_error(select_query, user="A")
-    )
+    response = instance.query_and_get_error(select_query, user="A")
+    assert match_error(response, "d, x, y", "table2")
 
 
 def test_select_union():

From 5d042dc815a8e5ccf9136fb4191d610e8d193814 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 6 Feb 2024 17:42:24 +0100
Subject: [PATCH 0668/1081] Check pointer

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index de7788997be..99425518623 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5570,7 +5570,7 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
                 column = function_base->getConstantResultForNonConstArguments(argument_columns, result_type);
             }
 
-            if (column->getDataType() != result_type->getColumnType())
+            if (column && column->getDataType() != result_type->getColumnType())
                 throw Exception(
                     ErrorCodes::LOGICAL_ERROR,
                     "Unexpected return type from {}. Expected {}. Got {}",

From 8a428eb7cfbe72acdbd197a924fad604765e217e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 6 Feb 2024 18:37:14 +0100
Subject: [PATCH 0669/1081] Better usability for server versions in ClickHouse
 Cloud

---
 programs/client/Client.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 0988e1eb4a1..cc142470d7f 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -504,7 +504,7 @@ void Client::connect()
                         << "It may lack support for new features." << std::endl
                         << std::endl;
         }
-        else if (client_version_tuple > server_version_tuple)
+        else if (client_version_tuple > server_version_tuple && server_display_name != "clickhouse-cloud")
         {
             std::cout << "ClickHouse server version is older than ClickHouse client. "
                         << "It may indicate that the server is out of date and can be upgraded." << std::endl

From 5c68f9cabdd44ed147c586702793980f7c70a2e5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 6 Feb 2024 19:09:28 +0100
Subject: [PATCH 0670/1081] Maintain function alias in
 RewriteSumFunctionWithSumAndCountVisitor

---
 ...writeSumFunctionWithSumAndCountVisitor.cpp |  6 ++
 ..._rewrite_sum_column_and_constant.reference | 72 ++++++++++---------
 .../02931_rewrite_sum_column_and_constant.sql |  5 ++
 3 files changed, 51 insertions(+), 32 deletions(-)

diff --git a/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp b/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
index b654d28d750..2f5e597bdab 100644
--- a/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
+++ b/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
@@ -100,7 +100,10 @@ void RewriteSumFunctionWithSumAndCountMatcher::visit(const ASTFunction & functio
         if (!new_ast)
             return;
         else
+        {
+            new_ast->setAlias(ast->tryGetAlias());
             ast = new_ast;
+        }
     }
     else if (column_id == 1)
     {
@@ -116,7 +119,10 @@ void RewriteSumFunctionWithSumAndCountMatcher::visit(const ASTFunction & functio
         if (!new_ast)
             return;
         else
+        {
+            new_ast->setAlias(ast->tryGetAlias());
             ast = new_ast;
+        }
     }
 }
 
diff --git a/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.reference b/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.reference
index 8f29910e9ae..3124698d218 100644
--- a/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.reference
+++ b/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.reference
@@ -47,24 +47,24 @@ SELECT sum(uint64) + (1 * count(uint64))
 FROM test_table
 WHERE ((uint64 + 1) AS i) > 0
 EXPLAIN SYNTAX (SELECT sum(uint64 + 1) AS j from test_table having j > 0);
-SELECT sum(uint64) + (1 * count(uint64))
+SELECT sum(uint64) + (1 * count(uint64)) AS j
 FROM test_table
-HAVING (sum(uint64) + (1 * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(uint64 + 1 AS i) j from test_table where i > 0 having j > 0);
-SELECT sum(uint64) + (1 * count(uint64))
+SELECT sum(uint64) + (1 * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 + 1) AS i) > 0
-HAVING (sum(uint64) + (1 * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum((uint64 AS m) + (1 AS n)) j from test_table where m > 0 and n > 0 having j > 0);
-SELECT sum(uint64) + ((1 AS n) * count(uint64))
+SELECT sum(uint64) + ((1 AS n) * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 AS m) > 0) AND (n > 0)
-HAVING (sum(uint64) + (n * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(((uint64 AS m) + (1 AS n)) AS i) j from test_table where m > 0 and n > 0 and i > 0 having j > 0);
-SELECT sum(uint64) + ((1 AS n) * count(uint64))
+SELECT sum(uint64) + ((1 AS n) * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 AS m) > 0) AND (n > 0) AND (((m + n) AS i) > 0)
-HAVING (sum(uint64) + (n * count(uint64))) > 0
+HAVING j > 0
 SELECT sum(1 + uint64 AS i) from test_table where i > 0;
 20
 SELECT sum(1 + uint64) AS j from test_table having j > 0;
@@ -80,24 +80,24 @@ SELECT (1 * count(uint64)) + sum(uint64)
 FROM test_table
 WHERE ((1 + uint64) AS i) > 0
 EXPLAIN SYNTAX (SELECT sum(1 + uint64) AS j from test_table having j > 0);
-SELECT (1 * count(uint64)) + sum(uint64)
+SELECT (1 * count(uint64)) + sum(uint64) AS j
 FROM test_table
-HAVING ((1 * count(uint64)) + sum(uint64)) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(1 + uint64 AS i) j from test_table where i > 0 having j > 0);
-SELECT (1 * count(uint64)) + sum(uint64)
+SELECT (1 * count(uint64)) + sum(uint64) AS j
 FROM test_table
 WHERE ((1 + uint64) AS i) > 0
-HAVING ((1 * count(uint64)) + sum(uint64)) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum((1 AS m) + (uint64 AS n)) j from test_table where m > 0 and n > 0 having j > 0);
-SELECT ((1 AS m) * count(uint64)) + sum(uint64)
+SELECT ((1 AS m) * count(uint64)) + sum(uint64) AS j
 FROM test_table
 WHERE (m > 0) AND ((uint64 AS n) > 0)
-HAVING ((m * count(uint64)) + sum(uint64)) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(((1 AS m) + (uint64 AS n)) AS i) j from test_table where m > 0 and n > 0 and i > 0 having j > 0);
-SELECT ((1 AS m) * count(uint64)) + sum(uint64)
+SELECT ((1 AS m) * count(uint64)) + sum(uint64) AS j
 FROM test_table
 WHERE (m > 0) AND ((uint64 AS n) > 0) AND (((m + n) AS i) > 0)
-HAVING ((m * count(uint64)) + sum(uint64)) > 0
+HAVING j > 0
 SELECT sum(uint64 - 1 AS i) from test_table where i > 0;
 10
 SELECT sum(uint64 - 1) AS j from test_table having j > 0;
@@ -113,24 +113,24 @@ SELECT sum(uint64) - (1 * count(uint64))
 FROM test_table
 WHERE ((uint64 - 1) AS i) > 0
 EXPLAIN SYNTAX (SELECT sum(uint64 - 1) AS j from test_table having j > 0);
-SELECT sum(uint64) - (1 * count(uint64))
+SELECT sum(uint64) - (1 * count(uint64)) AS j
 FROM test_table
-HAVING (sum(uint64) - (1 * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(uint64 - 1 AS i) j from test_table where i > 0 having j > 0);
-SELECT sum(uint64) - (1 * count(uint64))
+SELECT sum(uint64) - (1 * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 - 1) AS i) > 0
-HAVING (sum(uint64) - (1 * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum((uint64 AS m) - (1 AS n)) j from test_table where m > 0 and n > 0 having j > 0);
-SELECT sum(uint64) - ((1 AS n) * count(uint64))
+SELECT sum(uint64) - ((1 AS n) * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 AS m) > 0) AND (n > 0)
-HAVING (sum(uint64) - (n * count(uint64))) > 0
+HAVING j > 0
 EXPLAIN SYNTAX (SELECT sum(((uint64 AS m) - (1 AS n)) AS i) j from test_table where m > 0 and n > 0 and i > 0 having j > 0);
-SELECT sum(uint64) - ((1 AS n) * count(uint64))
+SELECT sum(uint64) - ((1 AS n) * count(uint64)) AS j
 FROM test_table
 WHERE ((uint64 AS m) > 0) AND (n > 0) AND (((m - n) AS i) > 0)
-HAVING (sum(uint64) - (n * count(uint64))) > 0
+HAVING j > 0
 SELECT sum(1 - uint64 AS i) from test_table;
 -10
 SELECT sum(1 - uint64) AS j from test_table;
@@ -146,24 +146,24 @@ SELECT (1 * count(uint64)) - sum(uint64)
 FROM test_table
 WHERE ((1 - uint64) AS i) > 0
 EXPLAIN SYNTAX (SELECT sum(1 - uint64) AS j from test_table having j < 0);
-SELECT (1 * count(uint64)) - sum(uint64)
+SELECT (1 * count(uint64)) - sum(uint64) AS j
 FROM test_table
-HAVING ((1 * count(uint64)) - sum(uint64)) < 0
+HAVING j < 0
 EXPLAIN SYNTAX (SELECT sum(1 - uint64 AS i) j from test_table where i > 0 having j < 0);
-SELECT (1 * count(uint64)) - sum(uint64)
+SELECT (1 * count(uint64)) - sum(uint64) AS j
 FROM test_table
 WHERE ((1 - uint64) AS i) > 0
-HAVING ((1 * count(uint64)) - sum(uint64)) < 0
+HAVING j < 0
 EXPLAIN SYNTAX (SELECT sum((1 AS m) - (uint64 AS n)) j from test_table where m > 0 and n > 0 having j < 0);
-SELECT ((1 AS m) * count(uint64)) - sum(uint64)
+SELECT ((1 AS m) * count(uint64)) - sum(uint64) AS j
 FROM test_table
 WHERE (m > 0) AND ((uint64 AS n) > 0)
-HAVING ((m * count(uint64)) - sum(uint64)) < 0
+HAVING j < 0
 EXPLAIN SYNTAX (SELECT sum(((1 AS m) - (uint64 AS n)) AS i) j from test_table where m > 0 and n > 0 and i < 0 having j < 0);
-SELECT ((1 AS m) * count(uint64)) - sum(uint64)
+SELECT ((1 AS m) * count(uint64)) - sum(uint64) AS j
 FROM test_table
 WHERE (m > 0) AND ((uint64 AS n) > 0) AND (((m - n) AS i) < 0)
-HAVING ((m * count(uint64)) - sum(uint64)) < 0
+HAVING j < 0
 SELECT sum(uint64 + 2.11) From test_table;
 25.549999999999997
 SELECT sum(2.11 + uint64) From test_table;
@@ -474,3 +474,11 @@ FROM test_table
 EXPLAIN SYNTAX (SELECT (2 * count(decimal32) - sum(decimal32)) + (3 * count(decimal32) - sum(decimal32)) From test_table);
 SELECT ((2 * count(decimal32)) - sum(decimal32)) + ((3 * count(decimal32)) - sum(decimal32))
 FROM test_table
+-- https://github.com/ClickHouse/ClickHouse/issues/59414
+SELECT sum(uint64 + 2) as j, j + 5 as t from test_table;
+25	30
+EXPLAIN SYNTAX SELECT sum(uint64 + 2) as j, j + 5 as t from test_table;
+SELECT
+    sum(uint64) + (2 * count(uint64)) AS j,
+    j + 5 AS t
+FROM test_table
diff --git a/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.sql b/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.sql
index b29407d7208..c7b0ff82442 100644
--- a/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.sql
+++ b/tests/queries/0_stateless/02931_rewrite_sum_column_and_constant.sql
@@ -204,6 +204,11 @@ EXPLAIN SYNTAX (SELECT (sum(decimal32) + 2 * count(decimal32)) - (sum(decimal32)
 EXPLAIN SYNTAX (SELECT (sum(decimal32) - 2 * count(decimal32)) + (sum(decimal32) - 3 * count(decimal32)) From test_table);
 EXPLAIN SYNTAX (SELECT (sum(decimal32) - 2 * count(decimal32)) - (sum(decimal32) - 3 * count(decimal32)) From test_table);
 EXPLAIN SYNTAX (SELECT (2 * count(decimal32) - sum(decimal32)) + (3 * count(decimal32) - sum(decimal32)) From test_table);
+
+-- https://github.com/ClickHouse/ClickHouse/issues/59414
+SELECT sum(uint64 + 2) as j, j + 5 as t from test_table;
+EXPLAIN SYNTAX SELECT sum(uint64 + 2) as j, j + 5 as t from test_table;
 -- { echoOff }
 
+
 DROP TABLE IF EXISTS test_table;

From 5894fa9860406b8473f0dca27aec1ec2115ba6c8 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 6 Feb 2024 19:09:04 +0100
Subject: [PATCH 0671/1081] `0` means number of cores

---
 programs/server/Server.cpp | 6 ++++--
 src/Core/ServerSettings.h  | 2 +-
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 8d63eeb2cab..7d3953ae37e 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -826,10 +826,12 @@ try
         0, // We don't need any threads one all the parts will be deleted
         server_settings.max_parts_cleaning_thread_pool_size);
 
+    auto max_database_replicated_create_table_thread_pool_size = server_settings.max_database_replicated_create_table_thread_pool_size ?
+        server_settings.max_database_replicated_create_table_thread_pool_size : getNumberOfPhysicalCPUCores();
     getDatabaseReplicatedCreateTablesThreadPool().initialize(
-        server_settings.max_database_replicated_create_table_thread_pool_size,
+        max_database_replicated_create_table_thread_pool_size,
         0, // We don't need any threads once all the tables will be created
-        server_settings.max_database_replicated_create_table_thread_pool_size);
+        max_database_replicated_create_table_thread_pool_size);
 
     /// Initialize global local cache for remote filesystem.
     if (config().has("local_cache_for_remote_fs"))
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 92e91cbca54..b10c0d8e093 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -114,7 +114,7 @@ namespace DB
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
-    M(UInt64, max_database_replicated_create_table_thread_pool_size, 0, "The number of threads to create tables during replica recovery in DatabaseReplicated. Value less than two means tables will be created sequentially.", 0) \
+    M(UInt32, max_database_replicated_create_table_thread_pool_size, 1, "The number of threads to create tables during replica recovery in DatabaseReplicated. Zero means number of threads equal number of cores.", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 

From 3b03aea16bdef344f56e38039ae204bef11a4ad1 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 6 Feb 2024 19:10:45 +0100
Subject: [PATCH 0672/1081] Use vector instead of a map

---
 src/Databases/DatabaseReplicated.cpp    |  4 ++--
 src/Databases/TablesDependencyGraph.cpp |  8 ++++----
 src/Databases/TablesDependencyGraph.h   | 10 +++++-----
 3 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index fcefa2ae253..9cf19a251f7 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -1094,12 +1094,12 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
     tables_dependencies.checkNoCyclicDependencies();
 
     auto allow_concurrent_table_creation = getContext()->getServerSettings().max_database_replicated_create_table_thread_pool_size > 1;
-    auto tables_to_create_by_level = tables_dependencies.getTablesSortedByDependencyWithLevels();
+    auto tables_to_create_by_level = tables_dependencies.getTablesSplitByDependencyLevel();
 
     auto create_tables_runner = threadPoolCallbackRunner<void>(getDatabaseReplicatedCreateTablesThreadPool().get(), "CreateTables");
     std::vector<std::future<void>> create_table_futures;
 
-    for (const auto & [_, tables_to_create] : tables_to_create_by_level)
+    for (const auto & tables_to_create : tables_to_create_by_level)
     {
         for (const auto & table_id : tables_to_create)
         {
diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index 007bcb5ab17..bda9c81253b 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -699,14 +699,14 @@ std::vector<StorageID> TablesDependencyGraph::getTablesSortedByDependency() cons
 }
 
 
-std::map<size_t, std::vector<StorageID>> TablesDependencyGraph::getTablesSortedByDependencyWithLevels() const
+std::vector<std::vector<StorageID>> TablesDependencyGraph::getTablesSplitByDependencyLevel() const
 {
-    std::map<size_t, std::vector<StorageID>> tables_by_level;
+    std::vector<std::vector<StorageID>> tables_split_by_level;
     for (const auto * node : getNodesSortedByLevel())
     {
-        tables_by_level[node->level].emplace_back(node->storage_id);
+        tables_split_by_level[node->level].emplace_back(node->storage_id);
     }
-    return tables_by_level;
+    return tables_split_by_level;
 }
 
 
diff --git a/src/Databases/TablesDependencyGraph.h b/src/Databases/TablesDependencyGraph.h
index 18cdc999ee1..eb13539b5b6 100644
--- a/src/Databases/TablesDependencyGraph.h
+++ b/src/Databases/TablesDependencyGraph.h
@@ -107,11 +107,11 @@ public:
     /// tables which depend on the tables which depend on the tables without dependencies, and so on.
     std::vector<StorageID> getTablesSortedByDependency() const;
 
-    /// Returns a map of lists of tables by the number of dependencies they have:
-    /// tables without dependencies first with level 0, then
-    /// tables with depend on the tables without dependencies with level 1, then
-    /// tables which depend on the tables which depend on the tables without dependencies with level 2, and so on.
-    std::map<size_t, std::vector<StorageID>> getTablesSortedByDependencyWithLevels() const;
+    /// Returns a list of lists of tables by the number of dependencies they have:
+    /// tables without dependencies are in the first list, then
+    /// tables which depend on the tables without dependencies are in the second list, then
+    /// tables which depend on the tables which depend on the tables without dependencies are in the third list, and so on.
+    std::vector<std::vector<StorageID>> getTablesSplitByDependencyLevel() const;
 
     /// Outputs information about this graph as a bunch of logging messages.
     void log() const;

From 0f515e7759cf0ff5e1200465dece3bf12cd1f9f1 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 6 Feb 2024 19:37:22 +0100
Subject: [PATCH 0673/1081] Reserve space in vector

---
 src/Databases/TablesDependencyGraph.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index bda9c81253b..fe358694f9a 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -702,7 +702,9 @@ std::vector<StorageID> TablesDependencyGraph::getTablesSortedByDependency() cons
 std::vector<std::vector<StorageID>> TablesDependencyGraph::getTablesSplitByDependencyLevel() const
 {
     std::vector<std::vector<StorageID>> tables_split_by_level;
-    for (const auto * node : getNodesSortedByLevel())
+    auto sorted_nodes = getNodesSortedByLevel();
+    tables_split_by_level.reserve(sorted_nodes.back()->level);
+    for (const auto * node : sorted_nodes)
     {
         tables_split_by_level[node->level].emplace_back(node->storage_id);
     }

From 648fa525832644a89b55dba9f6957969060e1a69 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <yakov@clickhouse.com>
Date: Tue, 6 Feb 2024 18:48:57 +0000
Subject: [PATCH 0674/1081] move instead copy

---
 utils/self-extracting-executable/decompressor.cpp | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/utils/self-extracting-executable/decompressor.cpp b/utils/self-extracting-executable/decompressor.cpp
index 1f19a349d65..6614403c0ab 100644
--- a/utils/self-extracting-executable/decompressor.cpp
+++ b/utils/self-extracting-executable/decompressor.cpp
@@ -322,6 +322,8 @@ int decompressFiles(int input_fd, char * path, char * name, bool & have_compress
             return 1;
         }
 
+        if (0 != munmap(output, le64toh(file_info.uncompressed_size)))
+            perror("munmap");
         if (0 != fsync(output_fd))
             perror("fsync");
         if (0 != close(output_fd))
@@ -528,10 +530,10 @@ int main(int/* argc*/, char* argv[])
         (void)snprintf(decompressed_name, decompressed_name_len + 1, decompressed_name_fmt, self, decompressed_suffix);
 
         std::error_code ec;
-        std::filesystem::copy_file(static_cast<char *>(decompressed_name), static_cast<char *>(self), ec);
-        if (ec)
+
+        if (link(decompressed_name, self))
         {
-            std::cerr << ec.message() << std::endl;
+            perror("link");
             return 1;
         }
 

From b43f90fce209351972fafd420e1b62d58159ba81 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 6 Feb 2024 19:55:01 +0100
Subject: [PATCH 0675/1081] Fix query start time on non initial queries

---
 src/Interpreters/executeQuery.cpp             | 18 ++++--------
 .../02985_shard_query_start_time.reference    |  2 ++
 .../02985_shard_query_start_time.sql          | 29 +++++++++++++++++++
 3 files changed, 37 insertions(+), 12 deletions(-)
 create mode 100644 tests/queries/0_stateless/02985_shard_query_start_time.reference
 create mode 100644 tests/queries/0_stateless/02985_shard_query_start_time.sql

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 1787f627c2e..5c16a5d800f 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -663,15 +663,17 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     if (query_span && query_span->trace_id != UUID{})
         LOG_TRACE(getLogger("executeQuery"), "Query span trace_id for opentelemetry log: {}", query_span->trace_id);
 
+    /// Used for logging query start time in system.query_log
     auto query_start_time = std::chrono::system_clock::now();
 
-    /// Used to set the watch in QueryStatus and the output formats. It is not based on query_start_time as that might be based on
-    /// the value passed by the client
+    /// Used for:
+    /// * Setting the watch in QueryStatus (controls timeouts and progress) and the output formats
+    /// * Logging query duration (system.query_log)
     Stopwatch start_watch{CLOCK_MONOTONIC};
 
     const auto & client_info = context->getClientInfo();
 
-    if (!internal)
+    if (!internal && client_info.initial_query_start_time == 0)
     {
         // If it's not an internal query and we don't see an initial_query_start_time yet, initialize it
         // to current time. Internal queries are those executed without an independent client context,
@@ -679,15 +681,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
         // possible to have unset initial_query_start_time for non-internal and non-initial queries. For
         // example, the query is from an initiator that is running an old version of clickhouse.
         // On the other hand, if it's initialized then take it as the start of the query
-        if (client_info.initial_query_start_time == 0)
-        {
-            context->setInitialQueryStartTime(query_start_time);
-        }
-        else
-        {
-            query_start_time = std::chrono::time_point<std::chrono::system_clock>(
-                std::chrono::microseconds{client_info.initial_query_start_time_microseconds});
-        }
+        context->setInitialQueryStartTime(query_start_time);
     }
 
     assert(internal || CurrentThread::get().getQueryContext());
diff --git a/tests/queries/0_stateless/02985_shard_query_start_time.reference b/tests/queries/0_stateless/02985_shard_query_start_time.reference
new file mode 100644
index 00000000000..1957f3a9604
--- /dev/null
+++ b/tests/queries/0_stateless/02985_shard_query_start_time.reference
@@ -0,0 +1,2 @@
+1	1
+1	1
diff --git a/tests/queries/0_stateless/02985_shard_query_start_time.sql b/tests/queries/0_stateless/02985_shard_query_start_time.sql
new file mode 100644
index 00000000000..b0d8d2b6e53
--- /dev/null
+++ b/tests/queries/0_stateless/02985_shard_query_start_time.sql
@@ -0,0 +1,29 @@
+DROP TABLE IF EXISTS sharded_table;
+CREATE TABLE sharded_table (dummy UInt8) ENGINE = Distributed('test_cluster_two_shards', 'system', 'one');
+
+SELECT * FROM sharded_table FORMAT Null SETTINGS log_comment='02985_shard_query_start_time_query_1';
+
+SYSTEM FLUSH LOGS;
+
+-- We do not test for query_start_time because that would conflict pretty easily
+WITH
+(
+    SELECT
+        (query_id, query_start_time_microseconds)
+    FROM
+        system.query_log
+    WHERE
+            event_date >= yesterday()
+      AND current_database = currentDatabase()
+      AND log_comment = '02985_shard_query_start_time_query_1'
+      AND type = 'QueryFinish'
+    ORDER BY query_start_time_microseconds DESC
+    LIMIT 1
+) AS id_and_start_tuple
+SELECT
+    query_start_time_microseconds > initial_query_start_time_microseconds,
+    initial_query_start_time_microseconds = id_and_start_tuple.2
+FROM
+    system.query_log
+WHERE
+    NOT is_initial_query AND initial_query_id = id_and_start_tuple.1;

From a64ce706719aa5ecf8f7bd954eaf50b96ce59df0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 6 Feb 2024 20:11:04 +0100
Subject: [PATCH 0676/1081] Pin python dependencies in stateless tests

---
 docker/test/stateless/Dockerfile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index 66ba0a58e03..f09ba46de1e 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -47,7 +47,7 @@ RUN apt-get update -y \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
-RUN pip3 install numpy scipy pandas Jinja2 pyarrow
+RUN pip3 install numpy==1.26.3 scipy==1.12.0 pandas==1.5.3 Jinja2==3.1.3 pyarrow==15.0.0
 
 RUN mkdir -p /tmp/clickhouse-odbc-tmp \
    && wget -nv -O - ${odbc_driver_url} | tar --strip-components=1 -xz -C /tmp/clickhouse-odbc-tmp \

From 0a4e73a98dc4d0471957ad65aecb8b16bae1070f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 1 Feb 2024 15:50:48 +0100
Subject: [PATCH 0677/1081] Strict aliasing for Int8

---
 base/base/CMakeLists.txt                      |  1 +
 base/base/int8_to_string.cpp                  |  9 +++++
 base/base/int8_to_string.h                    | 34 +++++++++++++++++++
 base/base/types.h                             | 19 +++++++++--
 src/Common/Exception.h                        |  5 +--
 src/Core/Field.h                              |  3 +-
 src/Functions/divide/divide.cpp               |  4 +--
 src/Functions/divide/divideImpl.cpp           |  8 +++--
 .../Formats/Impl/CHColumnToArrowColumn.cpp    |  5 +++
 9 files changed, 78 insertions(+), 10 deletions(-)
 create mode 100644 base/base/int8_to_string.cpp
 create mode 100644 base/base/int8_to_string.h

diff --git a/base/base/CMakeLists.txt b/base/base/CMakeLists.txt
index 3886932d198..025687d2c59 100644
--- a/base/base/CMakeLists.txt
+++ b/base/base/CMakeLists.txt
@@ -17,6 +17,7 @@ set (SRCS
     getMemoryAmount.cpp
     getPageSize.cpp
     getThreadId.cpp
+    int8_to_string.cpp
     JSON.cpp
     mremap.cpp
     phdr_cache.cpp
diff --git a/base/base/int8_to_string.cpp b/base/base/int8_to_string.cpp
new file mode 100644
index 00000000000..09da940e1a0
--- /dev/null
+++ b/base/base/int8_to_string.cpp
@@ -0,0 +1,9 @@
+#include <base/int8_to_string.h>
+
+namespace std
+{
+std::string to_string(Int8 v)
+{
+    return to_string(int8_t{v});
+}
+}
diff --git a/base/base/int8_to_string.h b/base/base/int8_to_string.h
new file mode 100644
index 00000000000..db92630ad86
--- /dev/null
+++ b/base/base/int8_to_string.h
@@ -0,0 +1,34 @@
+#pragma once
+
+#include <base/defines.h>
+#include <base/types.h>
+
+#include <fmt/format.h>
+
+template <>
+struct fmt::formatter<Int8>
+{
+    constexpr auto parse(format_parse_context & ctx)
+    {
+        const auto * it = ctx.begin();
+        const auto * end = ctx.end();
+
+        /// Only support {}.
+        if (it != end && *it != '}')
+            throw format_error("invalid format");
+
+        return it;
+    }
+
+    template <typename FormatContext>
+    auto format(const Int8 & value, FormatContext & ctx) -> decltype(ctx.out())
+    {
+        return format<FormatContext>(int8_t{value}, ctx);
+    }
+};
+
+
+namespace std
+{
+std::string to_string(Int8 v);
+}
diff --git a/base/base/types.h b/base/base/types.h
index 3a7760eae91..52e9df65f04 100644
--- a/base/base/types.h
+++ b/base/base/types.h
@@ -3,14 +3,29 @@
 #include <cstdint>
 #include <string>
 
-/// This is needed for more strict aliasing. https://godbolt.org/z/xpJBSb https://stackoverflow.com/a/57453713
+/// Using char8_t more strict aliasing (https://stackoverflow.com/a/57453713)
 using UInt8 = char8_t;
 
+/// Same for using signed _BitInt(8) (there isn't a signed char8_t, which would be more convenient)
+/// See https://godbolt.org/z/fafnWEnnf
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wbit-int-extension"
+using Int8 = signed _BitInt(8);
+#pragma clang diagnostic pop
+
+namespace std
+{
+template <>
+struct hash<Int8>
+{
+    size_t operator()(const Int8 x) const { return std::hash<int8_t>()(int8_t{x}); }
+};
+}
+
 using UInt16 = uint16_t;
 using UInt32 = uint32_t;
 using UInt64 = uint64_t;
 
-using Int8 = int8_t;
 using Int16 = int16_t;
 using Int32 = int32_t;
 using Int64 = int64_t;
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index 94e4a986feb..21f9529a49c 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -9,10 +9,11 @@
 
 #include <base/defines.h>
 #include <base/errnoToString.h>
+#include <base/int8_to_string.h>
 #include <base/scope_guard.h>
-#include <Common/LoggingFormatStringHelpers.h>
-#include <Common/Logger.h>
 #include <Common/AtomicLogger.h>
+#include <Common/Logger.h>
+#include <Common/LoggingFormatStringHelpers.h>
 #include <Common/StackTrace.h>
 
 #include <fmt/format.h>
diff --git a/src/Core/Field.h b/src/Core/Field.h
index f9ce70efbc5..414874310a6 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -216,9 +216,8 @@ using NearestFieldType = typename NearestFieldTypeImpl<T>::Type;
 template <> struct NearestFieldTypeImpl<char> { using Type = std::conditional_t<is_signed_v<char>, Int64, UInt64>; };
 template <> struct NearestFieldTypeImpl<signed char> { using Type = Int64; };
 template <> struct NearestFieldTypeImpl<unsigned char> { using Type = UInt64; };
-#ifdef __cpp_char8_t
 template <> struct NearestFieldTypeImpl<char8_t> { using Type = UInt64; };
-#endif
+template <> struct NearestFieldTypeImpl<Int8> { using Type = Int64; };
 
 template <> struct NearestFieldTypeImpl<UInt16> { using Type = UInt64; };
 template <> struct NearestFieldTypeImpl<UInt32> { using Type = UInt64; };
diff --git a/src/Functions/divide/divide.cpp b/src/Functions/divide/divide.cpp
index cf2cd354a7d..6262d42a666 100644
--- a/src/Functions/divide/divide.cpp
+++ b/src/Functions/divide/divide.cpp
@@ -49,9 +49,9 @@ template void divideImpl<uint32_t, char8_t, uint32_t>(const uint32_t * __restric
 template void divideImpl<int64_t, int64_t, int64_t>(const int64_t * __restrict, int64_t, int64_t * __restrict, size_t);
 template void divideImpl<int64_t, int32_t, int64_t>(const int64_t * __restrict, int32_t, int64_t * __restrict, size_t);
 template void divideImpl<int64_t, int16_t, int64_t>(const int64_t * __restrict, int16_t, int64_t * __restrict, size_t);
-template void divideImpl<int64_t, int8_t, int64_t>(const int64_t * __restrict, int8_t, int64_t * __restrict, size_t);
+template void divideImpl<int64_t, Int8, int64_t>(const int64_t * __restrict, Int8, int64_t * __restrict, size_t);
 
 template void divideImpl<int32_t, int64_t, int32_t>(const int32_t * __restrict, int64_t, int32_t * __restrict, size_t);
 template void divideImpl<int32_t, int32_t, int32_t>(const int32_t * __restrict, int32_t, int32_t * __restrict, size_t);
 template void divideImpl<int32_t, int16_t, int32_t>(const int32_t * __restrict, int16_t, int32_t * __restrict, size_t);
-template void divideImpl<int32_t, int8_t, int32_t>(const int32_t * __restrict, int8_t, int32_t * __restrict, size_t);
+template void divideImpl<int32_t, Int8, int32_t>(const int32_t * __restrict, Int8, int32_t * __restrict, size_t);
diff --git a/src/Functions/divide/divideImpl.cpp b/src/Functions/divide/divideImpl.cpp
index 966d5777c1d..6d44b427582 100644
--- a/src/Functions/divide/divideImpl.cpp
+++ b/src/Functions/divide/divideImpl.cpp
@@ -12,6 +12,10 @@
 
 #include <libdivide.h>
 
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wbit-int-extension"
+using Int8 = signed _BitInt(8);
+#pragma clang diagnostic pop
 
 namespace NAMESPACE
 {
@@ -62,11 +66,11 @@ template void divideImpl<uint32_t, char8_t, uint32_t>(const uint32_t * __restric
 template void divideImpl<int64_t, int64_t, int64_t>(const int64_t * __restrict, int64_t, int64_t * __restrict, size_t);
 template void divideImpl<int64_t, int32_t, int64_t>(const int64_t * __restrict, int32_t, int64_t * __restrict, size_t);
 template void divideImpl<int64_t, int16_t, int64_t>(const int64_t * __restrict, int16_t, int64_t * __restrict, size_t);
-template void divideImpl<int64_t, int8_t, int64_t>(const int64_t * __restrict, int8_t, int64_t * __restrict, size_t);
+template void divideImpl<int64_t, Int8, int64_t>(const int64_t * __restrict, Int8, int64_t * __restrict, size_t);
 
 template void divideImpl<int32_t, int64_t, int32_t>(const int32_t * __restrict, int64_t, int32_t * __restrict, size_t);
 template void divideImpl<int32_t, int32_t, int32_t>(const int32_t * __restrict, int32_t, int32_t * __restrict, size_t);
 template void divideImpl<int32_t, int16_t, int32_t>(const int32_t * __restrict, int16_t, int32_t * __restrict, size_t);
-template void divideImpl<int32_t, int8_t, int32_t>(const int32_t * __restrict, int8_t, int32_t * __restrict, size_t);
+template void divideImpl<int32_t, Int8, int32_t>(const int32_t * __restrict, Int8, int32_t * __restrict, size_t);
 
 }
diff --git a/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp b/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
index 1048bdad22f..9d6c8420069 100644
--- a/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
+++ b/src/Processors/Formats/Impl/CHColumnToArrowColumn.cpp
@@ -130,6 +130,11 @@ namespace DB
                 reinterpret_cast<const uint8_t *>(internal_data.data() + start),
                 end - start,
                 reinterpret_cast<const uint8_t *>(arrow_null_bytemap_raw_ptr));
+        else if constexpr (std::is_same_v<NumericType, Int8>)
+            status = builder.AppendValues(
+                reinterpret_cast<const int8_t *>(internal_data.data() + start),
+                end - start,
+                reinterpret_cast<const uint8_t *>(arrow_null_bytemap_raw_ptr));
         else
             status = builder.AppendValues(internal_data.data() + start, end - start, reinterpret_cast<const uint8_t *>(arrow_null_bytemap_raw_ptr));
         checkStatus(status, write_column->getName(), format_name);

From 333c45634fa8fd239d562b958146fc2178e1cd2a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 1 Feb 2024 16:53:31 +0100
Subject: [PATCH 0678/1081] Infinite recursion

---
 base/base/int8_to_string.h | 19 +------------------
 1 file changed, 1 insertion(+), 18 deletions(-)

diff --git a/base/base/int8_to_string.h b/base/base/int8_to_string.h
index db92630ad86..715473b1482 100644
--- a/base/base/int8_to_string.h
+++ b/base/base/int8_to_string.h
@@ -6,25 +6,8 @@
 #include <fmt/format.h>
 
 template <>
-struct fmt::formatter<Int8>
+struct fmt::formatter<Int8> : fmt::formatter<int8_t>
 {
-    constexpr auto parse(format_parse_context & ctx)
-    {
-        const auto * it = ctx.begin();
-        const auto * end = ctx.end();
-
-        /// Only support {}.
-        if (it != end && *it != '}')
-            throw format_error("invalid format");
-
-        return it;
-    }
-
-    template <typename FormatContext>
-    auto format(const Int8 & value, FormatContext & ctx) -> decltype(ctx.out())
-    {
-        return format<FormatContext>(int8_t{value}, ctx);
-    }
 };
 
 
From b609fc157fc9a0ca8a6cd0511c93599c401164ad Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 2 Feb 2024 16:28:09 +0100
Subject: [PATCH 0679/1081] Silence tidy

---
 base/base/int8_to_string.cpp | 2 +-
 base/base/int8_to_string.h   | 2 +-
 base/base/types.h            | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/base/base/int8_to_string.cpp b/base/base/int8_to_string.cpp
index 09da940e1a0..f74a6b8077e 100644
--- a/base/base/int8_to_string.cpp
+++ b/base/base/int8_to_string.cpp
@@ -2,7 +2,7 @@
 
 namespace std
 {
-std::string to_string(Int8 v)
+std::string to_string(Int8 v) /// NOLINT (cert-dcl58-cpp)
 {
     return to_string(int8_t{v});
 }
diff --git a/base/base/int8_to_string.h b/base/base/int8_to_string.h
index 715473b1482..af0914f4312 100644
--- a/base/base/int8_to_string.h
+++ b/base/base/int8_to_string.h
@@ -13,5 +13,5 @@ struct fmt::formatter<Int8> : fmt::formatter<int8_t>
 
 namespace std
 {
-std::string to_string(Int8 v);
+std::string to_string(Int8 v); /// NOLINT (cert-dcl58-cpp)
 }
diff --git a/base/base/types.h b/base/base/types.h
index 52e9df65f04..a4874860514 100644
--- a/base/base/types.h
+++ b/base/base/types.h
@@ -16,7 +16,7 @@ using Int8 = signed _BitInt(8);
 namespace std
 {
 template <>
-struct hash<Int8>
+struct hash<Int8> /// NOLINT (cert-dcl58-cpp)
 {
     size_t operator()(const Int8 x) const { return std::hash<int8_t>()(int8_t{x}); }
 };

From ff63a1cf9f578fa4f33433b9969d0eb844383d1e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 13:41:07 +0100
Subject: [PATCH 0680/1081] Fix tidy

---
 src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
index f99ebf51792..ba3cc6f58d0 100644
--- a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
+++ b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
@@ -313,7 +313,7 @@ void MaterializedPostgreSQLConsumer::readTupleData(
                 Int32 col_len = readInt32(message, pos, size);
                 String value;
                 for (Int32 i = 0; i < col_len; ++i)
-                    value += readInt8(message, pos, size);
+                    value += static_cast<char>(readInt8(message, pos, size));
 
                 insertValue(storage_data, value, column_idx);
                 break;

From 25738c8313bff80f3a2e3a8e3a53101041a62f2c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 5 Feb 2024 14:26:46 +0100
Subject: [PATCH 0681/1081] Remove no longer needed specialization

---
 src/Functions/if.cpp | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index 5346f3a811c..7306dc4173e 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -230,13 +230,8 @@ inline void fillConstantConstant(const ArrayCond & cond, A a, B b, ArrayResult &
 {
     size_t size = cond.size();
 
-    /// Int8(alias type of uint8_t) has special aliasing properties that prevents compiler from auto-vectorizing for below codes, refer to https://gist.github.com/alexei-zaripov/dcc14c78819c5f1354afe8b70932007c
-    ///
-    /// for (size_t i = 0; i < size; ++i)
-    ///     res[i] = cond[i] ? static_cast<Int8>(a) : static_cast<Int8>(b);
-    ///
-    /// Therefore, we manually optimize it by avoiding branch miss when ResultType is Int8. Other types like (U)Int128|256 or Decimal128/256 also benefit from this optimization.
-    if constexpr (std::is_same_v<ResultType, Int8> || is_over_big_int<ResultType>)
+    /// We manually optimize the loop for types like (U)Int128|256 or Decimal128/256 to avoid branches
+    if constexpr (is_over_big_int<ResultType>)
     {
         alignas(64) const ResultType ab[2] = {static_cast<ResultType>(a), static_cast<ResultType>(b)};
         for (size_t i = 0; i < size; ++i)

From 942addfa8c55e6f32fb2b9af4c7ede7d19ddba6d Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 6 Feb 2024 21:22:55 +0100
Subject: [PATCH 0682/1081] Learning how std::vector works

---
 src/Databases/TablesDependencyGraph.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index fe358694f9a..5f66f11e6fd 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -703,7 +703,7 @@ std::vector<std::vector<StorageID>> TablesDependencyGraph::getTablesSplitByDepen
 {
     std::vector<std::vector<StorageID>> tables_split_by_level;
     auto sorted_nodes = getNodesSortedByLevel();
-    tables_split_by_level.reserve(sorted_nodes.back()->level);
+    tables_split_by_level.resize(sorted_nodes.back()->level + 1);
     for (const auto * node : sorted_nodes)
     {
         tables_split_by_level[node->level].emplace_back(node->storage_id);

From f7a0c38a3ddc2caf555daae22badf56c38430800 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 6 Feb 2024 21:31:44 +0100
Subject: [PATCH 0683/1081] Unquote FLAG_LATEST to fix issue with empty
 argument

---
 .github/workflows/reusable_docker.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/reusable_docker.yml b/.github/workflows/reusable_docker.yml
index 1b186350580..3fe1a8883c6 100644
--- a/.github/workflows/reusable_docker.yml
+++ b/.github/workflows/reusable_docker.yml
@@ -63,4 +63,4 @@ jobs:
           python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
             --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
             --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}' \
-            "$FLAG_LATEST"
+            $FLAG_LATEST

From d64db12f72a40bf80da7f3e3944ed143e1f7a89a Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 6 Feb 2024 21:44:45 +0100
Subject: [PATCH 0684/1081] Fix for empty `sorted_nodes`

---
 src/Databases/TablesDependencyGraph.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Databases/TablesDependencyGraph.cpp b/src/Databases/TablesDependencyGraph.cpp
index 5f66f11e6fd..4b05f19fe91 100644
--- a/src/Databases/TablesDependencyGraph.cpp
+++ b/src/Databases/TablesDependencyGraph.cpp
@@ -703,6 +703,9 @@ std::vector<std::vector<StorageID>> TablesDependencyGraph::getTablesSplitByDepen
 {
     std::vector<std::vector<StorageID>> tables_split_by_level;
     auto sorted_nodes = getNodesSortedByLevel();
+    if (sorted_nodes.empty())
+        return tables_split_by_level;
+
     tables_split_by_level.resize(sorted_nodes.back()->level + 1);
     for (const auto * node : sorted_nodes)
     {

From 8d08d60bf1a012131b075079639a73cb118f79c6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 6 Feb 2024 23:49:54 +0100
Subject: [PATCH 0685/1081] Rename a setting

---
 src/Core/Settings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 67bd721d3d1..8bba62e1ff3 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -857,7 +857,7 @@ class IColumn;
     M(UInt64, grace_hash_join_max_buckets, 1024, "Limit on the number of grace hash join buckets", 0) \
     M(Bool, optimize_distinct_in_order, true, "Enable DISTINCT optimization if some columns in DISTINCT form a prefix of sorting. For example, prefix of sorting key in merge tree or ORDER BY statement", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
-    M(UInt64, extract_kvp_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
+    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
     M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \

From 23c9b32282810e9aeef11cd54dedf95bc11b8a5c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 6 Feb 2024 23:54:12 +0100
Subject: [PATCH 0686/1081] Fix the documentation

---
 src/Core/Settings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 8bba62e1ff3..5e009cda254 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -857,7 +857,7 @@ class IColumn;
     M(UInt64, grace_hash_join_max_buckets, 1024, "Limit on the number of grace hash join buckets", 0) \
     M(Bool, optimize_distinct_in_order, true, "Enable DISTINCT optimization if some columns in DISTINCT form a prefix of sorting. For example, prefix of sorting key in merge tree or ORDER BY statement", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
-    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
+    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory.", 0) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
     M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \

From 5991ea4dc3ed3ff53c76ca8aa16d1e92b6959603 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 00:00:34 +0100
Subject: [PATCH 0687/1081] Rename the setting

---
 src/Functions/keyvaluepair/extractKeyValuePairs.cpp         | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.reference  | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.sql        | 6 +++---
 3 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
index 34081cddb92..94f02861af0 100644
--- a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
+++ b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
@@ -43,11 +43,11 @@ class ExtractKeyValuePairs : public IFunction
             builder.withQuotingCharacter(parsed_arguments.quoting_character.value());
         }
 
-        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_kvp_max_pairs_per_row == 0;
+        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row == 0;
 
         if (!is_number_of_pairs_unlimited)
         {
-            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_kvp_max_pairs_per_row);
+            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row);
         }
 
         return builder.build();
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
index f646583bbd3..9a0cfdffcb5 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
@@ -293,7 +293,7 @@ SELECT
 {'age':'31','last_key':'last_value','name':'neymar','nationality':'brazil','team':'psg'}
 -- { echoOn }
 
-SET extract_kvp_max_pairs_per_row = 2;
+SET extract_key_value_pairs_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -307,7 +307,7 @@ WITH
 SELECT
     x;
 {'key1':'value1','key2':'value2'}
-SET extract_kvp_max_pairs_per_row = 0;
+SET extract_key_value_pairs_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
index 9277ba6d7ec..4f3db3f166b 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
@@ -415,7 +415,7 @@ SELECT
     x; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
 
 -- Should fail allowed because it exceeds the max number of pairs
-SET extract_kvp_max_pairs_per_row = 1;
+SET extract_key_value_pairs_max_pairs_per_row = 1;
 WITH
     extractKeyValuePairs('key1:value1,key2:value2') AS s_map,
     CAST(
@@ -429,7 +429,7 @@ SELECT
 
 -- { echoOn }
 
-SET extract_kvp_max_pairs_per_row = 2;
+SET extract_key_value_pairs_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -443,7 +443,7 @@ WITH
 SELECT
     x;
 
-SET extract_kvp_max_pairs_per_row = 0;
+SET extract_key_value_pairs_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH

From 10082399d540a1ab5cee3ff381856193afc9ad22 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 7 Feb 2024 00:52:25 +0000
Subject: [PATCH 0688/1081] Minor review fixes

---
 src/Client/ConnectionPool.h                 | 22 ++++++++++++---------
 src/Common/ProfileEvents.cpp                |  2 +-
 src/Processors/QueryPlan/ReadFromRemote.cpp |  8 ++++----
 src/QueryPipeline/RemoteQueryExecutor.cpp   |  2 +-
 4 files changed, 19 insertions(+), 15 deletions(-)

diff --git a/src/Client/ConnectionPool.h b/src/Client/ConnectionPool.h
index 1886a0431a5..8e707e8190f 100644
--- a/src/Client/ConnectionPool.h
+++ b/src/Client/ConnectionPool.h
@@ -27,6 +27,9 @@ class IConnectionPool : private boost::noncopyable
 public:
     using Entry = PoolBase<Connection>::Entry;
 
+    IConnectionPool() = default;
+    IConnectionPool(String host_, UInt16 port_) : host(host_), port(port_), address(host + ":" + toString(port_)) {}
+
     virtual ~IConnectionPool() = default;
 
     /// Selects the connection to work.
@@ -36,7 +39,15 @@ public:
                       const Settings & settings,
                       bool force_connected = true) = 0;
 
+    const std::string & getHost() const { return host; }
+    UInt16 getPort() const { return port; }
+    const String & getAddress() const { return address; }
     virtual Priority getPriority() const { return Priority{1}; }
+
+protected:
+    const String host;
+    const UInt16 port = 0;
+    const String address;
 };
 
 using ConnectionPoolPtr = std::shared_ptr<IConnectionPool>;
@@ -63,10 +74,9 @@ public:
             Protocol::Compression compression_,
             Protocol::Secure secure_,
             Priority priority_ = Priority{1})
-       : Base(max_connections_,
+       : IConnectionPool(host_, port_),
+        Base(max_connections_,
         getLogger("ConnectionPool (" + host_ + ":" + toString(port_) + ")")),
-        host(host_),
-        port(port_),
         default_database(default_database_),
         user(user_),
         password(password_),
@@ -99,10 +109,6 @@ public:
         return entry;
     }
 
-    const std::string & getHost() const
-    {
-        return host;
-    }
     std::string getDescription() const
     {
         return host + ":" + toString(port);
@@ -125,8 +131,6 @@ protected:
     }
 
 private:
-    String host;
-    UInt16 port;
     String default_database;
     String user;
     String password;
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 0218545c3a4..fc30a4e0794 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -617,7 +617,7 @@ The server successfully detected this situation and will download merged part fr
     \
     M(ParallelReplicasUsedCount, "Number of replicas used to execute a query with task-based parallel replicas") \
     M(ParallelReplicasAvailableCount, "Number of replicas available to execute a query with task-based parallel replicas") \
-    M(ParallelReplicasUnavailableCount, "Number of replicas which was chosen, but unavailable, to execute a query with task-based parallel replicas") \
+    M(ParallelReplicasUnavailableCount, "Number of replicas which was chosen, but found to be unavailable during query execution with task-based parallel replicas") \
 
 #ifdef APPLY_FOR_EXTERNAL_EVENTS
     #define APPLY_FOR_EVENTS(M) APPLY_FOR_BUILTIN_EVENTS(M) APPLY_FOR_EXTERNAL_EVENTS(M)
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 6764e095088..5707eb2e9c6 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -375,10 +375,11 @@ ReadFromParallelRemoteReplicasStep::ReadFromParallelRemoteReplicasStep(
     , storage_limits(std::move(storage_limits_))
     , log(log_)
 {
-    std::vector<String> description;
+    chassert(cluster->getShardCount() == 1);
 
-    for (const auto & address : cluster->getShardsAddresses())
-        description.push_back(fmt::format("Replica: {}", address[0].host_name));
+    std::vector<String> description;
+    for (const auto & pool : cluster->getShardsInfo().front().per_replica_pools)
+        description.push_back(fmt::format("Replica: {}", pool->getHost()));
 
     setStepDescription(boost::algorithm::join(description, ", "));
 }
@@ -412,7 +413,6 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
         all_replicas_count = shard.getAllNodeCount();
     }
 
-    chassert(cluster->getShardCount() == 1);
     auto shuffled_pool = shard.pool->getShuffledPools(current_settings);
     shuffled_pool.resize(all_replicas_count);
 
diff --git a/src/QueryPipeline/RemoteQueryExecutor.cpp b/src/QueryPipeline/RemoteQueryExecutor.cpp
index e44749dfb97..46616905bcb 100644
--- a/src/QueryPipeline/RemoteQueryExecutor.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutor.cpp
@@ -105,7 +105,7 @@ RemoteQueryExecutor::RemoteQueryExecutor(
             connection_entries.emplace_back(std::move(result.entry));
         }
 
-        auto res = std::make_unique<MultiplexedConnections>(std::move(connection_entries), context->getSettingsRef(), throttler);
+        auto res = std::make_unique<MultiplexedConnections>(std::move(connection_entries), current_settings, throttler);
         if (extension_ && extension_->replica_info)
             res->setReplicaInfo(*extension_->replica_info);
 

From 755298838fba555fa5dba644277e151841d1cf67 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 7 Feb 2024 01:28:27 +0000
Subject: [PATCH 0689/1081] Preserve replicas order for data locality

---
 src/Processors/QueryPlan/ReadFromRemote.cpp | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 5707eb2e9c6..91c81d619a7 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -413,7 +413,17 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
         all_replicas_count = shard.getAllNodeCount();
     }
 
-    auto shuffled_pool = shard.pool->getShuffledPools(current_settings);
+
+    std::vector<ConnectionPoolWithFailover::Base::ShuffledPool> shuffled_pool;
+    if (all_replicas_count < shard.getAllNodeCount())
+        shuffled_pool = shard.pool->getShuffledPools(current_settings);
+    else
+    {
+        /// try to preserve replicas order if all replicas in cluster are used for query execution
+        /// it's important for data locality during query execution
+        auto priority_func = [](size_t i) { return Priority{static_cast<Int64>(i)}; };
+        shuffled_pool = shard.pool->getShuffledPools(current_settings, priority_func);
+    }
     shuffled_pool.resize(all_replicas_count);
 
     for (size_t i=0; i < all_replicas_count; ++i)

From 4f153b59c06afa2c75e9f43b1279900d594359cd Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 7 Feb 2024 01:30:48 +0000
Subject: [PATCH 0690/1081] Minor fix

---
 src/Processors/QueryPlan/ReadFromRemote.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 91c81d619a7..93c73a66b78 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -416,7 +416,10 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
 
     std::vector<ConnectionPoolWithFailover::Base::ShuffledPool> shuffled_pool;
     if (all_replicas_count < shard.getAllNodeCount())
+    {
         shuffled_pool = shard.pool->getShuffledPools(current_settings);
+        shuffled_pool.resize(all_replicas_count);
+    }
     else
     {
         /// try to preserve replicas order if all replicas in cluster are used for query execution
@@ -424,7 +427,6 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
         auto priority_func = [](size_t i) { return Priority{static_cast<Int64>(i)}; };
         shuffled_pool = shard.pool->getShuffledPools(current_settings, priority_func);
     }
-    shuffled_pool.resize(all_replicas_count);
 
     for (size_t i=0; i < all_replicas_count; ++i)
     {

From 77e4b0c8d909baea75c7701a77f9cb0ee30db3ca Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Wed, 7 Feb 2024 02:52:43 +0100
Subject: [PATCH 0691/1081] Revert "Merge pull request #59122 from
 arthurpassos/bring_back_attach_partition_pr"

This reverts commit ac906371702c2eac856dac304f59ef041e95d48f, reversing
changes made to fe2b5cde058a70dc38690e3e6754aabc006ad91c.
---
 .../statements/alter/partition.md             |   2 +-
 src/Interpreters/MonotonicityCheckVisitor.h   | 102 +---
 src/Interpreters/applyFunction.cpp            |  43 --
 src/Interpreters/applyFunction.h              |  16 -
 src/Parsers/queryToString.cpp                 |   5 -
 src/Parsers/queryToString.h                   |   1 -
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  37 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   1 -
 src/Storages/MergeTree/KeyCondition.cpp       |  85 ++-
 src/Storages/MergeTree/MergeTreeData.cpp      | 351 ++++++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  18 -
 .../MergeTree/MergeTreeDataPartCloner.cpp     | 319 ------------
 .../MergeTree/MergeTreeDataPartCloner.h       |  43 --
 src/Storages/MergeTree/MergeTreePartition.cpp |  39 --
 src/Storages/MergeTree/MergeTreePartition.h   |  10 +-
 ...ergeTreePartitionCompatibilityVerifier.cpp |  91 ----
 .../MergeTreePartitionCompatibilityVerifier.h |  30 --
 ...TreePartitionGlobalMinMaxIdxCalculator.cpp |  25 -
 ...geTreePartitionGlobalMinMaxIdxCalculator.h |  24 -
 src/Storages/StorageMergeTree.cpp             |  91 +---
 src/Storages/StorageReplicatedMergeTree.cpp   | 136 +----
 .../__init__.py                               |   0
 .../configs/remote_servers.xml                |  17 -
 .../test.py                                   | 214 --------
 ...artition_different_partition_exp.reference | 467 -----------------
 ...tach_partition_different_partition_exp.sql | 485 ------------------
 26 files changed, 346 insertions(+), 2306 deletions(-)
 delete mode 100644 src/Interpreters/applyFunction.cpp
 delete mode 100644 src/Interpreters/applyFunction.h
 delete mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreeDataPartCloner.h
 delete mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
 delete mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
 delete mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
 delete mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
 delete mode 100644 tests/integration/test_attach_partition_distinct_expression_replicated/test.py
 delete mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
 delete mode 100644 tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql

diff --git a/docs/en/sql-reference/statements/alter/partition.md b/docs/en/sql-reference/statements/alter/partition.md
index 5659a0565c5..114b8d5ffe3 100644
--- a/docs/en/sql-reference/statements/alter/partition.md
+++ b/docs/en/sql-reference/statements/alter/partition.md
@@ -112,7 +112,7 @@ Note that:
 For the query to run successfully, the following conditions must be met:
 
 - Both tables must have the same structure.
-- Both tables must have the same order by key and the same primary key.
+- Both tables must have the same partition key, the same order by key and the same primary key.
 - Both tables must have the same indices and projections.
 - Both tables must have the same storage policy.
 
diff --git a/src/Interpreters/MonotonicityCheckVisitor.h b/src/Interpreters/MonotonicityCheckVisitor.h
index 4e71bd56851..cc386825024 100644
--- a/src/Interpreters/MonotonicityCheckVisitor.h
+++ b/src/Interpreters/MonotonicityCheckVisitor.h
@@ -1,17 +1,13 @@
 #pragma once
 
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <Core/Range.h>
 #include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/FieldToDataType.h>
 #include <Functions/FunctionFactory.h>
 #include <IO/WriteHelpers.h>
-#include <Interpreters/IdentifierSemantic.h>
 #include <Interpreters/InDepthNodeVisitor.h>
-#include <Interpreters/applyFunction.h>
+#include <Interpreters/IdentifierSemantic.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTOrderByElement.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/IAST.h>
@@ -37,8 +33,6 @@ public:
         ASTIdentifier * identifier = nullptr;
         DataTypePtr arg_data_type = {};
 
-        Range range = Range::createWholeUniverse();
-
         void reject() { monotonicity.is_monotonic = false; }
         bool isRejected() const { return !monotonicity.is_monotonic; }
 
@@ -103,30 +97,13 @@ public:
         if (data.isRejected())
             return;
 
-        /// Monotonicity check only works for functions that contain at most two arguments and one of them must be a constant.
-        if (!ast_function.arguments)
+        /// TODO: monotonicity for functions of several arguments
+        if (!ast_function.arguments || ast_function.arguments->children.size() != 1)
         {
             data.reject();
             return;
         }
 
-        auto arguments_size = ast_function.arguments->children.size();
-
-        if (arguments_size == 0 || arguments_size > 2)
-        {
-            data.reject();
-            return;
-        }
-        else if (arguments_size == 2)
-        {
-            /// If the function has two arguments, then one of them must be a constant.
-            if (!ast_function.arguments->children[0]->as<ASTLiteral>() && !ast_function.arguments->children[1]->as<ASTLiteral>())
-            {
-                data.reject();
-                return;
-            }
-        }
-
         if (!data.canOptimize(ast_function))
         {
             data.reject();
@@ -147,33 +124,14 @@ public:
             return;
         }
 
-        auto function_arguments = getFunctionArguments(ast_function, data);
-
-        auto function_base = function->build(function_arguments);
+        ColumnsWithTypeAndName args;
+        args.emplace_back(data.arg_data_type, "tmp");
+        auto function_base = function->build(args);
 
         if (function_base && function_base->hasInformationAboutMonotonicity())
         {
             bool is_positive = data.monotonicity.is_positive;
-            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, data.range.left, data.range.right);
-
-            auto & key_range = data.range;
-
-            /// If we apply function to open interval, we can get empty intervals in result.
-            /// E.g. for ('2020-01-03', '2020-01-20') after applying 'toYYYYMM' we will get ('202001', '202001').
-            /// To avoid this we make range left and right included.
-            /// Any function that treats NULL specially is not monotonic.
-            /// Thus we can safely use isNull() as an -Inf/+Inf indicator here.
-            if (!key_range.left.isNull())
-            {
-                key_range.left = applyFunction(function_base, data.arg_data_type, key_range.left);
-                key_range.left_included = true;
-            }
-
-            if (!key_range.right.isNull())
-            {
-                key_range.right = applyFunction(function_base, data.arg_data_type, key_range.right);
-                key_range.right_included = true;
-            }
+            data.monotonicity = function_base->getMonotonicityForRange(*data.arg_data_type, Field(), Field());
 
             if (!is_positive)
                 data.monotonicity.is_positive = !data.monotonicity.is_positive;
@@ -185,53 +143,13 @@ public:
 
     static bool needChildVisit(const ASTPtr & parent, const ASTPtr &)
     {
-        /// Multi-argument functions with all but one constant arguments can be monotonic.
+        /// Currently we check monotonicity only for single-argument functions.
+        /// Although, multi-argument functions with all but one constant arguments can also be monotonic.
         if (const auto * func = typeid_cast<const ASTFunction *>(parent.get()))
-            return func->arguments->children.size() <= 2;
+            return func->arguments->children.size() < 2;
 
         return true;
     }
-
-    static ColumnWithTypeAndName extractLiteralColumnAndTypeFromAstLiteral(const ASTLiteral * literal)
-    {
-        ColumnWithTypeAndName result;
-
-        result.type = applyVisitor(FieldToDataType(), literal->value);
-        result.column = result.type->createColumnConst(0, literal->value);
-
-        return result;
-    }
-
-    static ColumnsWithTypeAndName getFunctionArguments(const ASTFunction & ast_function, const Data & data)
-    {
-        ColumnsWithTypeAndName args;
-
-        auto arguments_size = ast_function.arguments->children.size();
-
-        chassert(arguments_size == 1 || arguments_size == 2);
-
-        if (arguments_size == 2)
-        {
-            if (ast_function.arguments->children[0]->as<ASTLiteral>())
-            {
-                const auto * literal = ast_function.arguments->children[0]->as<ASTLiteral>();
-                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
-                args.emplace_back(data.arg_data_type, "tmp");
-            }
-            else
-            {
-                const auto * literal = ast_function.arguments->children[1]->as<ASTLiteral>();
-                args.emplace_back(data.arg_data_type, "tmp");
-                args.push_back(extractLiteralColumnAndTypeFromAstLiteral(literal));
-            }
-        }
-        else
-        {
-            args.emplace_back(data.arg_data_type, "tmp");
-        }
-
-        return args;
-    }
 };
 
 using MonotonicityCheckVisitor = ConstInDepthNodeVisitor<MonotonicityCheckMatcher, false>;
diff --git a/src/Interpreters/applyFunction.cpp b/src/Interpreters/applyFunction.cpp
deleted file mode 100644
index a53f14f0381..00000000000
--- a/src/Interpreters/applyFunction.cpp
+++ /dev/null
@@ -1,43 +0,0 @@
-#include <Interpreters/applyFunction.h>
-
-#include <Core/Range.h>
-#include <Functions/IFunction.h>
-
-namespace DB
-{
-
-static Field applyFunctionForField(const FunctionBasePtr & func, const DataTypePtr & arg_type, const Field & arg_value)
-{
-    ColumnsWithTypeAndName columns{
-        {arg_type->createColumnConst(1, arg_value), arg_type, "x"},
-    };
-
-    auto col = func->execute(columns, func->getResultType(), 1);
-    return (*col)[0];
-}
-
-FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
-{
-    /// Fallback for fields without block reference.
-    if (field.isExplicit())
-        return applyFunctionForField(func, current_type, field);
-
-    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
-    const auto & columns = field.columns;
-    size_t result_idx = columns->size();
-
-    for (size_t i = 0; i < result_idx; ++i)
-        if ((*columns)[i].name == result_name)
-            result_idx = i;
-
-    if (result_idx == columns->size())
-    {
-        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
-        field.columns->emplace_back(ColumnWithTypeAndName{nullptr, func->getResultType(), result_name});
-        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
-    }
-
-    return {field.columns, field.row_idx, result_idx};
-}
-
-}
diff --git a/src/Interpreters/applyFunction.h b/src/Interpreters/applyFunction.h
deleted file mode 100644
index 9b8ae43a53c..00000000000
--- a/src/Interpreters/applyFunction.h
+++ /dev/null
@@ -1,16 +0,0 @@
-#pragma once
-
-#include <memory>
-
-namespace DB
-{
-struct FieldRef;
-
-class IFunctionBase;
-class IDataType;
-
-using DataTypePtr = std::shared_ptr<const IDataType>;
-using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
-
-FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field);
-}
diff --git a/src/Parsers/queryToString.cpp b/src/Parsers/queryToString.cpp
index 4a1903393f6..9721aa1f128 100644
--- a/src/Parsers/queryToString.cpp
+++ b/src/Parsers/queryToString.cpp
@@ -3,11 +3,6 @@
 
 namespace DB
 {
-    String queryToStringNullable(const ASTPtr & query)
-    {
-        return query ? queryToString(query) : "";
-    }
-
     String queryToString(const ASTPtr & query)
     {
         return queryToString(*query);
diff --git a/src/Parsers/queryToString.h b/src/Parsers/queryToString.h
index 3acd560b1e2..873de218293 100644
--- a/src/Parsers/queryToString.h
+++ b/src/Parsers/queryToString.h
@@ -6,5 +6,4 @@ namespace DB
 {
     String queryToString(const ASTPtr & query);
     String queryToString(const IAST & query);
-    String queryToStringNullable(const ASTPtr & query);
 }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 7e4a51cfbae..0f82e00edff 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -81,7 +81,6 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
     size_t minmax_idx_size = minmax_column_types.size();
 
-    hyperrectangle.clear();
     hyperrectangle.reserve(minmax_idx_size);
     for (size_t i = 0; i < minmax_idx_size; ++i)
     {
@@ -105,39 +104,6 @@ void IMergeTreeDataPart::MinMaxIndex::load(const MergeTreeData & data, const Par
     initialized = true;
 }
 
-Block IMergeTreeDataPart::MinMaxIndex::getBlock(const MergeTreeData & data) const
-{
-    if (!initialized)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to get block from uninitialized MinMax index.");
-
-    Block block;
-
-    const auto metadata_snapshot = data.getInMemoryMetadataPtr();
-    const auto & partition_key = metadata_snapshot->getPartitionKey();
-
-    const auto minmax_column_names = data.getMinMaxColumnsNames(partition_key);
-    const auto minmax_column_types = data.getMinMaxColumnsTypes(partition_key);
-    const auto minmax_idx_size = minmax_column_types.size();
-
-    for (size_t i = 0; i < minmax_idx_size; ++i)
-    {
-        const auto & data_type = minmax_column_types[i];
-        const auto & column_name = minmax_column_names[i];
-
-        const auto column = data_type->createColumn();
-
-        const auto min_val = hyperrectangle.at(i).left;
-        const auto max_val = hyperrectangle.at(i).right;
-
-        column->insert(min_val);
-        column->insert(max_val);
-
-        block.insert(ColumnWithTypeAndName(column->getPtr(), data_type, column_name));
-    }
-
-    return block;
-}
-
 IMergeTreeDataPart::MinMaxIndex::WrittenFiles IMergeTreeDataPart::MinMaxIndex::store(
     const MergeTreeData & data, IDataPartStorage & part_storage, Checksums & out_checksums) const
 {
@@ -219,7 +185,8 @@ void IMergeTreeDataPart::MinMaxIndex::merge(const MinMaxIndex & other)
 
     if (!initialized)
     {
-        *this = other;
+        hyperrectangle = other.hyperrectangle;
+        initialized = true;
     }
     else
     {
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index b118aa78ce9..fcf9d5bd17d 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -342,7 +342,6 @@ public:
         }
 
         void load(const MergeTreeData & data, const PartMetadataManagerPtr & manager);
-        Block getBlock(const MergeTreeData & data) const;
 
         using WrittenFiles = std::vector<std::unique_ptr<WriteBufferFromFileBase>>;
 
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index e5bcb11091f..d5922ae1bc2 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -1,37 +1,36 @@
-#include <Columns/ColumnConst.h>
-#include <Columns/ColumnSet.h>
+#include <Storages/MergeTree/KeyCondition.h>
+#include <Storages/MergeTree/BoolMask.h>
+#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeNothing.h>
 #include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/FieldToDataType.h>
-#include <DataTypes/Utils.h>
 #include <DataTypes/getLeastSupertype.h>
-#include <Functions/CastOverloadResolver.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/IFunction.h>
-#include <Functions/indexHint.h>
-#include <IO/Operators.h>
-#include <IO/WriteBufferFromString.h>
-#include <Interpreters/ExpressionActions.h>
-#include <Interpreters/ExpressionAnalyzer.h>
-#include <Interpreters/Set.h>
+#include <DataTypes/Utils.h>
 #include <Interpreters/TreeRewriter.h>
-#include <Interpreters/applyFunction.h>
+#include <Interpreters/ExpressionAnalyzer.h>
+#include <Interpreters/ExpressionActions.h>
 #include <Interpreters/castColumn.h>
-#include <Interpreters/convertFieldToType.h>
 #include <Interpreters/misc.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTLiteral.h>
-#include <Parsers/ASTSelectQuery.h>
-#include <Parsers/queryToString.h>
-#include <Storages/MergeTree/BoolMask.h>
-#include <Storages/MergeTree/KeyCondition.h>
-#include <Storages/MergeTree/MergeTreeIndexUtils.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/indexHint.h>
+#include <Functions/CastOverloadResolver.h>
+#include <Functions/IFunction.h>
 #include <Common/FieldVisitorToString.h>
 #include <Common/MortonUtils.h>
 #include <Common/typeid_cast.h>
+#include <Columns/ColumnSet.h>
+#include <Columns/ColumnConst.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/Set.h>
+#include <Parsers/queryToString.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
+#include <Parsers/ASTSelectQuery.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/Operators.h>
+#include <Storages/MergeTree/MergeTreeIndexUtils.h>
 
 #include <algorithm>
 #include <cassert>
@@ -837,6 +836,21 @@ bool KeyCondition::getConstant(const ASTPtr & expr, Block & block_with_constants
     return node.tryGetConstant(out_value, out_type);
 }
 
+
+static Field applyFunctionForField(
+    const FunctionBasePtr & func,
+    const DataTypePtr & arg_type,
+    const Field & arg_value)
+{
+    ColumnsWithTypeAndName columns
+    {
+        { arg_type->createColumnConst(1, arg_value), arg_type, "x" },
+    };
+
+    auto col = func->execute(columns, func->getResultType(), 1);
+    return (*col)[0];
+}
+
 /// The case when arguments may have types different than in the primary key.
 static std::pair<Field, DataTypePtr> applyFunctionForFieldOfUnknownType(
     const FunctionBasePtr & func,
@@ -876,6 +890,33 @@ static std::pair<Field, DataTypePtr> applyBinaryFunctionForFieldOfUnknownType(
     return {std::move(result), std::move(return_type)};
 }
 
+
+static FieldRef applyFunction(const FunctionBasePtr & func, const DataTypePtr & current_type, const FieldRef & field)
+{
+    /// Fallback for fields without block reference.
+    if (field.isExplicit())
+        return applyFunctionForField(func, current_type, field);
+
+    String result_name = "_" + func->getName() + "_" + toString(field.column_idx);
+    const auto & columns = field.columns;
+    size_t result_idx = columns->size();
+
+    for (size_t i = 0; i < result_idx; ++i)
+    {
+        if ((*columns)[i].name == result_name)
+            result_idx = i;
+    }
+
+    if (result_idx == columns->size())
+    {
+        ColumnsWithTypeAndName args{(*columns)[field.column_idx]};
+        field.columns->emplace_back(ColumnWithTypeAndName {nullptr, func->getResultType(), result_name});
+        (*columns)[result_idx].column = func->execute(args, (*columns)[result_idx].type, columns->front().column->size());
+    }
+
+    return {field.columns, field.row_idx, result_idx};
+}
+
 /** When table's key has expression with these functions from a column,
   * and when a column in a query is compared with a constant, such as:
   * CREATE TABLE (x String) ORDER BY toDate(x)
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 3ca746a7197..c8262914702 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -8,6 +8,21 @@
 #include <Backups/BackupEntryWrappedWith.h>
 #include <Backups/IBackup.h>
 #include <Backups/RestorerFromBackup.h>
+#include <Common/Config/ConfigHelper.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/Increment.h>
+#include <Common/ProfileEventsScope.h>
+#include <Common/SimpleIncrement.h>
+#include <Common/Stopwatch.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/ThreadFuzzer.h>
+#include <Common/escapeForFileName.h>
+#include <Common/getNumberOfPhysicalCPUCores.h>
+#include <Common/noexcept_scope.h>
+#include <Common/quoteString.h>
+#include <Common/scope_guard_safe.h>
+#include <Common/typeid_cast.h>
+#include <Storages/MergeTree/RangesInDataPart.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Core/QueryProcessingStage.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -27,20 +42,19 @@
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Aggregator.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/MergeTreeTransaction.h>
 #include <Interpreters/PartLog.h>
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/TreeRewriter.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/inplaceBlockConversions.h>
-#include <Parsers/ASTAlterQuery.h>
 #include <Parsers/ASTExpressionList.h>
-#include <Parsers/ASTFunction.h>
-#include <Parsers/ASTHelpers.h>
 #include <Parsers/ASTIndexDeclaration.h>
+#include <Parsers/ASTHelpers.h>
+#include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTNameTypePair.h>
 #include <Parsers/ASTPartition.h>
@@ -48,37 +62,25 @@
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
+#include <Parsers/ASTAlterQuery.h>
 #include <Processors/Formats/IInputFormat.h>
 #include <Processors/QueryPlan/QueryIdHolder.h>
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/BlockNumberColumn.h>
 #include <Storages/Freeze.h>
-#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
-#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/Statistics/Estimator.h>
-#include <Storages/MergeTree/RangesInDataPart.h>
+#include <Storages/MergeTree/MergeTreeSelectProcessor.h>
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MutationCommands.h>
+#include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/StorageMergeTree.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
-#include <Common/Config/ConfigHelper.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/Increment.h>
-#include <Common/ProfileEventsScope.h>
-#include <Common/Stopwatch.h>
-#include <Common/StringUtils/StringUtils.h>
-#include <Common/ThreadFuzzer.h>
-#include <Common/escapeForFileName.h>
-#include <Common/noexcept_scope.h>
-#include <Common/quoteString.h>
-#include <Common/scope_guard_safe.h>
-#include <Common/typeid_cast.h>
 
 #include <boost/range/algorithm_ext/erase.hpp>
 #include <boost/algorithm/string/join.hpp>
@@ -190,50 +192,6 @@ namespace ErrorCodes
     extern const int LIMIT_EXCEEDED;
 }
 
-static size_t getPartitionAstFieldsCount(const ASTPartition & partition_ast, ASTPtr partition_value_ast)
-{
-    if (partition_ast.fields_count.has_value())
-        return *partition_ast.fields_count;
-
-    if (partition_value_ast->as<ASTLiteral>())
-        return 1;
-
-    const auto * tuple_ast = partition_value_ast->as<ASTFunction>();
-
-    if (!tuple_ast)
-    {
-        throw Exception(
-            ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
-    }
-
-    if (tuple_ast->name != "tuple")
-    {
-        if (!isFunctionCast(tuple_ast))
-            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-
-        if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
-            throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-
-        auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
-        if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
-        {
-            const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-            return arguments_ast ? arguments_ast->children.size() : 0;
-        }
-        else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
-        {
-            return inner_literal_tuple->value.getType() == Field::Types::Tuple ? inner_literal_tuple->value.safeGet<Tuple>().size() : 1;
-        }
-
-        throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
-    }
-    else
-    {
-        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
-        return arguments_ast ? arguments_ast->children.size() : 0;
-    }
-}
-
 static void checkSuspiciousIndices(const ASTFunction * index_function)
 {
     std::unordered_set<UInt64> unique_index_expression_hashes;
@@ -4902,7 +4860,7 @@ void MergeTreeData::removePartContributionToColumnAndSecondaryIndexSizes(const D
 }
 
 void MergeTreeData::checkAlterPartitionIsPossible(
-    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr) const
+    const PartitionCommands & commands, const StorageMetadataPtr & /*metadata_snapshot*/, const Settings & settings, ContextPtr local_context) const
 {
     for (const auto & command : commands)
     {
@@ -4930,15 +4888,7 @@ void MergeTreeData::checkAlterPartitionIsPossible(
                         throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH PARTITION ALL currently");
                 }
                 else
-                {
-                    // The below `getPartitionIDFromQuery` call will not work for attach / replace because it assumes the partition expressions
-                    // are the same and deliberately uses this storage. Later on, `MergeTreeData::replaceFrom` is called, and it makes the right
-                    // call to `getPartitionIDFromQuery` using source storage.
-                    // Note: `PartitionCommand::REPLACE_PARTITION` is used both for `REPLACE PARTITION` and `ATTACH PARTITION FROM` queries.
-                    // But not for `ATTACH PARTITION` queries.
-                    if (command.type != PartitionCommand::REPLACE_PARTITION)
-                        getPartitionIDFromQuery(command.partition, getContext());
-                }
+                    getPartitionIDFromQuery(command.partition, local_context);
             }
         }
     }
@@ -5675,8 +5625,69 @@ String MergeTreeData::getPartitionIDFromQuery(const ASTPtr & ast, ContextPtr loc
         MergeTreePartInfo::validatePartitionID(partition_ast.id->clone(), format_version);
         return partition_ast.id->as<ASTLiteral>()->value.safeGet<String>();
     }
+    size_t partition_ast_fields_count = 0;
     ASTPtr partition_value_ast = partition_ast.value->clone();
-    auto partition_ast_fields_count = getPartitionAstFieldsCount(partition_ast, partition_value_ast);
+    if (!partition_ast.fields_count.has_value())
+    {
+        if (partition_value_ast->as<ASTLiteral>())
+        {
+            partition_ast_fields_count = 1;
+        }
+        else if (const auto * tuple_ast = partition_value_ast->as<ASTFunction>())
+        {
+            if (tuple_ast->name != "tuple")
+            {
+                if (isFunctionCast(tuple_ast))
+                {
+                    if (tuple_ast->arguments->as<ASTExpressionList>()->children.empty())
+                    {
+                        throw Exception(
+                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+                    }
+                    auto first_arg = tuple_ast->arguments->as<ASTExpressionList>()->children.at(0);
+                    if (const auto * inner_tuple = first_arg->as<ASTFunction>(); inner_tuple && inner_tuple->name == "tuple")
+                    {
+                        const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+                        if (arguments_ast)
+                            partition_ast_fields_count = arguments_ast->children.size();
+                        else
+                            partition_ast_fields_count = 0;
+                    }
+                    else if (const auto * inner_literal_tuple = first_arg->as<ASTLiteral>(); inner_literal_tuple)
+                    {
+                        if (inner_literal_tuple->value.getType() == Field::Types::Tuple)
+                            partition_ast_fields_count = inner_literal_tuple->value.safeGet<Tuple>().size();
+                        else
+                            partition_ast_fields_count = 1;
+                    }
+                    else
+                    {
+                        throw Exception(
+                            ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+                    }
+                }
+                else
+                    throw Exception(ErrorCodes::INVALID_PARTITION_VALUE, "Expected tuple for complex partition key, got {}", tuple_ast->name);
+            }
+            else
+            {
+                const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
+                if (arguments_ast)
+                    partition_ast_fields_count = arguments_ast->children.size();
+                else
+                    partition_ast_fields_count = 0;
+            }
+        }
+        else
+        {
+            throw Exception(
+                ErrorCodes::INVALID_PARTITION_VALUE, "Expected literal or tuple for partition key, got {}", partition_value_ast->getID());
+        }
+    }
+    else
+    {
+        partition_ast_fields_count = *partition_ast.fields_count;
+    }
 
     if (format_version < MERGE_TREE_DATA_MIN_FORMAT_VERSION_WITH_CUSTOM_PARTITIONING)
     {
@@ -7012,35 +7023,23 @@ MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(IStorage & sour
     if (my_snapshot->getColumns().getAllPhysical().sizeOfDifference(src_snapshot->getColumns().getAllPhysical()))
         throw Exception(ErrorCodes::INCOMPATIBLE_COLUMNS, "Tables have different structure");
 
-    if (queryToStringNullable(my_snapshot->getSortingKeyAST()) != queryToStringNullable(src_snapshot->getSortingKeyAST()))
+    auto query_to_string = [] (const ASTPtr & ast)
+    {
+        return ast ? queryToString(ast) : "";
+    };
+
+    if (query_to_string(my_snapshot->getSortingKeyAST()) != query_to_string(src_snapshot->getSortingKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different ordering");
 
+    if (query_to_string(my_snapshot->getPartitionKeyAST()) != query_to_string(src_snapshot->getPartitionKeyAST()))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different partition key");
+
     if (format_version != src_data->format_version)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different format_version");
 
-    if (queryToStringNullable(my_snapshot->getPrimaryKeyAST()) != queryToStringNullable(src_snapshot->getPrimaryKeyAST()))
+    if (query_to_string(my_snapshot->getPrimaryKeyAST()) != query_to_string(src_snapshot->getPrimaryKeyAST()))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Tables have different primary key");
 
-    const auto is_a_subset_of = [](const auto & lhs, const auto & rhs)
-    {
-        if (lhs.size() > rhs.size())
-            return false;
-
-        const auto rhs_set = NameSet(rhs.begin(), rhs.end());
-        for (const auto & lhs_element : lhs)
-            if (!rhs_set.contains(lhs_element))
-                return false;
-
-        return true;
-    };
-
-    if (!is_a_subset_of(my_snapshot->getColumnsRequiredForPartitionKey(), src_snapshot->getColumnsRequiredForPartitionKey()))
-    {
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "Destination table partition expression columns must be a subset of source table partition expression columns");
-    }
-
     const auto check_definitions = [](const auto & my_descriptions, const auto & src_descriptions)
     {
         if (my_descriptions.size() != src_descriptions.size())
@@ -7081,56 +7080,130 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
-    return MergeTreeDataPartCloner::clone(
-        this, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, require_part_metadata, params, read_settings, write_settings);
-}
+    chassert(!isStaticStorage());
 
-std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
-    const MergeTreeData::DataPartPtr & src_part,
-    const MergeTreePartition & new_partition,
-    const String & partition_id,
-    const IMergeTreeDataPart::MinMaxIndex & min_max_index,
-    const String & tmp_part_prefix,
-    const StorageMetadataPtr & my_metadata_snapshot,
-    const IDataPartStorage::ClonePartParams & clone_params,
-    ContextPtr local_context,
-    Int64 min_block,
-    Int64 max_block
-)
-{
-    MergeTreePartInfo dst_part_info(partition_id, min_block, max_block, src_part->info.level);
+    /// Check that the storage policy contains the disk where the src_part is located.
+    bool does_storage_policy_allow_same_disk = false;
+    for (const DiskPtr & disk : getStoragePolicy()->getDisks())
+    {
+        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
+        {
+            does_storage_policy_allow_same_disk = true;
+            break;
+        }
+    }
+    if (!does_storage_policy_allow_same_disk)
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Could not clone and load part {} because disk does not belong to storage policy",
+            quoteString(src_part->getDataPartStorage().getFullPath()));
 
-    return MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
-        this,
-        src_part,
-        my_metadata_snapshot,
-        dst_part_info,
-        tmp_part_prefix,
-        local_context->getReadSettings(),
-        local_context->getWriteSettings(),
-        new_partition,
-        min_max_index,
-        false,
-        clone_params);
-}
+    String dst_part_name = src_part->getNewName(dst_part_info);
+    String tmp_dst_part_name = tmp_part_prefix + dst_part_name;
+    auto temporary_directory_lock = getTemporaryPartDirectoryHolder(tmp_dst_part_name);
 
-std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> MergeTreeData::createPartitionAndMinMaxIndexFromSourcePart(
-    const MergeTreeData::DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    ContextPtr local_context)
-{
-    const auto & src_data = src_part->storage;
+    /// Why it is needed if we only hardlink files?
+    auto reservation = src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
+    auto src_part_storage = src_part->getDataPartStoragePtr();
 
-    auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(src_part.get());
-    IMergeTreeDataPart::MinMaxIndex min_max_index;
+    scope_guard src_flushed_tmp_dir_lock;
+    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
 
-    min_max_index.load(src_data, metadata_manager);
+    /// If source part is in memory, flush it to disk and clone it already in on-disk format
+    /// Protect tmp dir from removing by cleanup thread with src_flushed_tmp_dir_lock
+    /// Construct src_flushed_tmp_part in order to delete part with its directory at destructor
+    if (auto src_part_in_memory = asInMemoryPart(src_part))
+    {
+        auto flushed_part_path = *src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
 
-    MergeTreePartition new_partition;
+        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
+        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
 
-    new_partition.create(metadata_snapshot, min_max_index.getBlock(src_data), 0u, local_context);
+        auto flushed_part_storage = src_part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
 
-    return {new_partition, min_max_index};
+        src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, src_part->name, flushed_part_storage)
+            .withPartInfo(src_part->info)
+            .withPartFormatFromDisk()
+            .build();
+
+        src_flushed_tmp_part->is_temp = true;
+        src_part_storage = flushed_part_storage;
+    }
+
+    String with_copy;
+    if (params.copy_instead_of_hardlink)
+        with_copy = " (copying data)";
+
+    auto dst_part_storage = src_part_storage->freeze(
+        relative_data_path,
+        tmp_dst_part_name,
+        read_settings,
+        write_settings,
+        /* save_metadata_callback= */ {},
+        params);
+
+    if (params.metadata_version_to_write.has_value())
+    {
+        chassert(!params.keep_metadata_version);
+        auto out_metadata = dst_part_storage->writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, getContext()->getWriteSettings());
+        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
+        out_metadata->finalize();
+        if (getSettings()->fsync_after_insert)
+            out_metadata->sync();
+    }
+
+    LOG_DEBUG(log, "Clone{} part {} to {}{}",
+              src_flushed_tmp_part ? " flushed" : "",
+              src_part_storage->getFullPath(),
+              std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
+              with_copy);
+
+    auto dst_data_part = MergeTreeDataPartBuilder(*this, dst_part_name, dst_part_storage)
+        .withPartFormatFromDisk()
+        .build();
+
+    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
+    {
+        params.hardlinked_files->source_part_name = src_part->name;
+        params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
+
+        for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
+        {
+            if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
+                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+            {
+                params.hardlinked_files->hardlinks_from_source_part.insert(it->name());
+            }
+        }
+
+        auto projections = src_part->getProjectionParts();
+        for (const auto & [name, projection_part] : projections)
+        {
+            const auto & projection_storage = projection_part->getDataPartStorage();
+            for (auto it = projection_storage.iterate(); it->isValid(); it->next())
+            {
+                auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
+                if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
+                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
+                    && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
+                {
+                    params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
+                }
+            }
+        }
+    }
+
+    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
+    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
+    dst_data_part->version.setCreationTID(tid, nullptr);
+    dst_data_part->storeVersionMetadata();
+
+    dst_data_part->is_temp = true;
+
+    dst_data_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
+    dst_data_part->modification_time = dst_part_storage->getLastModified().epochTime();
+    return std::make_pair(dst_data_part, std::move(temporary_directory_lock));
 }
 
 String MergeTreeData::getFullPathOnDisk(const DiskPtr & disk) const
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index dfdc22baa8f..4ad440dae00 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -232,7 +232,6 @@ public:
         }
     };
 
-
     using DataParts = std::set<DataPartPtr, LessDataPart>;
     using MutableDataParts = std::set<MutableDataPartPtr, LessDataPart>;
     using DataPartsVector = std::vector<DataPartPtr>;
@@ -855,23 +854,6 @@ public:
         const ReadSettings & read_settings,
         const WriteSettings & write_settings);
 
-    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
-        const MergeTreeData::DataPartPtr & src_part,
-        const MergeTreePartition & new_partition,
-        const String & partition_id,
-        const IMergeTreeDataPart::MinMaxIndex & min_max_index,
-        const String & tmp_part_prefix,
-        const StorageMetadataPtr & my_metadata_snapshot,
-        const IDataPartStorage::ClonePartParams & clone_params,
-        ContextPtr local_context,
-        Int64 min_block,
-        Int64 max_block);
-
-    static std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> createPartitionAndMinMaxIndexFromSourcePart(
-        const MergeTreeData::DataPartPtr & src_part,
-        const StorageMetadataPtr & metadata_snapshot,
-        ContextPtr local_context);
-
     virtual std::vector<MergeTreeMutationStatus> getMutationsStatus() const = 0;
 
     /// Returns true if table can create new parts with adaptive granularity
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
deleted file mode 100644
index 04019d2c665..00000000000
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ /dev/null
@@ -1,319 +0,0 @@
-#include <Interpreters/MergeTreeTransaction.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-#include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
-#include <Storages/MergeTree/MergeTreeDataPartCloner.h>
-#include <Common/escapeForFileName.h>
-#include <Common/logger_useful.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-extern const int BAD_ARGUMENTS;
-}
-
-namespace DistinctPartitionExpression
-{
-std::unique_ptr<WriteBufferFromFileBase> updatePartitionFile(
-    const MergeTreeData & merge_tree_data,
-    const MergeTreePartition & partition,
-    const MergeTreeData::MutableDataPartPtr & dst_part,
-    IDataPartStorage & storage)
-{
-    storage.removeFile("partition.dat");
-    // Leverage already implemented MergeTreePartition::store to create & store partition.dat.
-    // Checksum is re-calculated later.
-    return partition.store(merge_tree_data, storage, dst_part->checksums);
-}
-
-IMergeTreeDataPart::MinMaxIndex::WrittenFiles updateMinMaxFiles(
-    const MergeTreeData & merge_tree_data,
-    const MergeTreeData::MutableDataPartPtr & dst_part,
-    IDataPartStorage & storage,
-    const StorageMetadataPtr & metadata_snapshot)
-{
-    for (const auto & column_name : MergeTreeData::getMinMaxColumnsNames(metadata_snapshot->partition_key))
-    {
-        auto file = "minmax_" + escapeForFileName(column_name) + ".idx";
-        storage.removeFile(file);
-    }
-
-    return dst_part->minmax_idx->store(merge_tree_data, storage, dst_part->checksums);
-}
-
-void finalizeNewFiles(const std::vector<std::unique_ptr<WriteBufferFromFileBase>> & files, bool sync_new_files)
-{
-    for (const auto & file : files)
-    {
-        file->finalize();
-        if (sync_new_files)
-            file->sync();
-    }
-}
-
-void updateNewPartFiles(
-    const MergeTreeData & merge_tree_data,
-    const MergeTreeData::MutableDataPartPtr & dst_part,
-    const MergeTreePartition & new_partition,
-    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
-    const StorageMetadataPtr & src_metadata_snapshot,
-    bool sync_new_files)
-{
-    auto & storage = dst_part->getDataPartStorage();
-
-    *dst_part->minmax_idx = new_min_max_index;
-
-    auto partition_file = updatePartitionFile(merge_tree_data, new_partition, dst_part, storage);
-
-    auto min_max_files = updateMinMaxFiles(merge_tree_data, dst_part, storage, src_metadata_snapshot);
-
-    IMergeTreeDataPart::MinMaxIndex::WrittenFiles written_files;
-
-    if (partition_file)
-        written_files.emplace_back(std::move(partition_file));
-
-    written_files.insert(written_files.end(), std::make_move_iterator(min_max_files.begin()), std::make_move_iterator(min_max_files.end()));
-
-    finalizeNewFiles(written_files, sync_new_files);
-
-    // MergeTreeDataPartCloner::finalize_part calls IMergeTreeDataPart::loadColumnsChecksumsIndexes, which will re-create
-    // the checksum file if it doesn't exist. Relying on that is cumbersome, but this refactoring is simply a code extraction
-    // with small improvements. It can be further improved in the future.
-    storage.removeFile("checksums.txt");
-}
-}
-
-namespace
-{
-bool doesStoragePolicyAllowSameDisk(MergeTreeData * merge_tree_data, const MergeTreeData::DataPartPtr & src_part)
-{
-    for (const DiskPtr & disk : merge_tree_data->getStoragePolicy()->getDisks())
-        if (disk->getName() == src_part->getDataPartStorage().getDiskName())
-            return true;
-    return false;
-}
-
-DataPartStoragePtr flushPartStorageToDiskIfInMemory(
-    MergeTreeData * merge_tree_data,
-    const MergeTreeData::DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    const String & tmp_part_prefix,
-    const String & tmp_dst_part_name,
-    scope_guard & src_flushed_tmp_dir_lock,
-    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part)
-{
-    if (auto src_part_in_memory = asInMemoryPart(src_part))
-    {
-        auto flushed_part_path = src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
-        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
-
-        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
-
-        auto flushed_part_storage = src_part_in_memory->flushToDisk(*flushed_part_path, metadata_snapshot);
-
-        src_flushed_tmp_part = MergeTreeDataPartBuilder(*merge_tree_data, src_part->name, flushed_part_storage)
-                                   .withPartInfo(src_part->info)
-                                   .withPartFormatFromDisk()
-                                   .build();
-
-        src_flushed_tmp_part->is_temp = true;
-
-        return flushed_part_storage;
-    }
-
-    return src_part->getDataPartStoragePtr();
-}
-
-std::shared_ptr<IDataPartStorage> hardlinkAllFiles(
-    MergeTreeData * merge_tree_data,
-    const DB::ReadSettings & read_settings,
-    const DB::WriteSettings & write_settings,
-    const DataPartStoragePtr & storage,
-    const String & path,
-    const DB::IDataPartStorage::ClonePartParams & params)
-{
-    return storage->freeze(
-        merge_tree_data->getRelativeDataPath(),
-        path,
-        read_settings,
-        write_settings,
-        /*save_metadata_callback=*/{},
-        params);
-}
-
-std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
-    MergeTreeData * merge_tree_data,
-    const MergeTreeData::DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    const MergeTreePartInfo & dst_part_info,
-    const String & tmp_part_prefix,
-    const ReadSettings & read_settings,
-    const WriteSettings & write_settings,
-    const DB::IDataPartStorage::ClonePartParams & params)
-{
-    const auto dst_part_name = src_part->getNewName(dst_part_info);
-
-    const auto tmp_dst_part_name = tmp_part_prefix + dst_part_name;
-
-    auto temporary_directory_lock = merge_tree_data->getTemporaryPartDirectoryHolder(tmp_dst_part_name);
-
-    src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
-
-    scope_guard src_flushed_tmp_dir_lock;
-    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
-
-    auto src_part_storage = flushPartStorageToDiskIfInMemory(
-        merge_tree_data, src_part, metadata_snapshot, tmp_part_prefix, tmp_dst_part_name, src_flushed_tmp_dir_lock, src_flushed_tmp_part);
-
-    auto dst_part_storage = hardlinkAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name, params);
-
-    if (params.metadata_version_to_write.has_value())
-    {
-        chassert(!params.keep_metadata_version);
-        auto out_metadata = dst_part_storage->writeFile(
-            IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, merge_tree_data->getContext()->getWriteSettings());
-        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
-        out_metadata->finalize();
-        if (merge_tree_data->getSettings()->fsync_after_insert)
-            out_metadata->sync();
-    }
-
-    LOG_DEBUG(
-        &Poco::Logger::get("MergeTreeDataPartCloner"),
-        "Clone {} part {} to {}{}",
-        src_flushed_tmp_part ? "flushed" : "",
-        src_part_storage->getFullPath(),
-        std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
-        false);
-
-
-    auto part = MergeTreeDataPartBuilder(*merge_tree_data, dst_part_name, dst_part_storage).withPartFormatFromDisk().build();
-
-    return std::make_pair(part, std::move(temporary_directory_lock));
-}
-
-void handleHardLinkedParameterFiles(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
-{
-    const auto & hardlinked_files = params.hardlinked_files;
-
-    hardlinked_files->source_part_name = src_part->name;
-    hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
-
-    for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
-    {
-        if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
-            && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-            && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-        {
-            hardlinked_files->hardlinks_from_source_part.insert(it->name());
-        }
-    }
-}
-
-void handleProjections(const MergeTreeData::DataPartPtr & src_part, const DB::IDataPartStorage::ClonePartParams & params)
-{
-    auto projections = src_part->getProjectionParts();
-    for (const auto & [name, projection_part] : projections)
-    {
-        const auto & projection_storage = projection_part->getDataPartStorage();
-        for (auto it = projection_storage.iterate(); it->isValid(); it->next())
-        {
-            auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
-            if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
-                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-            {
-                params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
-            }
-        }
-    }
-}
-
-MergeTreeData::MutableDataPartPtr finalizePart(
-    const MergeTreeData::MutableDataPartPtr & dst_part, const DB::IDataPartStorage::ClonePartParams & params, bool require_part_metadata)
-{
-    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
-    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
-    dst_part->version.setCreationTID(tid, nullptr);
-    dst_part->storeVersionMetadata();
-
-    dst_part->is_temp = true;
-
-    dst_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
-
-    dst_part->modification_time = dst_part->getDataPartStorage().getLastModified().epochTime();
-
-    return dst_part;
-}
-
-std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHandleHardlinksAndProjections(
-    MergeTreeData * merge_tree_data,
-    const DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    const MergeTreePartInfo & dst_part_info,
-    const String & tmp_part_prefix,
-    const ReadSettings & read_settings,
-    const WriteSettings & write_settings,
-    const IDataPartStorage::ClonePartParams & params)
-{
-    chassert(!merge_tree_data->isStaticStorage());
-    if (!doesStoragePolicyAllowSameDisk(merge_tree_data, src_part))
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "Could not clone and load part {} because disk does not belong to storage policy",
-            quoteString(src_part->getDataPartStorage().getFullPath()));
-
-    auto [destination_part, temporary_directory_lock] = cloneSourcePart(
-        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
-
-    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
-    {
-        handleHardLinkedParameterFiles(src_part, params);
-        handleProjections(src_part, params);
-    }
-
-    return std::make_pair(destination_part, std::move(temporary_directory_lock));
-}
-}
-
-std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::clone(
-    MergeTreeData * merge_tree_data,
-    const DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    const MergeTreePartInfo & dst_part_info,
-    const String & tmp_part_prefix,
-    bool require_part_metadata,
-    const IDataPartStorage::ClonePartParams & params,
-    const ReadSettings & read_settings,
-    const WriteSettings & write_settings)
-{
-    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
-        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
-
-    return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
-}
-
-std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
-    MergeTreeData * merge_tree_data,
-    const DataPartPtr & src_part,
-    const StorageMetadataPtr & metadata_snapshot,
-    const MergeTreePartInfo & dst_part_info,
-    const String & tmp_part_prefix,
-    const ReadSettings & read_settings,
-    const WriteSettings & write_settings,
-    const MergeTreePartition & new_partition,
-    const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
-    bool sync_new_files,
-    const IDataPartStorage::ClonePartParams & params)
-{
-    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
-        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
-
-    DistinctPartitionExpression::updateNewPartFiles(
-        *merge_tree_data, destination_part, new_partition, new_min_max_index, src_part->storage.getInMemoryMetadataPtr(), sync_new_files);
-
-    return std::make_pair(finalizePart(destination_part, params, false), std::move(temporary_directory_lock));
-}
-
-}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.h b/src/Storages/MergeTree/MergeTreeDataPartCloner.h
deleted file mode 100644
index 53585f20b7f..00000000000
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.h
+++ /dev/null
@@ -1,43 +0,0 @@
-#pragma once
-
-namespace DB
-{
-
-struct StorageInMemoryMetadata;
-using StorageMetadataPtr = std::shared_ptr<const StorageInMemoryMetadata>;
-struct MergeTreePartition;
-class IMergeTreeDataPart;
-
-class MergeTreeDataPartCloner
-{
-public:
-    using DataPart = IMergeTreeDataPart;
-    using MutableDataPartPtr = std::shared_ptr<DataPart>;
-    using DataPartPtr = std::shared_ptr<const DataPart>;
-
-    static std::pair<MutableDataPartPtr, scope_guard> clone(
-        MergeTreeData * merge_tree_data,
-        const DataPartPtr & src_part,
-        const StorageMetadataPtr & metadata_snapshot,
-        const MergeTreePartInfo & dst_part_info,
-        const String & tmp_part_prefix,
-        bool require_part_metadata,
-        const IDataPartStorage::ClonePartParams & params,
-        const ReadSettings & read_settings,
-        const WriteSettings & write_settings);
-
-    static std::pair<MutableDataPartPtr, scope_guard> cloneWithDistinctPartitionExpression(
-        MergeTreeData * merge_tree_data,
-        const DataPartPtr & src_part,
-        const StorageMetadataPtr & metadata_snapshot,
-        const MergeTreePartInfo & dst_part_info,
-        const String & tmp_part_prefix,
-        const ReadSettings & read_settings,
-        const WriteSettings & write_settings,
-        const MergeTreePartition & new_partition,
-        const IMergeTreeDataPart::MinMaxIndex & new_min_max_index,
-        bool sync_new_files,
-        const IDataPartStorage::ClonePartParams & params);
-};
-
-}
diff --git a/src/Storages/MergeTree/MergeTreePartition.cpp b/src/Storages/MergeTree/MergeTreePartition.cpp
index 76ef3be25b3..ddeaf69136a 100644
--- a/src/Storages/MergeTree/MergeTreePartition.cpp
+++ b/src/Storages/MergeTree/MergeTreePartition.cpp
@@ -467,45 +467,6 @@ void MergeTreePartition::create(const StorageMetadataPtr & metadata_snapshot, Bl
     }
 }
 
-void MergeTreePartition::createAndValidateMinMaxPartitionIds(
-    const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context)
-{
-    if (!metadata_snapshot->hasPartitionKey())
-        return;
-
-    auto partition_key_names_and_types = executePartitionByExpression(metadata_snapshot, block_with_min_max_partition_ids, context);
-    value.resize(partition_key_names_and_types.size());
-
-    /// Executing partition_by expression adds new columns to passed block according to partition functions.
-    /// The block is passed by reference and is used afterwards. `moduloLegacy` needs to be substituted back
-    /// with just `modulo`, because it was a temporary substitution.
-    static constexpr std::string_view modulo_legacy_function_name = "moduloLegacy";
-
-    size_t i = 0;
-    for (const auto & element : partition_key_names_and_types)
-    {
-        auto & partition_column = block_with_min_max_partition_ids.getByName(element.name);
-
-        if (element.name.starts_with(modulo_legacy_function_name))
-            partition_column.name.replace(0, modulo_legacy_function_name.size(), "modulo");
-
-        Field extracted_min_partition_id_field;
-        Field extracted_max_partition_id_field;
-
-        partition_column.column->get(0, extracted_min_partition_id_field);
-        partition_column.column->get(1, extracted_max_partition_id_field);
-
-        if (extracted_min_partition_id_field != extracted_max_partition_id_field)
-        {
-            throw Exception(
-                ErrorCodes::INVALID_PARTITION_VALUE,
-                "Can not create the partition. A partition can not contain values that have different partition ids");
-        }
-
-        partition_column.column->get(0u, value[i++]);
-    }
-}
-
 NamesAndTypesList MergeTreePartition::executePartitionByExpression(const StorageMetadataPtr & metadata_snapshot, Block & block, ContextPtr context)
 {
     auto adjusted_partition_key = adjustPartitionKey(metadata_snapshot, context);
diff --git a/src/Storages/MergeTree/MergeTreePartition.h b/src/Storages/MergeTree/MergeTreePartition.h
index fd7ae02cde4..78b141f26ec 100644
--- a/src/Storages/MergeTree/MergeTreePartition.h
+++ b/src/Storages/MergeTree/MergeTreePartition.h
@@ -1,12 +1,11 @@
 #pragma once
 
-#include <Core/Field.h>
+#include <base/types.h>
 #include <Disks/IDisk.h>
 #include <IO/WriteBuffer.h>
 #include <Storages/KeyDescription.h>
 #include <Storages/MergeTree/IPartMetadataManager.h>
-#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
-#include <base/types.h>
+#include <Core/Field.h>
 
 namespace DB
 {
@@ -52,11 +51,6 @@ public:
 
     void create(const StorageMetadataPtr & metadata_snapshot, Block block, size_t row, ContextPtr context);
 
-    /// Copy of MergeTreePartition::create, but also validates if min max partition keys are equal. If they are different,
-    /// it means the partition can't be created because the data doesn't belong to the same partition.
-    void createAndValidateMinMaxPartitionIds(
-        const StorageMetadataPtr & metadata_snapshot, Block block_with_min_max_partition_ids, ContextPtr context);
-
     static void appendFiles(const MergeTreeData & storage, Strings & files);
 
     /// Adjust partition key and execute its expression on block. Return sample block according to used expression.
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
deleted file mode 100644
index 21bcdb84a96..00000000000
--- a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.cpp
+++ /dev/null
@@ -1,91 +0,0 @@
-#include <Interpreters/MonotonicityCheckVisitor.h>
-#include <Interpreters/getTableExpressions.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
-#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-extern const int BAD_ARGUMENTS;
-}
-
-namespace
-{
-bool isDestinationPartitionExpressionMonotonicallyIncreasing(
-    const std::vector<Range> & hyperrectangle, const MergeTreeData & destination_storage)
-{
-    auto destination_table_metadata = destination_storage.getInMemoryMetadataPtr();
-
-    auto key_description = destination_table_metadata->getPartitionKey();
-    auto definition_ast = key_description.definition_ast->clone();
-
-    auto table_identifier = std::make_shared<ASTIdentifier>(destination_storage.getStorageID().getTableName());
-    auto table_with_columns
-        = TableWithColumnNamesAndTypes{DatabaseAndTableWithAlias(table_identifier), destination_table_metadata->getColumns().getOrdinary()};
-
-    auto expression_list = extractKeyExpressionList(definition_ast);
-
-    MonotonicityCheckVisitor::Data data{{table_with_columns}, destination_storage.getContext(), /*group_by_function_hashes*/ {}};
-
-    for (auto i = 0u; i < expression_list->children.size(); i++)
-    {
-        data.range = hyperrectangle[i];
-
-        MonotonicityCheckVisitor(data).visit(expression_list->children[i]);
-
-        if (!data.monotonicity.is_monotonic || !data.monotonicity.is_positive)
-            return false;
-    }
-
-    return true;
-}
-
-bool isExpressionDirectSubsetOf(const ASTPtr source, const ASTPtr destination)
-{
-    auto source_expression_list = extractKeyExpressionList(source);
-    auto destination_expression_list = extractKeyExpressionList(destination);
-
-    std::unordered_set<std::string> source_columns;
-
-    for (auto i = 0u; i < source_expression_list->children.size(); ++i)
-        source_columns.insert(source_expression_list->children[i]->getColumnName());
-
-    for (auto i = 0u; i < destination_expression_list->children.size(); ++i)
-        if (!source_columns.contains(destination_expression_list->children[i]->getColumnName()))
-            return false;
-
-    return true;
-}
-}
-
-void MergeTreePartitionCompatibilityVerifier::verify(
-    const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts)
-{
-    const auto source_metadata = source_storage.getInMemoryMetadataPtr();
-    const auto destination_metadata = destination_storage.getInMemoryMetadataPtr();
-
-    const auto source_partition_key_ast = source_metadata->getPartitionKeyAST();
-    const auto destination_partition_key_ast = destination_metadata->getPartitionKeyAST();
-
-    // If destination partition expression columns are a subset of source partition expression columns,
-    // there is no need to check for monotonicity.
-    if (isExpressionDirectSubsetOf(source_partition_key_ast, destination_partition_key_ast))
-        return;
-
-    const auto src_global_min_max_indexes = MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(source_parts, destination_storage);
-
-    assert(!src_global_min_max_indexes.hyperrectangle.empty());
-
-    if (!isDestinationPartitionExpressionMonotonicallyIncreasing(src_global_min_max_indexes.hyperrectangle, destination_storage))
-        throw DB::Exception(ErrorCodes::BAD_ARGUMENTS, "Destination table partition expression is not monotonically increasing");
-
-    MergeTreePartition().createAndValidateMinMaxPartitionIds(
-        destination_storage.getInMemoryMetadataPtr(),
-        src_global_min_max_indexes.getBlock(destination_storage),
-        destination_storage.getContext());
-}
-
-}
diff --git a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h b/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
deleted file mode 100644
index 1682add3ebd..00000000000
--- a/src/Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h
+++ /dev/null
@@ -1,30 +0,0 @@
-#pragma once
-
-#include <Core/Field.h>
-#include <Storages/MergeTree/IMergeTreeDataPart.h>
-
-namespace DB
-{
-
-/*
- * Verifies that source and destination partitions are compatible.
- * To be compatible, one of the following criteria must be met:
- * 1. Destination partition expression columns are a subset of source partition columns; or
- * 2. Destination partition expression is monotonic on the source global min_max idx Range AND the computer partition id for
- * the source global min_max idx range is the same.
- *
- * If not, an exception is thrown.
- * */
-
-class MergeTreePartitionCompatibilityVerifier
-{
-public:
-    using DataPart = IMergeTreeDataPart;
-    using DataPartPtr = std::shared_ptr<const DataPart>;
-    using DataPartsVector = std::vector<DataPartPtr>;
-
-    static void
-    verify(const MergeTreeData & source_storage, const MergeTreeData & destination_storage, const DataPartsVector & source_parts);
-};
-
-}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
deleted file mode 100644
index 0871efadf0c..00000000000
--- a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.cpp
+++ /dev/null
@@ -1,25 +0,0 @@
-#include <Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h>
-
-namespace DB
-{
-
-IMergeTreeDataPart::MinMaxIndex
-MergeTreePartitionGlobalMinMaxIdxCalculator::calculate(const DataPartsVector & parts, const MergeTreeData & storage)
-{
-    IMergeTreeDataPart::MinMaxIndex global_min_max_indexes;
-
-    for (const auto & part : parts)
-    {
-        auto metadata_manager = std::make_shared<PartMetadataManagerOrdinary>(part.get());
-
-        auto local_min_max_index = MergeTreeData::DataPart::MinMaxIndex();
-
-        local_min_max_index.load(storage, metadata_manager);
-
-        global_min_max_indexes.merge(local_min_max_index);
-    }
-
-    return global_min_max_indexes;
-}
-
-}
diff --git a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h b/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
deleted file mode 100644
index 4f271177246..00000000000
--- a/src/Storages/MergeTree/MergeTreePartitionGlobalMinMaxIdxCalculator.h
+++ /dev/null
@@ -1,24 +0,0 @@
-#pragma once
-
-#include <utility>
-
-#include <Core/Field.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-
-namespace DB
-{
-
-/*
- * Calculates global min max indexes for a given set of parts on given storage.
- * */
-class MergeTreePartitionGlobalMinMaxIdxCalculator
-{
-    using DataPart = IMergeTreeDataPart;
-    using DataPartPtr = std::shared_ptr<const DataPart>;
-    using DataPartsVector = std::vector<DataPartPtr>;
-
-public:
-    static IMergeTreeDataPart::MinMaxIndex calculate(const DataPartsVector & parts, const MergeTreeData & storage);
-};
-
-}
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 0f75c726bce..79d03187efb 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -5,9 +5,9 @@
 #include <optional>
 #include <ranges>
 
+#include <base/sort.h>
 #include <Backups/BackupEntriesCollector.h>
 #include <Databases/IDatabase.h>
-#include <IO/copyData.h>
 #include "Common/Exception.h"
 #include <Common/MemoryTracker.h>
 #include <Common/escapeForFileName.h>
@@ -20,30 +20,27 @@
 #include <Interpreters/TransactionLog.h>
 #include <Interpreters/ClusterProxy/executeQuery.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
-#include <Interpreters/InterpreterAlterQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <IO/copyData.h>
 #include <Parsers/ASTCheckQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTPartition.h>
 #include <Parsers/ASTSetQuery.h>
-#include <Parsers/formatAST.h>
 #include <Parsers/queryToString.h>
+#include <Parsers/formatAST.h>
 #include <Planner/Utils.h>
 #include <Storages/buildQueryTreeForShard.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/ActiveDataPartSet.h>
 #include <Storages/AlterCommands.h>
-#include <Storages/MergeTree/MergeList.h>
-#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
-#include <Storages/MergeTree/MergeTreeSink.h>
-#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
-#include <Storages/MergeTree/PartitionPruner.h>
-#include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/PartitionCommands.h>
-#include <base/sort.h>
+#include <Storages/MergeTree/MergeTreeSink.h>
+#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
+#include <Storages/MergeTree/MergePlainMergeTreeTask.h>
+#include <Storages/MergeTree/PartitionPruner.h>
+#include <Storages/MergeTree/MergeList.h>
+#include <Storages/MergeTree/checkDataPart.h>
 #include <QueryPipeline/Pipe.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
@@ -2064,74 +2061,42 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, my_metadata_snapshot);
-    String partition_id = src_data.getPartitionIDFromQuery(partition, local_context);
+    String partition_id = getPartitionIDFromQuery(partition, local_context);
 
     DataPartsVector src_parts = src_data.getVisibleDataPartsVectorInPartition(local_context, partition_id);
-
-    bool attach_empty_partition = !replace && src_parts.empty();
-    if (attach_empty_partition)
-        return;
-
     MutableDataPartsVector dst_parts;
     std::vector<scope_guard> dst_parts_locks;
 
     static const String TMP_PREFIX = "tmp_replace_from_";
 
-    const auto my_partition_expression = my_metadata_snapshot->getPartitionKeyAST();
-    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
-    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
-
-    if (is_partition_exp_different && !src_parts.empty())
-        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_parts);
-
-    for (DataPartPtr & src_part : src_parts)
+    for (const DataPartPtr & src_part : src_parts)
     {
         if (!canReplacePartition(src_part))
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                             "Cannot replace partition '{}' because part '{}' has inconsistent granularity with table",
                             partition_id, src_part->name);
 
-        IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
         /// This will generate unique name in scope of current server process.
-        auto index = insert_increment.get();
+        Int64 temp_index = insert_increment.get();
+        MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
-        if (is_partition_exp_different)
-        {
-            auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
-                src_part, my_metadata_snapshot, local_context);
-
-            auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
-                src_part,
-                new_partition,
-                new_partition.getID(*this),
-                new_min_max_index,
-                TMP_PREFIX,
-                my_metadata_snapshot,
-                clone_params,
-                local_context,
-                index,
-                index);
-
-            dst_parts.emplace_back(std::move(dst_part));
-            dst_parts_locks.emplace_back(std::move(part_lock));
-        }
-        else
-        {
-            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                my_metadata_snapshot,
-                clone_params,
-                local_context->getReadSettings(),
-                local_context->getWriteSettings());
-            dst_parts.emplace_back(std::move(dst_part));
-            dst_parts_locks.emplace_back(std::move(part_lock));
-        }
+        IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
+        auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+            src_part,
+            TMP_PREFIX,
+            dst_part_info,
+            my_metadata_snapshot,
+            clone_params,
+            local_context->getReadSettings(),
+            local_context->getWriteSettings());
+        dst_parts.emplace_back(std::move(dst_part));
+        dst_parts_locks.emplace_back(std::move(part_lock));
     }
 
+    /// ATTACH empty part set
+    if (!replace && dst_parts.empty())
+        return;
+
     MergeTreePartInfo drop_range;
     if (replace)
     {
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6bd57cc4d6d..80fe2c7a838 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -25,18 +25,20 @@
 
 #include <base/sort.h>
 
+#include <Storages/buildQueryTreeForShard.h>
 #include <Storages/AlterCommands.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/Freeze.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
+#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/LeaderElection.h>
+#include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/MergeFromLogEntryTask.h>
 #include <Storages/MergeTree/MergeTreeBackgroundExecutor.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 #include <Storages/MergeTree/MergeTreePartInfo.h>
-#include <Storages/MergeTree/MergeTreePartitionCompatibilityVerifier.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
+#include <Storages/MergeTree/MergeTreeReaderCompact.h>
 #include <Storages/MergeTree/MutateFromLogEntryTask.h>
 #include <Storages/MergeTree/PinnedPartUUIDs.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeAddress.h>
@@ -48,11 +50,9 @@
 #include <Storages/MergeTree/ReplicatedMergeTreeSink.h>
 #include <Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h>
 #include <Storages/MergeTree/ZeroCopyLock.h>
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
 #include <Storages/PartitionCommands.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/VirtualColumnUtils.h>
-#include <Storages/buildQueryTreeForShard.h>
 
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabaseReplicated.h>
@@ -2704,48 +2704,16 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || ((our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-
-            const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
-            const auto src_partition_expression = source_table->getInMemoryMetadataPtr()->getPartitionKeyAST();
-
-            const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
-
-            if (is_partition_exp_different)
-            {
-                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(
-                    part_desc->src_table_part, metadata_snapshot, getContext());
-
-                auto partition_id = new_partition.getID(*this);
-
-                auto [res_part, temporary_part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
-                    part_desc->src_table_part,
-                    new_partition,
-                    partition_id,
-                    new_min_max_index,
-                    TMP_PREFIX + "clone_",
-                    metadata_snapshot,
-                    clone_params,
-                    getContext(),
-                    part_desc->new_part_info.min_block,
-                    part_desc->new_part_info.max_block);
-
-                part_desc->res_part = std::move(res_part);
-                part_desc->temporary_part_lock = std::move(temporary_part_lock);
-            }
-            else
-            {
-                auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
-                    part_desc->src_table_part,
-                    TMP_PREFIX + "clone_",
-                    part_desc->new_part_info,
-                    metadata_snapshot,
-                    clone_params,
-                    getContext()->getReadSettings(),
-                    getContext()->getWriteSettings());
-
-                part_desc->res_part = std::move(res_part);
-                part_desc->temporary_part_lock = std::move(temporary_part_lock);
-            }
+            auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
+                part_desc->src_table_part,
+                TMP_PREFIX + "clone_",
+                part_desc->new_part_info,
+                metadata_snapshot,
+                clone_params,
+                getContext()->getReadSettings(),
+                getContext()->getWriteSettings());
+            part_desc->res_part = std::move(res_part);
+            part_desc->temporary_part_lock = std::move(temporary_part_lock);
         }
         else if (!part_desc->replica.empty())
         {
@@ -7883,22 +7851,11 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
     ProfileEventsScope profile_events_scope;
 
     MergeTreeData & src_data = checkStructureAndGetMergeTreeData(source_table, source_metadata_snapshot, metadata_snapshot);
-    String partition_id = src_data.getPartitionIDFromQuery(partition, query_context);
+    String partition_id = getPartitionIDFromQuery(partition, query_context);
 
     /// NOTE: Some covered parts may be missing in src_all_parts if corresponding log entries are not executed yet.
     DataPartsVector src_all_parts = src_data.getVisibleDataPartsVectorInPartition(query_context, partition_id);
 
-    bool attach_empty_partition = !replace && src_all_parts.empty();
-    if (attach_empty_partition)
-        return;
-
-    const auto my_partition_expression = metadata_snapshot->getPartitionKeyAST();
-    const auto src_partition_expression = source_metadata_snapshot->getPartitionKeyAST();
-    const auto is_partition_exp_different = queryToStringNullable(my_partition_expression) != queryToStringNullable(src_partition_expression);
-
-    if (is_partition_exp_different && !src_all_parts.empty())
-        MergeTreePartitionCompatibilityVerifier::verify(src_data, /* destination_storage */ *this, src_all_parts);
-
     LOG_DEBUG(log, "Cloning {} parts", src_all_parts.size());
 
     static const String TMP_PREFIX = "tmp_replace_from_";
@@ -7953,18 +7910,6 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                                 "Cannot replace partition '{}' because part '{}"
                                 "' has inconsistent granularity with table", partition_id, src_part->name);
 
-            IMergeTreeDataPart::MinMaxIndex min_max_index = *src_part->minmax_idx;
-            MergeTreePartition merge_tree_partition = src_part->partition;
-
-            if (is_partition_exp_different)
-            {
-                auto [new_partition, new_min_max_index] = createPartitionAndMinMaxIndexFromSourcePart(src_part, metadata_snapshot, query_context);
-
-                merge_tree_partition = new_partition;
-                min_max_index = new_min_max_index;
-                partition_id = merge_tree_partition.getID(*this);
-            }
-
             String hash_hex = src_part->checksums.getTotalChecksumHex();
             const bool is_duplicated_part = replaced_parts.contains(hash_hex);
             replaced_parts.insert(hash_hex);
@@ -7983,52 +7928,27 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 continue;
             }
 
+            UInt64 index = lock->getNumber();
+            MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
+
             bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
                 || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
-
-            UInt64 index = lock->getNumber();
-
             IDataPartStorage::ClonePartParams clone_params
             {
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-
-            if (is_partition_exp_different)
-            {
-                auto [dst_part, part_lock] = cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
-                    src_part,
-                    merge_tree_partition,
-                    partition_id,
-                    min_max_index,
-                    TMP_PREFIX,
-                    metadata_snapshot,
-                    clone_params,
-                    query_context,
-                    index,
-                    index);
-
-                dst_parts.emplace_back(dst_part);
-                dst_parts_locks.emplace_back(std::move(part_lock));
-            }
-            else
-            {
-                MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-
-                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                    src_part,
-                    TMP_PREFIX,
-                    dst_part_info,
-                    metadata_snapshot,
-                    clone_params,
-                    query_context->getReadSettings(),
-                    query_context->getWriteSettings());
-
-                dst_parts.emplace_back(dst_part);
-                dst_parts_locks.emplace_back(std::move(part_lock));
-            }
-
+            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                src_part,
+                TMP_PREFIX,
+                dst_part_info,
+                metadata_snapshot,
+                clone_params,
+                query_context->getReadSettings(),
+                query_context->getWriteSettings());
             src_parts.emplace_back(src_part);
+            dst_parts.emplace_back(dst_part);
+            dst_parts_locks.emplace_back(std::move(part_lock));
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
             part_checksums.emplace_back(hash_hex);
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py b/tests/integration/test_attach_partition_distinct_expression_replicated/__init__.py
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml b/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
deleted file mode 100644
index b40730e9f7d..00000000000
--- a/tests/integration/test_attach_partition_distinct_expression_replicated/configs/remote_servers.xml
+++ /dev/null
@@ -1,17 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <test_cluster>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>replica1</host>
-                    <port>9000</port>
-                </replica>
-                <replica>
-                    <host>replica2</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </test_cluster>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_attach_partition_distinct_expression_replicated/test.py b/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
deleted file mode 100644
index 1d8ac4e9e37..00000000000
--- a/tests/integration/test_attach_partition_distinct_expression_replicated/test.py
+++ /dev/null
@@ -1,214 +0,0 @@
-import pytest
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
-
-cluster = ClickHouseCluster(__file__)
-
-replica1 = cluster.add_instance(
-    "replica1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
-)
-replica2 = cluster.add_instance(
-    "replica2", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
-)
-
-
-@pytest.fixture(scope="module")
-def start_cluster():
-    try:
-        cluster.start()
-        yield cluster
-    except Exception as ex:
-        print(ex)
-    finally:
-        cluster.shutdown()
-
-
-def cleanup(nodes):
-    for node in nodes:
-        node.query("DROP TABLE IF EXISTS source SYNC")
-        node.query("DROP TABLE IF EXISTS destination SYNC")
-
-
-def create_table(node, table_name, replicated):
-    replica = node.name
-    engine = (
-        f"ReplicatedMergeTree('/clickhouse/tables/1/{table_name}', '{replica}')"
-        if replicated
-        else "MergeTree()"
-    )
-    partition_expression = (
-        "toYYYYMMDD(timestamp)" if table_name == "source" else "toYYYYMM(timestamp)"
-    )
-    node.query_with_retry(
-        """
-        CREATE TABLE {table_name}(timestamp DateTime)
-        ENGINE = {engine}
-        ORDER BY tuple() PARTITION BY {partition_expression}
-        SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
-        """.format(
-            table_name=table_name,
-            engine=engine,
-            partition_expression=partition_expression,
-        )
-    )
-
-
-def test_both_replicated(start_cluster):
-    for node in [replica1, replica2]:
-        create_table(node, "source", True)
-        create_table(node, "destination", True)
-
-    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
-    replica1.query("SYSTEM SYNC REPLICA source")
-    replica1.query("SYSTEM SYNC REPLICA destination")
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
-    )
-
-    assert_eq_with_retry(
-        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
-    )
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination",
-        replica2.query(f"SELECT * FROM destination"),
-    )
-
-    cleanup([replica1, replica2])
-
-
-def test_only_destination_replicated(start_cluster):
-    create_table(replica1, "source", False)
-    create_table(replica1, "destination", True)
-    create_table(replica2, "destination", True)
-
-    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
-    replica1.query("SYSTEM SYNC REPLICA destination")
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
-    )
-
-    assert_eq_with_retry(
-        replica1, f"SELECT * FROM destination", "2010-03-02 02:01:01\n"
-    )
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination",
-        replica2.query(f"SELECT * FROM destination"),
-    )
-
-    cleanup([replica1, replica2])
-
-
-def test_both_replicated_partitioned_to_unpartitioned(start_cluster):
-    def create_tables(nodes):
-        for node in nodes:
-            source_engine = (
-                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
-            )
-            node.query(
-                """
-                CREATE TABLE source(timestamp DateTime)
-                ENGINE = {engine}
-                ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp)
-                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
-                """.format(
-                    engine=source_engine,
-                )
-            )
-
-            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
-            node.query(
-                """
-                CREATE TABLE destination(timestamp DateTime)
-                ENGINE = {engine}
-                ORDER BY tuple() PARTITION BY tuple()
-                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
-                """.format(
-                    engine=destination_engine,
-                )
-            )
-
-    create_tables([replica1, replica2])
-
-    replica1.query("INSERT INTO source VALUES ('2010-03-02 02:01:01')")
-    replica1.query("INSERT INTO source VALUES ('2010-03-03 02:01:01')")
-    replica1.query("SYSTEM SYNC REPLICA source")
-    replica1.query("SYSTEM SYNC REPLICA destination")
-
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source"
-    )
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION ID '20100303' FROM source"
-    )
-
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination ORDER BY timestamp",
-        "2010-03-02 02:01:01\n2010-03-03 02:01:01\n",
-    )
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination ORDER BY timestamp",
-        replica2.query(f"SELECT * FROM destination ORDER BY timestamp"),
-    )
-
-    cleanup([replica1, replica2])
-
-
-def test_both_replicated_different_exp_same_id(start_cluster):
-    def create_tables(nodes):
-        for node in nodes:
-            source_engine = (
-                f"ReplicatedMergeTree('/clickhouse/tables/1/source', '{node.name}')"
-            )
-            node.query(
-                """
-                CREATE TABLE source(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
-                ENGINE = {engine}
-                ORDER BY tuple() PARTITION BY a % 3
-                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
-                """.format(
-                    engine=source_engine,
-                )
-            )
-
-            destination_engine = f"ReplicatedMergeTree('/clickhouse/tables/1/destination', '{node.name}')"
-            node.query(
-                """
-                CREATE TABLE destination(a UInt16,b UInt16,c UInt16,extra UInt64,Path String,Time DateTime,Value Float64,Timestamp Int64,sign Int8)
-                ENGINE = {engine}
-                ORDER BY tuple() PARTITION BY a
-                SETTINGS cleanup_delay_period=1, cleanup_delay_period_random_add=1, max_cleanup_delay_period=1;
-                """.format(
-                    engine=destination_engine,
-                )
-            )
-
-    create_tables([replica1, replica2])
-
-    replica1.query(
-        "INSERT INTO source (a, b, c, extra, sign) VALUES (1, 5, 9, 1000, 1)"
-    )
-    replica1.query(
-        "INSERT INTO source (a, b, c, extra, sign) VALUES (2, 6, 10, 1000, 1)"
-    )
-    replica1.query("SYSTEM SYNC REPLICA source")
-    replica1.query("SYSTEM SYNC REPLICA destination")
-
-    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 1 FROM source")
-    replica1.query(f"ALTER TABLE destination ATTACH PARTITION 2 FROM source")
-
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination ORDER BY a",
-        "1\t5\t9\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n2\t6\t10\t1000\t\t1970-01-01 00:00:00\t0\t0\t1\n",
-    )
-    assert_eq_with_retry(
-        replica1,
-        f"SELECT * FROM destination ORDER BY a",
-        replica2.query(f"SELECT * FROM destination ORDER BY a"),
-    )
-
-    cleanup([replica1, replica2])
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
deleted file mode 100644
index f1d036b08bf..00000000000
--- a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.reference
+++ /dev/null
@@ -1,467 +0,0 @@
--- { echoOn }
--- Should be allowed since destination partition expr is monotonically increasing and compatible
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
--- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
--- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-20100302
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-20100302
--- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
-CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
-ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	1
-2010-03-02 02:01:03	1
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	1
-2010-03-02 02:01:03	1
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION 0 FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	1
-2010-03-02 02:01:03	1
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	1
-2010-03-02 02:01:03	1
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1
--- Should be allowed because dst partition exp is monot inc and data is not split
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
-SELECT * FROM source ORDER BY productName;
-mop	general
-rice	food
-spaghetti	food
-SELECT * FROM destination ORDER BY productName;
-rice	food
-spaghetti	food
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-59532f3c39a412a413f0f014c7750a9d
-59532f3c39a412a413f0f014c7750a9d
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
-SELECT * FROM source ORDER BY productName;
-mop	general
-rice	food
-spaghetti	food
-SELECT * FROM destination ORDER BY productName;
-rice	food
-spaghetti	food
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-59532f3c39a412a413f0f014c7750a9d
-59532f3c39a412a413f0f014c7750a9d
--- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
-
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
-CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
-INSERT INTO TABLE source VALUES (1267495261123);
-ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-1267495261123
-SELECT * FROM destination ORDER BY timestamp;
-1267495261123
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-2010
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '14670' from source;
-SELECT * FROM source ORDER BY timestamp;
-1267495261123
-SELECT * FROM destination ORDER BY timestamp;
-1267495261123
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-2010
--- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
-
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
-CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
-ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	1	1
-2010-03-02 02:01:01	1	1
-2011-02-02 02:01:03	1	1
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	1	1
-2010-03-02 02:01:01	1	1
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-14670
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '2010' from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	1	1
-2010-03-02 02:01:01	1	1
-2011-02-02 02:01:03	1	1
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	1	1
-2010-03-02 02:01:01	1	1
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-14670
--- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
--- fall into the same partition.
--- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-all
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '201003' from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-all
--- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
--- partition by tuple() is accepted.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-all
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '201003' from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-all
--- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
--- Columns in this case refer to the expression elements, not to the actual table columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
-CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
-INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
-ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
-SELECT * FROM source ORDER BY (a, b, c);
-1	2	3
-1	2	4
-SELECT * FROM destination ORDER BY (a, b, c);
-1	2	3
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1-2
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
-SELECT * FROM source ORDER BY (a, b, c);
-1	2	3
-1	2	4
-SELECT * FROM destination ORDER BY (a, b, c);
-1	2	3
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1-2
--- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
--- Columns in this case refer to the expression elements, not to the actual table columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
-CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
-INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
-ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
-SELECT * FROM source ORDER BY (a, b, c);
-1	2	3
-1	2	4
-SELECT * FROM destination ORDER BY (a, b, c);
-1	2	3
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
-SELECT * FROM source ORDER BY (a, b, c);
-1	2	3
-1	2	4
-SELECT * FROM destination ORDER BY (a, b, c);
-1	2	3
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-1
--- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
--- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
--- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
-CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
-ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	5
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	5
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-5
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01	5
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01	5
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-5
--- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
--- increasing in the source partition min max indexes.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
-CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
-INSERT INTO TABLE source VALUES (6, 12);
-ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
-SELECT * FROM source ORDER BY A;
-6	12
-SELECT * FROM destination ORDER BY A;
-6	12
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-3-6
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
-SELECT * FROM source ORDER BY A;
-6	12
-SELECT * FROM destination ORDER BY A;
-6	12
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-3-6
--- Should be allowed. The same scenario as above, but partition expressions inverted.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
-CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
-INSERT INTO TABLE source VALUES (6, 12);
-ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
-SELECT * FROM source ORDER BY A;
-6	12
-SELECT * FROM destination ORDER BY A;
-6	12
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-6-12
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
-SELECT * FROM source ORDER BY A;
-6	12
-SELECT * FROM destination ORDER BY A;
-6	12
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-6-12
--- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE
-    source(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMMDD(timestamp)
-        ORDER BY tuple();
-CREATE TABLE
-    destination(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMM(timestamp)
-        ORDER BY tuple();
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '20100302' from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
--- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
-DROP TABLE IF EXISTS source SYNC;
-DROP TABLE IF EXISTS destination SYNC;
-CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
-CREATE TABLE
-    destination(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMM(timestamp)
-        ORDER BY tuple();
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
-TRUNCATE TABLE destination;
-ALTER TABLE destination ATTACH PARTITION '20100302' from source;
-SELECT * FROM source ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT * FROM destination ORDER BY timestamp;
-2010-03-02 02:01:01
-2010-03-02 02:01:03
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-201003
--- Should not be allowed because data would be split into two different partitions
-DROP TABLE IF EXISTS source SYNC;
-DROP TABLE IF EXISTS destination SYNC;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
-ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
--- Should not be allowed because data would be split into two different partitions
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
-CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
-ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
-ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
--- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
--- Should not be allowed because dst partition exp depends on a different set of columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
--- Should not be allowed because dst partition exp is not monotonically increasing
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
-CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
-INSERT INTO TABLE source VALUES ('bread'), ('mop');
-INSERT INTO TABLE source VALUES ('broccoli');
-ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
--- Empty/ non-existent partition, same partition expression. Nothing should happen
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
-ALTER TABLE destination ATTACH PARTITION 1 FROM source;
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
--- Empty/ non-existent partition, different partition expression. Nothing should happen
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
-ALTER TABLE destination ATTACH PARTITION 1 FROM source;
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
--- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-ALTER TABLE destination REPLACE PARTITION '1' FROM source;
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
--- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
-CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
-INSERT INTO TABLE destination VALUES (1);
-ALTER TABLE destination REPLACE PARTITION '1' FROM source;
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
diff --git a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql b/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
deleted file mode 100644
index 9547d6ae249..00000000000
--- a/tests/queries/0_stateless/02456_test_attach_partition_different_partition_exp.sql
+++ /dev/null
@@ -1,485 +0,0 @@
--- { echoOn }
--- Should be allowed since destination partition expr is monotonically increasing and compatible
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '20100302' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed since destination partition expr is monotonically increasing and compatible. Note that even though
--- the destination partition expression is more granular, the data would still fall in the same partition. Thus, it is valid
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '201003' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed since destination partition expr is monotonically increasing and compatible for those specific values
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
-
-CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 1);
-
-ALTER TABLE destination ATTACH PARTITION ID '0' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION 0 FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed because dst partition exp is monot inc and data is not split
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-
-ALTER TABLE destination ATTACH PARTITION ID '17908065610379824077' from source;
-
-SELECT * FROM source ORDER BY productName;
-SELECT * FROM destination ORDER BY productName;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '17908065610379824077' from source;
-
-SELECT * FROM source ORDER BY productName;
-SELECT * FROM destination ORDER BY productName;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747574133
-
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY intDiv(timestamp, 86400000);
-CREATE TABLE destination (timestamp Int64) engine=MergeTree ORDER BY (timestamp) PARTITION BY toYear(toDateTime(intDiv(timestamp, 1000)));
-
-INSERT INTO TABLE source VALUES (1267495261123);
-
-ALTER TABLE destination ATTACH PARTITION ID '14670' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '14670' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed, extra test case to validate https://github.com/ClickHouse/ClickHouse/pull/39507#issuecomment-1747511726
-
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY toYear(timestamp);
-CREATE TABLE destination (timestamp DateTime('UTC'), key Int64, f Float64) engine=MergeTree ORDER BY (key, timestamp) PARTITION BY (intDiv(toUInt32(timestamp),86400));
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01',1,1),('2010-03-02 02:01:01',1,1),('2011-02-02 02:01:03',1,1);
-
-ALTER TABLE destination ATTACH PARTITION ID '2010' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '2010' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed, partitioned table to unpartitioned. Since the destination is unpartitioned, parts would ultimately
--- fall into the same partition.
--- Destination partition by expression is omitted, which causes StorageMetadata::getPartitionKeyAST() to be nullptr.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple();
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '201003' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Same as above, but destination partition by expression is explicitly defined. Test case required to validate that
--- partition by tuple() is accepted.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY tuple();
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '201003' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
--- Columns in this case refer to the expression elements, not to the actual table columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
-CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b);
-
-INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
-
-ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
-
-SELECT * FROM source ORDER BY (a, b, c);
-SELECT * FROM destination ORDER BY (a, b, c);
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
-
-SELECT * FROM source ORDER BY (a, b, c);
-SELECT * FROM destination ORDER BY (a, b, c);
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed because the destination partition expression columns are a subset of the source partition expression columns
--- Columns in this case refer to the expression elements, not to the actual table columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE source (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY (a, b, c);
-CREATE TABLE destination (a Int, b Int, c Int) engine=MergeTree ORDER BY tuple() PARTITION BY a;
-
-INSERT INTO TABLE source VALUES (1, 2, 3), (1, 2, 4);
-
-ALTER TABLE destination ATTACH PARTITION ID '1-2-3' FROM source;
-
-SELECT * FROM source ORDER BY (a, b, c);
-SELECT * FROM destination ORDER BY (a, b, c);
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION (1, 2, 3) from source;
-
-SELECT * FROM source ORDER BY (a, b, c);
-SELECT * FROM destination ORDER BY (a, b, c);
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed. Special test case, tricky to explain. First column of source partition expression is
--- timestamp, while first column of destination partition expression is `A`. One of the previous implementations
--- would not match the columns, which could lead to `timestamp` min max being used to calculate monotonicity of `A`.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY tuple(toYYYYMM(timestamp), intDiv(A, 6)) ORDER BY timestamp;
-CREATE TABLE destination (`timestamp` DateTime, `A` Int64) ENGINE = MergeTree PARTITION BY A ORDER BY timestamp;
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 5);
-
-ALTER TABLE destination ATTACH PARTITION ID '201003-0' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION (201003, 0) from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed. Destination partition expression contains multiple expressions, but all of them are monotonically
--- increasing in the source partition min max indexes.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
-CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
-
-INSERT INTO TABLE source VALUES (6, 12);
-
-ALTER TABLE destination ATTACH PARTITION ID '6-12' FROM source;
-
-SELECT * FROM source ORDER BY A;
-SELECT * FROM destination ORDER BY A;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION (6, 12) from source;
-
-SELECT * FROM source ORDER BY A;
-SELECT * FROM destination ORDER BY A;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed. The same scenario as above, but partition expressions inverted.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(intDiv(A, 2), intDiv(B, 2)) ORDER BY tuple();
-CREATE TABLE destination (A Int, B Int) ENGINE = MergeTree PARTITION BY tuple(A, B) ORDER BY tuple();
-
-INSERT INTO TABLE source VALUES (6, 12);
-
-ALTER TABLE destination ATTACH PARTITION ID '3-6' FROM source;
-
-SELECT * FROM source ORDER BY A;
-SELECT * FROM destination ORDER BY A;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION (3, 6) from source;
-
-SELECT * FROM source ORDER BY A;
-SELECT * FROM destination ORDER BY A;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed, it is a local operation, no different than regular attach. Replicated to replicated.
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-CREATE TABLE
-    source(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/source_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMMDD(timestamp)
-        ORDER BY tuple();
-
-CREATE TABLE
-    destination(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMM(timestamp)
-        ORDER BY tuple();
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '20100302' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should be allowed, it is a local operation, no different than regular attach. Non replicated to replicated
-DROP TABLE IF EXISTS source SYNC;
-DROP TABLE IF EXISTS destination SYNC;
-CREATE TABLE source(timestamp DateTime) ENGINE = MergeTree() PARTITION BY toYYYYMMDD(timestamp) ORDER BY tuple();
-
-CREATE TABLE
-    destination(timestamp DateTime)
-    ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/destination_non_replicated_to_replicated_distinct_expression', '1')
-        PARTITION BY toYYYYMM(timestamp)
-        ORDER BY tuple();
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-02 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '20100302' FROM source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
-TRUNCATE TABLE destination;
-
-ALTER TABLE destination ATTACH PARTITION '20100302' from source;
-
-SELECT * FROM source ORDER BY timestamp;
-SELECT * FROM destination ORDER BY timestamp;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Should not be allowed because data would be split into two different partitions
-DROP TABLE IF EXISTS source SYNC;
-DROP TABLE IF EXISTS destination SYNC;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01'), ('2010-03-03 02:01:03');
-
-ALTER TABLE destination ATTACH PARTITION ID '201003' FROM source; -- { serverError 248 }
-ALTER TABLE destination ATTACH PARTITION '201003' from source; -- { serverError 248 }
-
--- Should not be allowed because data would be split into two different partitions
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY intDiv(A, 6);
-
-CREATE TABLE destination (timestamp DateTime, A Int64) engine=MergeTree ORDER BY timestamp PARTITION BY A;
-
-INSERT INTO TABLE source VALUES ('2010-03-02 02:01:01', 1), ('2010-03-02 02:01:03', 2);
-
-ALTER TABLE destination ATTACH PARTITION ID '0' FROM source; -- { serverError 248 }
-ALTER TABLE destination ATTACH PARTITION 0 FROM source; -- { serverError 248 }
-
--- Should not be allowed because dst partition exp takes more than two arguments, so it's not considered monotonically inc
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY substring(category, 1, 2);
-
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-
-ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
-
--- Should not be allowed because dst partition exp depends on a different set of columns
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(category);
-CREATE TABLE destination (productName String, category String) engine=MergeTree ORDER BY tuple() PARTITION BY toString(productName);
-
-INSERT INTO TABLE source VALUES ('spaghetti', 'food'), ('mop', 'general');
-INSERT INTO TABLE source VALUES ('rice', 'food');
-
-ALTER TABLE destination ATTACH PARTITION ID '4590ba78048910b74a47d5bfb308abed' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'food' from source; -- { serverError 36 }
-
--- Should not be allowed because dst partition exp is not monotonically increasing
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY left(productName, 2);
-CREATE TABLE destination (productName String) engine=MergeTree ORDER BY tuple() PARTITION BY cityHash64(productName);
-
-INSERT INTO TABLE source VALUES ('bread'), ('mop');
-INSERT INTO TABLE source VALUES ('broccoli');
-
-ALTER TABLE destination ATTACH PARTITION ID '4589453b7ee96ce9de1265bd57674496' from source; -- { serverError 36 }
-ALTER TABLE destination ATTACH PARTITION 'br' from source; -- { serverError 36 }
-
--- Empty/ non-existent partition, same partition expression. Nothing should happen
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-
-ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
-ALTER TABLE destination ATTACH PARTITION 1 FROM source;
-
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Empty/ non-existent partition, different partition expression. Nothing should happen
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMMDD(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-
-ALTER TABLE destination ATTACH PARTITION ID '1' FROM source;
-ALTER TABLE destination ATTACH PARTITION 1 FROM source;
-
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Replace instead of attach. Empty/ non-existent partition, same partition expression. Nothing should happen
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-CREATE TABLE destination (timestamp DateTime) engine=MergeTree ORDER BY tuple() PARTITION BY toYYYYMM(timestamp);
-
-ALTER TABLE destination REPLACE PARTITION '1' FROM source;
-
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;
-
--- Replace instead of attach. Empty/ non-existent partition to non-empty partition, same partition id.
--- https://github.com/ClickHouse/ClickHouse/pull/39507#discussion_r1399839045
-DROP TABLE IF EXISTS source;
-DROP TABLE IF EXISTS destination;
-
-CREATE TABLE source (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
-CREATE TABLE destination (A Int) engine=MergeTree ORDER BY tuple() PARTITION BY A;
-
-INSERT INTO TABLE destination VALUES (1);
-
-ALTER TABLE destination REPLACE PARTITION '1' FROM source;
-
-SELECT * FROM destination;
-SELECT partition_id FROM system.parts where table='destination' AND database = currentDatabase() AND active = 1;

From 90f2c4286d647b9888eda0a70e4f5379207c7f76 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 05:33:32 +0300
Subject: [PATCH 0692/1081] Update CHANGELOG.md

---
 CHANGELOG.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 60618402174..b3e5dd709ab 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -22,7 +22,6 @@
 * Add `quantileDD` aggregate function as well as the corresponding `quantilesDD` and `medianDD`. It is based on the DDSketch https://www.vldb.org/pvldb/vol12/p2195-masson.pdf. ### Documentation entry for user-facing changes. [#56342](https://github.com/ClickHouse/ClickHouse/pull/56342) ([Srikanth Chekuri](https://github.com/srikanthccv)).
 * Allow to configure any kind of object storage with any kind of metadata type. [#58357](https://github.com/ClickHouse/ClickHouse/pull/58357) ([Kseniia Sumarokova](https://github.com/kssenii)).
 * Added `null_status_on_timeout_only_active` and `throw_only_active` modes for `distributed_ddl_output_mode` that allow to avoid waiting for inactive replicas. [#58350](https://github.com/ClickHouse/ClickHouse/pull/58350) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Allow partitions from tables with different partition expressions to be attached when the destination table partition expression doesn't re-partition/split the part. [#39507](https://github.com/ClickHouse/ClickHouse/pull/39507) ([Arthur Passos](https://github.com/arthurpassos)).
 * Add function `arrayShingles` to compute subarrays, e.g. `arrayShingles([1, 2, 3, 4, 5], 3)` returns `[[1,2,3],[2,3,4],[3,4,5]]`. [#58396](https://github.com/ClickHouse/ClickHouse/pull/58396) ([Zheng Miao](https://github.com/zenmiao7)).
 * Added functions `punycodeEncode`, `punycodeDecode`, `idnaEncode` and `idnaDecode` which are useful for translating international domain names to an ASCII representation according to the IDNA standard. [#58454](https://github.com/ClickHouse/ClickHouse/pull/58454) ([Robert Schulze](https://github.com/rschu1ze)).
 * Added string similarity functions `dramerauLevenshteinDistance`, `jaroSimilarity` and `jaroWinklerSimilarity`. [#58531](https://github.com/ClickHouse/ClickHouse/pull/58531) ([Robert Schulze](https://github.com/rschu1ze)).

From 88b6b38a748e994695b078fa03bd6dd5b9210ee0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 04:21:57 +0100
Subject: [PATCH 0693/1081] Check stack size in Parser

---
 src/Parsers/IParser.h | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index d53b58baa7c..6be33e43920 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -9,6 +9,7 @@
 #include <Parsers/TokenIterator.h>
 #include <base/types.h>
 #include <Common/Exception.h>
+#include <Common/checkStackSize.h>
 
 
 namespace DB
@@ -73,6 +74,16 @@ public:
             if (unlikely(max_depth > 0 && depth > max_depth))
                 throw Exception(ErrorCodes::TOO_DEEP_RECURSION, "Maximum parse depth ({}) exceeded. "
                     "Consider rising max_parser_depth parameter.", max_depth);
+
+            /** Sometimes the maximum parser depth can be set to a high value by the user,
+              * but we still want to avoid stack overflow.
+              * For this purpose, we can use the checkStackSize function, but it is too heavy.
+              * The solution is to check not too frequently.
+              * The frequency 128 is arbitrary, but not too large, not too small,
+              * and a power of two to simplify the division.
+              */
+            if (depth % 8192 == 0)
+                checkStackSize();
         }
 
         ALWAYS_INLINE void decreaseDepth()

From 5b791ddec894e1587db7a726e68890b479312145 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 04:23:43 +0100
Subject: [PATCH 0694/1081] Check stack size in Parser

---
 src/Parsers/IParser.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index 6be33e43920..99dbc39f06f 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -79,7 +79,7 @@ public:
               * but we still want to avoid stack overflow.
               * For this purpose, we can use the checkStackSize function, but it is too heavy.
               * The solution is to check not too frequently.
-              * The frequency 128 is arbitrary, but not too large, not too small,
+              * The frequency is arbitrary, but not too large, not too small,
               * and a power of two to simplify the division.
               */
             if (depth % 8192 == 0)

From 8733a9634a4342d57c7b7ae8a9ba8bc877ea76fd Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 7 Feb 2024 11:24:27 +0800
Subject: [PATCH 0695/1081] add uts

---
 .../0_stateless/02985_if_over_big_int_decimal.reference     | 6 ++++++
 tests/queries/0_stateless/02985_if_over_big_int_decimal.sql | 6 ++++++
 2 files changed, 12 insertions(+)
 create mode 100644 tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
 create mode 100644 tests/queries/0_stateless/02985_if_over_big_int_decimal.sql

diff --git a/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference b/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
new file mode 100644
index 00000000000..055103ad134
--- /dev/null
+++ b/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
@@ -0,0 +1,6 @@
+49500
+49500
+49500
+49500
+49500
+49500
diff --git a/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql b/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql
new file mode 100644
index 00000000000..6868524d195
--- /dev/null
+++ b/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql
@@ -0,0 +1,6 @@
+select sumIf(number::Int128, number % 10 == 0) from numbers(1000);
+select sumIf(number::UInt128, number % 10 == 0) from numbers(1000);
+select sumIf(number::Int256, number % 10 == 0) from numbers(1000);
+select sumIf(number::UInt256, number % 10 == 0) from numbers(1000);
+select sumIf(number::Decimal128(3), number % 10 == 0) from numbers(1000);
+select sumIf(number::Decimal256(3), number % 10 == 0) from numbers(1000);

From a652bd98b25a9cc04a01702815ec151b0f402b45 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 04:30:48 +0100
Subject: [PATCH 0696/1081] Add a test

---
 .../0_stateless/02985_parser_check_stack_size.reference    | 1 +
 tests/queries/0_stateless/02985_parser_check_stack_size.sh | 7 +++++++
 2 files changed, 8 insertions(+)
 create mode 100644 tests/queries/0_stateless/02985_parser_check_stack_size.reference
 create mode 100755 tests/queries/0_stateless/02985_parser_check_stack_size.sh

diff --git a/tests/queries/0_stateless/02985_parser_check_stack_size.reference b/tests/queries/0_stateless/02985_parser_check_stack_size.reference
new file mode 100644
index 00000000000..f83e0818db2
--- /dev/null
+++ b/tests/queries/0_stateless/02985_parser_check_stack_size.reference
@@ -0,0 +1 @@
+TOO_DEEP
diff --git a/tests/queries/0_stateless/02985_parser_check_stack_size.sh b/tests/queries/0_stateless/02985_parser_check_stack_size.sh
new file mode 100755
index 00000000000..c91a0a3eacc
--- /dev/null
+++ b/tests/queries/0_stateless/02985_parser_check_stack_size.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT --query "select 'create table test (x ' || repeat('Array(', 10000) || 'UInt64' || repeat(')', 10000) || ') engine=Memory' format TSVRaw" | $CLICKHOUSE_CURL "${CLICKHOUSE_URL}&max_parser_depth=100000" --data-binary @- | grep -o -F 'TOO_DEEP'

From b5b7847036452f73f0e8d7ebab7af9fcb2497ccb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 7 Feb 2024 10:59:32 +0100
Subject: [PATCH 0697/1081] Revert "MergeTree FINAL optimization diagnostics
 and settings"

---
 src/Core/Settings.h                           |  2 -
 src/Core/SettingsChangesHistory.h             |  4 +-
 src/Processors/QueryPlan/PartsSplitter.cpp    | 38 ++++---------------
 src/Processors/QueryPlan/PartsSplitter.h      |  3 +-
 .../QueryPlan/ReadFromMergeTree.cpp           |  6 +--
 5 files changed, 11 insertions(+), 42 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 221f8a01966..a433d523358 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -215,8 +215,6 @@ class IColumn;
     M(UInt64, merge_tree_max_rows_to_use_cache, (128 * 8192), "The maximum number of rows per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(UInt64, merge_tree_max_bytes_to_use_cache, (192 * 10 * 1024 * 1024), "The maximum number of bytes per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(Bool, do_not_merge_across_partitions_select_final, false, "Merge parts only in one partition in select final", 0) \
-    M(Bool, split_parts_ranges_into_intersecting_and_non_intersecting_final, true, "Split parts ranges into intersecting and non intersecting during FINAL optimization", 0) \
-    M(Bool, split_intersecting_parts_ranges_into_layers_final, true, "Split intersecting parts ranges into layers during FINAL optimization", 0) \
     M(Bool, allow_experimental_inverted_index, false, "If it is set to true, allow to use experimental inverted index.", 0) \
     \
     M(UInt64, mysql_max_rows_to_insert, 65536, "The maximum number of rows in MySQL batch insertion of the MySQL storage engine", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 27412ec20a4..a1c1523aaa9 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -116,9 +116,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
-              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"},
-              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", false, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
-              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
+              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"}}},
     {"23.9", {{"optimize_group_by_constant_keys", false, true, "Optimize group by constant keys by default"},
               {"input_format_json_try_infer_named_tuples_from_objects", false, true, "Try to infer named Tuples from JSON objects by default"},
               {"input_format_json_read_numbers_as_strings", false, true, "Allow to read numbers as strings in JSON formats by default"},
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 363fdca22c5..7c66c0cc8df 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -228,7 +228,7 @@ struct SplitPartsRangesResult
     RangesInDataParts intersecting_parts_ranges;
 };
 
-SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts, const LoggerPtr & logger)
+SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts)
 {
     /** Split ranges in data parts into intersecting ranges in data parts and non intersecting ranges in data parts.
       *
@@ -483,15 +483,10 @@ SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts,
         intersecting_ranges_in_data_parts.end(),
         [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
 
-    LOG_TEST(logger, "Non intersecting ranges in data parts {}", non_intersecting_ranges_in_data_parts.getDescriptions().describe());
-    LOG_TEST(logger, "Intersecting ranges in data parts {}", intersecting_ranges_in_data_parts.getDescriptions().describe());
-
     return {std::move(non_intersecting_ranges_in_data_parts), std::move(intersecting_ranges_in_data_parts)};
 }
 
-std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts,
-    size_t max_layers,
-    const LoggerPtr & logger)
+std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts, size_t max_layers)
 {
     // We will advance the iterator pointing to the mark with the smallest PK value until
     // there will be not less than rows_per_layer rows in the current layer (roughly speaking).
@@ -596,18 +591,8 @@ std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersecting
         result_layers.back() = std::move(current_layer_builder.getCurrentRangesInDataParts());
     }
 
-    size_t result_layers_size = result_layers.size();
-    LOG_TEST(logger, "Split intersecting ranges into {} layers", result_layers_size);
-
-    for (size_t i = 0; i < result_layers_size; ++i)
+    for (auto & layer : result_layers)
     {
-        auto & layer = result_layers[i];
-
-        LOG_TEST(logger, "Layer {} {} filter values in ({}, {}])",
-            i,
-            layer.getDescriptions().describe(),
-            i ? ::toString(borders[i - 1]) : "-inf", i < borders.size() ? ::toString(borders[i]) : "+inf");
-
         std::stable_sort(
             layer.begin(),
             layer.end(),
@@ -727,32 +712,23 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool split_parts_ranges_into_intersecting_and_non_intersecting_final,
-    bool split_intersecting_parts_ranges_into_layers)
+    bool force_process_all_ranges)
 {
     if (max_layers <= 1)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "max_layer should be greater than 1");
 
-    auto logger = getLogger("PartsSplitter");
-
     SplitPartsWithRangesByPrimaryKeyResult result;
 
     RangesInDataParts intersecting_parts_ranges = std::move(parts);
 
-    if (split_parts_ranges_into_intersecting_and_non_intersecting_final)
+    if (!force_process_all_ranges)
     {
-        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges, logger);
+        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges);
         result.non_intersecting_parts_ranges = std::move(split_result.non_intersecting_parts_ranges);
         intersecting_parts_ranges = std::move(split_result.intersecting_parts_ranges);
     }
 
-    if (!split_intersecting_parts_ranges_into_layers)
-    {
-        result.merging_pipes.emplace_back(in_order_reading_step_getter(intersecting_parts_ranges));
-        return result;
-    }
-
-    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers, logger);
+    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers);
     auto filters = buildFilters(primary_key, borders);
     result.merging_pipes.resize(layers.size());
 
diff --git a/src/Processors/QueryPlan/PartsSplitter.h b/src/Processors/QueryPlan/PartsSplitter.h
index 9bceb344589..f1ed1cb0b9c 100644
--- a/src/Processors/QueryPlan/PartsSplitter.h
+++ b/src/Processors/QueryPlan/PartsSplitter.h
@@ -34,6 +34,5 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool split_parts_ranges_into_intersecting_and_non_intersecting,
-    bool split_intersecting_parts_ranges_into_layers);
+    bool force_process_all_ranges);
 }
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 8a04caede80..5ed56f59fc1 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1175,8 +1175,7 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
 
                 /// Parts of non-zero level still may contain duplicate PK values to merge on FINAL if there's is_deleted column,
                 /// so we have to process all ranges. It would be more optimal to remove this flag and add an extra filtering step.
-                bool split_parts_ranges_into_intersecting_and_non_intersecting_final = settings.split_parts_ranges_into_intersecting_and_non_intersecting_final &&
-                    data.merging_params.is_deleted_column.empty();
+                bool force_process_all_ranges = !data.merging_params.is_deleted_column.empty();
 
                 SplitPartsWithRangesByPrimaryKeyResult split_ranges_result = splitPartsWithRangesByPrimaryKey(
                     metadata_for_reading->getPrimaryKey(),
@@ -1185,8 +1184,7 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
                     num_streams,
                     context,
                     std::move(in_order_reading_step_getter),
-                    split_parts_ranges_into_intersecting_and_non_intersecting_final,
-                    settings.split_intersecting_parts_ranges_into_layers_final);
+                    force_process_all_ranges);
 
                 for (auto && non_intersecting_parts_range : split_ranges_result.non_intersecting_parts_ranges)
                     non_intersecting_parts_by_primary_key.push_back(std::move(non_intersecting_parts_range));

From 06d112135ec0156155510653abdef429d7cb6283 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 5 Jan 2024 16:31:10 +0000
Subject: [PATCH 0698/1081] Simplify prewhere push down from query plan. Try to
 always use it.

---
 src/Interpreters/ActionsDAG.cpp               |  11 +-
 src/Interpreters/ActionsDAG.h                 |   9 +-
 src/Interpreters/InterpreterSelectQuery.cpp   |  56 +-
 .../Optimizations/liftUpFunctions.cpp         |   2 +-
 .../Optimizations/optimizePrewhere.cpp        | 509 ++++++++++--------
 .../MergeTree/MergeTreeWhereOptimizer.cpp     |  27 +-
 .../MergeTree/MergeTreeWhereOptimizer.h       |   9 +-
 7 files changed, 334 insertions(+), 289 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 6512def9202..03d7e620541 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -1631,7 +1631,7 @@ void ActionsDAG::mergeNodes(ActionsDAG && second)
     }
 }
 
-ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split_nodes) const
+ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split_nodes, bool create_split_nodes_mapping) const
 {
     /// Split DAG into two parts.
     /// (first_nodes, first_outputs) is a part which will have split_list in result.
@@ -1830,7 +1830,14 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
     second_actions->outputs.swap(second_outputs);
     second_actions->inputs.swap(second_inputs);
 
-    return {std::move(first_actions), std::move(second_actions)};
+    std::unordered_map<const Node *, const Node *> split_nodes_mapping;
+    if (create_split_nodes_mapping)
+    {
+        for (const auto * node : split_nodes)
+            split_nodes_mapping[node] = data[node].to_first;
+    }
+
+    return {std::move(first_actions), std::move(second_actions), std::move(split_nodes_mapping)};
 }
 
 ActionsDAG::SplitResult ActionsDAG::splitActionsBeforeArrayJoin(const NameSet & array_joined_columns) const
diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index 45f6e5cc717..04683832c6d 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -326,13 +326,18 @@ public:
     /// Merge current nodes with specified dag nodes
     void mergeNodes(ActionsDAG && second);
 
-    using SplitResult = std::pair<ActionsDAGPtr, ActionsDAGPtr>;
+    struct SplitResult
+    {
+        ActionsDAGPtr first;
+        ActionsDAGPtr second;
+        std::unordered_map<const Node *, const Node *> split_nodes_mapping;
+    };
 
     /// Split ActionsDAG into two DAGs, where first part contains all nodes from split_nodes and their children.
     /// Execution of first then second parts on block is equivalent to execution of initial DAG.
     /// First DAG and initial DAG have equal inputs, second DAG and initial DAG has equal outputs.
     /// Second DAG inputs may contain less inputs then first DAG (but also include other columns).
-    SplitResult split(std::unordered_set<const Node *> split_nodes) const;
+    SplitResult split(std::unordered_set<const Node *> split_nodes, bool create_split_nodes_mapping = false) const;
 
     /// Splits actions into two parts. Returned first half may be swapped with ARRAY JOIN.
     SplitResult splitActionsBeforeArrayJoin(const NameSet & array_joined_columns) const;
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index d0cf9f1160c..187518b9f6c 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -600,7 +600,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
         query.setFinal();
     }
 
-    auto analyze = [&] (bool try_move_to_prewhere)
+    auto analyze = [&] (bool)
     {
         /// Allow push down and other optimizations for VIEW: replace with subquery and rewrite it.
         ASTPtr view_table;
@@ -632,37 +632,37 @@ InterpreterSelectQuery::InterpreterSelectQuery(
             view = nullptr;
         }
 
-        if (try_move_to_prewhere
-            && storage && storage->canMoveConditionsToPrewhere()
-            && query.where() && !query.prewhere()
-            && !query.hasJoin()) /// Join may produce rows with nulls or default values, it's difficult to analyze if they affected or not.
-        {
-            /// PREWHERE optimization: transfer some condition from WHERE to PREWHERE if enabled and viable
-            if (const auto & column_sizes = storage->getColumnSizes(); !column_sizes.empty())
-            {
-                /// Extract column compressed sizes.
-                std::unordered_map<std::string, UInt64> column_compressed_sizes;
-                for (const auto & [name, sizes] : column_sizes)
-                    column_compressed_sizes[name] = sizes.data_compressed;
+        // if (try_move_to_prewhere
+        //     && storage && storage->canMoveConditionsToPrewhere()
+        //     && query.where() && !query.prewhere()
+        //     && !query.hasJoin()) /// Join may produce rows with nulls or default values, it's difficult to analyze if they affected or not.
+        // {
+        //     /// PREWHERE optimization: transfer some condition from WHERE to PREWHERE if enabled and viable
+        //     if (const auto & column_sizes = storage->getColumnSizes(); !column_sizes.empty())
+        //     {
+        //         /// Extract column compressed sizes.
+        //         std::unordered_map<std::string, UInt64> column_compressed_sizes;
+        //         for (const auto & [name, sizes] : column_sizes)
+        //             column_compressed_sizes[name] = sizes.data_compressed;
 
-                SelectQueryInfo current_info;
-                current_info.query = query_ptr;
-                current_info.syntax_analyzer_result = syntax_analyzer_result;
+        //         SelectQueryInfo current_info;
+        //         current_info.query = query_ptr;
+        //         current_info.syntax_analyzer_result = syntax_analyzer_result;
 
-                Names queried_columns = syntax_analyzer_result->requiredSourceColumns();
-                const auto & supported_prewhere_columns = storage->supportedPrewhereColumns();
+        //         Names queried_columns = syntax_analyzer_result->requiredSourceColumns();
+        //         const auto & supported_prewhere_columns = storage->supportedPrewhereColumns();
 
-                MergeTreeWhereOptimizer where_optimizer{
-                    std::move(column_compressed_sizes),
-                    metadata_snapshot,
-                    storage->getConditionEstimatorByPredicate(query_info, storage_snapshot, context),
-                    queried_columns,
-                    supported_prewhere_columns,
-                    log};
+        //         MergeTreeWhereOptimizer where_optimizer{
+        //             std::move(column_compressed_sizes),
+        //             metadata_snapshot,
+        //             storage->getConditionEstimatorByPredicate(query_info, storage_snapshot, context),
+        //             queried_columns,
+        //             supported_prewhere_columns,
+        //             log};
 
-                where_optimizer.optimize(current_info, context);
-            }
-        }
+        //         where_optimizer.optimize(current_info, context);
+        //     }
+        // }
 
         if (query.prewhere() && query.where())
         {
diff --git a/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp b/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
index 34a1fc2bb88..3fc2d64b11f 100644
--- a/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
+++ b/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
@@ -66,7 +66,7 @@ size_t tryExecuteFunctionsAfterSorting(QueryPlan::Node * parent_node, QueryPlan:
     NameSet sort_columns;
     for (const auto & col : sorting_step->getSortDescription())
         sort_columns.insert(col.column_name);
-    auto [needed_for_sorting, unneeded_for_sorting] = expression_step->getExpression()->splitActionsBySortingDescription(sort_columns);
+    auto [needed_for_sorting, unneeded_for_sorting, _] = expression_step->getExpression()->splitActionsBySortingDescription(sort_columns);
 
     // No calculations can be postponed.
     if (unneeded_for_sorting->trivial())
diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 7902b36f80e..b2ac34b4b24 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -5,7 +5,8 @@
 #include <Storages/MergeTree/MergeTreeWhereOptimizer.h>
 #include <Interpreters/ActionsDAG.h>
 #include <Planner/ActionsChain.h>
-#include <deque>
+#include "Functions/FunctionsLogical.h"
+#include "Functions/IFunctionAdaptors.h"
 
 namespace DB
 {
@@ -15,58 +16,58 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-namespace
-{
+// namespace
+// {
 
-void matchDAGOutputNodesOrderWithHeader(ActionsDAGPtr & actions_dag, const Block & expected_header)
-{
-    std::unordered_map<std::string, const ActionsDAG::Node *> output_name_to_node;
-    for (const auto * output_node : actions_dag->getOutputs())
-        output_name_to_node.emplace(output_node->result_name, output_node);
+// void matchDAGOutputNodesOrderWithHeader(ActionsDAGPtr & actions_dag, const Block & expected_header)
+// {
+//     std::unordered_map<std::string, const ActionsDAG::Node *> output_name_to_node;
+//     for (const auto * output_node : actions_dag->getOutputs())
+//         output_name_to_node.emplace(output_node->result_name, output_node);
 
-    std::unordered_set<const ActionsDAG::Node *> used_output_nodes;
+//     std::unordered_set<const ActionsDAG::Node *> used_output_nodes;
 
-    ActionsDAG::NodeRawConstPtrs updated_outputs;
-    updated_outputs.reserve(expected_header.columns());
+//     ActionsDAG::NodeRawConstPtrs updated_outputs;
+//     updated_outputs.reserve(expected_header.columns());
 
-    for (const auto & column : expected_header)
-    {
-        auto output_node_it = output_name_to_node.find(column.name);
-        if (output_node_it == output_name_to_node.end())
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "Invalid move to PREWHERE optimization. Cannot find column {} in output",
-                column.name);
+//     for (const auto & column : expected_header)
+//     {
+//         auto output_node_it = output_name_to_node.find(column.name);
+//         if (output_node_it == output_name_to_node.end())
+//             throw Exception(ErrorCodes::LOGICAL_ERROR,
+//                 "Invalid move to PREWHERE optimization. Cannot find column {} in output",
+//                 column.name);
 
-        updated_outputs.push_back(output_node_it->second);
-        used_output_nodes.insert(output_node_it->second);
-    }
+//         updated_outputs.push_back(output_node_it->second);
+//         used_output_nodes.insert(output_node_it->second);
+//     }
 
-    ActionsDAG::NodeRawConstPtrs unused_outputs;
-    for (const auto * output_node : actions_dag->getOutputs())
-    {
-        if (used_output_nodes.contains(output_node))
-            continue;
+//     ActionsDAG::NodeRawConstPtrs unused_outputs;
+//     for (const auto * output_node : actions_dag->getOutputs())
+//     {
+//         if (used_output_nodes.contains(output_node))
+//             continue;
 
-        unused_outputs.push_back(output_node);
-    }
+//         unused_outputs.push_back(output_node);
+//     }
 
-    auto & actions_dag_outputs = actions_dag->getOutputs();
-    actions_dag_outputs = std::move(updated_outputs);
-    actions_dag_outputs.insert(actions_dag_outputs.end(), unused_outputs.begin(), unused_outputs.end());
-}
+//     auto & actions_dag_outputs = actions_dag->getOutputs();
+//     actions_dag_outputs = std::move(updated_outputs);
+//     actions_dag_outputs.insert(actions_dag_outputs.end(), unused_outputs.begin(), unused_outputs.end());
+// }
 
-}
+// }
 
 
 namespace QueryPlanOptimizations
 {
 
-void optimizePrewhere(Stack & stack, QueryPlan::Nodes & nodes)
+void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
 {
     if (stack.size() < 3)
         return;
 
-    const auto & frame = stack.back();
+    auto & frame = stack.back();
 
     /** Assume that on stack there are at least 3 nodes:
       *
@@ -82,7 +83,7 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes & nodes)
     if (storage_prewhere_info && storage_prewhere_info->prewhere_actions)
         return;
 
-    const QueryPlan::Node * filter_node = (stack.rbegin() + 1)->node;
+    QueryPlan::Node * filter_node = (stack.rbegin() + 1)->node;
     const auto * filter_step = typeid_cast<FilterStep *>(filter_node->step.get());
     if (!filter_step)
         return;
@@ -92,40 +93,40 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes & nodes)
       * Collect input node to output nodes mapping.
       */
     ColumnsWithTypeAndName required_columns_after_filter;
-    std::unordered_set<std::string> output_nodes_mapped_to_input;
-    std::unordered_map<std::string, std::vector<std::string>> input_node_to_output_names;
+    // std::unordered_set<std::string> output_nodes_mapped_to_input;
+    // std::unordered_map<std::string, std::vector<std::string>> input_node_to_output_names;
 
-    for (const auto * output_node : filter_step->getExpression()->getOutputs())
-    {
-        const auto * node_without_alias = output_node;
-        while (node_without_alias->type == ActionsDAG::ActionType::ALIAS)
-            node_without_alias = node_without_alias->children[0];
+    // for (const auto * output_node : filter_step->getExpression()->getOutputs())
+    // {
+    //     const auto * node_without_alias = output_node;
+    //     while (node_without_alias->type == ActionsDAG::ActionType::ALIAS)
+    //         node_without_alias = node_without_alias->children[0];
 
-        if (node_without_alias->type == ActionsDAG::ActionType::INPUT)
-        {
-            output_nodes_mapped_to_input.emplace(output_node->result_name);
+    //     if (node_without_alias->type == ActionsDAG::ActionType::INPUT)
+    //     {
+    //         output_nodes_mapped_to_input.emplace(output_node->result_name);
 
-            auto output_names_it = input_node_to_output_names.find(node_without_alias->result_name);
-            if (output_names_it == input_node_to_output_names.end())
-            {
-                auto [insert_it, _] = input_node_to_output_names.emplace(node_without_alias->result_name, std::vector<std::string>());
-                output_names_it = insert_it;
-            }
+    //         auto output_names_it = input_node_to_output_names.find(node_without_alias->result_name);
+    //         if (output_names_it == input_node_to_output_names.end())
+    //         {
+    //             auto [insert_it, _] = input_node_to_output_names.emplace(node_without_alias->result_name, std::vector<std::string>());
+    //             output_names_it = insert_it;
+    //         }
 
-            output_names_it->second.push_back(output_node->result_name);
-        }
+    //         output_names_it->second.push_back(output_node->result_name);
+    //     }
 
-        if (output_node->result_name == filter_step->getFilterColumnName() && filter_step->removesFilterColumn())
-            continue;
+    //     if (output_node->result_name == filter_step->getFilterColumnName() && filter_step->removesFilterColumn())
+    //         continue;
 
-        required_columns_after_filter.push_back(ColumnWithTypeAndName(output_node->result_type, output_node->result_name));
-    }
+    //     required_columns_after_filter.push_back(ColumnWithTypeAndName(output_node->result_type, output_node->result_name));
+    // }
 
     const auto & context = read_from_merge_tree->getContext();
     const auto & settings = context->getSettingsRef();
 
-    if (!settings.allow_experimental_analyzer)
-        return;
+    // if (!settings.allow_experimental_analyzer)
+    //     return;
 
     const auto & table_expression_modifiers = read_from_merge_tree->getQueryInfo().table_expression_modifiers;
     bool is_final = table_expression_modifiers && table_expression_modifiers->hasFinal();
@@ -170,7 +171,8 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes & nodes)
         filter_step->getFilterColumnName(),
         read_from_merge_tree->getContext(),
         is_final);
-    if (!optimize_result.has_value())
+
+    if (!optimize_result.fully_moved_to_prewhere && optimize_result.prewhere_nodes.empty())
         return;
 
     PrewhereInfoPtr prewhere_info;
@@ -181,198 +183,243 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes & nodes)
 
     prewhere_info->need_filter = true;
 
-    auto & prewhere_filter_actions = optimize_result->prewhere_filter_actions;
+    // QueryPlan::Node * replace_old_filter_node = nullptr;
+    // bool remove_filter_node = false;
 
-    ActionsChain actions_chain;
-
-    std::string prewere_filter_node_name = prewhere_filter_actions->getOutputs().at(0)->result_name;
-    actions_chain.addStep(std::make_unique<ActionsChainStep>(prewhere_filter_actions));
-
-    auto & filter_actions = optimize_result->filter_actions;
-
-    /** Merge tree where optimizer splits conjunctions in filter expression into 2 parts:
-      * 1. Filter expressions.
-      * 2. Prewhere filter expressions.
-      *
-      * There can be cases when all expressions are moved to PREWHERE, but it is not
-      * enough to produce required filter output columns.
-      *
-      * Example: SELECT (a AND b) AS cond FROM test_table WHERE cond AND c;
-      * In this example condition expressions `a`, `b`, `c` can move to PREWHERE, but PREWHERE will not contain expression `and(a, b)`.
-      * It will contain only `a`, `b`, `c`, `and(a, b, c)` expressions.
-      *
-      * In such scenario we need to create additional step to calculate `and(a, b)` expression after PREWHERE.
-      */
-    bool need_additional_filter_after_prewhere = false;
-
-    if (!filter_actions)
+    if (!optimize_result.fully_moved_to_prewhere)
     {
-        /// Any node from PREWHERE filter actions can be used as possible output node
-        std::unordered_set<std::string> possible_prewhere_output_nodes;
-        for (const auto & node : prewhere_filter_actions->getNodes())
-            possible_prewhere_output_nodes.insert(node.result_name);
+        auto split_result = filter_step->getExpression()->split(optimize_result.prewhere_nodes, true);
+        ActionsDAG::NodeRawConstPtrs conditions;
+        conditions.reserve(split_result.split_nodes_mapping.size());
+        for (const auto * condition : optimize_result.prewhere_nodes)
+            conditions.push_back(split_result.split_nodes_mapping.at(condition));
 
-        for (auto & required_column : required_columns_after_filter)
+        prewhere_info->prewhere_actions = std::move(split_result.first);
+        prewhere_info->remove_prewhere_column = true;
+
+        if (conditions.size() == 1)
         {
-            if (!possible_prewhere_output_nodes.contains(required_column.name) &&
-                !output_nodes_mapped_to_input.contains(required_column.name))
+            for (const auto * output : prewhere_info->prewhere_actions->getOutputs())
             {
-                need_additional_filter_after_prewhere = true;
-                break;
-            }
-        }
-    }
-
-    /** If there are additional filter actions after PREWHERE filter actions, we create filter actions dag using PREWHERE filter
-      * actions output columns as filter actions dag input columns.
-      * Then we merge this filter actions dag nodes with old filter step actions dag nodes, to reuse some expressions from
-      * PREWHERE filter actions.
-      */
-    if (need_additional_filter_after_prewhere || filter_actions)
-    {
-        auto merged_filter_actions = std::make_shared<ActionsDAG>(actions_chain.getLastStepAvailableOutputColumns());
-        merged_filter_actions->getOutputs().clear();
-        merged_filter_actions->mergeNodes(std::move(*filter_step->getExpression()->clone()));
-
-        /// Add old filter step filter column to outputs
-        for (const auto & node : merged_filter_actions->getNodes())
-        {
-            if (node.result_name == filter_step->getFilterColumnName())
-            {
-                merged_filter_actions->getOutputs().push_back(&node);
-                break;
-            }
-        }
-
-        filter_actions = std::move(merged_filter_actions);
-
-        /// If there is filter after PREWHERE, we can ignore filtering during PREWHERE stage
-        prewhere_info->need_filter = false;
-
-        actions_chain.addStep(std::make_unique<ActionsChainStep>(filter_actions));
-    }
-
-    auto required_output_actions = std::make_shared<ActionsDAG>(required_columns_after_filter);
-    actions_chain.addStep(std::make_unique<ActionsChainStep>(required_output_actions));
-
-    actions_chain.finalize();
-
-    prewhere_filter_actions->projectInput(false);
-
-    auto & prewhere_actions_chain_node = actions_chain[0];
-    prewhere_info->prewhere_actions = std::move(prewhere_filter_actions);
-    prewhere_info->prewhere_column_name = prewere_filter_node_name;
-    prewhere_info->remove_prewhere_column = !prewhere_actions_chain_node->getChildRequiredOutputColumnsNames().contains(prewere_filter_node_name);
-
-    read_from_merge_tree->updatePrewhereInfo(prewhere_info);
-
-    QueryPlan::Node * replace_old_filter_node = nullptr;
-    bool remove_filter_node = false;
-
-    if (filter_actions)
-    {
-        filter_actions->projectInput(false);
-
-        /// Match dag output nodes with old filter step header
-        matchDAGOutputNodesOrderWithHeader(filter_actions, filter_step->getOutputStream().header);
-
-        auto & filter_actions_chain_node = actions_chain[1];
-        bool remove_filter_column = !filter_actions_chain_node->getChildRequiredOutputColumnsNames().contains(filter_step->getFilterColumnName());
-        auto after_prewhere_filter_step = std::make_unique<FilterStep>(read_from_merge_tree->getOutputStream(),
-            filter_actions,
-            filter_step->getFilterColumnName(),
-            remove_filter_column);
-
-        auto & node = nodes.emplace_back();
-        node.children.emplace_back(frame.node);
-        node.step = std::move(after_prewhere_filter_step);
-
-        replace_old_filter_node = &node;
-    }
-    else
-    {
-        auto rename_actions_dag = std::make_shared<ActionsDAG>(read_from_merge_tree->getOutputStream().header.getColumnsWithTypeAndName());
-        bool apply_rename_step = false;
-
-        ActionsDAG::NodeRawConstPtrs updated_outputs;
-
-        /** If in output after read from merge tree there are column names without aliases,
-          * apply old filter step aliases to them.
-          */
-        for (const auto * output_node : rename_actions_dag->getOutputs())
-        {
-            const auto alias_it = input_node_to_output_names.find(output_node->result_name);
-            if (alias_it == input_node_to_output_names.end())
-            {
-                updated_outputs.push_back(output_node);
-                continue;
+                if (output == conditions.front())
+                    prewhere_info->remove_prewhere_column = false;
             }
 
-            for (auto & output_name : alias_it->second)
-            {
-                if (output_name == output_node->result_name)
-                {
-                    updated_outputs.push_back(output_node);
-                    continue;
-                }
-
-                updated_outputs.push_back(&rename_actions_dag->addAlias(*output_node, output_name));
-                apply_rename_step = true;
-            }
-        }
-
-        rename_actions_dag->getOutputs() = std::move(updated_outputs);
-
-        bool apply_match_step = false;
-
-        /// If column order does not match old filter step column order, match dag output nodes with header
-        if (!blocksHaveEqualStructure(read_from_merge_tree->getOutputStream().header, filter_step->getOutputStream().header))
-        {
-            apply_match_step = true;
-            matchDAGOutputNodesOrderWithHeader(rename_actions_dag, filter_step->getOutputStream().header);
-        }
-
-        if (apply_rename_step || apply_match_step)
-        {
-            auto rename_step = std::make_unique<ExpressionStep>(read_from_merge_tree->getOutputStream(), rename_actions_dag);
-            if (apply_rename_step)
-                rename_step->setStepDescription("Change column names to column identifiers");
-
-            auto & node = nodes.emplace_back();
-            node.children.emplace_back(frame.node);
-            node.step = std::move(rename_step);
-
-            replace_old_filter_node = &node;
+            prewhere_info->prewhere_column_name = conditions.front()->result_name;
         }
         else
         {
-            replace_old_filter_node = frame.node;
-            remove_filter_node = true;
+
+            FunctionOverloadResolverPtr func_builder_and = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+            const auto * node = &prewhere_info->prewhere_actions->addFunction(func_builder_and, std::move(conditions), {});
+            prewhere_info->prewhere_column_name = node->result_name;
+            prewhere_info->prewhere_actions->getOutputs().push_back(node);
         }
+
+        read_from_merge_tree->updatePrewhereInfo(prewhere_info);
+        filter_node->step = std::make_unique<FilterStep>(
+            read_from_merge_tree->getOutputStream(),
+            std::move(split_result.second),
+            filter_step->getFilterColumnName(),
+            filter_step->removesFilterColumn());
+
+        return;
     }
 
+    prewhere_info->prewhere_actions = filter_step->getExpression();
+    prewhere_info->prewhere_column_name = filter_step->getFilterColumnName();
+    prewhere_info->remove_prewhere_column = filter_step->removesFilterColumn();
+
+    read_from_merge_tree->updatePrewhereInfo(prewhere_info);
+
+    // replace_old_filter_node = frame.node;
+    // remove_filter_node = true;
+
+
+
+    // auto & prewhere_filter_actions = optimize_result->prewhere_filter_actions;
+
+    // ActionsChain actions_chain;
+
+    // std::string prewere_filter_node_name = prewhere_filter_actions->getOutputs().at(0)->result_name;
+    // actions_chain.addStep(std::make_unique<ActionsChainStep>(prewhere_filter_actions));
+
+    // auto & filter_actions = optimize_result->filter_actions;
+
+    // /** Merge tree where optimizer splits conjunctions in filter expression into 2 parts:
+    //   * 1. Filter expressions.
+    //   * 2. Prewhere filter expressions.
+    //   *
+    //   * There can be cases when all expressions are moved to PREWHERE, but it is not
+    //   * enough to produce required filter output columns.
+    //   *
+    //   * Example: SELECT (a AND b) AS cond FROM test_table WHERE cond AND c;
+    //   * In this example condition expressions `a`, `b`, `c` can move to PREWHERE, but PREWHERE will not contain expression `and(a, b)`.
+    //   * It will contain only `a`, `b`, `c`, `and(a, b, c)` expressions.
+    //   *
+    //   * In such scenario we need to create additional step to calculate `and(a, b)` expression after PREWHERE.
+    //   */
+    // bool need_additional_filter_after_prewhere = false;
+
+    // if (!filter_actions)
+    // {
+    //     /// Any node from PREWHERE filter actions can be used as possible output node
+    //     std::unordered_set<std::string> possible_prewhere_output_nodes;
+    //     for (const auto & node : prewhere_filter_actions->getNodes())
+    //         possible_prewhere_output_nodes.insert(node.result_name);
+
+    //     for (auto & required_column : required_columns_after_filter)
+    //     {
+    //         if (!possible_prewhere_output_nodes.contains(required_column.name) &&
+    //             !output_nodes_mapped_to_input.contains(required_column.name))
+    //         {
+    //             need_additional_filter_after_prewhere = true;
+    //             break;
+    //         }
+    //     }
+    // }
+
+    // /** If there are additional filter actions after PREWHERE filter actions, we create filter actions dag using PREWHERE filter
+    //   * actions output columns as filter actions dag input columns.
+    //   * Then we merge this filter actions dag nodes with old filter step actions dag nodes, to reuse some expressions from
+    //   * PREWHERE filter actions.
+    //   */
+    // if (need_additional_filter_after_prewhere || filter_actions)
+    // {
+    //     auto merged_filter_actions = std::make_shared<ActionsDAG>(actions_chain.getLastStepAvailableOutputColumns());
+    //     merged_filter_actions->getOutputs().clear();
+    //     merged_filter_actions->mergeNodes(std::move(*filter_step->getExpression()->clone()));
+
+    //     /// Add old filter step filter column to outputs
+    //     for (const auto & node : merged_filter_actions->getNodes())
+    //     {
+    //         if (node.result_name == filter_step->getFilterColumnName())
+    //         {
+    //             merged_filter_actions->getOutputs().push_back(&node);
+    //             break;
+    //         }
+    //     }
+
+    //     filter_actions = std::move(merged_filter_actions);
+
+    //     /// If there is filter after PREWHERE, we can ignore filtering during PREWHERE stage
+    //     prewhere_info->need_filter = false;
+
+    //     actions_chain.addStep(std::make_unique<ActionsChainStep>(filter_actions));
+    // }
+
+    // auto required_output_actions = std::make_shared<ActionsDAG>(required_columns_after_filter);
+    // actions_chain.addStep(std::make_unique<ActionsChainStep>(required_output_actions));
+
+    // actions_chain.finalize();
+
+    // prewhere_filter_actions->projectInput(false);
+
+    // auto & prewhere_actions_chain_node = actions_chain[0];
+    // prewhere_info->prewhere_actions = std::move(prewhere_filter_actions);
+    // prewhere_info->prewhere_column_name = prewere_filter_node_name;
+    // prewhere_info->remove_prewhere_column = !prewhere_actions_chain_node->getChildRequiredOutputColumnsNames().contains(prewere_filter_node_name);
+
+    // read_from_merge_tree->updatePrewhereInfo(prewhere_info);
+
+    // QueryPlan::Node * replace_old_filter_node = nullptr;
+    // bool remove_filter_node = false;
+
+    // if (filter_actions)
+    // {
+    //     filter_actions->projectInput(false);
+
+    //     /// Match dag output nodes with old filter step header
+    //     matchDAGOutputNodesOrderWithHeader(filter_actions, filter_step->getOutputStream().header);
+
+    //     auto & filter_actions_chain_node = actions_chain[1];
+    //     bool remove_filter_column = !filter_actions_chain_node->getChildRequiredOutputColumnsNames().contains(filter_step->getFilterColumnName());
+    //     auto after_prewhere_filter_step = std::make_unique<FilterStep>(read_from_merge_tree->getOutputStream(),
+    //         filter_actions,
+    //         filter_step->getFilterColumnName(),
+    //         remove_filter_column);
+
+    //     auto & node = nodes.emplace_back();
+    //     node.children.emplace_back(frame.node);
+    //     node.step = std::move(after_prewhere_filter_step);
+
+    //     replace_old_filter_node = &node;
+    // }
+    // else
+    // {
+    //     auto rename_actions_dag = std::make_shared<ActionsDAG>(read_from_merge_tree->getOutputStream().header.getColumnsWithTypeAndName());
+    //     bool apply_rename_step = false;
+
+    //     ActionsDAG::NodeRawConstPtrs updated_outputs;
+
+    //     /** If in output after read from merge tree there are column names without aliases,
+    //       * apply old filter step aliases to them.
+    //       */
+    //     for (const auto * output_node : rename_actions_dag->getOutputs())
+    //     {
+    //         const auto alias_it = input_node_to_output_names.find(output_node->result_name);
+    //         if (alias_it == input_node_to_output_names.end())
+    //         {
+    //             updated_outputs.push_back(output_node);
+    //             continue;
+    //         }
+
+    //         for (auto & output_name : alias_it->second)
+    //         {
+    //             if (output_name == output_node->result_name)
+    //             {
+    //                 updated_outputs.push_back(output_node);
+    //                 continue;
+    //             }
+
+    //             updated_outputs.push_back(&rename_actions_dag->addAlias(*output_node, output_name));
+    //             apply_rename_step = true;
+    //         }
+    //     }
+
+    //     rename_actions_dag->getOutputs() = std::move(updated_outputs);
+
+    //     bool apply_match_step = false;
+
+    //     /// If column order does not match old filter step column order, match dag output nodes with header
+    //     if (!blocksHaveEqualStructure(read_from_merge_tree->getOutputStream().header, filter_step->getOutputStream().header))
+    //     {
+    //         apply_match_step = true;
+    //         matchDAGOutputNodesOrderWithHeader(rename_actions_dag, filter_step->getOutputStream().header);
+    //     }
+
+    //     if (apply_rename_step || apply_match_step)
+    //     {
+    //         auto rename_step = std::make_unique<ExpressionStep>(read_from_merge_tree->getOutputStream(), rename_actions_dag);
+    //         if (apply_rename_step)
+    //             rename_step->setStepDescription("Change column names to column identifiers");
+
+    //         auto & node = nodes.emplace_back();
+    //         node.children.emplace_back(frame.node);
+    //         node.step = std::move(rename_step);
+
+    //         replace_old_filter_node = &node;
+    //     }
+    //     else
+    //     {
+    //         replace_old_filter_node = frame.node;
+    //         remove_filter_node = true;
+    //     }
+    // }
+
     QueryPlan::Node * filter_parent_node = (stack.rbegin() + 2)->node;
 
     for (auto & filter_parent_child : filter_parent_node->children)
     {
         if (filter_parent_child == filter_node)
         {
-            filter_parent_child = replace_old_filter_node;
+            filter_parent_child = frame.node;
 
             size_t stack_size = stack.size();
 
-            /** If filter step is completely replaced with PREWHERE filter actions, remove it from stack.
-              * Otherwise replace old filter step with new filter step after PREWHERE.
-              */
-            if (remove_filter_node)
-            {
-                std::swap(stack[stack_size - 1], stack[stack_size - 2]);
-                stack.pop_back();
-            }
-            else
-            {
-                stack[stack_size - 2] = Frame{.node = replace_old_filter_node, .next_child = 1};
-            }
+            /// Step is completely replaced with PREWHERE filter actions, remove it from stack.
+            std::swap(stack[stack_size - 1], stack[stack_size - 2]);
+            stack.pop_back();
 
             break;
         }
diff --git a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
index 4aecf85ac2a..151ce7635b2 100644
--- a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
+++ b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
@@ -112,7 +112,7 @@ void MergeTreeWhereOptimizer::optimize(SelectQueryInfo & select_query_info, cons
     LOG_DEBUG(log, "MergeTreeWhereOptimizer: condition \"{}\" moved to PREWHERE", select.prewhere()->formatForLogging(log_queries_cut_to_length));
 }
 
-std::optional<MergeTreeWhereOptimizer::FilterActionsOptimizeResult> MergeTreeWhereOptimizer::optimize(const ActionsDAGPtr & filter_dag,
+MergeTreeWhereOptimizer::FilterActionsOptimizeResult MergeTreeWhereOptimizer::optimize(const ActionsDAGPtr & filter_dag,
     const std::string & filter_column_name,
     const ContextPtr & context,
     bool is_final)
@@ -132,11 +132,14 @@ std::optional<MergeTreeWhereOptimizer::FilterActionsOptimizeResult> MergeTreeWhe
     if (!optimize_result)
         return {};
 
-    auto filter_actions = reconstructDAG(optimize_result->where_conditions);
-    auto prewhere_filter_actions = reconstructDAG(optimize_result->prewhere_conditions);
+    if (optimize_result->where_conditions.empty())
+        return {.prewhere_nodes = {}, .fully_moved_to_prewhere = true};
 
-    FilterActionsOptimizeResult result = { std::move(filter_actions), std::move(prewhere_filter_actions) };
-    return result;
+    std::unordered_set<const ActionsDAG::Node *> prewhere_conditions;
+    for (const auto & condition : optimize_result->prewhere_conditions)
+        prewhere_conditions.insert(condition.node.getDAGNode());
+
+    return {.prewhere_nodes = std::move(prewhere_conditions), .fully_moved_to_prewhere = false};
 }
 
 static void collectColumns(const RPNBuilderTreeNode & node, const NameSet & columns_names, NameSet & result_set, bool & has_invalid_column)
@@ -343,20 +346,6 @@ ASTPtr MergeTreeWhereOptimizer::reconstructAST(const Conditions & conditions)
     return function;
 }
 
-ActionsDAGPtr MergeTreeWhereOptimizer::reconstructDAG(const Conditions & conditions)
-{
-    if (conditions.empty())
-        return {};
-
-    ActionsDAG::NodeRawConstPtrs filter_nodes;
-    filter_nodes.reserve(conditions.size());
-
-    for (const auto & condition : conditions)
-        filter_nodes.push_back(condition.node.getDAGNode());
-
-    return ActionsDAG::buildFilterActionsDAG(filter_nodes);
-}
-
 std::optional<MergeTreeWhereOptimizer::OptimizeResult> MergeTreeWhereOptimizer::optimizeImpl(const RPNBuilderTreeNode & node,
     const WhereOptimizerContext & where_optimizer_context) const
 {
diff --git a/src/Storages/MergeTree/MergeTreeWhereOptimizer.h b/src/Storages/MergeTree/MergeTreeWhereOptimizer.h
index b56219e3c59..84afa4cda17 100644
--- a/src/Storages/MergeTree/MergeTreeWhereOptimizer.h
+++ b/src/Storages/MergeTree/MergeTreeWhereOptimizer.h
@@ -47,11 +47,11 @@ public:
 
     struct FilterActionsOptimizeResult
     {
-        ActionsDAGPtr filter_actions;
-        ActionsDAGPtr prewhere_filter_actions;
+        std::unordered_set<const ActionsDAG::Node *> prewhere_nodes;
+        bool fully_moved_to_prewhere = false;
     };
 
-    std::optional<FilterActionsOptimizeResult> optimize(const ActionsDAGPtr & filter_dag,
+    FilterActionsOptimizeResult optimize(const ActionsDAGPtr & filter_dag,
         const std::string & filter_column_name,
         const ContextPtr & context,
         bool is_final);
@@ -122,9 +122,6 @@ private:
     /// Reconstruct AST from conditions
     static ASTPtr reconstructAST(const Conditions & conditions);
 
-    /// Reconstruct DAG from conditions
-    static ActionsDAGPtr reconstructDAG(const Conditions & conditions);
-
     void optimizeArbitrary(ASTSelectQuery & select) const;
 
     UInt64 getColumnsSize(const NameSet & columns) const;

From fbd71ee15e22f68d4155437201a83d5c8133c203 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 5 Jan 2024 20:46:13 +0000
Subject: [PATCH 0699/1081] Fixing style.

---
 src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index b2ac34b4b24..4cea74b9b12 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -235,8 +235,6 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     // replace_old_filter_node = frame.node;
     // remove_filter_node = true;
 
-
-
     // auto & prewhere_filter_actions = optimize_result->prewhere_filter_actions;
 
     // ActionsChain actions_chain;

From d1902cdba0b9fce3c621e1266e9e004fe2a21daf Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 9 Jan 2024 16:31:16 +0000
Subject: [PATCH 0700/1081] Fix some tests.

---
 src/Interpreters/ActionsDAG.cpp               |  42 +++--
 .../Optimizations/optimizePrewhere.cpp        | 151 ++++++++++++------
 .../QueryPlan/ReadFromMergeTree.cpp           |  79 +++++++--
 .../MergeTree/MergeTreeSelectProcessor.cpp    |   2 +-
 .../MergeTree/MergeTreeWhereOptimizer.cpp     |   6 +-
 .../02235_add_part_offset_virtual_column.sql  |   4 +-
 6 files changed, 208 insertions(+), 76 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 03d7e620541..5a1f9a87974 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -1765,13 +1765,13 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
                     }
 
                     /// Input from second DAG should also be in the first.
-                    if (copy.type == ActionType::INPUT)
-                    {
-                        auto & input_copy = first_nodes.emplace_back(*cur.node);
-                        assert(cur_data.to_first == nullptr);
-                        cur_data.to_first = &input_copy;
-                        new_inputs.push_back(cur.node);
-                    }
+                    // if (copy.type == ActionType::INPUT)
+                    // {
+                    //     auto & input_copy = first_nodes.emplace_back(*cur.node);
+                    //     assert(cur_data.to_first == nullptr);
+                    //     cur_data.to_first = &input_copy;
+                    //     new_inputs.push_back(cur.node);
+                    // }
                 }
                 else
                 {
@@ -1790,11 +1790,12 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
                         /// If this node is needed in result, add it as input.
                         Node input_node;
                         input_node.type = ActionType::INPUT;
-                        input_node.result_type = node.result_type;
-                        input_node.result_name = node.result_name;
+                        input_node.result_type = cur.node->result_type;
+                        input_node.result_name = cur.node->result_name;
                         cur_data.to_second = &second_nodes.emplace_back(std::move(input_node));
 
-                        new_inputs.push_back(cur.node);
+                        if (cur.node->type != ActionType::INPUT)
+                            new_inputs.push_back(cur.node);
                     }
                 }
             }
@@ -1810,14 +1811,29 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
     for (const auto * input_node : inputs)
     {
         const auto & cur = data[input_node];
-        first_inputs.push_back(cur.to_first);
+        if (cur.to_first)
+        {
+            first_inputs.push_back(cur.to_first);
+
+            if (cur.to_second)
+                first_outputs.push_back(cur.to_first);
+        }
     }
 
     for (const auto * input : new_inputs)
     {
         const auto & cur = data[input];
-        second_inputs.push_back(cur.to_second);
-        first_outputs.push_back(cur.to_first);
+        if (cur.to_second)
+            second_inputs.push_back(cur.to_second);
+        if (cur.to_first)
+            first_outputs.push_back(cur.to_first);
+    }
+
+    for (const auto * input_node : inputs)
+    {
+        const auto & cur = data[input_node];
+        if (cur.to_second)
+            second_inputs.push_back(cur.to_second);
     }
 
     auto first_actions = std::make_shared<ActionsDAG>();
diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 4cea74b9b12..a9405d0cbdb 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -62,6 +62,20 @@ namespace ErrorCodes
 namespace QueryPlanOptimizations
 {
 
+static void removeFromOutput(ActionsDAG & dag, const std::string name)
+{
+    const auto * node = &dag.findInOutputs(name);
+    auto & outputs = dag.getOutputs();
+    for (size_t i = 0; i < outputs.size(); ++i)
+    {
+        if (node == outputs[i])
+        {
+            outputs.erase(outputs.begin() + i);
+            return;
+        }
+    }
+}
+
 void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
 {
     if (stack.size() < 3)
@@ -172,7 +186,7 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         read_from_merge_tree->getContext(),
         is_final);
 
-    if (!optimize_result.fully_moved_to_prewhere && optimize_result.prewhere_nodes.empty())
+    if (optimize_result.prewhere_nodes.empty())
         return;
 
     PrewhereInfoPtr prewhere_info;
@@ -182,55 +196,102 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         prewhere_info = std::make_shared<PrewhereInfo>();
 
     prewhere_info->need_filter = true;
+    // std::cerr << filter_step->getExpression()->dumpDAG() << std::endl;
 
     // QueryPlan::Node * replace_old_filter_node = nullptr;
     // bool remove_filter_node = false;
 
-    if (!optimize_result.fully_moved_to_prewhere)
-    {
-        auto split_result = filter_step->getExpression()->split(optimize_result.prewhere_nodes, true);
-        ActionsDAG::NodeRawConstPtrs conditions;
-        conditions.reserve(split_result.split_nodes_mapping.size());
-        for (const auto * condition : optimize_result.prewhere_nodes)
-            conditions.push_back(split_result.split_nodes_mapping.at(condition));
+    auto filter_expression = filter_step->getExpression();
+    const auto & filter_column_name = filter_step->getFilterColumnName();
 
-        prewhere_info->prewhere_actions = std::move(split_result.first);
+    if (optimize_result.fully_moved_to_prewhere && filter_step->removesFilterColumn())
+    {
+        removeFromOutput(*filter_expression, filter_column_name);
+        auto & outputs = filter_expression->getOutputs();
+        size_t size = outputs.size();
+        outputs.insert(outputs.end(), optimize_result.prewhere_nodes.begin(), optimize_result.prewhere_nodes.end());
+        filter_expression->removeUnusedActions(false);
+        outputs.resize(size);
+    }
+
+    // std::cerr << "!!!!!!!!!!!!!!!!\n";
+
+    // if (!optimize_result.fully_moved_to_prewhere)
+    // {
+    auto split_result = filter_step->getExpression()->split(optimize_result.prewhere_nodes, true);
+
+    // std::cerr << split_result.first->dumpDAG() << std::endl;
+    // std::cerr << split_result.second->dumpDAG() << std::endl;
+
+    // for (const auto * input : split_result.first->getInputs())
+    //     std::cerr << "in 1" << input->result_name << std::endl;
+    // for (const auto * input : split_result.second->getInputs())
+    //     std::cerr << "in 2" << input->result_name << std::endl;
+
+    ActionsDAG::NodeRawConstPtrs conditions;
+    conditions.reserve(split_result.split_nodes_mapping.size());
+    for (const auto * condition : optimize_result.prewhere_nodes)
+    {
+        // std::cerr << ".. " << condition->result_name << std::endl;
+        conditions.push_back(split_result.split_nodes_mapping.at(condition));
+    }
+
+    prewhere_info->prewhere_actions = std::move(split_result.first);
+    prewhere_info->remove_prewhere_column = optimize_result.fully_moved_to_prewhere && filter_step->removesFilterColumn();
+
+    if (conditions.size() == 1)
+    {
+        prewhere_info->prewhere_column_name = conditions.front()->result_name;
+        prewhere_info->prewhere_actions->getOutputs().push_back(conditions.front());
+    }
+    else
+    {
         prewhere_info->remove_prewhere_column = true;
 
-        if (conditions.size() == 1)
-        {
-            for (const auto * output : prewhere_info->prewhere_actions->getOutputs())
-            {
-                if (output == conditions.front())
-                    prewhere_info->remove_prewhere_column = false;
-            }
+        FunctionOverloadResolverPtr func_builder_and = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+        const auto * node = &prewhere_info->prewhere_actions->addFunction(func_builder_and, std::move(conditions), {});
+        prewhere_info->prewhere_column_name = node->result_name;
+        prewhere_info->prewhere_actions->getOutputs().push_back(node);
+    }
 
-            prewhere_info->prewhere_column_name = conditions.front()->result_name;
-        }
-        else
-        {
+    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
+    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
 
-            FunctionOverloadResolverPtr func_builder_and = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
-            const auto * node = &prewhere_info->prewhere_actions->addFunction(func_builder_and, std::move(conditions), {});
-            prewhere_info->prewhere_column_name = node->result_name;
-            prewhere_info->prewhere_actions->getOutputs().push_back(node);
-        }
+    read_from_merge_tree->updatePrewhereInfo(prewhere_info);
 
-        read_from_merge_tree->updatePrewhereInfo(prewhere_info);
+    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
+    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
+
+    if (!optimize_result.fully_moved_to_prewhere)
+    {
         filter_node->step = std::make_unique<FilterStep>(
             read_from_merge_tree->getOutputStream(),
             std::move(split_result.second),
             filter_step->getFilterColumnName(),
             filter_step->removesFilterColumn());
-
-        return;
     }
+    else
+    {
+        // std::cerr << split_result.second->dumpDAG() << std::endl;
+        // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
+        // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
 
-    prewhere_info->prewhere_actions = filter_step->getExpression();
-    prewhere_info->prewhere_column_name = filter_step->getFilterColumnName();
-    prewhere_info->remove_prewhere_column = filter_step->removesFilterColumn();
+        filter_node->step = std::make_unique<ExpressionStep>(
+            read_from_merge_tree->getOutputStream(),
+            std::move(split_result.second));
+    }
+    // return;
+    // }
 
-    read_from_merge_tree->updatePrewhereInfo(prewhere_info);
+    // std::cerr << "!!!!!!!!!!!!!!!!\n";
+
+    // prewhere_info->prewhere_actions = filter_step->getExpression();
+    // prewhere_info->prewhere_actions->projectInput(false);
+    // std::cerr << prewhere_info->prewhere_actions->dumpDAG() << std::endl;
+    // prewhere_info->prewhere_column_name = filter_step->getFilterColumnName();
+    // prewhere_info->remove_prewhere_column = filter_step->removesFilterColumn();
+
+    // read_from_merge_tree->updatePrewhereInfo(prewhere_info);
 
     // replace_old_filter_node = frame.node;
     // remove_filter_node = true;
@@ -405,23 +466,23 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     //     }
     // }
 
-    QueryPlan::Node * filter_parent_node = (stack.rbegin() + 2)->node;
+    // QueryPlan::Node * filter_parent_node = (stack.rbegin() + 2)->node;
 
-    for (auto & filter_parent_child : filter_parent_node->children)
-    {
-        if (filter_parent_child == filter_node)
-        {
-            filter_parent_child = frame.node;
+    // for (auto & filter_parent_child : filter_parent_node->children)
+    // {
+    //     if (filter_parent_child == filter_node)
+    //     {
+    //         filter_parent_child = frame.node;
 
-            size_t stack_size = stack.size();
+    //         size_t stack_size = stack.size();
 
-            /// Step is completely replaced with PREWHERE filter actions, remove it from stack.
-            std::swap(stack[stack_size - 1], stack[stack_size - 2]);
-            stack.pop_back();
+    //         /// Step is completely replaced with PREWHERE filter actions, remove it from stack.
+    //         std::swap(stack[stack_size - 1], stack[stack_size - 2]);
+    //         stack.pop_back();
 
-            break;
-        }
-    }
+    //         break;
+    //     }
+    // }
 }
 
 }
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 5ed56f59fc1..6adc48d87d2 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -89,6 +89,34 @@ size_t countPartitions(const MergeTreeData::DataPartsVector & prepared_parts)
     return countPartitions(prepared_parts, get_partition_id);
 }
 
+bool restoreDAGInputs(ActionsDAG & dag, const NameSet & inputs)
+{
+    std::unordered_set<const ActionsDAG::Node *> outputs(dag.getOutputs().begin(), dag.getOutputs().end());
+    bool added = false;
+    for (const auto * input : dag.getInputs())
+    {
+        if (inputs.contains(input->result_name) && !outputs.contains(input))
+        {
+            dag.getOutputs().push_back(input);
+            added = true;
+        }
+    }
+
+    return added;
+}
+
+bool restorePrewhereInputs(PrewhereInfo & info, const NameSet & inputs)
+{
+    bool added = false;
+    if (info.row_level_filter)
+        added = added || restoreDAGInputs(*info.row_level_filter, inputs);
+
+    if (info.prewhere_actions)
+        added = added || restoreDAGInputs(*info.prewhere_actions, inputs);
+
+    return added;
+}
+
 }
 
 namespace ProfileEvents
@@ -786,18 +814,13 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsWithOrder(
     /// To fix this, we prohibit removing any input in prewhere actions. Instead, projection actions will be added after sorting.
     /// See 02354_read_in_order_prewhere.sql as an example.
     bool have_input_columns_removed_after_prewhere = false;
-    if (prewhere_info && prewhere_info->prewhere_actions)
+    if (prewhere_info)
     {
-        auto & outputs = prewhere_info->prewhere_actions->getOutputs();
-        std::unordered_set<const ActionsDAG::Node *> outputs_set(outputs.begin(), outputs.end());
-        for (const auto * input : prewhere_info->prewhere_actions->getInputs())
-        {
-            if (!outputs_set.contains(input))
-            {
-                outputs.push_back(input);
-                have_input_columns_removed_after_prewhere = true;
-            }
-        }
+        NameSet sorting_columns;
+        for (const auto & column : metadata_for_reading->getSortingKey().expression->getRequiredColumnsWithTypes())
+            sorting_columns.insert(column.name);
+
+        have_input_columns_removed_after_prewhere = restorePrewhereInputs(*prewhere_info, sorting_columns);
     }
 
     /// Let's split ranges to avoid reading much data.
@@ -984,7 +1007,6 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsWithOrder(
             /// Thus we need to merge all partition parts into a single sorted stream.
             Pipe pipe = Pipe::unitePipes(std::move(pipes));
             merge_streams(pipe);
-            out_projection = createProjection(pipe_header);
             return pipe;
         }
 
@@ -1133,6 +1155,14 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
 
     auto sorting_expr = std::make_shared<ExpressionActions>(metadata_for_reading->getSortingKey().expression->getActionsDAG().clone());
 
+    if (prewhere_info)
+    {
+        NameSet sorting_columns;
+        for (const auto & column : metadata_for_reading->getSortingKey().expression->getRequiredColumnsWithTypes())
+            sorting_columns.insert(column.name);
+        restorePrewhereInputs(*prewhere_info, sorting_columns);
+    }
+
     for (size_t range_index = 0; range_index < parts_to_merge_ranges.size() - 1; ++range_index)
     {
         /// If do_not_merge_across_partitions_select_final is true and there is only one part in partition
@@ -1802,13 +1832,20 @@ Pipe ReadFromMergeTree::spreadMarkRanges(
 
     if (!final && result.sampling.use_sampling)
     {
+        NameSet sampling_columns;
+
         /// Add columns needed for `sample_by_ast` to `column_names_to_read`.
         /// Skip this if final was used, because such columns were already added from PK.
         for (const auto & column : result.sampling.filter_expression->getRequiredColumns().getNames())
         {
             if (!names.contains(column))
                 column_names_to_read.push_back(column);
+
+            sampling_columns.insert(column);
         }
+
+        if (prewhere_info)
+            restorePrewhereInputs(*prewhere_info, sampling_columns);
     }
 
     if (final)
@@ -2002,6 +2039,24 @@ void ReadFromMergeTree::initializePipeline(QueryPipelineBuilder & pipeline, cons
         });
     }
 
+    /// Some extra columns could be added by sample/final/in-order/etc
+    /// Remove them from header if not needed.
+    if (!blocksHaveEqualStructure(pipe.getHeader(), getOutputStream().header))
+    {
+        auto convert_actions_dag = ActionsDAG::makeConvertingActions(
+            pipe.getHeader().getColumnsWithTypeAndName(),
+            getOutputStream().header.getColumnsWithTypeAndName(),
+            ActionsDAG::MatchColumnsMode::Name,
+            true);
+
+        auto converting_dag_expr = std::make_shared<ExpressionActions>(convert_actions_dag);
+
+        pipe.addSimpleTransform([&](const Block & header)
+        {
+            return std::make_shared<ExpressionTransform>(header, converting_dag_expr);
+        });
+    }
+
     for (const auto & processor : pipe.getProcessors())
         processors.emplace_back(processor);
 
diff --git a/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp b/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
index aeff438f509..4e93bd267ec 100644
--- a/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
+++ b/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
@@ -449,8 +449,8 @@ Block MergeTreeSelectProcessor::applyPrewhereActions(Block block, const Prewhere
 Block MergeTreeSelectProcessor::transformHeader(
     Block block, const PrewhereInfoPtr & prewhere_info, const DataTypePtr & partition_value_type, const Names & virtual_columns)
 {
+    injectVirtualColumns(block, 0, nullptr, partition_value_type, virtual_columns);
     auto transformed = applyPrewhereActions(std::move(block), prewhere_info);
-    injectVirtualColumns(transformed, 0, nullptr, partition_value_type, virtual_columns);
     return transformed;
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
index 151ce7635b2..c52a2fee051 100644
--- a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
+++ b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
@@ -132,14 +132,14 @@ MergeTreeWhereOptimizer::FilterActionsOptimizeResult MergeTreeWhereOptimizer::op
     if (!optimize_result)
         return {};
 
-    if (optimize_result->where_conditions.empty())
-        return {.prewhere_nodes = {}, .fully_moved_to_prewhere = true};
+    // if (optimize_result->where_conditions.empty())
+    //     return {.prewhere_nodes = {}, .fully_moved_to_prewhere = true};
 
     std::unordered_set<const ActionsDAG::Node *> prewhere_conditions;
     for (const auto & condition : optimize_result->prewhere_conditions)
         prewhere_conditions.insert(condition.node.getDAGNode());
 
-    return {.prewhere_nodes = std::move(prewhere_conditions), .fully_moved_to_prewhere = false};
+    return {.prewhere_nodes = std::move(prewhere_conditions), .fully_moved_to_prewhere = optimize_result->where_conditions.empty()};
 }
 
 static void collectColumns(const RPNBuilderTreeNode & node, const NameSet & columns_names, NameSet & result_set, bool & has_invalid_column)
diff --git a/tests/queries/0_stateless/02235_add_part_offset_virtual_column.sql b/tests/queries/0_stateless/02235_add_part_offset_virtual_column.sql
index dc8fceddc52..73ae6eb499f 100644
--- a/tests/queries/0_stateless/02235_add_part_offset_virtual_column.sql
+++ b/tests/queries/0_stateless/02235_add_part_offset_virtual_column.sql
@@ -52,7 +52,7 @@ SELECT _part_offset, foo FROM t_1 where granule == 0 AND _part_offset >= 100000
 
 SELECT 'PREWHERE';
 SELECT count(*), sum(_part_offset), sum(order_0) from t_1 prewhere granule == 0 where _part_offset >= 100000;
-SELECT count(*), sum(_part_offset), sum(order_0) from t_1 prewhere _part != '' where granule == 0; -- { serverError 10 }
-SELECT count(*), sum(_part_offset), sum(order_0) from t_1 prewhere _part_offset > 100000 where granule == 0; -- { serverError 10 }
+SELECT count(*), sum(_part_offset), sum(order_0) from t_1 prewhere _part != '' where granule == 0; -- { serverError 10, 16 }
+SELECT count(*), sum(_part_offset), sum(order_0) from t_1 prewhere _part_offset > 100000 where granule == 0; -- { serverError 10, 16 }
 SELECT _part_offset FROM t_1 PREWHERE order_0 % 10000 == 42 ORDER BY order_0 LIMIT 3;
 SELECT _part_offset, foo FROM t_1 PREWHERE order_0 % 10000 == 42 ORDER BY order_0 LIMIT 3;

From df0c30878eaca90c3eb4426e93727481b9ed4f0b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 19 Jan 2024 10:44:58 +0000
Subject: [PATCH 0701/1081] Fixing style

---
 src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index a9405d0cbdb..6872141951e 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -214,8 +214,6 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         outputs.resize(size);
     }
 
-    // std::cerr << "!!!!!!!!!!!!!!!!\n";
-
     // if (!optimize_result.fully_moved_to_prewhere)
     // {
     auto split_result = filter_step->getExpression()->split(optimize_result.prewhere_nodes, true);
@@ -283,8 +281,6 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     // return;
     // }
 
-    // std::cerr << "!!!!!!!!!!!!!!!!\n";
-
     // prewhere_info->prewhere_actions = filter_step->getExpression();
     // prewhere_info->prewhere_actions->projectInput(false);
     // std::cerr << prewhere_info->prewhere_actions->dumpDAG() << std::endl;

From 41d624317064bc2a2784b6afaf3b3f22548c2f2b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 7 Feb 2024 12:43:26 +0000
Subject: [PATCH 0702/1081] Fix PreparedSets

---
 src/Interpreters/PreparedSets.cpp | 9 +--------
 src/Interpreters/PreparedSets.h   | 2 +-
 2 files changed, 2 insertions(+), 9 deletions(-)

diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index 946eef08ce3..76f75cde1dc 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -205,18 +205,11 @@ SetPtr FutureSetFromSubquery::buildOrderedSetInplace(const ContextPtr & context)
         }
     }
 
-    if (!set_and_key->set->hasSetElements())
-        set_and_key->set->fillSetElements();
-
-    return buildSetInplace(context);
-}
-
-SetPtr FutureSetFromSubquery::buildSetInplace(const ContextPtr & context)
-{
     auto plan = build(context);
     if (!plan)
         return nullptr;
 
+    set_and_key->set->fillSetElements();
     auto builder = plan->buildQueryPipeline(QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
     auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
     pipeline.complete(std::make_shared<EmptySink>(Block()));
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index a65f30351db..3419d3b6839 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -111,9 +111,9 @@ public:
     SetPtr get() const override;
     DataTypes getTypes() const override;
     SetPtr buildOrderedSetInplace(const ContextPtr & context) override;
-    SetPtr buildSetInplace(const ContextPtr & context);
 
     std::unique_ptr<QueryPlan> build(const ContextPtr & context);
+    void buildSetInplace(const ContextPtr & context);
 
     QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
     void setQueryPlan(std::unique_ptr<QueryPlan> source_);

From a1eb9abaf09af2ade899e0fe6199f04595bd54f0 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 7 Feb 2024 13:49:35 +0100
Subject: [PATCH 0703/1081] Add test for increase-always autoscaling lambda

---
 tests/ci/autoscale_runners_lambda/app.py           |  5 +++--
 .../ci/autoscale_runners_lambda/test_autoscale.py  | 14 ++++++++++----
 2 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index 120126b404a..26a05ab0af4 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -8,11 +8,10 @@ from pprint import pformat
 from typing import Any, List, Literal, Optional, Tuple
 
 import boto3  # type: ignore
-
 from lambda_shared import (
+    RUNNER_TYPE_LABELS,
     CHException,
     ClickHouseHelper,
-    RUNNER_TYPE_LABELS,
     get_parameter_from_ssm,
 )
 
@@ -115,6 +114,8 @@ def set_capacity(
         # Are we already at the capacity limits
         stop = stop or asg["MaxSize"] <= asg["DesiredCapacity"]
         # Let's calculate a new desired capacity
+        # (capacity_deficit + scale_up - 1) // scale_up : will increase min by 1
+        # if there is any capacity_deficit
         desired_capacity = (
             asg["DesiredCapacity"] + (capacity_deficit + scale_up - 1) // scale_up
         )
diff --git a/tests/ci/autoscale_runners_lambda/test_autoscale.py b/tests/ci/autoscale_runners_lambda/test_autoscale.py
index 464e5695556..21a407276f9 100644
--- a/tests/ci/autoscale_runners_lambda/test_autoscale.py
+++ b/tests/ci/autoscale_runners_lambda/test_autoscale.py
@@ -4,7 +4,7 @@ import unittest
 from dataclasses import dataclass
 from typing import Any, List
 
-from app import set_capacity, Queue
+from app import Queue, set_capacity
 
 
 @dataclass
@@ -68,10 +68,16 @@ class TestSetCapacity(unittest.TestCase):
         test_cases = (
             # Do not change capacity
             TestCase("noqueue", 1, 13, 20, [Queue("in_progress", 155, "noqueue")], -1),
-            TestCase(
-                "w/reserve-1", 1, 13, 20, [Queue("queued", 15, "w/reserve-1")], 14
-            ),
+            TestCase("reserve", 1, 13, 20, [Queue("queued", 13, "reserve")], -1),
             # Increase capacity
+            TestCase(
+                "increase-always",
+                1,
+                13,
+                20,
+                [Queue("queued", 14, "increase-always")],
+                14,
+            ),
             TestCase("increase-1", 1, 13, 20, [Queue("queued", 23, "increase-1")], 17),
             TestCase(
                 "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 20

From e8c0637fe2eebb2a369a79ac2c2e8b381e7a726c Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 2 Feb 2024 22:53:28 +0100
Subject: [PATCH 0704/1081] fix

---
 src/Processors/Transforms/AggregatingTransform.cpp | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Processors/Transforms/AggregatingTransform.cpp b/src/Processors/Transforms/AggregatingTransform.cpp
index 2fd9f102159..74da97f2199 100644
--- a/src/Processors/Transforms/AggregatingTransform.cpp
+++ b/src/Processors/Transforms/AggregatingTransform.cpp
@@ -600,6 +600,12 @@ IProcessor::Status AggregatingTransform::prepare()
         if (is_consume_finished)
         {
             output.finish();
+            /// input.isFinished() means that merging is done. Now we can release our reference to aggregation states.
+            /// TODO: there is another case, when output port is getting closed first.
+            /// E.g. `select ... group by x limit 10`, if it was two-level aggregation and first few buckets contained already enough rows
+            /// limit will stop merging. It turned out to be not trivial to both release aggregation states and ensure that
+            /// ManyAggregatedData holds the last references to them to trigger parallel destruction in its dtor. Will work on that.
+            many_data.reset();
             return Status::Finished;
         }
         else
@@ -828,8 +834,6 @@ void AggregatingTransform::initGenerate()
 
         processors = Pipe::detachProcessors(std::move(pipe));
     }
-
-    many_data.reset();
 }
 
 }

From 74b37ea5b04047f3207d05caf83c3f2b8645a9a2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 7 Feb 2024 14:23:43 +0100
Subject: [PATCH 0705/1081] Revert "Use `MergeTree` as a default table engine"

---
 src/Core/Settings.h                                      | 2 +-
 src/Core/SettingsChangesHistory.h                        | 1 -
 tests/queries/0_stateless/02184_default_table_engine.sql | 2 --
 3 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index a433d523358..dc863576a85 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -559,7 +559,7 @@ class IColumn;
     M(UInt64, min_free_disk_space_for_temporary_data, 0, "The minimum disk space to keep while writing temporary data used in external sorting and aggregation.", 0) \
     \
     M(DefaultTableEngine, default_temporary_table_engine, DefaultTableEngine::Memory, "Default table engine used when ENGINE is not set in CREATE TEMPORARY statement.",0) \
-    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::MergeTree, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
+    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::None, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
     M(Bool, show_table_uuid_in_table_create_query_if_not_nil, false, "For tables in databases with Engine=Atomic show UUID of the table in its CREATE query.", 0) \
     M(Bool, database_atomic_wait_for_drop_and_detach_synchronously, false, "When executing DROP or DETACH TABLE in Atomic database, wait for table data to be finally dropped or detached.", 0) \
     M(Bool, enable_scalar_subquery_optimization, true, "If it is set to true, prevent scalar subqueries from (de)serializing large scalar values and possibly avoid running the same subquery more than once.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index a1c1523aaa9..db3a76e29cd 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -109,7 +109,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
diff --git a/tests/queries/0_stateless/02184_default_table_engine.sql b/tests/queries/0_stateless/02184_default_table_engine.sql
index aff30eeea98..a984ec1b6c9 100644
--- a/tests/queries/0_stateless/02184_default_table_engine.sql
+++ b/tests/queries/0_stateless/02184_default_table_engine.sql
@@ -1,5 +1,3 @@
-SET default_table_engine = 'None';
-
 CREATE TABLE table_02184 (x UInt8); --{serverError 119}
 SET default_table_engine = 'Log';
 CREATE TABLE table_02184 (x UInt8);

From a64d9cf1c0ab4294a8ea9c83fa7d03bd6b7fe4c6 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Wed, 7 Feb 2024 14:15:49 +0100
Subject: [PATCH 0706/1081] add test

---
 .../02982_aggregation_states_destruction.reference |  1 +
 .../02982_aggregation_states_destruction.sh        | 14 ++++++++++++++
 2 files changed, 15 insertions(+)
 create mode 100644 tests/queries/0_stateless/02982_aggregation_states_destruction.reference
 create mode 100755 tests/queries/0_stateless/02982_aggregation_states_destruction.sh

diff --git a/tests/queries/0_stateless/02982_aggregation_states_destruction.reference b/tests/queries/0_stateless/02982_aggregation_states_destruction.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02982_aggregation_states_destruction.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02982_aggregation_states_destruction.sh b/tests/queries/0_stateless/02982_aggregation_states_destruction.sh
new file mode 100755
index 00000000000..1c72cf2b8c1
--- /dev/null
+++ b/tests/queries/0_stateless/02982_aggregation_states_destruction.sh
@@ -0,0 +1,14 @@
+#!/usr/bin/env bash
+# Tags: no-random-settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+query_id="02982_$RANDOM"
+$CLICKHOUSE_CLIENT --query_id $query_id --log_query_threads 1 --query="select number, uniq(number) from numbers_mt(1e7) group by number limit 100 format Null;"
+
+$CLICKHOUSE_CLIENT -q "system flush logs;"
+
+$CLICKHOUSE_CLIENT -q "select count() > 1 from system.query_thread_log where query_id = '$query_id' and current_database = currentDatabase() and thread_name = 'AggregDestruct';"

From 7016e1d397de7f50dc39b59f370924fc93f1a889 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 15:43:58 +0100
Subject: [PATCH 0707/1081] Maybe better

---
 src/Parsers/IParser.h | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index 99dbc39f06f..d5c9d48d730 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -82,7 +82,12 @@ public:
               * The frequency is arbitrary, but not too large, not too small,
               * and a power of two to simplify the division.
               */
-            if (depth % 8192 == 0)
+#ifdef USE_MUSL
+            static constexpr uint32_t check_frequency = 128;
+#else
+            static constexpr uint32_t check_frequency = 8192;
+#endif
+            if (depth % check_frequency == 0)
                 checkStackSize();
         }
 

From c391cb5f56d7c54a009d3110d26a6bb40c610c35 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 7 Feb 2024 14:53:55 +0000
Subject: [PATCH 0708/1081] Remove SourceWithKeyCondition from
 ReadFromStorageStep

---
 src/Processors/QueryPlan/ReadFromPreparedSource.cpp | 9 +--------
 src/Processors/QueryPlan/ReadFromPreparedSource.h   | 4 +---
 2 files changed, 2 insertions(+), 11 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromPreparedSource.cpp b/src/Processors/QueryPlan/ReadFromPreparedSource.cpp
index bf2e49727ed..b845101125b 100644
--- a/src/Processors/QueryPlan/ReadFromPreparedSource.cpp
+++ b/src/Processors/QueryPlan/ReadFromPreparedSource.cpp
@@ -7,7 +7,7 @@ namespace DB
 {
 
 ReadFromPreparedSource::ReadFromPreparedSource(Pipe pipe_)
-    : SourceStepWithFilter(DataStream{.header = pipe_.getHeader()})
+    : ISourceStep(DataStream{.header = pipe_.getHeader()})
     , pipe(std::move(pipe_))
 {
 }
@@ -35,11 +35,4 @@ ReadFromStorageStep::ReadFromStorageStep(
         processor->setStorageLimits(query_info.storage_limits);
 }
 
-void ReadFromStorageStep::applyFilters()
-{
-    for (const auto & processor : pipe.getProcessors())
-        if (auto * source = dynamic_cast<SourceWithKeyCondition *>(processor.get()))
-            source->setKeyCondition(filter_nodes.nodes, context);
-}
-
 }
diff --git a/src/Processors/QueryPlan/ReadFromPreparedSource.h b/src/Processors/QueryPlan/ReadFromPreparedSource.h
index 2eea48553b3..b40a656cee3 100644
--- a/src/Processors/QueryPlan/ReadFromPreparedSource.h
+++ b/src/Processors/QueryPlan/ReadFromPreparedSource.h
@@ -2,7 +2,6 @@
 
 #include <Interpreters/Context.h>
 #include <Processors/QueryPlan/ISourceStep.h>
-#include <Processors/QueryPlan/SourceStepWithFilter.h>
 #include <QueryPipeline/Pipe.h>
 #include <Storages/SelectQueryInfo.h>
 
@@ -10,7 +9,7 @@ namespace DB
 {
 
 /// Create source from prepared pipe.
-class ReadFromPreparedSource : public SourceStepWithFilter
+class ReadFromPreparedSource : public ISourceStep
 {
 public:
     explicit ReadFromPreparedSource(Pipe pipe_);
@@ -28,7 +27,6 @@ public:
     ReadFromStorageStep(Pipe pipe_, String storage_name, ContextPtr context_, const SelectQueryInfo & query_info_);
 
     String getName() const override { return "ReadFromStorage"; }
-    void applyFilters() override;
 
 private:
     ContextPtr context;

From 99be5b5cb1d49222dc85c184e51cc9f83aa8de15 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 7 Feb 2024 15:57:52 +0100
Subject: [PATCH 0709/1081] Fix

---
 src/Coordination/KeeperSnapshotManager.cpp | 14 +++++-----
 src/Coordination/KeeperStorage.cpp         | 32 ++++++++++++----------
 src/Coordination/KeeperStorage.h           | 19 +++++++++++--
 src/Coordination/ZooKeeperDataReader.cpp   |  6 ++--
 4 files changed, 46 insertions(+), 25 deletions(-)

diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index c176536dfbf..07116fedfab 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -16,7 +16,7 @@
 #include <Coordination/pathUtils.h>
 #include <Coordination/KeeperConstants.h>
 #include <Common/ZooKeeper/ZooKeeperCommon.h>
-#include "Core/Field.h"
+#include <Core/Field.h>
 #include <Disks/DiskLocal.h>
 
 
@@ -86,10 +86,10 @@ namespace
         writeBinary(node.version, out);
         writeBinary(node.cversion, out);
         writeBinary(node.aversion, out);
-        const bool is_ephemeral = node.isEphemeral();
-        writeBinary(is_ephemeral ? node.ephemeralOwner() : 0, out);
+        writeBinary(node.ephemeralOwner(), out);
         if (version < SnapshotVersion::V6)
             writeBinary(static_cast<int32_t>(node.data_size), out);
+        const bool is_ephemeral = node.isEphemeral();
         writeBinary(is_ephemeral ? 0 : node.numChildren(), out);
         writeBinary(node.pzxid, out);
 
@@ -162,15 +162,15 @@ namespace
         }
         int32_t num_children = 0;
         readBinary(num_children, in);
-        if (num_children != 0)
-            node.ephemeral_or_children_data.children_info.num_children = num_children;
+        if (ephemeral_owner == 0)
+            node.setNumChildren(num_children);
 
         readBinary(node.pzxid, in);
 
         int32_t seq_num = 0;
         readBinary(seq_num, in);
-        if (seq_num != 0)
-            node.ephemeral_or_children_data.children_info.seq_num = seq_num;
+        if (ephemeral_owner == 0)
+            node.setSeqNum(seq_num);
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
         {
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index ac4a9433e30..e855274f08b 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -172,7 +172,11 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
 
     hash.update(path);
 
-    hash.update(node.data, node.data_size);
+    if (node.data_size != 0)
+    {
+        chassert(node.data != nullptr);
+        hash.update(node.data, node.data_size);
+    }
 
     hash.update(node.czxid);
     hash.update(node.mzxid);
@@ -369,7 +373,7 @@ void KeeperStorage::initializeSystemNodes()
 
         // update root and the digest based on it
         auto current_root_it = container.find("/");
-        assert(current_root_it != container.end());
+        chassert(current_root_it != container.end());
         removeDigest(current_root_it->value, "/");
         auto updated_root_it = container.updateValue(
             "/",
@@ -385,7 +389,7 @@ void KeeperStorage::initializeSystemNodes()
     // insert child system nodes
     for (const auto & [path, data] : keeper_context->getSystemNodesWithData())
     {
-        assert(path.starts_with(keeper_system_path));
+        chassert(path.starts_with(keeper_system_path));
         Node child_system_node;
         child_system_node.setData(data);
         auto [map_key, _] = container.insert(std::string{path}, child_system_node);
@@ -430,7 +434,7 @@ std::shared_ptr<KeeperStorage::Node> KeeperStorage::UncommittedState::tryGetNode
 
 void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
 {
-    assert(!delta.path.empty());
+    chassert(!delta.path.empty());
     if (!nodes.contains(delta.path))
     {
         if (auto storage_node = tryGetNodeFromStorage(delta.path))
@@ -446,7 +450,7 @@ void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
 
             if constexpr (std::same_as<DeltaType, CreateNodeDelta>)
             {
-                assert(!node);
+                chassert(!node);
                 node = std::make_shared<Node>();
                 node->copyStats(operation.stat);
                 node->setData(operation.data);
@@ -455,13 +459,13 @@ void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
             }
             else if constexpr (std::same_as<DeltaType, RemoveNodeDelta>)
             {
-                assert(node);
+                chassert(node);
                 node = nullptr;
                 last_applied_zxid = delta.zxid;
             }
             else if constexpr (std::same_as<DeltaType, UpdateNodeDelta>)
             {
-                assert(node);
+                chassert(node);
                 node->invalidateDigestCache();
                 operation.update_fn(*node);
                 last_applied_zxid = delta.zxid;
@@ -499,7 +503,7 @@ void KeeperStorage::UncommittedState::addDeltas(std::vector<Delta> new_deltas)
 
 void KeeperStorage::UncommittedState::commit(int64_t commit_zxid)
 {
-    assert(deltas.empty() || deltas.front().zxid >= commit_zxid);
+    chassert(deltas.empty() || deltas.front().zxid >= commit_zxid);
 
     // collect nodes that have no further modification in the current transaction
     std::unordered_set<std::string> modified_nodes;
@@ -517,7 +521,7 @@ void KeeperStorage::UncommittedState::commit(int64_t commit_zxid)
         if (!front_delta.path.empty())
         {
             auto & path_deltas = deltas_for_path.at(front_delta.path);
-            assert(path_deltas.front() == &front_delta);
+            chassert(path_deltas.front() == &front_delta);
             path_deltas.pop_front();
             if (path_deltas.empty())
             {
@@ -535,7 +539,7 @@ void KeeperStorage::UncommittedState::commit(int64_t commit_zxid)
         else if (auto * add_auth = std::get_if<AddAuthDelta>(&front_delta.operation))
         {
             auto & uncommitted_auth = session_and_auth[add_auth->session_id];
-            assert(!uncommitted_auth.empty() && uncommitted_auth.front() == &add_auth->auth_id);
+            chassert(!uncommitted_auth.empty() && uncommitted_auth.front() == &add_auth->auth_id);
             uncommitted_auth.pop_front();
             if (uncommitted_auth.empty())
                 session_and_auth.erase(add_auth->session_id);
@@ -575,7 +579,7 @@ void KeeperStorage::UncommittedState::rollback(int64_t rollback_zxid)
         if (delta_it->zxid < rollback_zxid)
             break;
 
-        assert(delta_it->zxid == rollback_zxid);
+        chassert(delta_it->zxid == rollback_zxid);
         if (!delta_it->path.empty())
         {
             std::visit(
@@ -1917,7 +1921,7 @@ struct KeeperStorageMultiRequestProcessor final : public KeeperStorageRequestPro
             }
         }
 
-        assert(request.requests.empty() || operation_type.has_value());
+        chassert(request.requests.empty() || operation_type.has_value());
     }
 
     std::vector<KeeperStorage::Delta>
@@ -1966,7 +1970,7 @@ struct KeeperStorageMultiRequestProcessor final : public KeeperStorageRequestPro
 
         auto & deltas = storage.uncommitted_state.deltas;
         // the deltas will have at least SubDeltaEnd or FailedMultiDelta
-        assert(!deltas.empty());
+        chassert(!deltas.empty());
         if (auto * failed_multi = std::get_if<KeeperStorage::FailedMultiDelta>(&deltas.front().operation))
         {
             for (size_t i = 0; i < concrete_requests.size(); ++i)
@@ -2393,7 +2397,7 @@ KeeperStorage::ResponsesForSessions KeeperStorage::processRequest(
 
         if (is_local)
         {
-            assert(zk_request->isReadRequest());
+            chassert(zk_request->isReadRequest());
             if (check_acl && !request_processor->checkAuth(*this, session_id, true))
             {
                 response = zk_request->makeResponse();
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 55d2e20d44c..c3350275d2f 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -50,7 +50,6 @@ public:
             int64_t mtime : 63;
         } is_ephemeral_and_mtime{false, 0};
 
-
         union
         {
             int64_t ephemeral_owner;
@@ -89,7 +88,9 @@ public:
 
         int64_t ephemeralOwner() const
         {
-            return isEphemeral() ? ephemeral_or_children_data.ephemeral_owner : 0;
+            if (isEphemeral())
+                return ephemeral_or_children_data.ephemeral_owner;
+            return 0;
         }
 
         void setEphemeralOwner(int64_t ephemeral_owner)
@@ -100,9 +101,17 @@ public:
 
         int32_t numChildren() const
         {
+            if (isEphemeral())
+                return 0;
+
             return ephemeral_or_children_data.children_info.num_children;
         }
 
+        void setNumChildren(int32_t num_children)
+        {
+            ephemeral_or_children_data.children_info.num_children = num_children;
+        }
+
         void increaseNumChildren()
         {
             chassert(!isEphemeral());
@@ -111,6 +120,9 @@ public:
 
         int32_t seqNum() const
         {
+            if (isEphemeral())
+                return 0;
+
             return ephemeral_or_children_data.children_info.seq_num;
         }
 
@@ -121,6 +133,7 @@ public:
 
         void increaseSeqNum()
         {
+            chassert(!isEphemeral());
             ++ephemeral_or_children_data.children_info.seq_num;
         }
 
@@ -175,8 +188,10 @@ public:
         ChildrenSet children{};
     };
 
+#if !defined(ADDRESS_SANITIZER) && !defined(MEMORY_SANITIZER)
     static_assert(
         sizeof(ListNode<Node>) <= 144, "std::list node containing ListNode<Node> is > 160 bytes which will increase memory consumption");
+#endif
 
     enum DigestVersion : uint8_t
     {
diff --git a/src/Coordination/ZooKeeperDataReader.cpp b/src/Coordination/ZooKeeperDataReader.cpp
index 2e173667e28..e027b44b3a2 100644
--- a/src/Coordination/ZooKeeperDataReader.cpp
+++ b/src/Coordination/ZooKeeperDataReader.cpp
@@ -123,11 +123,13 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, LoggerP
         int64_t ephemeral_owner;
         Coordination::read(ephemeral_owner, in);
         if (ephemeral_owner != 0)
-          node.setEphemeralOwner(ephemeral_owner);
+            node.setEphemeralOwner(ephemeral_owner);
         Coordination::read(node.pzxid, in);
         if (!path.empty())
         {
-            node.setSeqNum(node.cversion);
+            if (ephemeral_owner == 0)
+                node.setSeqNum(node.cversion);
+
             storage.container.insertOrReplace(path, node);
 
             if (ephemeral_owner != 0)

From ff4729ccc4adbedeb3f70d5221820e9f54febaab Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 7 Feb 2024 16:40:23 +0100
Subject: [PATCH 0710/1081] Improve replaceTableExpressionAndRemoveJoin
 function

---
 src/Storages/StorageMerge.cpp | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index df5b0cd715d..301ff3f37d5 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -60,7 +60,7 @@
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
-#include "Core/NamesAndTypes.h"
+#include <Core/NamesAndTypes.h>
 #include <Functions/FunctionFactory.h>
 
 namespace
@@ -625,17 +625,25 @@ namespace
 class ApplyAliasColumnExpressionsVisitor : public InDepthQueryTreeVisitor<ApplyAliasColumnExpressionsVisitor>
 {
 public:
-    ApplyAliasColumnExpressionsVisitor() = default;
+    explicit ApplyAliasColumnExpressionsVisitor(QueryTreeNodePtr replacement_table_expression_)
+        : replacement_table_expression(replacement_table_expression_)
+    {}
 
     void visitImpl(QueryTreeNodePtr & node)
     {
-        if (auto * column = node->as<ColumnNode>();
-            column != nullptr && column->hasExpression())
+        if (auto * column = node->as<ColumnNode>(); column != nullptr)
         {
-            node = column->getExpressionOrThrow();
-            node->setAlias(column->getColumnName());
+            if (column->hasExpression())
+            {
+                node = column->getExpressionOrThrow();
+                node->setAlias(column->getColumnName());
+            }
+            else
+                column->setColumnSource(replacement_table_expression);
         }
     }
+private:
+    QueryTreeNodePtr replacement_table_expression;
 };
 
 bool hasUnknownColumn(const QueryTreeNodePtr & node, QueryTreeNodePtr replacement_table_expression)
@@ -783,7 +791,7 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Required column '{}' is not resolved", column_name);
         auto fake_column = resolved_column->getColumn();
 
-        ApplyAliasColumnExpressionsVisitor visitor;
+        ApplyAliasColumnExpressionsVisitor visitor(replacement_table_expression);
         visitor.visit(fake_node);
 
         projection.push_back(fake_node);
@@ -865,7 +873,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
                     auto * resolved_column = fake_node->as<ColumnNode>();
 
                     column_node = fake_node;
-                    ApplyAliasColumnExpressionsVisitor visitor;
+                    ApplyAliasColumnExpressionsVisitor visitor(replacement_table_expression);
                     visitor.visit(column_node);
 
                     if (!resolved_column || !resolved_column->getExpression())

From 813020a1a6f4462dea1edec3cc42e000206b6327 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 7 Feb 2024 16:44:09 +0100
Subject: [PATCH 0711/1081] remove redundant logging

---
 src/Storages/StorageMerge.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 301ff3f37d5..d3b8f30b1c5 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -800,8 +800,6 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
 
     query_node->resolveProjectionColumns(std::move(projection_columns));
 
-    LOG_DEBUG(&Poco::Logger::get("removeJoin"), "Result:\n{}", modified_query->dumpTree());
-
     return modified_query;
 }
 

From ae7dcdffd89083e3a5a4ee66838387c35853f54b Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 7 Feb 2024 15:46:08 +0000
Subject: [PATCH 0712/1081] Undo terrible silent patching

---
 contrib/libssh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/libssh b/contrib/libssh
index 2c76332ef56..5b43b6183c9 160000
--- a/contrib/libssh
+++ b/contrib/libssh
@@ -1 +1 @@
-Subproject commit 2c76332ef56d90f55965ab24da6b6dbcbef29c4c
+Subproject commit 5b43b6183c93c5d170b13719e1fcc9c3def7e5d2

From e3896a31c69ae6d1f40c24ae4d40f2c7215f9e09 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 7 Feb 2024 15:56:01 +0000
Subject: [PATCH 0713/1081] Upgrade to v0.9.8

---
 contrib/libssh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/libssh b/contrib/libssh
index 5b43b6183c9..ed4011b9187 160000
--- a/contrib/libssh
+++ b/contrib/libssh
@@ -1 +1 @@
-Subproject commit 5b43b6183c93c5d170b13719e1fcc9c3def7e5d2
+Subproject commit ed4011b91873836713576475a98cd132cd834539

From a740fc7835ff54bda95c322d9d19e31349144d8e Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 7 Feb 2024 14:46:38 +0000
Subject: [PATCH 0714/1081] Cleanup CMakeLists.txt file

---
 contrib/libssh-cmake/CMakeLists.txt       | 104 +++++++++++++++++-----
 contrib/libssh-cmake/IncludeSources.cmake |  98 --------------------
 2 files changed, 84 insertions(+), 118 deletions(-)
 delete mode 100644 contrib/libssh-cmake/IncludeSources.cmake

diff --git a/contrib/libssh-cmake/CMakeLists.txt b/contrib/libssh-cmake/CMakeLists.txt
index eee3df832fa..7b589718140 100644
--- a/contrib/libssh-cmake/CMakeLists.txt
+++ b/contrib/libssh-cmake/CMakeLists.txt
@@ -8,24 +8,12 @@ endif()
 set(LIB_SOURCE_DIR "${ClickHouse_SOURCE_DIR}/contrib/libssh")
 set(LIB_BINARY_DIR "${ClickHouse_BINARY_DIR}/contrib/libssh")
 
-project(libssh VERSION 0.9.7 LANGUAGES C)
+# Set CMake variables which are used in libssh_version.h.cmake
+project(libssh VERSION 0.9.8 LANGUAGES C)
 
-# global needed variable
-set(APPLICATION_NAME ${PROJECT_NAME})
-
-# SOVERSION scheme: CURRENT.AGE.REVISION
-#   If there was an incompatible interface change:
-#     Increment CURRENT. Set AGE and REVISION to 0
-#   If there was a compatible interface change:
-#     Increment AGE. Set REVISION to 0
-#   If the source code was changed, but there were no interface changes:
-#     Increment REVISION.
-set(LIBRARY_VERSION "4.8.7")
+set(LIBRARY_VERSION "4.8.8")
 set(LIBRARY_SOVERSION "4")
 
-# Copy library files to a lib sub-directory
-set(CMAKE_LIBRARY_OUTPUT_DIRECTORY "${LIB_BINARY_DIR}/lib")
-
 set(CMAKE_THREAD_PREFER_PTHREADS ON)
 set(THREADS_PREFER_PTHREAD_FLAG ON)
 
@@ -33,7 +21,87 @@ set(WITH_ZLIB OFF)
 set(WITH_SYMBOL_VERSIONING OFF)
 set(WITH_SERVER ON)
 
-include(IncludeSources.cmake)
+set(libssh_SRCS
+    ${LIB_SOURCE_DIR}/src/agent.c
+    ${LIB_SOURCE_DIR}/src/auth.c
+    ${LIB_SOURCE_DIR}/src/base64.c
+    ${LIB_SOURCE_DIR}/src/bignum.c
+    ${LIB_SOURCE_DIR}/src/buffer.c
+    ${LIB_SOURCE_DIR}/src/callbacks.c
+    ${LIB_SOURCE_DIR}/src/channels.c
+    ${LIB_SOURCE_DIR}/src/client.c
+    ${LIB_SOURCE_DIR}/src/config.c
+    ${LIB_SOURCE_DIR}/src/connect.c
+    ${LIB_SOURCE_DIR}/src/connector.c
+    ${LIB_SOURCE_DIR}/src/curve25519.c
+    ${LIB_SOURCE_DIR}/src/dh.c
+    ${LIB_SOURCE_DIR}/src/ecdh.c
+    ${LIB_SOURCE_DIR}/src/error.c
+    ${LIB_SOURCE_DIR}/src/getpass.c
+    ${LIB_SOURCE_DIR}/src/init.c
+    ${LIB_SOURCE_DIR}/src/kdf.c
+    ${LIB_SOURCE_DIR}/src/kex.c
+    ${LIB_SOURCE_DIR}/src/known_hosts.c
+    ${LIB_SOURCE_DIR}/src/knownhosts.c
+    ${LIB_SOURCE_DIR}/src/legacy.c
+    ${LIB_SOURCE_DIR}/src/log.c
+    ${LIB_SOURCE_DIR}/src/match.c
+    ${LIB_SOURCE_DIR}/src/messages.c
+    ${LIB_SOURCE_DIR}/src/misc.c
+    ${LIB_SOURCE_DIR}/src/options.c
+    ${LIB_SOURCE_DIR}/src/packet.c
+    ${LIB_SOURCE_DIR}/src/packet_cb.c
+    ${LIB_SOURCE_DIR}/src/packet_crypt.c
+    ${LIB_SOURCE_DIR}/src/pcap.c
+    ${LIB_SOURCE_DIR}/src/pki.c
+    ${LIB_SOURCE_DIR}/src/pki_container_openssh.c
+    ${LIB_SOURCE_DIR}/src/poll.c
+    ${LIB_SOURCE_DIR}/src/session.c
+    ${LIB_SOURCE_DIR}/src/scp.c
+    ${LIB_SOURCE_DIR}/src/socket.c
+    ${LIB_SOURCE_DIR}/src/string.c
+    ${LIB_SOURCE_DIR}/src/threads.c
+    ${LIB_SOURCE_DIR}/src/wrapper.c
+    ${LIB_SOURCE_DIR}/src/external/bcrypt_pbkdf.c
+    ${LIB_SOURCE_DIR}/src/external/blowfish.c
+    ${LIB_SOURCE_DIR}/src/external/chacha.c
+    ${LIB_SOURCE_DIR}/src/external/poly1305.c
+    ${LIB_SOURCE_DIR}/src/chachapoly.c
+    ${LIB_SOURCE_DIR}/src/config_parser.c
+    ${LIB_SOURCE_DIR}/src/token.c
+    ${LIB_SOURCE_DIR}/src/pki_ed25519_common.c
+
+    ${LIB_SOURCE_DIR}/src/threads/noop.c
+    ${LIB_SOURCE_DIR}/src/threads/pthread.c
+
+    # LIBCRYPT specific
+    ${libssh_SRCS}
+    ${LIB_SOURCE_DIR}/src/threads/libcrypto.c
+    ${LIB_SOURCE_DIR}/src/pki_crypto.c
+    ${LIB_SOURCE_DIR}/src/ecdh_crypto.c
+    ${LIB_SOURCE_DIR}/src/libcrypto.c
+    ${LIB_SOURCE_DIR}/src/dh_crypto.c
+
+    ${LIB_SOURCE_DIR}/src/options.c
+    ${LIB_SOURCE_DIR}/src/server.c
+    ${LIB_SOURCE_DIR}/src/bind.c
+    ${LIB_SOURCE_DIR}/src/bind_config.c
+)
+
+if (NOT (ENABLE_OPENSSL OR ENABLE_OPENSSL_DYNAMIC))
+    add_compile_definitions(USE_BORINGSSL=1)
+endif()
+
+configure_file(${LIB_SOURCE_DIR}/include/libssh/libssh_version.h.cmake ${LIB_BINARY_DIR}/include/libssh/libssh_version.h @ONLY)
+
+add_library(_ssh STATIC ${libssh_SRCS})
+add_library(ch_contrib::ssh ALIAS _ssh)
+
+target_link_libraries(_ssh PRIVATE OpenSSL::Crypto)
+
+target_include_directories(_ssh PUBLIC "${LIB_SOURCE_DIR}/include" "${LIB_BINARY_DIR}/include")
+
+# These headers need to be generated using the native build system on each platform.
 if (OS_LINUX)
     if (ARCH_AMD64)
         if (USE_MUSL)
@@ -63,7 +131,3 @@ elseif (OS_FREEBSD)
 else ()
     message(FATAL_ERROR "Platform is not supported")
 endif()
-
-configure_file(${LIB_SOURCE_DIR}/include/libssh/libssh_version.h.cmake
-               ${LIB_BINARY_DIR}/include/libssh/libssh_version.h
-               @ONLY)
diff --git a/contrib/libssh-cmake/IncludeSources.cmake b/contrib/libssh-cmake/IncludeSources.cmake
deleted file mode 100644
index 30348d5d7dd..00000000000
--- a/contrib/libssh-cmake/IncludeSources.cmake
+++ /dev/null
@@ -1,98 +0,0 @@
-set(LIBSSH_LINK_LIBRARIES
-  ${LIBSSH_LINK_LIBRARIES}
-  OpenSSL::Crypto
-)
-
-set(libssh_SRCS
-  ${LIB_SOURCE_DIR}/src/agent.c
-  ${LIB_SOURCE_DIR}/src/auth.c
-  ${LIB_SOURCE_DIR}/src/base64.c
-  ${LIB_SOURCE_DIR}/src/bignum.c
-  ${LIB_SOURCE_DIR}/src/buffer.c
-  ${LIB_SOURCE_DIR}/src/callbacks.c
-  ${LIB_SOURCE_DIR}/src/channels.c
-  ${LIB_SOURCE_DIR}/src/client.c
-  ${LIB_SOURCE_DIR}/src/config.c
-  ${LIB_SOURCE_DIR}/src/connect.c
-  ${LIB_SOURCE_DIR}/src/connector.c
-  ${LIB_SOURCE_DIR}/src/curve25519.c
-  ${LIB_SOURCE_DIR}/src/dh.c
-  ${LIB_SOURCE_DIR}/src/ecdh.c
-  ${LIB_SOURCE_DIR}/src/error.c
-  ${LIB_SOURCE_DIR}/src/getpass.c
-  ${LIB_SOURCE_DIR}/src/init.c
-  ${LIB_SOURCE_DIR}/src/kdf.c
-  ${LIB_SOURCE_DIR}/src/kex.c
-  ${LIB_SOURCE_DIR}/src/known_hosts.c
-  ${LIB_SOURCE_DIR}/src/knownhosts.c
-  ${LIB_SOURCE_DIR}/src/legacy.c
-  ${LIB_SOURCE_DIR}/src/log.c
-  ${LIB_SOURCE_DIR}/src/match.c
-  ${LIB_SOURCE_DIR}/src/messages.c
-  ${LIB_SOURCE_DIR}/src/misc.c
-  ${LIB_SOURCE_DIR}/src/options.c
-  ${LIB_SOURCE_DIR}/src/packet.c
-  ${LIB_SOURCE_DIR}/src/packet_cb.c
-  ${LIB_SOURCE_DIR}/src/packet_crypt.c
-  ${LIB_SOURCE_DIR}/src/pcap.c
-  ${LIB_SOURCE_DIR}/src/pki.c
-  ${LIB_SOURCE_DIR}/src/pki_container_openssh.c
-  ${LIB_SOURCE_DIR}/src/poll.c
-  ${LIB_SOURCE_DIR}/src/session.c
-  ${LIB_SOURCE_DIR}/src/scp.c
-  ${LIB_SOURCE_DIR}/src/socket.c
-  ${LIB_SOURCE_DIR}/src/string.c
-  ${LIB_SOURCE_DIR}/src/threads.c
-  ${LIB_SOURCE_DIR}/src/wrapper.c
-  ${LIB_SOURCE_DIR}/src/external/bcrypt_pbkdf.c
-  ${LIB_SOURCE_DIR}/src/external/blowfish.c
-  ${LIB_SOURCE_DIR}/src/external/chacha.c
-  ${LIB_SOURCE_DIR}/src/external/poly1305.c
-  ${LIB_SOURCE_DIR}/src/chachapoly.c
-  ${LIB_SOURCE_DIR}/src/config_parser.c
-  ${LIB_SOURCE_DIR}/src/token.c
-  ${LIB_SOURCE_DIR}/src/pki_ed25519_common.c
-)
-
-set(libssh_SRCS
-    ${libssh_SRCS}
-    ${LIB_SOURCE_DIR}/src/threads/noop.c
-    ${LIB_SOURCE_DIR}/src/threads/pthread.c
-)
-
-# LIBCRYPT specific
-set(libssh_SRCS
-    ${libssh_SRCS}
-    ${LIB_SOURCE_DIR}/src/threads/libcrypto.c
-    ${LIB_SOURCE_DIR}/src/pki_crypto.c
-    ${LIB_SOURCE_DIR}/src/ecdh_crypto.c
-    ${LIB_SOURCE_DIR}/src/libcrypto.c
-    ${LIB_SOURCE_DIR}/src/dh_crypto.c
-)
-
-if (NOT (ENABLE_OPENSSL OR ENABLE_OPENSSL_DYNAMIC))
-    add_compile_definitions(USE_BORINGSSL=1)
-endif()
-
-set(libssh_SRCS
-${libssh_SRCS}
-${LIB_SOURCE_DIR}/src/options.c
-${LIB_SOURCE_DIR}/src/server.c
-${LIB_SOURCE_DIR}/src/bind.c
-${LIB_SOURCE_DIR}/src/bind_config.c
-)
-
-
-add_library(_ssh STATIC ${libssh_SRCS})
-
-target_include_directories(_ssh PRIVATE ${LIB_BINARY_DIR})
-target_include_directories(_ssh PUBLIC "${LIB_SOURCE_DIR}/include" "${LIB_BINARY_DIR}/include")
-target_link_libraries(_ssh
-                      PRIVATE ${LIBSSH_LINK_LIBRARIES})
-
-add_library(ch_contrib::ssh ALIAS _ssh)
-
-target_compile_options(_ssh
-                     PRIVATE
-                        ${DEFAULT_C_COMPILE_FLAGS}
-                        -D_GNU_SOURCE)

From a547116821ccc680e234701f427b918e4234a3e4 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 7 Feb 2024 17:58:15 +0100
Subject: [PATCH 0715/1081] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 772fe690597..f891f52822a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -112,7 +112,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"min_external_table_block_size_rows", DEFAULT_INSERT_BLOCK_SIZE, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough"},
               {"min_external_table_block_size_bytes", DEFAULT_INSERT_BLOCK_SIZE * 256, DEFAULT_INSERT_BLOCK_SIZE * 256, "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough."},
               {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."},
-              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},

From a9624786f2ebb9b6633e7e324a98c52cc8b7ebfb Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 7 Feb 2024 14:47:10 +0300
Subject: [PATCH 0716/1081] Revert "Revert "MergeTree FINAL optimization
 diagnostics and settings""

---
 src/Core/Settings.h                           |  2 +
 src/Core/SettingsChangesHistory.h             |  4 +-
 src/Processors/QueryPlan/PartsSplitter.cpp    | 38 +++++++++++++++----
 src/Processors/QueryPlan/PartsSplitter.h      |  3 +-
 .../QueryPlan/ReadFromMergeTree.cpp           |  6 ++-
 5 files changed, 42 insertions(+), 11 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index dc863576a85..67bd721d3d1 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -215,6 +215,8 @@ class IColumn;
     M(UInt64, merge_tree_max_rows_to_use_cache, (128 * 8192), "The maximum number of rows per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(UInt64, merge_tree_max_bytes_to_use_cache, (192 * 10 * 1024 * 1024), "The maximum number of bytes per request, to use the cache of uncompressed data. If the request is large, the cache is not used. (For large queries not to flush out the cache.)", 0) \
     M(Bool, do_not_merge_across_partitions_select_final, false, "Merge parts only in one partition in select final", 0) \
+    M(Bool, split_parts_ranges_into_intersecting_and_non_intersecting_final, true, "Split parts ranges into intersecting and non intersecting during FINAL optimization", 0) \
+    M(Bool, split_intersecting_parts_ranges_into_layers_final, true, "Split intersecting parts ranges into layers during FINAL optimization", 0) \
     M(Bool, allow_experimental_inverted_index, false, "If it is set to true, allow to use experimental inverted index.", 0) \
     \
     M(UInt64, mysql_max_rows_to_insert, 65536, "The maximum number of rows in MySQL batch insertion of the MySQL storage engine", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index db3a76e29cd..a2612cab850 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -115,7 +115,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
-              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"}}},
+              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"},
+              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", false, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
+              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
     {"23.9", {{"optimize_group_by_constant_keys", false, true, "Optimize group by constant keys by default"},
               {"input_format_json_try_infer_named_tuples_from_objects", false, true, "Try to infer named Tuples from JSON objects by default"},
               {"input_format_json_read_numbers_as_strings", false, true, "Allow to read numbers as strings in JSON formats by default"},
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 7c66c0cc8df..363fdca22c5 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -228,7 +228,7 @@ struct SplitPartsRangesResult
     RangesInDataParts intersecting_parts_ranges;
 };
 
-SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts)
+SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts, const LoggerPtr & logger)
 {
     /** Split ranges in data parts into intersecting ranges in data parts and non intersecting ranges in data parts.
       *
@@ -483,10 +483,15 @@ SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts)
         intersecting_ranges_in_data_parts.end(),
         [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
 
+    LOG_TEST(logger, "Non intersecting ranges in data parts {}", non_intersecting_ranges_in_data_parts.getDescriptions().describe());
+    LOG_TEST(logger, "Intersecting ranges in data parts {}", intersecting_ranges_in_data_parts.getDescriptions().describe());
+
     return {std::move(non_intersecting_ranges_in_data_parts), std::move(intersecting_ranges_in_data_parts)};
 }
 
-std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts, size_t max_layers)
+std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts,
+    size_t max_layers,
+    const LoggerPtr & logger)
 {
     // We will advance the iterator pointing to the mark with the smallest PK value until
     // there will be not less than rows_per_layer rows in the current layer (roughly speaking).
@@ -591,8 +596,18 @@ std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersecting
         result_layers.back() = std::move(current_layer_builder.getCurrentRangesInDataParts());
     }
 
-    for (auto & layer : result_layers)
+    size_t result_layers_size = result_layers.size();
+    LOG_TEST(logger, "Split intersecting ranges into {} layers", result_layers_size);
+
+    for (size_t i = 0; i < result_layers_size; ++i)
     {
+        auto & layer = result_layers[i];
+
+        LOG_TEST(logger, "Layer {} {} filter values in ({}, {}])",
+            i,
+            layer.getDescriptions().describe(),
+            i ? ::toString(borders[i - 1]) : "-inf", i < borders.size() ? ::toString(borders[i]) : "+inf");
+
         std::stable_sort(
             layer.begin(),
             layer.end(),
@@ -712,23 +727,32 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool force_process_all_ranges)
+    bool split_parts_ranges_into_intersecting_and_non_intersecting_final,
+    bool split_intersecting_parts_ranges_into_layers)
 {
     if (max_layers <= 1)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "max_layer should be greater than 1");
 
+    auto logger = getLogger("PartsSplitter");
+
     SplitPartsWithRangesByPrimaryKeyResult result;
 
     RangesInDataParts intersecting_parts_ranges = std::move(parts);
 
-    if (!force_process_all_ranges)
+    if (split_parts_ranges_into_intersecting_and_non_intersecting_final)
     {
-        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges);
+        SplitPartsRangesResult split_result = splitPartsRanges(intersecting_parts_ranges, logger);
         result.non_intersecting_parts_ranges = std::move(split_result.non_intersecting_parts_ranges);
         intersecting_parts_ranges = std::move(split_result.intersecting_parts_ranges);
     }
 
-    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers);
+    if (!split_intersecting_parts_ranges_into_layers)
+    {
+        result.merging_pipes.emplace_back(in_order_reading_step_getter(intersecting_parts_ranges));
+        return result;
+    }
+
+    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(intersecting_parts_ranges, max_layers, logger);
     auto filters = buildFilters(primary_key, borders);
     result.merging_pipes.resize(layers.size());
 
diff --git a/src/Processors/QueryPlan/PartsSplitter.h b/src/Processors/QueryPlan/PartsSplitter.h
index f1ed1cb0b9c..9bceb344589 100644
--- a/src/Processors/QueryPlan/PartsSplitter.h
+++ b/src/Processors/QueryPlan/PartsSplitter.h
@@ -34,5 +34,6 @@ SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     size_t max_layers,
     ContextPtr context,
     ReadingInOrderStepGetter && in_order_reading_step_getter,
-    bool force_process_all_ranges);
+    bool split_parts_ranges_into_intersecting_and_non_intersecting,
+    bool split_intersecting_parts_ranges_into_layers);
 }
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 5ed56f59fc1..8a04caede80 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1175,7 +1175,8 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
 
                 /// Parts of non-zero level still may contain duplicate PK values to merge on FINAL if there's is_deleted column,
                 /// so we have to process all ranges. It would be more optimal to remove this flag and add an extra filtering step.
-                bool force_process_all_ranges = !data.merging_params.is_deleted_column.empty();
+                bool split_parts_ranges_into_intersecting_and_non_intersecting_final = settings.split_parts_ranges_into_intersecting_and_non_intersecting_final &&
+                    data.merging_params.is_deleted_column.empty();
 
                 SplitPartsWithRangesByPrimaryKeyResult split_ranges_result = splitPartsWithRangesByPrimaryKey(
                     metadata_for_reading->getPrimaryKey(),
@@ -1184,7 +1185,8 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
                     num_streams,
                     context,
                     std::move(in_order_reading_step_getter),
-                    force_process_all_ranges);
+                    split_parts_ranges_into_intersecting_and_non_intersecting_final,
+                    settings.split_intersecting_parts_ranges_into_layers_final);
 
                 for (auto && non_intersecting_parts_range : split_ranges_result.non_intersecting_parts_ranges)
                     non_intersecting_parts_by_primary_key.push_back(std::move(non_intersecting_parts_range));

From 65db50731781abf6229e7c7993fb852c619b9711 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 7 Feb 2024 15:54:23 +0300
Subject: [PATCH 0717/1081] Fixed tests

---
 src/Core/SettingsChangesHistory.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index a2612cab850..eb567f113d0 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -111,13 +111,13 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
-              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"}}},
+              {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},
+              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", false, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
+              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
     {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
               {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
               {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
-              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"},
-              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", false, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
-              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
+              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"}}},
     {"23.9", {{"optimize_group_by_constant_keys", false, true, "Optimize group by constant keys by default"},
               {"input_format_json_try_infer_named_tuples_from_objects", false, true, "Try to infer named Tuples from JSON objects by default"},
               {"input_format_json_read_numbers_as_strings", false, true, "Allow to read numbers as strings in JSON formats by default"},

From 8f774f358f065b79519cc3dd45a6fbe4e6fbc43d Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 7 Feb 2024 20:16:33 +0300
Subject: [PATCH 0718/1081] Fixed tests

---
 src/Core/SettingsChangesHistory.h | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index eb567f113d0..5bd38d600c1 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -90,7 +90,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
               {"async_insert_busy_timeout_max_ms", 200, 200, "The minimum value of the asynchronous insert timeout in milliseconds; async_insert_busy_timeout_ms is aliased to async_insert_busy_timeout_max_ms"},
               {"async_insert_busy_timeout_increase_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases"},
-              {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"}}},
+              {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
+              {"split_parts_ranges_into_intersecting_and_non_intersecting_final", true, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
+              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},

From 4a2912d7913eb7bf97720f60767c31b9f2f3053d Mon Sep 17 00:00:00 2001
From: Ilya Yatsishin <2159081+qoega@users.noreply.github.com>
Date: Wed, 7 Feb 2024 21:47:54 +0400
Subject: [PATCH 0719/1081] Update src/Core/Settings.h

Co-authored-by: Antonio Andelic <antonio2368@users.noreply.github.com>
---
 src/Core/Settings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 5e009cda254..2ad91cfd164 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -857,7 +857,7 @@ class IColumn;
     M(UInt64, grace_hash_join_max_buckets, 1024, "Limit on the number of grace hash join buckets", 0) \
     M(Bool, optimize_distinct_in_order, true, "Enable DISTINCT optimization if some columns in DISTINCT form a prefix of sorting. For example, prefix of sorting key in merge tree or ORDER BY statement", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
-    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory.", 0) \
+    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory.", 0) ALIAS(extract_kvp_max_pairs_per_row) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
     M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \

From 328359dcd3b97ace008750e7ab40002c1c051e2a Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Wed, 7 Feb 2024 18:51:19 +0100
Subject: [PATCH 0720/1081] Update ZooKeeperImpl.cpp

---
 src/Common/ZooKeeper/ZooKeeperImpl.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.cpp b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
index 1fbadbd7616..dcfadff536a 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
@@ -401,6 +401,9 @@ ZooKeeper::ZooKeeper(
         keeper_feature_flags.logFlags(log);
 
         ProfileEvents::increment(ProfileEvents::ZooKeeperInit);
+
+        /// Avoid stale reads after connecting
+        sync("/", [](const SyncResponse &){});
     }
     catch (...)
     {

From 9a4dbc843ac26165a876395ae61983b3dcc32ae0 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Wed, 7 Feb 2024 17:28:09 +0000
Subject: [PATCH 0721/1081] validate type of arguments for minmax secondary
 index

---
 .../MergeTree/MergeTreeIndexMinMax.cpp        | 16 ++++++++-
 ..._minmax_index_aggregate_function.reference |  6 ++++
 .../02985_minmax_index_aggregate_function.sql | 36 +++++++++++++++++++
 3 files changed, 57 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02985_minmax_index_aggregate_function.reference
 create mode 100644 tests/queries/0_stateless/02985_minmax_index_aggregate_function.sql

diff --git a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
index b1f8e09be9f..20dfed8cf8f 100644
--- a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
@@ -15,6 +15,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int BAD_ARGUMENTS;
 }
 
 
@@ -217,7 +218,20 @@ MergeTreeIndexPtr minmaxIndexCreator(
     return std::make_shared<MergeTreeIndexMinMax>(index);
 }
 
-void minmaxIndexValidator(const IndexDescription & /* index */, bool /* attach */)
+void minmaxIndexValidator(const IndexDescription & index, bool attach)
 {
+    if (attach)
+        return;
+
+    for (const auto & column : index.sample_block)
+    {
+        if (!column.type->isComparable())
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Data type of argument for minmax index must be comparable, got {} type for column {} instead",
+                column.type->getName(), column.name);
+        }
+    }
 }
+
 }
diff --git a/tests/queries/0_stateless/02985_minmax_index_aggregate_function.reference b/tests/queries/0_stateless/02985_minmax_index_aggregate_function.reference
new file mode 100644
index 00000000000..e71eb4f0d57
--- /dev/null
+++ b/tests/queries/0_stateless/02985_minmax_index_aggregate_function.reference
@@ -0,0 +1,6 @@
+1
+5	10
+6	11
+7	12
+8	13
+9	14
diff --git a/tests/queries/0_stateless/02985_minmax_index_aggregate_function.sql b/tests/queries/0_stateless/02985_minmax_index_aggregate_function.sql
new file mode 100644
index 00000000000..7d35c1b310b
--- /dev/null
+++ b/tests/queries/0_stateless/02985_minmax_index_aggregate_function.sql
@@ -0,0 +1,36 @@
+DROP TABLE IF EXISTS t_index_agg_func;
+
+CREATE TABLE t_index_agg_func
+(
+    id UInt64,
+    v AggregateFunction(avg, UInt64),
+    INDEX idx_v v TYPE minmax GRANULARITY 1
+)
+ENGINE = AggregatingMergeTree ORDER BY id
+SETTINGS index_granularity = 4; -- { serverError BAD_ARGUMENTS }
+
+CREATE TABLE t_index_agg_func
+(
+    id UInt64,
+    v AggregateFunction(avg, UInt64),
+)
+ENGINE = AggregatingMergeTree ORDER BY id
+SETTINGS index_granularity = 4;
+
+ALTER TABLE t_index_agg_func ADD INDEX idx_v v TYPE minmax GRANULARITY 1; -- { serverError BAD_ARGUMENTS }
+
+ALTER TABLE t_index_agg_func ADD INDEX idx_v finalizeAggregation(v) TYPE minmax GRANULARITY 1;
+
+INSERT INTO t_index_agg_func SELECT number % 10, initializeAggregation('avgState', toUInt64(number % 20)) FROM numbers(1000);
+INSERT INTO t_index_agg_func SELECT number % 10, initializeAggregation('avgState', toUInt64(number % 20)) FROM numbers(1000, 1000);
+
+OPTIMIZE TABLE t_index_agg_func FINAL;
+
+SELECT count() FROM system.parts WHERE table = 't_index_agg_func' AND database = currentDatabase() AND active;
+
+SET force_data_skipping_indices = 'idx_v';
+SET use_skip_indexes_if_final = 1;
+
+SELECT id, finalizeAggregation(v) AS vv FROM t_index_agg_func FINAL WHERE vv >= 10 ORDER BY id;
+
+DROP TABLE t_index_agg_func;

From 7f8449f6d8868005acee00ac9aad11aecdddb692 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 7 Feb 2024 18:52:41 +0100
Subject: [PATCH 0722/1081] FixedString: Assert columns are of the same size

---
 src/Columns/ColumnFixedString.cpp |  1 +
 src/Columns/ColumnFixedString.h   | 16 +++++++++++-----
 2 files changed, 12 insertions(+), 5 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index 1ba59ce4f4b..7ff2716baf8 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -203,6 +203,7 @@ void ColumnFixedString::updatePermutation(IColumn::PermutationSortDirection dire
 void ColumnFixedString::insertRangeFrom(const IColumn & src, size_t start, size_t length)
 {
     const ColumnFixedString & src_concrete = assert_cast<const ColumnFixedString &>(src);
+    chassert(this->n == src_concrete.n);
 
     if (start + length > src_concrete.size())
         throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Parameters start = {}, length = {} are out of bound "
diff --git a/src/Columns/ColumnFixedString.h b/src/Columns/ColumnFixedString.h
index 70c26ba8496..b5a9038e5de 100644
--- a/src/Columns/ColumnFixedString.h
+++ b/src/Columns/ColumnFixedString.h
@@ -130,15 +130,21 @@ public:
     int compareAt(size_t p1, size_t p2, const IColumn & rhs_, int /*nan_direction_hint*/) const override
     {
         const ColumnFixedString & rhs = assert_cast<const ColumnFixedString &>(rhs_);
+        chassert(this->n == rhs.n);
         return memcmpSmallAllowOverflow15(chars.data() + p1 * n, rhs.chars.data() + p2 * n, n);
     }
 
-    void compareColumn(const IColumn & rhs, size_t rhs_row_num,
-                       PaddedPODArray<UInt64> * row_indexes, PaddedPODArray<Int8> & compare_results,
-                       int direction, int nan_direction_hint) const override
+    void compareColumn(
+        const IColumn & rhs_,
+        size_t rhs_row_num,
+        PaddedPODArray<UInt64> * row_indexes,
+        PaddedPODArray<Int8> & compare_results,
+        int direction,
+        int nan_direction_hint) const override
     {
-        return doCompareColumn<ColumnFixedString>(assert_cast<const ColumnFixedString &>(rhs), rhs_row_num, row_indexes,
-                                               compare_results, direction, nan_direction_hint);
+        const ColumnFixedString & rhs = assert_cast<const ColumnFixedString &>(rhs_);
+        chassert(this->n == rhs.n);
+        return doCompareColumn<ColumnFixedString>(rhs, rhs_row_num, row_indexes, compare_results, direction, nan_direction_hint);
     }
 
     bool hasEqualValues() const override

From 39da54cd508adb7a8d071d5ba4a0f118a8a1af23 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 7 Feb 2024 19:15:59 +0000
Subject: [PATCH 0723/1081] Fixing more tests.

---
 .../Optimizations/optimizePrewhere.cpp        | 48 +++++++++++++++++--
 1 file changed, 45 insertions(+), 3 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 6872141951e..9d997584a28 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -142,15 +142,17 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     // if (!settings.allow_experimental_analyzer)
     //     return;
 
-    const auto & table_expression_modifiers = read_from_merge_tree->getQueryInfo().table_expression_modifiers;
-    bool is_final = table_expression_modifiers && table_expression_modifiers->hasFinal();
+    //const auto & table_expression_modifiers = read_from_merge_tree->getQueryInfo().table_expression_modifiers;
+    bool is_final = read_from_merge_tree->isQueryWithFinal(); //table_expression_modifiers && table_expression_modifiers->hasFinal();
     bool optimize_move_to_prewhere = settings.optimize_move_to_prewhere && (!is_final || settings.optimize_move_to_prewhere_if_final);
+    // std::cerr << "============ !!! << " << is_final << ' ' << settings.optimize_move_to_prewhere_if_final << std::endl;
     if (!optimize_move_to_prewhere)
         return;
 
     const auto & storage_snapshot = read_from_merge_tree->getStorageSnapshot();
 
-    if (table_expression_modifiers && table_expression_modifiers->hasSampleSizeRatio())
+    //if (table_expression_modifiers && table_expression_modifiers->hasSampleSizeRatio())
+    if (read_from_merge_tree->isQueryWithSampling())
     {
         const auto & sampling_key = storage_snapshot->getMetadataForQuery()->getSamplingKey();
         const auto & sampling_source_columns = sampling_key.expression->getRequiredColumnsWithTypes();
@@ -226,6 +228,46 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     // for (const auto * input : split_result.second->getInputs())
     //     std::cerr << "in 2" << input->result_name << std::endl;
 
+
+    /// This is the leak of abstraction.
+    /// Splited actions may have inputs which are needed only for PREWHERE.
+    /// This is fine for ActionsDAG to have such a split, but it breakes defaults calculation.
+    ///
+    /// See 00950_default_prewhere for example.
+    /// Table has structure `APIKey UInt8, SessionType UInt8` and default `OperatingSystem = SessionType+1`
+    /// For a query with `SELECT OperatingSystem WHERE APIKey = 42 AND SessionType = 42` we push everything to PREWHERE
+    /// and columns APIKey, SessionType are removed from inputs (cause only OperatingSystem is needed).
+    /// However, column OperatingSystem is calculated after PREWHERE stage, based on SessionType value.
+    /// If column SessionType is removed by PREWHERE actions, we use zero as defaut, and get a wrong result.
+    ///
+    /// So, here we restore removed inputs for PREWHERE actions
+    {
+        // const auto & virtuals = read_from_merge_tree->getVirtualColumnNames();
+        // NameSet virtual_names(virtuals.begin(), virtuals.end());
+
+        //std::unordered_set<const ActionsDAG::Node *> first_inputs(split_result.first->getInputs().begin(), split_result.first->getInputs().end());
+        std::unordered_set<const ActionsDAG::Node *> first_outputs(split_result.first->getOutputs().begin(), split_result.first->getOutputs().end());
+        ///std::unordered_set<const ActionsDAG::Node *> second_inputs(split_result.second->getInputs().begin(), split_result.second->getInputs().end());
+
+        for (const auto * input : split_result.first->getInputs())
+        {
+            if (!first_outputs.contains(input))
+            {
+                split_result.first->getOutputs().push_back(input);
+                /// Add column to second actions as input.
+                /// Do not add it to result, so it would be removed.
+                split_result.second->addInput(input->result_name, input->result_type);
+            }
+        }
+
+        // NameSet input_columns;
+        // for (const auto * input : split_result.first->getInputs())
+        //     input_columns.insert(input->result_name);
+
+        // auto header = read_from_merge_tree->getStorageSnapshot()->getSampleBlockForColumns(read_from_merge_tree->getRealColumnNames());
+        // header = MergeTreeSelectProcessor::transformHeader(std::move(header), prewhere_info, {}, {});
+    }
+
     ActionsDAG::NodeRawConstPtrs conditions;
     conditions.reserve(split_result.split_nodes_mapping.size());
     for (const auto * condition : optimize_result.prewhere_nodes)

From 10c09b5817cd13b34d662728c95d9098e7dc7f32 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 7 Feb 2024 20:23:52 +0100
Subject: [PATCH 0724/1081] Enable MSAN in mem*Overflow15 functions

---
 src/Common/MemorySanitizer.h |  5 ++++
 src/Common/memcmpSmall.h     | 48 +++++++++++++++++++++++++++++++++---
 src/Common/memcpySmall.h     |  4 +++
 3 files changed, 53 insertions(+), 4 deletions(-)

diff --git a/src/Common/MemorySanitizer.h b/src/Common/MemorySanitizer.h
index d1b8fd07f33..2c4ae3a6cfb 100644
--- a/src/Common/MemorySanitizer.h
+++ b/src/Common/MemorySanitizer.h
@@ -13,6 +13,9 @@
 #undef __msan_unpoison_string
 
 #define __msan_unpoison(X, Y) /// NOLINT
+/// Given a pointer and **its size**, unpoisons up to 15 bytes **at the end**
+/// See memcmpSmall.h / memcpySmall.h
+#define __msan_unpoison_overflow_15(X, Y) /// NOLINT
 #define __msan_test_shadow(X, Y) (false) /// NOLINT
 #define __msan_print_shadow(X, Y) /// NOLINT
 #define __msan_unpoison_string(X) /// NOLINT
@@ -24,6 +27,8 @@
 #        undef __msan_print_shadow
 #        undef __msan_unpoison_string
 #        include <sanitizer/msan_interface.h>
+#        undef __msan_unpoison_overflow_15
+#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE) - ((PTR_SIZE) % 16)], ((PTR_SIZE) % 16))
 #    endif
 #endif
 
diff --git a/src/Common/memcmpSmall.h b/src/Common/memcmpSmall.h
index 36d5d7efab8..0b05b4a53bd 100644
--- a/src/Common/memcmpSmall.h
+++ b/src/Common/memcmpSmall.h
@@ -7,6 +7,7 @@
 #include <base/simd.h>
 
 #include <Core/Defines.h>
+#include <Common/MemorySanitizer.h>
 
 
 namespace detail
@@ -26,9 +27,8 @@ inline int cmp(T a, T b)
 
 
 /// We can process uninitialized memory in the functions below.
-/// Results don't depend on the values inside uninitialized memory but Memory Sanitizer cannot see it.
-/// Disable optimized functions if compile with Memory Sanitizer.
-#if defined(__AVX512BW__) && defined(__AVX512VL__) && !defined(MEMORY_SANITIZER)
+/// Results don't depend on the values inside uninitialized memory
+#if defined(__AVX512BW__) && defined(__AVX512VL__)
 #    include <immintrin.h>
 
 
@@ -42,6 +42,9 @@ inline int cmp(T a, T b)
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -74,6 +77,9 @@ inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char
 template <typename Char>
 inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -144,6 +150,9 @@ inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_siz
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, const Char * b, size_t size)
 {
+    __msan_unpoison_overflow_15(a, size);
+    __msan_unpoison_overflow_15(b, size);
+
     for (size_t offset = 0; offset < size; offset += 16)
     {
         uint16_t mask = _mm_cmp_epi8_mask(
@@ -174,6 +183,9 @@ inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Ch
     if (a_size != b_size)
         return false;
 
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     for (size_t offset = 0; offset < a_size; offset += 16)
     {
         uint16_t mask = _mm_cmp_epi8_mask(
@@ -246,6 +258,7 @@ inline bool memequal16(const void * a, const void * b)
 /** Compare memory region to zero */
 inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
 {
+    __msan_unpoison_overflow_15(reinterpret_cast<const char *>(data), size);
     const __m128i zero16 = _mm_setzero_si128();
 
     for (size_t offset = 0; offset < size; offset += 16)
@@ -263,7 +276,7 @@ inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
     return true;
 }
 
-#elif defined(__SSE2__) && !defined(MEMORY_SANITIZER)
+#elif defined(__SSE2__)
 #    include <emmintrin.h>
 
 
@@ -277,6 +290,9 @@ inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -309,6 +325,9 @@ inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char
 template <typename Char>
 inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -380,6 +399,9 @@ inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_siz
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, const Char * b, size_t size)
 {
+    __msan_unpoison_overflow_15(a, size);
+    __msan_unpoison_overflow_15(b, size);
+
     for (size_t offset = 0; offset < size; offset += 16)
     {
         uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
@@ -410,6 +432,9 @@ inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Ch
     if (a_size != b_size)
         return false;
 
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     for (size_t offset = 0; offset < a_size; offset += 16)
     {
         uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
@@ -483,6 +508,8 @@ inline bool memequal16(const void * a, const void * b)
 /** Compare memory region to zero */
 inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
 {
+    __msan_unpoison_overflow_15(reinterpret_cast<const char *>(data), size);
+
     const __m128i zero16 = _mm_setzero_si128();
 
     for (size_t offset = 0; offset < size; offset += 16)
@@ -509,6 +536,9 @@ inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -534,6 +564,9 @@ inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char
 template <typename Char>
 inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
 {
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
+
     size_t min_size = std::min(a_size, b_size);
 
     for (size_t offset = 0; offset < min_size; offset += 16)
@@ -599,6 +632,9 @@ inline int memcmpSmallLikeZeroPaddedAllowOverflow15(const Char * a, size_t a_siz
 template <typename Char>
 inline int memcmpSmallAllowOverflow15(const Char * a, const Char * b, size_t size)
 {
+    __msan_unpoison_overflow_15(a, size);
+    __msan_unpoison_overflow_15(b, size);
+
     for (size_t offset = 0; offset < size; offset += 16)
     {
         uint64_t mask = getNibbleMask(vceqq_u8(
@@ -625,6 +661,9 @@ inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Ch
     if (a_size != b_size)
         return false;
 
+    __msan_unpoison(&a[a_size - a_size % 16], a_size % 16);
+    __msan_unpoison(&b[b_size - b_size % 16], b_size % 16);
+
     for (size_t offset = 0; offset < a_size; offset += 16)
     {
         uint64_t mask = getNibbleMask(vceqq_u8(
@@ -683,6 +722,7 @@ inline bool memequal16(const void * a, const void * b)
 
 inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
 {
+    __msan_unpoison_overflow_15(reinterpret_cast<const char *>(data), size);
     for (size_t offset = 0; offset < size; offset += 16)
     {
         uint64_t mask = getNibbleMask(vceqzq_u8(vld1q_u8(reinterpret_cast<const unsigned char *>(data) + offset)));
diff --git a/src/Common/memcpySmall.h b/src/Common/memcpySmall.h
index 0c2aee96250..f3d26c60380 100644
--- a/src/Common/memcpySmall.h
+++ b/src/Common/memcpySmall.h
@@ -1,5 +1,7 @@
 #pragma once
 
+#include <Common/MemorySanitizer.h>
+
 #include <cstring>
 #include <sys/types.h> /// ssize_t
 
@@ -38,6 +40,7 @@ namespace detail
 {
     inline void memcpySmallAllowReadWriteOverflow15Impl(char * __restrict dst, const char * __restrict src, ssize_t n)
     {
+        __msan_unpoison_overflow_15(src, n);
         while (n > 0)
         {
             _mm_storeu_si128(reinterpret_cast<__m128i *>(dst),
@@ -64,6 +67,7 @@ namespace detail
 {
 inline void memcpySmallAllowReadWriteOverflow15Impl(char * __restrict dst, const char * __restrict src, ssize_t n)
 {
+    __msan_unpoison_overflow_15(src, n);
     while (n > 0)
     {
         vst1q_s8(reinterpret_cast<signed char *>(dst), vld1q_s8(reinterpret_cast<const signed char *>(src)));

From 33401643a409e28c7bfafff6e15bcee0579dbaed Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 20:28:37 +0100
Subject: [PATCH 0725/1081] Fix error

---
 docker/test/base/setup_export_logs.sh | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 156adb1d1e4..6209336ab4e 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -163,9 +163,10 @@ function setup_logs_replication
                 EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION_TRACE_LOG}"
             fi
         elif [[ "$table" = "coverage_log" ]]
+        then
             EXTRA_COLUMNS_FOR_TABLE="${EXTRA_COLUMNS_COVERAGE_LOG}"
             EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION_COVERAGE_LOG}"
-        then
+        else
             EXTRA_COLUMNS_FOR_TABLE="${EXTRA_COLUMNS}"
             EXTRA_COLUMNS_EXPRESSION_FOR_TABLE="${EXTRA_COLUMNS_EXPRESSION}"
         fi

From 4d25929d74b221a29436f26cd4abdc5ba692059b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 20:58:40 +0100
Subject: [PATCH 0726/1081] A few missing changes

---
 docker/packager/packager | 6 +++---
 tests/ci/report.py       | 9 +++++++++
 2 files changed, 12 insertions(+), 3 deletions(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index 8efd3b8f302..6af5f97e6ce 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -115,8 +115,8 @@ def run_docker_image_with_env(
     subprocess.check_call(cmd, shell=True)
 
 
-def is_release_build(debug_build: bool, package_type: str, sanitizer: str) -> bool:
-    return not debug_build and package_type == "deb" and sanitizer == ""
+def is_release_build(debug_build: bool, package_type: str, sanitizer: str, coverage: bool) -> bool:
+    return not debug_build and package_type == "deb" and sanitizer == "" and not coverage
 
 
 def parse_env_variables(
@@ -262,7 +262,7 @@ def parse_env_variables(
         build_target = (
             f"{build_target} clickhouse-odbc-bridge clickhouse-library-bridge"
         )
-        if is_release_build(debug_build, package_type, sanitizer):
+        if is_release_build(debug_build, package_type, sanitizer, coverage):
             cmake_flags.append("-DSPLIT_DEBUG_SYMBOLS=ON")
             result.append("WITH_PERFORMANCE=1")
             if is_cross_arm:
diff --git a/tests/ci/report.py b/tests/ci/report.py
index ce20c7293f9..9d43830a755 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -449,6 +449,12 @@ class BuildResult:
             return self._wrong_config_message
         return self.build_config.sanitizer
 
+    @property
+    def coverage(self) -> str:
+        if self.build_config is None:
+            return self._wrong_config_message
+        return self.build_config.coverage
+
     @property
     def grouped_urls(self) -> List[List[str]]:
         "Combine and preserve build_urls by artifact types"
@@ -775,6 +781,7 @@ HTML_BASE_BUILD_TEMPLATE = (
 <th>Build type</th>
 <th>Version</th>
 <th>Sanitizer</th>
+<th>Coverage</th>
 <th>Status</th>
 <th>Build log</th>
 <th>Build time</th>
@@ -816,6 +823,8 @@ def create_build_html_report(
             else:
                 row.append("<td>none</td>")
 
+            row.append(f"<td>{build_result.coverage}</td>")
+
             if build_result.status:
                 style = _get_status_style(build_result.status)
                 row.append(f'<td style="{style}">{build_result.status}</td>')

From 1c71a27527262db3034f067aef0e159d85306c6b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 7 Feb 2024 20:05:39 +0000
Subject: [PATCH 0727/1081] Remove some comments

---
 src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 9d997584a28..eb5f7a42819 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -142,16 +142,13 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     // if (!settings.allow_experimental_analyzer)
     //     return;
 
-    //const auto & table_expression_modifiers = read_from_merge_tree->getQueryInfo().table_expression_modifiers;
-    bool is_final = read_from_merge_tree->isQueryWithFinal(); //table_expression_modifiers && table_expression_modifiers->hasFinal();
+    bool is_final = read_from_merge_tree->isQueryWithFinal();
     bool optimize_move_to_prewhere = settings.optimize_move_to_prewhere && (!is_final || settings.optimize_move_to_prewhere_if_final);
-    // std::cerr << "============ !!! << " << is_final << ' ' << settings.optimize_move_to_prewhere_if_final << std::endl;
     if (!optimize_move_to_prewhere)
         return;
 
     const auto & storage_snapshot = read_from_merge_tree->getStorageSnapshot();
 
-    //if (table_expression_modifiers && table_expression_modifiers->hasSampleSizeRatio())
     if (read_from_merge_tree->isQueryWithSampling())
     {
         const auto & sampling_key = storage_snapshot->getMetadataForQuery()->getSamplingKey();

From 64d9d2d467dd187647c88fde23e21c3af92d8439 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 7 Feb 2024 20:44:35 +0000
Subject: [PATCH 0728/1081] Automatic style fix

---
 docker/packager/packager | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/docker/packager/packager b/docker/packager/packager
index 6af5f97e6ce..ca0ae8358f3 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -115,8 +115,12 @@ def run_docker_image_with_env(
     subprocess.check_call(cmd, shell=True)
 
 
-def is_release_build(debug_build: bool, package_type: str, sanitizer: str, coverage: bool) -> bool:
-    return not debug_build and package_type == "deb" and sanitizer == "" and not coverage
+def is_release_build(
+    debug_build: bool, package_type: str, sanitizer: str, coverage: bool
+) -> bool:
+    return (
+        not debug_build and package_type == "deb" and sanitizer == "" and not coverage
+    )
 
 
 def parse_env_variables(

From 48a48be13500a7eb5cbc8cacef529e872ffb1657 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 7 Feb 2024 22:28:43 +0100
Subject: [PATCH 0729/1081] Fix leftPad / rightPad function with FixedString
 input

---
 src/Functions/padString.cpp                   |   3 +-
 .../02986_leftpad_fixedstring.reference       | 124 ++++++++++++++++++
 .../0_stateless/02986_leftpad_fixedstring.sql |  49 +++++++
 3 files changed, 175 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02986_leftpad_fixedstring.reference
 create mode 100644 tests/queries/0_stateless/02986_leftpad_fixedstring.sql

diff --git a/src/Functions/padString.cpp b/src/Functions/padString.cpp
index d0f22aeeb3b..b26a4ec3d6a 100644
--- a/src/Functions/padString.cpp
+++ b/src/Functions/padString.cpp
@@ -1,5 +1,6 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
+#include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/GatherUtils/Algorithms.h>
@@ -188,7 +189,7 @@ namespace
                     arguments[2]->getName(),
                     getName());
 
-            return arguments[0];
+            return std::make_shared<DataTypeString>();
         }
 
         ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
diff --git a/tests/queries/0_stateless/02986_leftpad_fixedstring.reference b/tests/queries/0_stateless/02986_leftpad_fixedstring.reference
new file mode 100644
index 00000000000..32ebe0af9b6
--- /dev/null
+++ b/tests/queries/0_stateless/02986_leftpad_fixedstring.reference
@@ -0,0 +1,124 @@
+	
+a	String
+	
+a	String
+	1	1	1
+61	1	1	1
+6162	1	1	1
+616263	1	1	1
+61626333	1	1	1
+6162633334	1	1	1
+616263333433	1	1	1
+61626333343332	1	1	1
+6162633334333234	1	1	1
+206162633334333234	1	1	1
+20206162633334333234	1	1	1
+2020206162633334333234	1	1	1
+202020206162633334333234	1	1	1
+20202020206162633334333234	1	1	1
+2020202020206162633334333234	1	1	1
+202020202020206162633334333234	1	1	1
+20202020202020206162633334333234	1	1	1
+2020202020202020206162633334333234	1	1	1
+202020202020202020206162633334333234	1	1	1
+20202020202020202020206162633334333234	1	1	1
+	1	1	1
+61	1	1	1
+6162	1	1	1
+616263	1	1	1
+61626333	1	1	1
+6162633334	1	1	1
+616263333433	1	1	1
+61626333343332	1	1	1
+6162633334333234	1	1	1
+616263333433323420	1	1	1
+61626333343332342020	1	1	1
+6162633334333234202020	1	1	1
+616263333433323420202020	1	1	1
+61626333343332342020202020	1	1	1
+6162633334333234202020202020	1	1	1
+616263333433323420202020202020	1	1	1
+61626333343332342020202020202020	1	1	1
+6162633334333234202020202020202020	1	1	1
+616263333433323420202020202020202020	1	1	1
+61626333343332342020202020202020202020	1	1	1
+	1	1	1
+61	1	1	1
+6162	1	1	1
+616263	1	1	1
+61626333	1	1	1
+6162633334	1	1	1
+616263333433	1	1	1
+61626333343332	1	1	1
+6162633334333234	1	1	1
+F09F87AA6162633334333234	1	1	1
+F09F87AAF09F87B86162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
+	1	1	1
+61	1	1	1
+6162	1	1	1
+616263	1	1	1
+61626333	1	1	1
+6162633334	1	1	1
+616263333433	1	1	1
+61626333343332	1	1	1
+6162633334333234	1	1	1
+6162633334333234F09F87AA	1	1	1
+6162633334333234F09F87AAF09F87B8	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AA	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
+	1	1	1
+F09F87AA	1	1	1
+F09F87AAF09F87B8	1	1	1
+C391F09F87AAF09F87B8	1	1	1
+C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
+	1	1	1
+F09F87AA	1	1	1
+F09F87AAF09F87B8	1	1	1
+F09F87AAF09F87B8C391	1	1	1
+F09F87AAF09F87B8C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
diff --git a/tests/queries/0_stateless/02986_leftpad_fixedstring.sql b/tests/queries/0_stateless/02986_leftpad_fixedstring.sql
new file mode 100644
index 00000000000..cbc7f4646a5
--- /dev/null
+++ b/tests/queries/0_stateless/02986_leftpad_fixedstring.sql
@@ -0,0 +1,49 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/59604
+SELECT leftPad(toFixedString('abc', 3), 0), leftPad('abc', CAST('0', 'Int32'));
+SELECT leftPad(toFixedString('abc343243424324', 15), 1) as a, toTypeName(a);
+
+SELECT rightPad(toFixedString('abc', 3), 0), rightPad('abc', CAST('0', 'Int32'));
+SELECT rightPad(toFixedString('abc343243424324', 15), 1) as a, toTypeName(a);
+
+SELECT
+    hex(leftPad(toFixedString('abc34324' as s, 8), number)) as result,
+    hex(leftPad(s, number)) = result,
+    hex(leftPadUTF8(toFixedString(s, 8), number)) = result,
+    hex(leftPadUTF8(s, number)) = result
+FROM numbers(20);
+
+SELECT
+    hex(rightPad(toFixedString('abc34324' as s, 8), number)) as result,
+    hex(rightPad(s, number)) = result,
+    hex(rightPadUTF8(toFixedString(s, 8), number)) = result,
+    hex(rightPadUTF8(s, number)) = result
+FROM numbers(20);
+
+-- I'm not confident the behaviour should be like this. I'm only testing memory problems
+SELECT
+    hex(leftPadUTF8(toFixedString('abc34324' as s, 8), number, '🇪🇸')) as result,
+    hex(leftPadUTF8(s, number, '🇪🇸')) = result,
+    hex(leftPadUTF8(toFixedString(s, 8), number, '🇪🇸')) = result,
+    hex(leftPadUTF8(s, number, '🇪🇸')) = result
+FROM numbers(20);
+
+SELECT
+    hex(rightPadUTF8(toFixedString('abc34324' as s, 8), number, '🇪🇸')) as result,
+    hex(rightPadUTF8(s, number, '🇪🇸')) = result,
+    hex(rightPadUTF8(toFixedString(s, 8), number, '🇪🇸')) = result,
+    hex(rightPadUTF8(s, number, '🇪🇸')) = result
+FROM numbers(20);
+
+SELECT
+    hex(leftPadUTF8(toFixedString('🇪🇸' as s, 8), number, 'Ñ')) as result,
+    hex(leftPadUTF8(s, number, 'Ñ')) = result,
+    hex(leftPadUTF8(toFixedString(s, 8), number, 'Ñ')) = result,
+    hex(leftPadUTF8(s, number, 'Ñ')) = result
+FROM numbers(20);
+
+SELECT
+    hex(rightPadUTF8(toFixedString('🇪🇸' as s, 8), number, 'Ñ')) as result,
+    hex(rightPadUTF8(s, number, 'Ñ')) = result,
+    hex(rightPadUTF8(toFixedString(s, 8), number, 'Ñ')) = result,
+    hex(rightPadUTF8(s, number, 'Ñ')) = result
+FROM numbers(20);

From 62721fef781cfde424701b2148c9595d2705f088 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 7 Feb 2024 22:45:35 +0100
Subject: [PATCH 0730/1081] Fix your Py

---
 tests/ci/report.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/report.py b/tests/ci/report.py
index 9d43830a755..8b83566eb57 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -450,7 +450,7 @@ class BuildResult:
         return self.build_config.sanitizer
 
     @property
-    def coverage(self) -> str:
+    def coverage(self) -> bool:
         if self.build_config is None:
             return self._wrong_config_message
         return self.build_config.coverage

From 85bd8d3cf0fe71963db819b2bbb2b93728353f87 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 8 Feb 2024 00:23:04 +0100
Subject: [PATCH 0731/1081] Fix your Py

---
 tests/ci/report.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/ci/report.py b/tests/ci/report.py
index 8b83566eb57..de94c23bc2c 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -450,10 +450,10 @@ class BuildResult:
         return self.build_config.sanitizer
 
     @property
-    def coverage(self) -> bool:
+    def coverage(self) -> str:
         if self.build_config is None:
             return self._wrong_config_message
-        return self.build_config.coverage
+        return str(self.build_config.coverage)
 
     @property
     def grouped_urls(self) -> List[List[str]]:

From 12a71375b8a482ef9f64bcc970b5e1ae03758daa Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 8 Feb 2024 00:44:21 +0100
Subject: [PATCH 0732/1081] Fix skipping unused shards with analyzer.

---
 src/Interpreters/ActionsDAG.cpp               | 19 +++++++++++++------
 src/Interpreters/ActionsDAG.h                 |  1 +
 .../evaluateConstantExpression.cpp            |  2 +-
 3 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 6512def9202..a1858916ca7 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -605,7 +605,7 @@ ActionsDAGPtr ActionsDAG::cloneSubDAG(const NodeRawConstPtrs & outputs, bool rem
     return actions;
 }
 
-static ColumnWithTypeAndName executeActionForHeader(const ActionsDAG::Node * node, ColumnsWithTypeAndName arguments)
+static ColumnWithTypeAndName executeActionForPartialResult(const ActionsDAG::Node * node, ColumnsWithTypeAndName arguments, size_t input_rows_count)
 {
     ColumnWithTypeAndName res_column;
     res_column.type = node->result_type;
@@ -615,7 +615,7 @@ static ColumnWithTypeAndName executeActionForHeader(const ActionsDAG::Node * nod
     {
         case ActionsDAG::ActionType::FUNCTION:
         {
-            res_column.column = node->function->execute(arguments, res_column.type, 0, true);
+            res_column.column = node->function->execute(arguments, res_column.type, input_rows_count, true);
             break;
         }
 
@@ -628,13 +628,17 @@ static ColumnWithTypeAndName executeActionForHeader(const ActionsDAG::Node * nod
             if (!array)
                 throw Exception(ErrorCodes::TYPE_MISMATCH,
                                 "ARRAY JOIN of not array nor map: {}", node->result_name);
-            res_column.column = array->getDataPtr()->cloneEmpty();
+            res_column.column = array->getDataPtr();
+            if (input_rows_count < array->size())
+                res_column.column = res_column.column->cloneResized(array->getOffsets()[input_rows_count - 1]);
             break;
         }
 
         case ActionsDAG::ActionType::COLUMN:
         {
-            res_column.column = node->column->cloneResized(0);
+            res_column.column = node->column;
+            if (input_rows_count < res_column.column->size())
+                res_column.column = res_column.column->cloneResized(input_rows_count);
             break;
         }
 
@@ -681,7 +685,7 @@ Block ActionsDAG::updateHeader(Block header) const
     ColumnsWithTypeAndName result_columns;
     try
     {
-        result_columns = evaluatePartialResult(node_to_column, outputs, true);
+        result_columns = evaluatePartialResult(node_to_column, outputs, /* input_rows_count= */ 0, /* throw_on_error= */ true);
     }
     catch (Exception & e)
     {
@@ -710,8 +714,11 @@ Block ActionsDAG::updateHeader(Block header) const
 ColumnsWithTypeAndName ActionsDAG::evaluatePartialResult(
     IntermediateExecutionResult & node_to_column,
     const NodeRawConstPtrs & outputs,
+    size_t input_rows_count,
     bool throw_on_error)
 {
+    chassert(input_rows_count <= 1); /// evaluatePartialResult() should be used only to evaluate headers or constants
+
     ColumnsWithTypeAndName result_columns;
     result_columns.reserve(outputs.size());
 
@@ -768,7 +775,7 @@ ColumnsWithTypeAndName ActionsDAG::evaluatePartialResult(
                                         node->result_name);
 
                     if (node->type != ActionsDAG::ActionType::INPUT && has_all_arguments)
-                        node_to_column[node] = executeActionForHeader(node, std::move(arguments));
+                        node_to_column[node] = executeActionForPartialResult(node, std::move(arguments), input_rows_count);
                 }
             }
 
diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index 45f6e5cc717..e6272ac9f60 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -278,6 +278,7 @@ public:
     static ColumnsWithTypeAndName evaluatePartialResult(
         IntermediateExecutionResult & node_to_column,
         const NodeRawConstPtrs & outputs,
+        size_t input_rows_count,
         bool throw_on_error);
 
     /// For apply materialize() function for every output.
diff --git a/src/Interpreters/evaluateConstantExpression.cpp b/src/Interpreters/evaluateConstantExpression.cpp
index af8bd19370b..00d36750cc1 100644
--- a/src/Interpreters/evaluateConstantExpression.cpp
+++ b/src/Interpreters/evaluateConstantExpression.cpp
@@ -661,7 +661,7 @@ namespace
         const ActionsDAG::NodeRawConstPtrs & target_expr,
         ConjunctionMap && conjunction)
     {
-        auto columns = ActionsDAG::evaluatePartialResult(conjunction, target_expr, false);
+        auto columns = ActionsDAG::evaluatePartialResult(conjunction, target_expr, /* input_rows_count= */ 1, /* throw_on_error= */ false);
         for (const auto & column : columns)
             if (!column.column)
                 return {};

From ce92f1338969d2e54c010c2920aef22aca219156 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Wed, 7 Feb 2024 20:02:21 -0800
Subject: [PATCH 0733/1081] [Docs] More details on quorum inserts on SMT

---
 docs/en/operations/settings/settings.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 59d8bf2d858..fc73cf15027 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1770,7 +1770,7 @@ Default value: 0 (no restriction).
 ## insert_quorum {#insert_quorum}
 
 :::note
-`insert_quorum` does not apply to ClickHouse Cloud as all inserts are quorum inserted when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree).
+`insert_quorum` does not apply when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree) in ClickHouse Cloud as all inserts are quorum inserted.
 :::
 
 Enables the quorum writes.
@@ -1813,7 +1813,7 @@ See also:
 ## insert_quorum_parallel {#insert_quorum_parallel}
 
 :::note
-`insert_quorum_parallel` does not apply to ClickHouse Cloud as all inserts are quorum inserted when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree).
+`insert_quorum_parallel` does not apply when using the [`SharedMergeTree` table engine](/en/cloud/reference/shared-merge-tree) in ClickHouse Cloud as all inserts are quorum inserted.
 :::
 
 Enables or disables parallelism for quorum `INSERT` queries. If enabled, additional `INSERT` queries can be sent while previous queries have not yet finished. If disabled, additional writes to the same table will be rejected.

From 560e78cf418ada54d23e34f25b88e8b93bcf3411 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Wed, 7 Feb 2024 21:08:30 -0800
Subject: [PATCH 0734/1081] [Docs] More details for Memory table engine in
 Cloud

---
 docs/en/engines/table-engines/special/memory.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index a30f620f5c5..54547b1bc69 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -7,7 +7,10 @@ sidebar_label:  Memory
 # Memory Table Engine
 
 :::note
-When using the Memory table engine on ClickHouse Cloud, you must use a client that uses TCP (such as [clickhouse-client](/en/interfaces/cli)) or a native interface, and not one that uses HTTP (such as [clickhouse-connect](/en/integrations/python)). If you use HTTP, all queries must be submitted and executed at once using a multi-statement query.
+When using the Memory table engine on ClickHouse Cloud, data is not replicated across all nodes (by design). To guarantee that all queries are routed to the same node and that the Memory table engine works as expected, you can do one of the following:
+- Execute all operations in the same session
+- Use a client that uses TCP or the native interface (which enables support for sticky connections) such as [clickhouse-client](/en/interfaces/cli)
+- Submit and execute all queries at once using a multi-statement query (required with clients using the HTTP interface such as [clickhouse-connect](/en/integrations/python))
 :::
 
 The Memory engine stores data in RAM, in uncompressed form. Data is stored in exactly the same form as it is received when read. In other words, reading from this table is completely free.

From ece4febe3265e542f979d57bd435127a8243bf0f Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Wed, 7 Feb 2024 01:35:48 +0000
Subject: [PATCH 0735/1081] Insert synchronously if dependent MV deduplication
 is enabled

---
 src/Interpreters/executeQuery.cpp             |  2 +
 src/Server/TCPHandler.cpp                     |  2 +-
 ...c_inserts_for_dependent_mv_dedup.reference |  1 +
 ...e_async_inserts_for_dependent_mv_dedup.sql | 46 +++++++++++++++++++
 4 files changed, 50 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
 create mode 100644 tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 1787f627c2e..ce6d1de4af4 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -933,6 +933,8 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
                 reason = "asynchronous insert queue is not configured";
             else if (insert_query->select)
                 reason = "insert query has select";
+            else if (settings.deduplicate_blocks_in_dependent_materialized_views)
+                reason = "dependent materialized views block deduplication is enabled";
             else if (insert_query->hasInlinedData())
                 async_insert = true;
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 2c4e9c1e3b2..e1086ac5833 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -933,7 +933,7 @@ void TCPHandler::processInsertQuery()
         if (auto table = DatabaseCatalog::instance().tryGetTable(insert_query.table_id, query_context))
             async_insert_enabled |= table->areAsynchronousInsertsEnabled();
 
-    if (insert_queue && async_insert_enabled && !insert_query.select)
+    if (insert_queue && async_insert_enabled && !insert_query.select && !settings.deduplicate_blocks_in_dependent_materialized_views)
     {
         auto result = processAsyncInsertQuery(*insert_queue);
         if (result.status == AsynchronousInsertQueue::PushResult::OK)
diff --git a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
new file mode 100644
index 00000000000..4ff73b99975
--- /dev/null
+++ b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
@@ -0,0 +1 @@
+Values	Ok	4	Parsed
diff --git a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql
new file mode 100644
index 00000000000..41b23374bfc
--- /dev/null
+++ b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql
@@ -0,0 +1,46 @@
+-- Tags: no-parallel
+
+SET async_insert = 1;
+SET insert_deduplicate = 1;
+SET deduplicate_blocks_in_dependent_materialized_views = 1;
+
+DROP TABLE IF EXISTS 02985_test;
+CREATE TABLE 02985_test
+(
+    d Date,
+    value UInt64
+) ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
+
+DROP VIEW IF EXISTS 02985_mv;
+CREATE MATERIALIZED VIEW 02985_mv
+ENGINE = SummingMergeTree ORDER BY d AS
+SELECT
+    d, sum(value) s
+FROM 02985_test GROUP BY d;
+
+-- Inserts are synchronous.
+INSERT INTO 02985_test (*)
+VALUES ('2024-01-01', 1), ('2024-01-01', 2), ('2024-01-02', 1);
+
+SYSTEM FLUSH LOGS;
+
+SELECT format, status, rows, data_kind  FROM system.asynchronous_insert_log
+WHERE database = currentDatabase() AND table = '02985_test';
+
+SET deduplicate_blocks_in_dependent_materialized_views = 0;
+
+-- Set a large value for async_insert_busy_timeout_max_ms to avoid flushing the entry synchronously.
+INSERT INTO 02985_test (*)
+SETTINGS
+    async_insert_busy_timeout_min_ms=200,
+    async_insert_busy_timeout_max_ms=100000
+VALUES ('2024-01-01', 1), ('2024-01-01', 2), ('2024-01-02', 1), ('2024-01-02', 4);
+
+SYSTEM FLUSH LOGS;
+
+SELECT format, status, rows, data_kind
+FROM system.asynchronous_insert_log
+WHERE database = currentDatabase() AND table = '02985_test';
+
+DROP VIEW IF EXISTS 02985_mv;
+DROP TABLE IF EXISTS 02985_test;

From c2019b3b1eb3b09803ecbbce8bd9bfe0560faf36 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 8 Feb 2024 09:08:44 +0000
Subject: [PATCH 0736/1081] Fix test

---
 tests/queries/0_stateless/02972_parallel_replicas_cte.sql | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
index c39ad172a27..3702184e336 100644
--- a/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
+++ b/tests/queries/0_stateless/02972_parallel_replicas_cte.sql
@@ -12,16 +12,16 @@ SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.
 
 WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
 SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
-SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;
 
 -- Testing that it is disabled for allow_experimental_analyzer=0. With analyzer it will be supported (with correct result)
 WITH filtered_groups AS (SELECT a FROM pr_1 WHERE a >= 10000)
 SELECT count() FROM pr_2 INNER JOIN filtered_groups ON pr_2.a = filtered_groups.a
-SETTINGS allow_experimental_analyzer = 0, allow_experimental_parallel_reading_from_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3; -- { serverError SUPPORT_IS_DISABLED }
+SETTINGS allow_experimental_analyzer = 0, allow_experimental_parallel_reading_from_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3; -- { serverError SUPPORT_IS_DISABLED }
 
 -- Sanitizer
 SELECT count() FROM pr_2 JOIN numbers(10) as pr_1 ON pr_2.a = pr_1.number
-SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_two_shards', max_parallel_replicas = 3;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;
 
 DROP TABLE IF EXISTS pr_1;
 DROP TABLE IF EXISTS pr_2;

From ffff6b9510d96d3885e6f3559065e888a813c5de Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 10:56:17 +0100
Subject: [PATCH 0737/1081] Cleanup duplicated tests

---
 .../02986_leftpad_fixedstring.reference       | 160 +++++++++---------
 .../0_stateless/02986_leftpad_fixedstring.sql |   8 -
 2 files changed, 80 insertions(+), 88 deletions(-)

diff --git a/tests/queries/0_stateless/02986_leftpad_fixedstring.reference b/tests/queries/0_stateless/02986_leftpad_fixedstring.reference
index 32ebe0af9b6..8e51d03d0a8 100644
--- a/tests/queries/0_stateless/02986_leftpad_fixedstring.reference
+++ b/tests/queries/0_stateless/02986_leftpad_fixedstring.reference
@@ -42,83 +42,83 @@ a	String
 6162633334333234202020202020202020	1	1	1
 616263333433323420202020202020202020	1	1	1
 61626333343332342020202020202020202020	1	1	1
-	1	1	1
-61	1	1	1
-6162	1	1	1
-616263	1	1	1
-61626333	1	1	1
-6162633334	1	1	1
-616263333433	1	1	1
-61626333343332	1	1	1
-6162633334333234	1	1	1
-F09F87AA6162633334333234	1	1	1
-F09F87AAF09F87B86162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1	1	1
-F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1	1	1
-	1	1	1
-61	1	1	1
-6162	1	1	1
-616263	1	1	1
-61626333	1	1	1
-6162633334	1	1	1
-616263333433	1	1	1
-61626333343332	1	1	1
-6162633334333234	1	1	1
-6162633334333234F09F87AA	1	1	1
-6162633334333234F09F87AAF09F87B8	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AA	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1	1	1
-6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1	1	1
-	1	1	1
-F09F87AA	1	1	1
-F09F87AAF09F87B8	1	1	1
-C391F09F87AAF09F87B8	1	1	1
-C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1	1	1
-	1	1	1
-F09F87AA	1	1	1
-F09F87AAF09F87B8	1	1	1
-F09F87AAF09F87B8C391	1	1	1
-F09F87AAF09F87B8C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
-F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1	1	1
+	1
+61	1
+6162	1
+616263	1
+61626333	1
+6162633334	1
+616263333433	1
+61626333343332	1
+6162633334333234	1
+F09F87AA6162633334333234	1
+F09F87AAF09F87B86162633334333234	1
+F09F87AAF09F87B8F09F87AA6162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B86162633334333234	1
+F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA6162633334333234	1
+	1
+61	1
+6162	1
+616263	1
+61626333	1
+6162633334	1
+616263333433	1
+61626333343332	1
+6162633334333234	1
+6162633334333234F09F87AA	1
+6162633334333234F09F87AAF09F87B8	1
+6162633334333234F09F87AAF09F87B8F09F87AA	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8	1
+6162633334333234F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AAF09F87B8F09F87AA	1
+	1
+F09F87AA	1
+F09F87AAF09F87B8	1
+C391F09F87AAF09F87B8	1
+C391C391F09F87AAF09F87B8	1
+C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391F09F87AAF09F87B8	1
+	1
+F09F87AA	1
+F09F87AAF09F87B8	1
+F09F87AAF09F87B8C391	1
+F09F87AAF09F87B8C391C391	1
+F09F87AAF09F87B8C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1
+F09F87AAF09F87B8C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391C391	1
diff --git a/tests/queries/0_stateless/02986_leftpad_fixedstring.sql b/tests/queries/0_stateless/02986_leftpad_fixedstring.sql
index cbc7f4646a5..eaed9b3adc6 100644
--- a/tests/queries/0_stateless/02986_leftpad_fixedstring.sql
+++ b/tests/queries/0_stateless/02986_leftpad_fixedstring.sql
@@ -22,28 +22,20 @@ FROM numbers(20);
 -- I'm not confident the behaviour should be like this. I'm only testing memory problems
 SELECT
     hex(leftPadUTF8(toFixedString('abc34324' as s, 8), number, '🇪🇸')) as result,
-    hex(leftPadUTF8(s, number, '🇪🇸')) = result,
-    hex(leftPadUTF8(toFixedString(s, 8), number, '🇪🇸')) = result,
     hex(leftPadUTF8(s, number, '🇪🇸')) = result
 FROM numbers(20);
 
 SELECT
     hex(rightPadUTF8(toFixedString('abc34324' as s, 8), number, '🇪🇸')) as result,
-    hex(rightPadUTF8(s, number, '🇪🇸')) = result,
-    hex(rightPadUTF8(toFixedString(s, 8), number, '🇪🇸')) = result,
     hex(rightPadUTF8(s, number, '🇪🇸')) = result
 FROM numbers(20);
 
 SELECT
     hex(leftPadUTF8(toFixedString('🇪🇸' as s, 8), number, 'Ñ')) as result,
-    hex(leftPadUTF8(s, number, 'Ñ')) = result,
-    hex(leftPadUTF8(toFixedString(s, 8), number, 'Ñ')) = result,
     hex(leftPadUTF8(s, number, 'Ñ')) = result
 FROM numbers(20);
 
 SELECT
     hex(rightPadUTF8(toFixedString('🇪🇸' as s, 8), number, 'Ñ')) as result,
-    hex(rightPadUTF8(s, number, 'Ñ')) = result,
-    hex(rightPadUTF8(toFixedString(s, 8), number, 'Ñ')) = result,
     hex(rightPadUTF8(s, number, 'Ñ')) = result
 FROM numbers(20);

From 3167bfe423d48a99aed758c7b032d360d682b8f0 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 8 Feb 2024 11:35:23 +0100
Subject: [PATCH 0738/1081] Bump server version

---
 tests/analyzer_integration_broken_tests.txt          | 1 -
 tests/integration/test_replicating_constants/test.py | 3 +--
 2 files changed, 1 insertion(+), 3 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c04ed440c18..89580771bc9 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -10,7 +10,6 @@ test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_ove
 test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_task
 test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
-test_replicating_constants/test.py::test_different_versions
 test_select_access_rights/test_main.py::test_alias_columns
 test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote
diff --git a/tests/integration/test_replicating_constants/test.py b/tests/integration/test_replicating_constants/test.py
index 9669e890cd3..fbf7450577f 100644
--- a/tests/integration/test_replicating_constants/test.py
+++ b/tests/integration/test_replicating_constants/test.py
@@ -9,9 +9,8 @@ node2 = cluster.add_instance(
     "node2",
     with_zookeeper=True,
     image="yandex/clickhouse-server",
-    tag="19.16.9.37",
+    tag="22.3",
     with_installed_binary=True,
-    allow_analyzer=False,
 )
 
 
From cfa1a452e1b3ea8b8f5c5c5af269ea0c0a35a8a9 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Feb 2024 11:27:24 +0000
Subject: [PATCH 0739/1081] Refactorings,  pt. I

---
 .../functions/string-search-functions.md      |  4 ++
 src/Functions/countMatches.h                  | 43 ++++++++-----------
 2 files changed, 22 insertions(+), 25 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index d5dbca3f2b7..22f879c62ae 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -590,6 +590,10 @@ Result:
 └───────────────────────────────┘
 ```
 
+## countMatchesCaseInsensitive
+
+Like `countMatches(haystack, pattern)` but matching ignores the case.
+
 ## regexpExtract
 
 Extracts the first string in haystack that matches the regexp pattern and corresponds to the regex group index.
diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 5e02915de56..4f37c9e7c8b 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -35,39 +35,32 @@ public:
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
-        if (!isStringOrFixedString(arguments[1].type))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                "Illegal type {} of second argument (pattern) of function {}. Must be String/FixedString.",
-                arguments[1].type->getName(), getName());
-        if (!isStringOrFixedString(arguments[0].type))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                "Illegal type {} of first argument (haystack) of function {}. Must be String/FixedString.",
-                arguments[0].type->getName(), getName());
-        const auto * column = arguments[1].column.get();
-        if (!column || !checkAndGetColumnConstStringOrFixedString(column))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN,
-                "The second argument of function {} should be a constant string with the pattern",
-                getName());
+        FunctionArgumentDescriptors args{
+            {"haystack", &isStringOrFixedString<IDataType>, nullptr, "String or FixedString"},
+            {"pattern", &isStringOrFixedString<IDataType>, isColumnConst, "constant String or FixedString"}
+        };
+        validateFunctionArgumentTypes(*this, arguments, args);
 
         return std::make_shared<DataTypeUInt64>();
     }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
     {
-        const ColumnConst * column_pattern = checkAndGetColumnConstStringOrFixedString(arguments[1].column.get());
-        const OptimizedRegularExpression re = Regexps::createRegexp</*is_like*/ false, /*no_capture*/ true, CountMatchesBase::case_insensitive>(column_pattern->getValue<String>());
+        const IColumn * col_pattern = arguments[1].column.get();
+        const ColumnConst * col_pattern_const = checkAndGetColumnConstStringOrFixedString(col_pattern);
+        const OptimizedRegularExpression re = Regexps::createRegexp</*is_like*/ false, /*no_capture*/ true, CountMatchesBase::case_insensitive>(col_pattern_const->getValue<String>());
+
+        const IColumn * col_haystack = arguments[0].column.get();
         OptimizedRegularExpression::MatchVec matches;
 
-        const IColumn * column_haystack = arguments[0].column.get();
-
-        if (const ColumnString * col_str = checkAndGetColumn<ColumnString>(column_haystack))
+        if (const ColumnString * col_haystack_string = checkAndGetColumn<ColumnString>(col_haystack))
         {
-            auto result_column = ColumnUInt64::create();
+            auto col_res = ColumnUInt64::create();
 
-            const ColumnString::Chars & src_chars = col_str->getChars();
-            const ColumnString::Offsets & src_offsets = col_str->getOffsets();
+            const ColumnString::Chars & src_chars = col_haystack_string->getChars();
+            const ColumnString::Offsets & src_offsets = col_haystack_string->getOffsets();
 
-            ColumnUInt64::Container & vec_res = result_column->getData();
+            ColumnUInt64::Container & vec_res = col_res->getData();
             vec_res.resize(input_rows_count);
 
             size_t size = src_offsets.size();
@@ -83,11 +76,11 @@ public:
                 vec_res[i] = countMatches(str, re, matches);
             }
 
-            return result_column;
+            return col_res;
         }
-        else if (const ColumnConst * col_const_str = checkAndGetColumnConstStringOrFixedString(column_haystack))
+        else if (const ColumnConst * col_haystack_const = checkAndGetColumnConstStringOrFixedString(col_haystack))
         {
-            std::string_view str = col_const_str->getDataColumn().getDataAt(0).toView();
+            std::string_view str = col_haystack_const->getDataColumn().getDataAt(0).toView();
             uint64_t matches_count = countMatches(str, re, matches);
             return result_type->createColumnConst(input_rows_count, matches_count);
         }

From f7bb000b5177a250bc44b3fadd6c5a33033ec0e2 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Feb 2024 11:34:08 +0000
Subject: [PATCH 0740/1081] Refactorings, pt. II: disallow FixedString patterns

---
 src/Functions/countMatches.h                   | 18 +++++++++---------
 .../queries/0_stateless/01595_countMatches.sql |  5 +++--
 2 files changed, 12 insertions(+), 11 deletions(-)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 4f37c9e7c8b..168d8e9cb3a 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -37,7 +37,7 @@ public:
     {
         FunctionArgumentDescriptors args{
             {"haystack", &isStringOrFixedString<IDataType>, nullptr, "String or FixedString"},
-            {"pattern", &isStringOrFixedString<IDataType>, isColumnConst, "constant String or FixedString"}
+            {"pattern", &isString<IDataType>, isColumnConst, "constant String"}
         };
         validateFunctionArgumentTypes(*this, arguments, args);
 
@@ -47,13 +47,19 @@ public:
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
     {
         const IColumn * col_pattern = arguments[1].column.get();
-        const ColumnConst * col_pattern_const = checkAndGetColumnConstStringOrFixedString(col_pattern);
+        const ColumnConst * col_pattern_const = checkAndGetColumnConst<ColumnString>(col_pattern);
         const OptimizedRegularExpression re = Regexps::createRegexp</*is_like*/ false, /*no_capture*/ true, CountMatchesBase::case_insensitive>(col_pattern_const->getValue<String>());
 
         const IColumn * col_haystack = arguments[0].column.get();
         OptimizedRegularExpression::MatchVec matches;
 
-        if (const ColumnString * col_haystack_string = checkAndGetColumn<ColumnString>(col_haystack))
+        if (const ColumnConst * col_haystack_const = checkAndGetColumnConstStringOrFixedString(col_haystack))
+        {
+            std::string_view str = col_haystack_const->getDataColumn().getDataAt(0).toView();
+            uint64_t matches_count = countMatches(str, re, matches);
+            return result_type->createColumnConst(input_rows_count, matches_count);
+        }
+        else if (const ColumnString * col_haystack_string = checkAndGetColumn<ColumnString>(col_haystack))
         {
             auto col_res = ColumnUInt64::create();
 
@@ -78,12 +84,6 @@ public:
 
             return col_res;
         }
-        else if (const ColumnConst * col_haystack_const = checkAndGetColumnConstStringOrFixedString(col_haystack))
-        {
-            std::string_view str = col_haystack_const->getDataColumn().getDataAt(0).toView();
-            uint64_t matches_count = countMatches(str, re, matches);
-            return result_type->createColumnConst(input_rows_count, matches_count);
-        }
         else
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Error in FunctionCountMatches::getReturnTypeImpl()");
     }
diff --git a/tests/queries/0_stateless/01595_countMatches.sql b/tests/queries/0_stateless/01595_countMatches.sql
index 0b170945d44..d0538b0289c 100644
--- a/tests/queries/0_stateless/01595_countMatches.sql
+++ b/tests/queries/0_stateless/01595_countMatches.sql
@@ -25,5 +25,6 @@ select countMatchesCaseInsensitive('foo.com BAR.COM baz.com bam.com', '([^. ]+)\
 select countMatchesCaseInsensitive('foo.com@foo.com bar.com@foo.com BAZ.com@foo.com bam.com@foo.com', '([^. ]+)\.([^. ]+)@([^. ]+)\.([^. ]+)');
 
 select 'errors';
-select countMatches(1, 'foo') from numbers(1); -- { serverError 43 }
-select countMatches('foobarfoo', toString(number)) from numbers(1); -- { serverError 44 }
+select countMatches(1, 'foo') from numbers(1); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+select countMatches('foobarfoo', toString(number)) from numbers(1); -- { serverError ILLEGAL_COLUMN }
+select countMatches('foo', materialize('foo')) -- { serverError ILLEGAL_COLUMN }

From fc003497bbea9b21294d77ad4e0f6b481240e07b Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Feb 2024 11:50:20 +0000
Subject: [PATCH 0741/1081] Fix bug 59749

---
 src/Functions/countMatches.h                  | 21 ++++++++++++++++---
 .../0_stateless/01595_countMatches.reference  |  3 +++
 .../0_stateless/01595_countMatches.sql        |  6 +++++-
 3 files changed, 26 insertions(+), 4 deletions(-)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 168d8e9cb3a..7e0cf83fb44 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -3,6 +3,7 @@
 #include <Functions/IFunction.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
+#include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypesNumber.h>
@@ -69,10 +70,9 @@ public:
             ColumnUInt64::Container & vec_res = col_res->getData();
             vec_res.resize(input_rows_count);
 
-            size_t size = src_offsets.size();
             ColumnString::Offset current_src_offset = 0;
 
-            for (size_t i = 0; i < size; ++i)
+            for (size_t i = 0; i < input_rows_count; ++i)
             {
                 Pos pos = reinterpret_cast<Pos>(&src_chars[current_src_offset]);
                 current_src_offset = src_offsets[i];
@@ -84,6 +84,21 @@ public:
 
             return col_res;
         }
+        else if (const ColumnFixedString * col_haystack_fixedstring = checkAndGetColumn<ColumnFixedString>(col_haystack))
+        {
+            auto col_res = ColumnUInt64::create();
+
+            ColumnUInt64::Container & vec_res = col_res->getData();
+            vec_res.resize(input_rows_count);
+
+            for (size_t i = 0; i < input_rows_count; ++i)
+            {
+                std::string_view str = col_haystack_fixedstring->getDataAt(i).toView();
+                vec_res[i] = countMatches(str, re, matches);
+            }
+
+            return col_res;
+        }
         else
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Error in FunctionCountMatches::getReturnTypeImpl()");
     }
@@ -109,7 +124,7 @@ public:
             if (!matches[0].length)
                 break;
             pos += matches[0].offset + matches[0].length;
-            match_count++;
+            ++match_count;
         }
 
         return match_count;
diff --git a/tests/queries/0_stateless/01595_countMatches.reference b/tests/queries/0_stateless/01595_countMatches.reference
index c65279c0b8e..025db39f1fe 100644
--- a/tests/queries/0_stateless/01595_countMatches.reference
+++ b/tests/queries/0_stateless/01595_countMatches.reference
@@ -22,3 +22,6 @@ case insensitive
 4
 4
 errors
+FixedString
+2
+2
diff --git a/tests/queries/0_stateless/01595_countMatches.sql b/tests/queries/0_stateless/01595_countMatches.sql
index d0538b0289c..5c016c52a4e 100644
--- a/tests/queries/0_stateless/01595_countMatches.sql
+++ b/tests/queries/0_stateless/01595_countMatches.sql
@@ -27,4 +27,8 @@ select countMatchesCaseInsensitive('foo.com@foo.com bar.com@foo.com BAZ.com@foo.
 select 'errors';
 select countMatches(1, 'foo') from numbers(1); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 select countMatches('foobarfoo', toString(number)) from numbers(1); -- { serverError ILLEGAL_COLUMN }
-select countMatches('foo', materialize('foo')) -- { serverError ILLEGAL_COLUMN }
+select countMatches('foo', materialize('foo')); -- { serverError ILLEGAL_COLUMN }
+
+select 'FixedString';
+select countMatches(toFixedString('foobarfoo', 9), 'foo');
+select countMatches(materialize(toFixedString('foobarfoo', 9)), 'foo');

From 0130d525f40521cae5c79e4c002ea9c268f826d7 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 8 Feb 2024 12:02:28 +0000
Subject: [PATCH 0742/1081] fix dashboard params default values

---
 programs/server/dashboard.html | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index ae916f2527e..3c2916b6a16 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -527,10 +527,11 @@ let queries = [];
 
 /// Query parameters with predefined default values.
 /// All other parameters will be automatically found in the queries.
-let params = {
+let default_params = {
     'rounding': '60',
     'seconds': '86400'
 };
+let params = default_params;
 
 /// Palette generation for charts
 function generatePalette(baseColor, numColors) {
@@ -594,13 +595,19 @@ let plots = [];
 let charts = document.getElementById('charts');
 
 /// This is not quite correct (we cannot really parse SQL with regexp) but tolerable.
-const query_param_regexp = /\{(\w+):[^}]+\}/g;
+const query_param_regexp = /\{(\w+):([^}]+)\}/g;
 
 /// Automatically parse more parameters from the queries.
 function findParamsInQuery(query, new_params) {
+    const typeDefault = (type) => type.includes('Int') ? '0'
+        : (type.includes('Float') ? '0.0'
+        : (type.includes('Bool') ? 'false'
+        : (type.includes('Date') ? new Date().toISOString().slice(0, 10)
+        : (type.includes('UUID') ? '00000000-0000-0000-0000-000000000000'
+        : ''))));
     for (let match of query.matchAll(query_param_regexp)) {
         const name = match[1];
-        new_params[name] = params[name] || '';
+        new_params[name] = params[name] || default_params[name] || typeDefault(match[2]);
     }
 }
 

From 284ed191ab40f397fdb75416ef39df021c75f359 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 13:13:22 +0100
Subject: [PATCH 0743/1081] Revert "Rename a setting"

---
 src/Core/Settings.h                                         | 2 +-
 src/Functions/keyvaluepair/extractKeyValuePairs.cpp         | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.reference  | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.sql        | 6 +++---
 4 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 1e6a556e99e..dc863576a85 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -855,7 +855,7 @@ class IColumn;
     M(UInt64, grace_hash_join_max_buckets, 1024, "Limit on the number of grace hash join buckets", 0) \
     M(Bool, optimize_distinct_in_order, true, "Enable DISTINCT optimization if some columns in DISTINCT form a prefix of sorting. For example, prefix of sorting key in merge tree or ORDER BY statement", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
-    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory.", 0) ALIAS(extract_kvp_max_pairs_per_row) \
+    M(UInt64, extract_kvp_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
     M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \
diff --git a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
index 94f02861af0..34081cddb92 100644
--- a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
+++ b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
@@ -43,11 +43,11 @@ class ExtractKeyValuePairs : public IFunction
             builder.withQuotingCharacter(parsed_arguments.quoting_character.value());
         }
 
-        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row == 0;
+        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_kvp_max_pairs_per_row == 0;
 
         if (!is_number_of_pairs_unlimited)
         {
-            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row);
+            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_kvp_max_pairs_per_row);
         }
 
         return builder.build();
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
index 9a0cfdffcb5..f646583bbd3 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
@@ -293,7 +293,7 @@ SELECT
 {'age':'31','last_key':'last_value','name':'neymar','nationality':'brazil','team':'psg'}
 -- { echoOn }
 
-SET extract_key_value_pairs_max_pairs_per_row = 2;
+SET extract_kvp_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -307,7 +307,7 @@ WITH
 SELECT
     x;
 {'key1':'value1','key2':'value2'}
-SET extract_key_value_pairs_max_pairs_per_row = 0;
+SET extract_kvp_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
index 4f3db3f166b..9277ba6d7ec 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
@@ -415,7 +415,7 @@ SELECT
     x; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
 
 -- Should fail allowed because it exceeds the max number of pairs
-SET extract_key_value_pairs_max_pairs_per_row = 1;
+SET extract_kvp_max_pairs_per_row = 1;
 WITH
     extractKeyValuePairs('key1:value1,key2:value2') AS s_map,
     CAST(
@@ -429,7 +429,7 @@ SELECT
 
 -- { echoOn }
 
-SET extract_key_value_pairs_max_pairs_per_row = 2;
+SET extract_kvp_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -443,7 +443,7 @@ WITH
 SELECT
     x;
 
-SET extract_key_value_pairs_max_pairs_per_row = 0;
+SET extract_kvp_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH

From b8dcc233fd9d8774ad125412d44294ffac7c3de4 Mon Sep 17 00:00:00 2001
From: AlexeyGrezz <38166396+AlexeyGrezz@users.noreply.github.com>
Date: Thu, 8 Feb 2024 16:32:50 +0300
Subject: [PATCH 0744/1081] Update grants.md

---
 docs/ru/operations/system-tables/grants.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/ru/operations/system-tables/grants.md b/docs/ru/operations/system-tables/grants.md
index b3ef789e95b..4485b684218 100644
--- a/docs/ru/operations/system-tables/grants.md
+++ b/docs/ru/operations/system-tables/grants.md
@@ -19,7 +19,7 @@ slug: /ru/operations/system-tables/grants
 -    `column` ([Nullable](../../sql-reference/data-types/nullable.md)([String](../../sql-reference/data-types/string.md))) — Имя столбца, к которому предоставляется доступ.
 
 -    `is_partial_revoke` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Логическое значение. Показывает, были ли отменены некоторые привилегии. Возможные значения:
-- `0` — Строка описывает частичный отзыв.
-- `1` — Строка описывает грант.
+- `0` — Строка описывает грант.
+- `1` — Строка описывает частичный отзыв.
 
 -    `grant_option` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Разрешение предоставлено с опцией `WITH GRANT OPTION`, подробнее см. [GRANT](../../sql-reference/statements/grant.md#grant-privigele-syntax).

From fafd8005a05412db754a6ea595472ba59fda6f29 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 8 Feb 2024 13:51:29 +0000
Subject: [PATCH 0745/1081] Fixing style.

---
 src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index eb5f7a42819..2f790d9892f 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -228,14 +228,14 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
 
     /// This is the leak of abstraction.
     /// Splited actions may have inputs which are needed only for PREWHERE.
-    /// This is fine for ActionsDAG to have such a split, but it breakes defaults calculation.
+    /// This is fine for ActionsDAG to have such a split, but it breaks defaults calculation.
     ///
     /// See 00950_default_prewhere for example.
     /// Table has structure `APIKey UInt8, SessionType UInt8` and default `OperatingSystem = SessionType+1`
     /// For a query with `SELECT OperatingSystem WHERE APIKey = 42 AND SessionType = 42` we push everything to PREWHERE
     /// and columns APIKey, SessionType are removed from inputs (cause only OperatingSystem is needed).
     /// However, column OperatingSystem is calculated after PREWHERE stage, based on SessionType value.
-    /// If column SessionType is removed by PREWHERE actions, we use zero as defaut, and get a wrong result.
+    /// If column SessionType is removed by PREWHERE actions, we use zero as default, and get a wrong result.
     ///
     /// So, here we restore removed inputs for PREWHERE actions
     {

From 73d2ff3933ca60133c33ed61af277d616e10bf9c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 8 Feb 2024 14:55:35 +0100
Subject: [PATCH 0746/1081] Update MergeTask.cpp

---
 src/Storages/MergeTree/MergeTask.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index f7cd721b8dd..9cbcdbaaaaa 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -1066,7 +1066,7 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
 #ifndef NDEBUG
     if (!sort_description.empty())
     {
-        res_pipe.addSimpleTransform([&](const Block & header_)
+        builder->addSimpleTransform([&](const Block & header_)
         {
             auto transform = std::make_shared<CheckSortedTransform>(header_, sort_description);
             return transform;

From 160f1b7fd85add76128c978f0d7ae93729b53a5e Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 8 Feb 2024 15:01:56 +0100
Subject: [PATCH 0747/1081] Fix logical optimizer with LowCardinality

---
 src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp    | 8 ++++----
 .../02987_logical_optimizer_pass_lowcardinality.reference | 0
 .../02987_logical_optimizer_pass_lowcardinality.sql       | 5 +++++
 3 files changed, 9 insertions(+), 4 deletions(-)
 create mode 100644 tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.reference
 create mode 100644 tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.sql

diff --git a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
index a8cdd27c9bf..5f08bb9035e 100644
--- a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
+++ b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
@@ -404,12 +404,12 @@ private:
 
             auto operand_type = and_operands[0]->getResultType();
             auto function_type = function_node.getResultType();
-            assert(!function_type->isNullable());
+            chassert(!function_type->isNullable());
             if (!function_type->equals(*operand_type))
             {
                 /// Result of equality operator can be low cardinality, while AND always returns UInt8.
                 /// In that case we replace `(lc = 1) AND (lc = 1)` with `(lc = 1) AS UInt8`
-                assert(function_type->equals(*removeLowCardinality(operand_type)));
+                chassert(function_type->equals(*removeLowCardinality(operand_type)));
                 node = createCastFunction(std::move(and_operands[0]), function_type, getContext());
             }
             else
@@ -427,7 +427,7 @@ private:
     void tryReplaceOrEqualsChainWithIn(QueryTreeNodePtr & node)
     {
         auto & function_node = node->as<FunctionNode &>();
-        assert(function_node.getFunctionName() == "or");
+        chassert(function_node.getFunctionName() == "or");
 
         QueryTreeNodes or_operands;
 
@@ -486,7 +486,7 @@ private:
             /// first we create tuple from RHS of equals functions
             for (const auto & equals : equals_functions)
             {
-                is_any_nullable |= equals->getResultType()->isNullable();
+                is_any_nullable |= removeLowCardinality(equals->getResultType())->isNullable();
 
                 const auto * equals_function = equals->as<FunctionNode>();
                 assert(equals_function && equals_function->getFunctionName() == "equals");
diff --git a/tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.reference b/tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.sql b/tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.sql
new file mode 100644
index 00000000000..be7689025b2
--- /dev/null
+++ b/tests/queries/0_stateless/02987_logical_optimizer_pass_lowcardinality.sql
@@ -0,0 +1,5 @@
+CREATE TABLE 02987_logical_optimizer_table (key Int, value Int) ENGINE=Memory();
+CREATE VIEW v1 AS SELECT * FROM 02987_logical_optimizer_table;
+CREATE TABLE 02987_logical_optimizer_merge AS v1 ENGINE=Merge(currentDatabase(), 'v1');
+
+SELECT _table, key FROM 02987_logical_optimizer_merge WHERE (_table = toFixedString(toFixedString(toFixedString('v1', toNullable(2)), 2), 2)) OR ((value = toLowCardinality(toNullable(10))) AND (_table = toFixedString(toNullable('v3'), 2))) OR ((value = 20) AND (_table = toFixedString(toFixedString(toFixedString('v1', 2), 2), 2)) AND (_table = toFixedString(toLowCardinality(toFixedString('v3', 2)), 2))) SETTINGS allow_experimental_analyzer = true, join_use_nulls = true, convert_query_to_cnf = true;

From fa0acaf39ba3c9d78b80c6af6f22663ff78d79ff Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 8 Feb 2024 15:18:17 +0100
Subject: [PATCH 0748/1081] Fix image name

---
 tests/integration/test_replicating_constants/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_replicating_constants/test.py b/tests/integration/test_replicating_constants/test.py
index fbf7450577f..90132b71a64 100644
--- a/tests/integration/test_replicating_constants/test.py
+++ b/tests/integration/test_replicating_constants/test.py
@@ -8,7 +8,7 @@ node1 = cluster.add_instance("node1", with_zookeeper=True)
 node2 = cluster.add_instance(
     "node2",
     with_zookeeper=True,
-    image="yandex/clickhouse-server",
+    image="clickhouse/clickhouse-server",
     tag="22.3",
     with_installed_binary=True,
 )

From 97d1eb109190b0bff8fdf3c61cf44d5c1fbafd7d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 8 Feb 2024 14:31:24 +0000
Subject: [PATCH 0749/1081] Fixing test.

---
 tests/integration/test_recompression_ttl/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_recompression_ttl/test.py b/tests/integration/test_recompression_ttl/test.py
index 851e3bb4eb8..9d7b09eacdf 100644
--- a/tests/integration/test_recompression_ttl/test.py
+++ b/tests/integration/test_recompression_ttl/test.py
@@ -155,7 +155,7 @@ def test_recompression_multiple_ttls(started_cluster):
         node2.query(
             "SELECT recompression_ttl_info.expression FROM system.parts where name = 'all_1_1_4'"
         )
-        == "['plus(d, toIntervalSecond(10))','plus(d, toIntervalSecond(15))','plus(d, toIntervalSecond(5))']\n"
+        == "['d + toIntervalSecond(10)','d + toIntervalSecond(15)','d + toIntervalSecond(5)']\n"
     )
 
 
From 1b9620001b31256ffb6e8fee7b521efa8688fbee Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 8 Feb 2024 15:24:01 +0100
Subject: [PATCH 0750/1081] Move ColumnArray-specific code out of the
 ActionsDAG.

---
 src/Columns/ColumnArray.cpp     | 15 +++++++++++++++
 src/Columns/ColumnArray.h       |  4 ++++
 src/Interpreters/ActionsDAG.cpp | 17 ++++++++++++-----
 3 files changed, 31 insertions(+), 5 deletions(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index fddfa2ac6b2..6f60ec0e642 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -554,6 +554,21 @@ void ColumnArray::insertRangeFrom(const IColumn & src, size_t start, size_t leng
 }
 
 
+MutableColumnPtr ColumnArray::getDataInRange(size_t start, size_t length) const
+{
+    if (start + length > getOffsets().size())
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Parameter out of bound in ColumnArray::getDataPtrForRange method. "
+            "[start({}) + length({}) > offsets.size({})]", start, length, getOffsets().size());
+
+    size_t start_offset = offsetAt(start);
+    size_t end_offset = offsetAt(start + length);
+
+    auto res = getData().cloneEmpty();
+    res->insertRangeFrom(getData(), start_offset, end_offset - start_offset);
+    return res;
+}
+
+
 ColumnPtr ColumnArray::filter(const Filter & filt, ssize_t result_size_hint) const
 {
     if (typeid_cast<const ColumnUInt8 *>(data.get()))
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 407f44a6f3c..64c8801b0c3 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -143,6 +143,10 @@ public:
     const ColumnPtr & getOffsetsPtr() const { return offsets; }
     ColumnPtr & getOffsetsPtr() { return offsets; }
 
+    /// Returns a copy of the data column's part corresponding to a specified range of rows.
+    /// For example, `getDataInRange(0, size())` is the same as `getDataPtr()->clone()`.
+    MutableColumnPtr getDataInRange(size_t start, size_t length) const;
+
     MutableColumns scatter(ColumnIndex num_columns, const Selector & selector) const override
     {
         return scatterImpl<ColumnArray>(num_columns, selector);
diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index a1858916ca7..b3f3f8da26d 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -628,17 +628,24 @@ static ColumnWithTypeAndName executeActionForPartialResult(const ActionsDAG::Nod
             if (!array)
                 throw Exception(ErrorCodes::TYPE_MISMATCH,
                                 "ARRAY JOIN of not array nor map: {}", node->result_name);
-            res_column.column = array->getDataPtr();
+
+            ColumnPtr data;
             if (input_rows_count < array->size())
-                res_column.column = res_column.column->cloneResized(array->getOffsets()[input_rows_count - 1]);
+                data = array->getDataInRange(0, input_rows_count);
+            else
+                data = array->getDataPtr();
+
+            res_column.column = data;
             break;
         }
 
         case ActionsDAG::ActionType::COLUMN:
         {
-            res_column.column = node->column;
-            if (input_rows_count < res_column.column->size())
-                res_column.column = res_column.column->cloneResized(input_rows_count);
+            auto column = node->column;
+            if (input_rows_count < column->size())
+                column = column->cloneResized(input_rows_count);
+
+            res_column.column = column;
             break;
         }
 

From 5f750871786772e1135084c34b5a20aa8c108c74 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 8 Feb 2024 15:48:20 +0000
Subject: [PATCH 0751/1081] Add comments

---
 src/Storages/StorageMerge.cpp | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index d3b8f30b1c5..09c38996b22 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -756,16 +756,23 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     auto join_tree_type = query_node->getJoinTree()->getNodeType();
     auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
 
+    // For the case when join tree is just a table or a table function we don't need to do anything more.
     if (join_tree_type == QueryTreeNodeType::TABLE || join_tree_type == QueryTreeNodeType::TABLE_FUNCTION)
         return modified_query;
 
+    // JOIN needs to be removed because StorageMerge should produce not joined data.
+    // GROUP BY should be removed as well.
+
     auto * modified_query_node = modified_query->as<QueryNode>();
 
+    // Remove the JOIN statement. As a result query will have a form like: SELECT * FROM <table> ...
     modified_query = modified_query->cloneAndReplace(modified_query_node->getJoinTree(), replacement_table_expression);
     modified_query_node = modified_query->as<QueryNode>();
 
     query_node = modified_query->as<QueryNode>();
 
+    // For backward compatibility we need to leave all filters related to this table.
+    // It may lead to some incorrect result.
     if (query_node->hasPrewhere())
         replaceFilterExpression(query_node->getPrewhere(), replacement_table_expression, context);
     if (query_node->hasWhere())
@@ -779,6 +786,9 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     projection.clear();
     NamesAndTypes projection_columns;
 
+    // Select only required columns from the table, because prjection list may contain:
+    // 1. aggregate functions
+    // 2. expressions referencing other tables of JOIN
     for (auto const & column_name : required_column_names)
     {
         QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column_name});
@@ -791,6 +801,8 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Required column '{}' is not resolved", column_name);
         auto fake_column = resolved_column->getColumn();
 
+        // Identifier is resolved to ColumnNode, but we need to get rid of ALIAS columns
+        // and also fix references to source expression (now column is referencing original table expression).
         ApplyAliasColumnExpressionsVisitor visitor(replacement_table_expression);
         visitor.visit(fake_node);
 
@@ -860,7 +872,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
 
                 QueryTreeNodePtr column_node;
 
-
+                // Replace all references to ALIAS columns in the query by expressions.
                 if (is_alias)
                 {
                     QueryTreeNodePtr fake_node = std::make_shared<IdentifierNode>(Identifier{column});

From ccafc523a959d31ae1340135655ca1caee278887 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 8 Feb 2024 15:51:27 +0000
Subject: [PATCH 0752/1081] Fix style

---
 src/Functions/countMatches.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 7e0cf83fb44..04e86f31884 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -16,8 +16,6 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int ILLEGAL_COLUMN;
     extern const int LOGICAL_ERROR;
 }
 

From dfb3a8f7be0c8f7aebb52d9cd3f7ebabd7f83af5 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 8 Feb 2024 13:52:46 +0100
Subject: [PATCH 0753/1081] Another fix

---
 src/Coordination/KeeperSnapshotManager.cpp |  5 ++---
 src/Coordination/KeeperStorage.cpp         | 21 ++++++++++-----------
 src/Coordination/KeeperStorage.h           |  9 ++++++++-
 utils/keeper-bench/Generator.cpp           |  1 -
 4 files changed, 20 insertions(+), 16 deletions(-)

diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index 07116fedfab..d7c9acae07a 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -89,11 +89,10 @@ namespace
         writeBinary(node.ephemeralOwner(), out);
         if (version < SnapshotVersion::V6)
             writeBinary(static_cast<int32_t>(node.data_size), out);
-        const bool is_ephemeral = node.isEphemeral();
-        writeBinary(is_ephemeral ? 0 : node.numChildren(), out);
+        writeBinary(node.numChildren(), out);
         writeBinary(node.pzxid, out);
 
-        writeBinary(is_ephemeral ? 0 : node.seqNum(), out);
+        writeBinary(node.seqNum(), out);
 
         if (version >= SnapshotVersion::V4 && version <= SnapshotVersion::V5)
             writeBinary(node.sizeInBytes(), out);
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index e855274f08b..9d4c22164d3 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -185,9 +185,8 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
     hash.update(node.version);
     hash.update(node.cversion);
     hash.update(node.aversion);
-    bool is_ephemeral = node.isEphemeral();
-    hash.update(is_ephemeral ? node.ephemeralOwner() : 0);
-    hash.update(is_ephemeral ? 0 : node.numChildren());
+    hash.update(node.ephemeralOwner());
+    hash.update(node.numChildren());
     hash.update(node.pzxid);
 
     return hash.get64();
@@ -223,6 +222,9 @@ KeeperStorage::Node & KeeperStorage::Node::operator=(const Node & other)
         data = new char[data_size];
         memcpy(data, other.data, data_size);
     }
+
+    children = other.children;
+
     return *this;
 }
 
@@ -252,7 +254,7 @@ void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
     if (stat.ephemeralOwner == 0)
     {
         is_ephemeral_and_mtime.is_ephemeral = false;
-        ephemeral_or_children_data.children_info.num_children = stat.numChildren;
+        setNumChildren(stat.numChildren);
     }
     else
     {
@@ -269,10 +271,9 @@ void KeeperStorage::Node::setResponseStat(Coordination::Stat & response_stat) co
     response_stat.version = version;
     response_stat.cversion = cversion;
     response_stat.aversion = aversion;
-    bool is_ephemeral = isEphemeral();
-    response_stat.ephemeralOwner = is_ephemeral ? ephemeral_or_children_data.ephemeral_owner : 0;
+    response_stat.ephemeralOwner = ephemeralOwner();
     response_stat.dataLength = static_cast<int32_t>(data_size);
-    response_stat.numChildren = is_ephemeral ? 0 : numChildren();
+    response_stat.numChildren = numChildren();
     response_stat.pzxid = pzxid;
 
 }
@@ -1316,7 +1317,7 @@ struct KeeperStorageRemoveRequestProcessor final : public KeeperStorageRequestPr
             KeeperStorage::UpdateNodeDelta{[](KeeperStorage::Node & parent)
                                            {
                                                ++parent.cversion;
-                                               --parent.ephemeral_or_children_data.children_info.num_children;
+                                               parent.decreaseNumChildren();
                                            }});
 
         new_deltas.emplace_back(request.path, zxid, KeeperStorage::RemoveNodeDelta{request.version, node->ephemeralOwner()});
@@ -1561,9 +1562,7 @@ struct KeeperStorageListRequestProcessor final : public KeeperStorageRequestProc
 
                 auto list_request_type = ALL;
                 if (auto * filtered_list = dynamic_cast<Coordination::ZooKeeperFilteredListRequest *>(&request))
-                {
                     list_request_type = filtered_list->list_request_type;
-                }
 
                 if (list_request_type == ALL)
                     return true;
@@ -2294,7 +2293,7 @@ void KeeperStorage::preprocessRequest(
                         [ephemeral_path](Node & parent)
                         {
                             ++parent.cversion;
-                            --parent.ephemeral_or_children_data.children_info.num_children;
+                            parent.decreaseNumChildren();
                         }
                     }
                 );
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index c3350275d2f..cf9c1710d3d 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -90,12 +90,13 @@ public:
         {
             if (isEphemeral())
                 return ephemeral_or_children_data.ephemeral_owner;
+
             return 0;
         }
 
         void setEphemeralOwner(int64_t ephemeral_owner)
         {
-            is_ephemeral_and_mtime.is_ephemeral = true;
+            is_ephemeral_and_mtime.is_ephemeral = ephemeral_owner != 0;
             ephemeral_or_children_data.ephemeral_owner = ephemeral_owner;
         }
 
@@ -118,6 +119,12 @@ public:
             ++ephemeral_or_children_data.children_info.num_children;
         }
 
+        void decreaseNumChildren()
+        {
+            chassert(!isEphemeral());
+            --ephemeral_or_children_data.children_info.num_children;
+        }
+
         int32_t seqNum() const
         {
             if (isEphemeral())
diff --git a/utils/keeper-bench/Generator.cpp b/utils/keeper-bench/Generator.cpp
index a3e85f670d6..2212f7158ae 100644
--- a/utils/keeper-bench/Generator.cpp
+++ b/utils/keeper-bench/Generator.cpp
@@ -455,7 +455,6 @@ Coordination::ZooKeeperRequestPtr CreateRequestGenerator::generateImpl(const Coo
 
     auto request = std::make_shared<ZooKeeperCreateRequest>();
     request->acls = acls;
-    request->is_sequential = true;
 
     std::string path_candidate = std::filesystem::path(parent_path.getPath()) / name.getString();
 

From d97c5496f54ea157796aae309bbe980db831c8d9 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 18:37:07 +0100
Subject: [PATCH 0754/1081] Fix unpoison

---
 src/Common/MemorySanitizer.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/MemorySanitizer.h b/src/Common/MemorySanitizer.h
index 2c4ae3a6cfb..cc6b0d5171f 100644
--- a/src/Common/MemorySanitizer.h
+++ b/src/Common/MemorySanitizer.h
@@ -28,7 +28,7 @@
 #        undef __msan_unpoison_string
 #        include <sanitizer/msan_interface.h>
 #        undef __msan_unpoison_overflow_15
-#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE) - ((PTR_SIZE) % 16)], ((PTR_SIZE) % 16))
+#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE) - ((PTR_SIZE) % 16)], 16)
 #    endif
 #endif
 

From 927e00f8f1a7ee602c72f40f9e47657e04669222 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 8 Feb 2024 18:51:50 +0100
Subject: [PATCH 0755/1081] Update libuv

---
 contrib/libuv | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/libuv b/contrib/libuv
index 3a85b2eb3d8..4482964660c 160000
--- a/contrib/libuv
+++ b/contrib/libuv
@@ -1 +1 @@
-Subproject commit 3a85b2eb3d83f369b8a8cafd329d7e9dc28f60cf
+Subproject commit 4482964660c77eec1166cd7d14fb915e3dbd774a

From 16e2b275c26eb0916b92b98f9500745ff2e72934 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 19:08:46 +0100
Subject: [PATCH 0756/1081] Fix unpoison

---
 src/Common/MemorySanitizer.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/MemorySanitizer.h b/src/Common/MemorySanitizer.h
index cc6b0d5171f..02747d1e130 100644
--- a/src/Common/MemorySanitizer.h
+++ b/src/Common/MemorySanitizer.h
@@ -28,7 +28,7 @@
 #        undef __msan_unpoison_string
 #        include <sanitizer/msan_interface.h>
 #        undef __msan_unpoison_overflow_15
-#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE) - ((PTR_SIZE) % 16)], 16)
+#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE)], ((16 - ((PTR_SIZE) % 16)) % 16))
 #    endif
 #endif
 

From 641c7b547d898696fe6719cf2f5662b138f4e44c Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Sun, 4 Feb 2024 19:12:37 +0000
Subject: [PATCH 0757/1081] CI: enable await

 #no_merge_commit
---
 .github/workflows/master.yml         |  97 ++++++++
 .github/workflows/pull_request.yml   |   2 +-
 .github/workflows/reusable_build.yml |   1 +
 .github/workflows/reusable_test.yml  |   1 +
 tests/ci/ci.py                       | 360 ++++++++++++++++++---------
 tests/ci/ci_config.py                |  28 +--
 tests/ci/ci_utils.py                 |  17 +-
 tests/ci/commit_status_helper.py     |   3 +
 tests/ci/report.py                   |   3 +-
 tests/ci/test_ci_cache.py            |  35 ++-
 10 files changed, 409 insertions(+), 138 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 2471e4f9194..dac1332adc6 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -385,6 +385,22 @@ jobs:
       test_name: Stateless tests (release, s3 storage)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestS3Debug:
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (debug, s3 storage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestS3Tsan:
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (tsan, s3 storage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAarch64:
     needs: [RunConfig, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
@@ -493,6 +509,55 @@ jobs:
       test_name: Stateful tests (debug)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
+  # Parallel replicas
+  FunctionalStatefulTestDebugParallelReplicas:
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (debug, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestUBsanParallelReplicas:
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (ubsan, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestMsanParallelReplicas:
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (msan, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestTsanParallelReplicas:
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (tsan, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestAsanParallelReplicas:
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (asan, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatefulTestReleaseParallelReplicas:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateful tests (release, ParallelReplicas)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ########################### ClickBench #######################################################
 ##############################################################################################
@@ -700,6 +765,28 @@ jobs:
       runner_type: func-tester-aarch64
       data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
+############################ SQLLOGIC TEST ###################################################
+##############################################################################################
+  SQLLogicTestRelease:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Sqllogic test (release)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+##############################################################################################
+##################################### SQL TEST ###############################################
+##############################################################################################
+  SQLTest:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: SQLTest
+      runner_type: fuzzer-unit-tester
+      data: ${{ needs.RunConfig.outputs.data }}
+##############################################################################################
 ###################################### SQLANCER FUZZERS ######################################
 ##############################################################################################
   SQLancerTestRelease:
@@ -732,6 +819,8 @@ jobs:
       - FunctionalStatelessTestTsan
       - FunctionalStatelessTestMsan
       - FunctionalStatelessTestUBsan
+      - FunctionalStatelessTestS3Debug
+      - FunctionalStatelessTestS3Tsan
       - FunctionalStatefulTestDebug
       - FunctionalStatefulTestRelease
       - FunctionalStatefulTestAarch64
@@ -739,6 +828,12 @@ jobs:
       - FunctionalStatefulTestTsan
       - FunctionalStatefulTestMsan
       - FunctionalStatefulTestUBsan
+      - FunctionalStatefulTestDebugParallelReplicas
+      - FunctionalStatefulTestUBsanParallelReplicas
+      - FunctionalStatefulTestMsanParallelReplicas
+      - FunctionalStatefulTestTsanParallelReplicas
+      - FunctionalStatefulTestAsanParallelReplicas
+      - FunctionalStatefulTestReleaseParallelReplicas
       - StressTestDebug
       - StressTestAsan
       - StressTestTsan
@@ -764,6 +859,8 @@ jobs:
       - UnitTestsReleaseClang
       - SQLancerTestRelease
       - SQLancerTestDebug
+      - SQLLogicTestRelease
+      - SQLTest
     runs-on: [self-hosted, style-checker]
     steps:
       - name: Check out repository code
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 09e2d6dbb97..cf31738643b 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -1002,7 +1002,7 @@ jobs:
 ####################################### libFuzzer ###########################################
 #############################################################################################
   libFuzzer:
-    if: ${{ !failure() && !cancelled() && contains(github.event.pull_request.labels.*.name, 'libFuzzer') }}
+    if: ${{ !failure() && !cancelled() }}
     needs: [RunConfig, StyleCheck]
     uses: ./.github/workflows/libfuzzer.yml
     with:
diff --git a/.github/workflows/reusable_build.yml b/.github/workflows/reusable_build.yml
index 2371579692f..6be9d30175e 100644
--- a/.github/workflows/reusable_build.yml
+++ b/.github/workflows/reusable_build.yml
@@ -85,6 +85,7 @@ jobs:
         run: |
           python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --post --job-name '${{inputs.build_name}}'
       - name: Mark as done
+        if: ${{ !cancelled() }}
         run: |
           python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --mark-success --job-name '${{inputs.build_name}}'
       - name: Clean
diff --git a/.github/workflows/reusable_test.yml b/.github/workflows/reusable_test.yml
index 749f64d434e..e30ef863a86 100644
--- a/.github/workflows/reusable_test.yml
+++ b/.github/workflows/reusable_test.yml
@@ -107,6 +107,7 @@ jobs:
         run: |
           python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --post --job-name '${{inputs.test_name}}'
       - name: Mark as done
+        if: ${{ !cancelled() }}
         run: |
           python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --mark-success --job-name '${{inputs.test_name}}' --batch ${{matrix.batch}}
       - name: Clean
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 622b7bb005a..5c33d4e02a8 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1,5 +1,8 @@
 import argparse
 import concurrent.futures
+from copy import deepcopy
+from dataclasses import asdict, dataclass
+from enum import Enum
 import json
 import logging
 import os
@@ -7,16 +10,14 @@ import re
 import subprocess
 import sys
 import time
-from dataclasses import asdict, dataclass
-from enum import Enum
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Sequence, Union
 
 import docker_images_helper
 import upload_result_helper
 from build_check import get_release_or_pr
-from ci_config import CI_CONFIG, Build, JobNames, Labels
-from ci_utils import GHActions, is_hex
+from ci_config import CI_CONFIG, Build, Labels, JobNames
+from ci_utils import GHActions, is_hex, normalize_string
 from clickhouse_helper import (
     CiLogsCredentials,
     ClickHouseHelper,
@@ -48,7 +49,7 @@ from git_helper import GIT_PREFIX, Git
 from git_helper import Runner as GitRunner
 from github import Github
 from pr_info import PRInfo
-from report import SUCCESS, BuildResult, JobReport
+from report import ERROR, SUCCESS, BuildResult, JobReport
 from s3_helper import S3Helper
 from version_helper import get_version_from_repo
 
@@ -88,6 +89,7 @@ class CiCache:
     class RecordType(Enum):
         SUCCESSFUL = "successful"
         PENDING = "pending"
+        FAILED = "failed"
 
     @dataclass
     class Record:
@@ -249,6 +251,13 @@ class CiCache:
         )
         return record
 
+    def print_status(self):
+        for record_type in self.RecordType:
+            GHActions.print_in_group(
+                f"Cache records: [{record_type}]", list(self.records[record_type])
+            )
+        return self
+
     def update(self):
         """
         Pulls cache records from s3. Only records name w/o content.
@@ -260,9 +269,6 @@ class CiCache:
                 path = self.cache_s3_paths[job_type]
                 records = self.s3.list_prefix(f"{path}{prefix}", S3_BUILDS_BUCKET)
                 records = [record.split("/")[-1] for record in records]
-                GHActions.print_in_group(
-                    f"Cache records: [{record_type}] in [{job_type.value}]", records
-                )
                 for file in records:
                     record = self._parse_record_file_name(
                         record_type=record_type, file_name=file
@@ -384,6 +390,9 @@ class CiCache:
             if record_type == self.RecordType.SUCCESSFUL:
                 assert isinstance(status, CommitStatusData)
                 status.dump_to_file(record_file)
+            elif record_type == self.RecordType.FAILED:
+                assert isinstance(status, CommitStatusData)
+                status.dump_to_file(record_file)
             elif record_type == self.RecordType.PENDING:
                 assert isinstance(status, PendingState)
                 with open(record_file, "w") as json_file:
@@ -488,6 +497,16 @@ class CiCache:
             self.RecordType.SUCCESSFUL, job, batch, num_batches, release_branch
         )
 
+    def is_failed(
+        self, job: str, batch: int, num_batches: int, release_branch: bool
+    ) -> bool:
+        """
+        checks if a given job have already been done with failure
+        """
+        return self.exist(
+            self.RecordType.FAILED, job, batch, num_batches, release_branch
+        )
+
     def is_pending(
         self, job: str, batch: int, num_batches: int, release_branch: bool
     ) -> bool:
@@ -495,8 +514,9 @@ class CiCache:
         check pending record in the cache for a given job
         @release_branch - checks that "release" attribute is set for a record
         """
-        if self.is_successful(job, batch, num_batches, release_branch):
-            # successful record is present - not pending
+        if self.is_successful(
+            job, batch, num_batches, release_branch
+        ) or self.is_failed(job, batch, num_batches, release_branch):
             return False
 
         return self.exist(
@@ -524,6 +544,27 @@ class CiCache:
             release_branch,
         )
 
+    def push_failed(
+        self,
+        job: str,
+        batch: int,
+        num_batches: int,
+        job_status: CommitStatusData,
+        release_branch: bool = False,
+    ) -> None:
+        """
+        Pushes a cache record of type Failed (CommitStatusData)
+        @release_branch adds "release" attribute to a record
+        """
+        self.push(
+            self.RecordType.FAILED,
+            job,
+            [batch],
+            num_batches,
+            job_status,
+            release_branch,
+        )
+
     def push_pending(
         self, job: str, batches: List[int], num_batches: int, release_branch: bool
     ) -> None:
@@ -591,46 +632,87 @@ class CiCache:
             bucket=S3_BUILDS_BUCKET, file_path=result_json_path, s3_path=s3_path
         )
 
-    # def await_jobs(self, jobs_with_params: Dict[str, Dict[str, Any]]) -> List[str]:
-    # if not jobs_with_params:
-    #     return []
-    # print(f"Start awaiting jobs [{list(jobs_with_params)}]")
-    # poll_interval_sec = 180
-    # start_at = int(time.time())
-    # TIMEOUT = 3000
-    # expired_sec = 0
-    # done_jobs = []  # type: List[str]
-    # while expired_sec < TIMEOUT and jobs_with_params:
-    #     time.sleep(poll_interval_sec)
-    #     self.update()
-    #     pending_finished: List[str] = []
-    #     for job_name in jobs_with_params:
-    #         num_batches = jobs_with_params[job_name]["num_batches"]
-    #         for batch in jobs_with_params[job_name]["batches"]:
-    #             if self.is_pending(job_name, batch, num_batches):
-    #                 continue
-    #             print(
-    #                 f"Job [{job_name}_[{batch}/{num_batches}]] is not pending anymore"
-    #             )
-    #             pending_finished.append(job_name)
-    #     if pending_finished:
-    #         # restart timer
-    #         start_at = int(time.time())
-    #         expired_sec = 0
-    #         # remove finished jobs from awaiting list
-    #         for job in pending_finished:
-    #             del jobs_with_params[job]
-    #             done_jobs.append(job)
-    #     else:
-    #         expired_sec = int(time.time()) - start_at
-    #     print(f"  ...awaiting continues... time left [{TIMEOUT - expired_sec}]")
-    # if done_jobs:
-    #     print(
-    #         f"Awaiting OK. Left jobs: [{list(jobs_with_params)}], finished jobs: [{done_jobs}]"
-    #     )
-    # else:
-    #     print("Awaiting FAILED. No job has finished.")
-    # return done_jobs
+    def await_jobs(
+        self, jobs_with_params: Dict[str, Dict[str, Any]], is_release_branch: bool
+    ) -> Dict[str, List[int]]:
+        """
+        await pending jobs to be finished
+        @jobs_with_params - jobs to await. {JOB_NAME: {"batches": [BATCHES...], "num_batches": NUM_BATCHES}}
+        returns successfully finished jobs: {JOB_NAME: [BATCHES...]}
+        """
+        if not jobs_with_params:
+            return {}
+        poll_interval_sec = 300
+        TIMEOUT = 3600
+        await_finished: Dict[str, List[int]] = {}
+        round_cnt = 0
+        while len(jobs_with_params) > 5 and round_cnt < 3:
+            round_cnt += 1
+            GHActions.print_in_group(
+                f"Wait pending jobs, round [{round_cnt}]:", list(jobs_with_params)
+            )
+            # this is initial approach to wait pending jobs:
+            # start waiting for the next TIMEOUT seconds if there are more than X(=5) jobs to wait
+            # wait TIMEOUT seconds in rounds. Y(=3) is the max number of rounds
+            expired_sec = 0
+            start_at = int(time.time())
+            while expired_sec < TIMEOUT and jobs_with_params:
+                time.sleep(poll_interval_sec)
+                self.update()
+                jobs_with_params_copy = deepcopy(jobs_with_params)
+                for job_name in jobs_with_params:
+                    num_batches = jobs_with_params[job_name]["num_batches"]
+                    job_config = CI_CONFIG.get_job_config(job_name)
+                    for batch in jobs_with_params[job_name]["batches"]:
+                        if self.is_pending(
+                            job_name,
+                            batch,
+                            num_batches,
+                            release_branch=is_release_branch
+                            and job_config.required_on_release_branch,
+                        ):
+                            continue
+                        print(
+                            f"Job [{job_name}_[{batch}/{num_batches}]] is not pending anymore"
+                        )
+
+                        # some_job_ready = True
+                        jobs_with_params_copy[job_name]["batches"].remove(batch)
+                        if not jobs_with_params_copy[job_name]["batches"]:
+                            del jobs_with_params_copy[job_name]
+
+                        if not self.is_successful(
+                            job_name,
+                            batch,
+                            num_batches,
+                            release_branch=is_release_branch
+                            and job_config.required_on_release_branch,
+                        ):
+                            print(
+                                f"NOTE: Job [{job_name}:{batch}] finished but no success - remove from awaiting list, do not add to ready"
+                            )
+                            continue
+                        if job_name in await_finished:
+                            await_finished[job_name].append(batch)
+                        else:
+                            await_finished[job_name] = [batch]
+                jobs_with_params = jobs_with_params_copy
+                expired_sec = int(time.time()) - start_at
+                print(
+                    f"...awaiting continues... seconds left [{TIMEOUT - expired_sec}]"
+                )
+        if await_finished:
+            GHActions.print_in_group(
+                "Finished jobs:",
+                [f"{job}:{batches}" for job, batches in await_finished.items()],
+            )
+        else:
+            print("Awaiting FAILED. No job has finished successfully.")
+        GHActions.print_in_group(
+            "Remaining jobs:",
+            [f"{job}:{params['batches']}" for job, params in jobs_with_params.items()],
+        )
+        return await_finished
 
 
 def get_check_name(check_name: str, batch: int, num_batches: int) -> str:
@@ -832,7 +914,10 @@ def _pre_action(s3, indata, pr_info):
     ci_cache = CiCache(s3, indata["jobs_data"]["digests"])
 
     # for release/master branches reports must be from the same branches
-    report_prefix = pr_info.head_ref if pr_info.number == 0 else ""
+    report_prefix = normalize_string(pr_info.head_ref) if pr_info.number == 0 else ""
+    print(
+        f"Use report prefix [{report_prefix}], pr_num [{pr_info.number}], head_ref [{pr_info.head_ref}]"
+    )
     reports_files = ci_cache.download_build_reports(file_prefix=report_prefix)
     print(f"Pre action done. Report files [{reports_files}] have been downloaded")
 
@@ -883,8 +968,19 @@ def _mark_success_action(
                 job, batch, num_batches, job_status, pr_info.is_release_branch()
             )
             print(f"Job [{job}] is ok")
-        elif job_status:
-            print(f"Job [{job}] is not ok, status [{job_status.status}]")
+        elif job_status and not job_status.is_ok():
+            ci_cache.push_failed(
+                job, batch, num_batches, job_status, pr_info.is_release_branch()
+            )
+            print(f"Job [{job}] is failed with status [{job_status.status}]")
+        else:
+            job_status = CommitStatusData(
+                description="dummy description", status=ERROR, report_url="dummy url"
+            )
+            ci_cache.push_failed(
+                job, batch, num_batches, job_status, pr_info.is_release_branch()
+            )
+            print(f"No CommitStatusData for [{job}], push dummy failure to ci_cache")
 
 
 def _print_results(result: Any, outfile: Optional[str], pretty: bool = False) -> None:
@@ -992,8 +1088,8 @@ def _configure_jobs(
     jobs_to_do: List[str] = []
     jobs_to_skip: List[str] = []
     digests: Dict[str, str] = {}
-    print("::group::Job Digests")
 
+    print("::group::Job Digests")
     for job in CI_CONFIG.job_generator():
         digest = job_digester.get_job_digest(CI_CONFIG.get_digest_config(job))
         digests[job] = digest
@@ -1003,7 +1099,8 @@ def _configure_jobs(
     ## b. check what we need to run
     ci_cache = None
     if not ci_cache_disabled:
-        ci_cache = CiCache(s3, digests)
+        ci_cache = CiCache(s3, digests).update()
+        ci_cache.print_status()
 
     jobs_to_wait: Dict[str, Dict[str, Any]] = {}
 
@@ -1012,10 +1109,13 @@ def _configure_jobs(
         job_config = CI_CONFIG.get_job_config(job)
         num_batches: int = job_config.num_batches
         batches_to_do: List[int] = []
+        add_to_skip = False
 
         for batch in range(num_batches):  # type: ignore
             if job_config.pr_only and pr_info.is_release_branch():
                 continue
+            if job_config.release_only and not pr_info.is_release_branch():
+                continue
             if job_config.run_by_label:
                 # this job controlled by label, add to todo if its label is set in pr
                 if job_config.run_by_label in pr_info.labels:
@@ -1036,7 +1136,13 @@ def _configure_jobs(
                 batches_to_do.append(batch)
 
                 # check if it's pending in the cache
-                if ci_cache.is_pending(job, batch, num_batches, release_branch=False):
+                if ci_cache.is_pending(
+                    job,
+                    batch,
+                    num_batches,
+                    release_branch=pr_info.is_release_branch()
+                    and job_config.required_on_release_branch,
+                ):
                     if job in jobs_to_wait:
                         jobs_to_wait[job]["batches"].append(batch)
                     else:
@@ -1044,10 +1150,12 @@ def _configure_jobs(
                             "batches": [batch],
                             "num_batches": num_batches,
                         }
+            else:
+                add_to_skip = True
 
         if batches_to_do:
             jobs_to_do.append(job)
-        elif not job_config.run_by_label:
+        elif add_to_skip:
             # treat job as being skipped only if it's controlled by digest
             jobs_to_skip.append(job)
         jobs_params[job] = {
@@ -1119,49 +1227,64 @@ def _configure_jobs(
         "digests": digests,
         "jobs_to_do": jobs_to_do,
         "jobs_to_skip": jobs_to_skip,
-        "jobs_to_wait": jobs_to_wait,
+        "jobs_to_wait": {
+            job: params for job, params in jobs_to_wait.items() if job in jobs_to_do
+        },
         "jobs_params": {
             job: params for job, params in jobs_params.items() if job in jobs_to_do
         },
     }
 
 
+def _create_gh_status(
+    commit: Any, job: str, batch: int, num_batches: int, job_status: CommitStatusData
+) -> None:
+    print(f"Going to re-create GH status for job [{job}]")
+    assert job_status.status == SUCCESS, "BUG!"
+    commit.create_status(
+        state=job_status.status,
+        target_url=job_status.report_url,
+        description=format_description(
+            f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
+            f"{job_status.description}"
+        ),
+        context=get_check_name(job, batch=batch, num_batches=num_batches),
+    )
+
+
 def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
     if indata["ci_flags"][Labels.NO_CI_CACHE]:
         print("CI cache is disabled - skip restoring commit statuses from CI cache")
         return
     job_digests = indata["jobs_data"]["digests"]
-    ci_cache = CiCache(s3, job_digests).update().fetch_records_data()
+    jobs_to_skip = indata["jobs_data"]["jobs_to_skip"]
+    jobs_to_do = indata["jobs_data"]["jobs_to_do"]
+    ci_cache = CiCache(s3, job_digests).update().fetch_records_data().print_status()
 
     # create GH status
     pr_info = PRInfo()
     commit = get_commit(Github(get_best_robot_token(), per_page=100), pr_info.sha)
 
-    def _run_create_status(job: str, batch: int, num_batches: int) -> None:
+    def _concurrent_create_status(job: str, batch: int, num_batches: int) -> None:
         job_status = ci_cache.get_successful(job, batch, num_batches)
         if not job_status:
             return
-        print(f"Going to re-create GH status for job [{job}] sha [{pr_info.sha}]")
-        assert job_status.status == SUCCESS, "BUG!"
-        commit.create_status(
-            state=job_status.status,
-            target_url=job_status.report_url,
-            description=format_description(
-                f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
-                f"{job_status.description}"
-            ),
-            context=get_check_name(job, batch=batch, num_batches=num_batches),
-        )
+        _create_gh_status(commit, job, batch, num_batches, job_status)
 
     with concurrent.futures.ThreadPoolExecutor() as executor:
         futures = []
         for job in job_digests:
+            if job not in jobs_to_skip or job not in jobs_to_do:
+                # no need to create status for job that are not supposed to be executed
+                continue
             if CI_CONFIG.is_build_job(job):
                 # no GH status for build jobs
                 continue
             num_batches = CI_CONFIG.get_job_config(job).num_batches
             for batch in range(num_batches):
-                future = executor.submit(_run_create_status, job, batch, num_batches)
+                future = executor.submit(
+                    _concurrent_create_status, job, batch, num_batches
+                )
                 futures.append(future)
         done, _ = concurrent.futures.wait(futures)
         for future in done:
@@ -1194,7 +1317,7 @@ def _upload_build_artifacts(
         (
             get_release_or_pr(pr_info, get_version_from_repo())[1],
             pr_info.sha,
-            CI_CONFIG.normalize_string(build_name),
+            normalize_string(build_name),
             "performance.tar.zst",
         )
     )
@@ -1509,30 +1632,51 @@ def main() -> int:
         if not args.skip_jobs and pr_info.has_changes_in_documentation_only():
             _update_config_for_docs_only(jobs_data)
 
-        # TODO: await pending jobs
-        # wait for pending jobs to be finished, await_jobs is a long blocking call if any job has to be awaited
-        # awaited_jobs = ci_cache.await_jobs(jobs_data.get("jobs_to_wait", {}))
-        # for job in awaited_jobs:
-        #     jobs_to_do = jobs_data["jobs_to_do"]
-        #     if job in jobs_to_do:
-        #         jobs_to_do.remove(job)
-        #     else:
-        #         assert False, "BUG"
-
-        # set planned jobs as pending in the CI cache if on the master
-        if pr_info.is_master() and not args.skip_jobs:
+        if not args.skip_jobs:
             ci_cache = CiCache(s3, jobs_data["digests"])
-            for job in jobs_data["jobs_to_do"]:
-                config = CI_CONFIG.get_job_config(job)
-                if config.run_always or config.run_by_label:
-                    continue
-                job_params = jobs_data["jobs_params"][job]
-                ci_cache.push_pending(
-                    job,
-                    job_params["batches"],
-                    config.num_batches,
-                    release_branch=pr_info.is_release_branch(),
+
+            if (
+                pr_info.is_release_branch()
+                or pr_info.event.get("pull_request", {})
+                .get("user", {})
+                .get("login", "not_maxknv")
+                == "maxknv"
+            ):
+                # wait for pending jobs to be finished, await_jobs is a long blocking call
+                # wait pending jobs (for now only on release/master branches)
+                ready_jobs_batches_dict = ci_cache.await_jobs(
+                    jobs_data.get("jobs_to_wait", {}), pr_info.is_release_branch()
                 )
+                jobs_to_do = jobs_data["jobs_to_do"]
+                jobs_to_skip = jobs_data["jobs_to_skip"]
+                jobs_params = jobs_data["jobs_params"]
+                for job, batches in ready_jobs_batches_dict.items():
+                    if job not in jobs_params:
+                        print(f"WARNING: Job [{job}] is not in the params list")
+                        continue
+                    for batch in batches:
+                        jobs_params[job]["batches"].remove(batch)
+                    if not jobs_params[job]["batches"]:
+                        jobs_to_do.remove(job)
+                        jobs_to_skip.append(job)
+                        del jobs_params[job]
+
+            # set planned jobs as pending in the CI cache if on the master
+            if pr_info.is_master():
+                for job in jobs_data["jobs_to_do"]:
+                    config = CI_CONFIG.get_job_config(job)
+                    if config.run_always or config.run_by_label:
+                        continue
+                    job_params = jobs_data["jobs_params"][job]
+                    ci_cache.push_pending(
+                        job,
+                        job_params["batches"],
+                        config.num_batches,
+                        release_branch=pr_info.is_release_branch(),
+                    )
+
+            if "jobs_to_wait" in jobs_data:
+                del jobs_data["jobs_to_wait"]
 
         # conclude results
         result["git_ref"] = git_ref
@@ -1608,23 +1752,15 @@ def main() -> int:
                         check_name, args.batch, job_config.num_batches
                     )
                     assert job_status, "BUG"
-                    commit.create_status(
-                        state=job_status.status,
-                        target_url=job_status.report_url,
-                        description=format_description(
-                            f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
-                            f"{job_status.description}"
-                        ),
-                        context=get_check_name(
-                            check_name,
-                            batch=args.batch,
-                            num_batches=job_config.num_batches,
-                        ),
+                    _create_gh_status(
+                        commit,
+                        check_name,
+                        args.batch,
+                        job_config.num_batches,
+                        job_status,
                     )
                     previous_status = job_status.status
-                    print("::group::Commit Status Data")
-                    print(job_status)
-                    print("::endgroup::")
+                    GHActions.print_in_group("Commit Status Data", job_status)
 
         if previous_status:
             print(
@@ -1648,7 +1784,7 @@ def main() -> int:
             if CI_CONFIG.is_build_job(args.job_name):
                 assert (
                     indata
-                ), "--infile with config must be provided for POST action of a build type job [{args.job_name}]"
+                ), f"--infile with config must be provided for POST action of a build type job [{args.job_name}]"
                 build_name = args.job_name
                 s3_path_prefix = "/".join(
                     (
@@ -1676,7 +1812,7 @@ def main() -> int:
                     (
                         get_release_or_pr(pr_info, get_version_from_repo())[0],
                         pr_info.sha,
-                        CI_CONFIG.normalize_string(
+                        normalize_string(
                             job_report.check_name or _get_ext_check_name(args.job_name)
                         ),
                     )
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 6036a04080c..7c8990e8d16 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -22,6 +22,8 @@ class Labels(metaclass=WithIter):
     CI_SET_ARM = "ci_set_arm"
     CI_SET_INTEGRATION = "ci_set_integration"
 
+    libFuzzer = "libFuzzer"
+
 
 class Build(metaclass=WithIter):
     PACKAGE_RELEASE = "package_release"
@@ -193,6 +195,8 @@ class JobConfig:
     required_on_release_branch: bool = False
     # job is for pr workflow only
     pr_only: bool = False
+    # job is for release/master branches only
+    release_only: bool = False
 
 
 @dataclass
@@ -790,6 +794,7 @@ CI_CONFIG = CiConfig(
             name=Build.FUZZERS,
             compiler="clang-17",
             package_type="fuzzers",
+            job_config=JobConfig(run_by_label=Labels.libFuzzer),
         ),
     },
     builds_report_config={
@@ -824,7 +829,7 @@ CI_CONFIG = CiConfig(
     },
     other_jobs_configs={
         JobNames.MARK_RELEASE_READY: TestConfig(
-            "", job_config=JobConfig(required_on_release_branch=True)
+            "", job_config=JobConfig(release_only=True)
         ),
         JobNames.DOCKER_SERVER: TestConfig(
             "",
@@ -909,13 +914,6 @@ CI_CONFIG = CiConfig(
         JobNames.STATEFUL_TEST_AARCH64: TestConfig(
             Build.PACKAGE_AARCH64, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
         ),
-        # FIXME: delete?
-        # "Stateful tests (release, DatabaseOrdinary)": TestConfig(
-        #     Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
-        # ),
-        # "Stateful tests (release, DatabaseReplicated)": TestConfig(
-        #     Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params) # type: ignore
-        # ),
         # Stateful tests for parallel replicas
         JobNames.STATEFUL_TEST_PARALLEL_REPL_RELEASE: TestConfig(
             Build.PACKAGE_RELEASE, job_config=JobConfig(**stateful_test_common_params)  # type: ignore
@@ -997,16 +995,16 @@ CI_CONFIG = CiConfig(
             Build.PACKAGE_DEBUG, job_config=JobConfig(**stress_test_common_params)  # type: ignore
         ),
         JobNames.UPGRADE_TEST_ASAN: TestConfig(
-            Build.PACKAGE_ASAN, job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+            Build.PACKAGE_ASAN, job_config=JobConfig(pr_only=True, **upgrade_test_common_params)  # type: ignore
         ),
         JobNames.UPGRADE_TEST_TSAN: TestConfig(
-            Build.PACKAGE_TSAN, job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+            Build.PACKAGE_TSAN, job_config=JobConfig(pr_only=True, **upgrade_test_common_params)  # type: ignore
         ),
         JobNames.UPGRADE_TEST_MSAN: TestConfig(
-            Build.PACKAGE_MSAN, job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+            Build.PACKAGE_MSAN, job_config=JobConfig(pr_only=True, **upgrade_test_common_params)  # type: ignore
         ),
         JobNames.UPGRADE_TEST_DEBUG: TestConfig(
-            Build.PACKAGE_DEBUG, job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+            Build.PACKAGE_DEBUG, job_config=JobConfig(pr_only=True, **upgrade_test_common_params)  # type: ignore
         ),
         JobNames.INTEGRATION_TEST_ASAN: TestConfig(
             Build.PACKAGE_ASAN,
@@ -1033,7 +1031,7 @@ CI_CONFIG = CiConfig(
             job_config=JobConfig(num_batches=4, **integration_test_common_params),  # type: ignore
         ),
         JobNames.INTEGRATION_TEST_FLAKY: TestConfig(
-            Build.PACKAGE_ASAN, job_config=JobConfig(**integration_test_common_params)  # type: ignore
+            Build.PACKAGE_ASAN, job_config=JobConfig(pr_only=True, **integration_test_common_params)  # type: ignore
         ),
         JobNames.COMPATIBILITY_TEST: TestConfig(
             Build.PACKAGE_RELEASE,
@@ -1080,7 +1078,7 @@ CI_CONFIG = CiConfig(
         JobNames.STATELESS_TEST_FLAKY_ASAN: TestConfig(
             # replace to non-default
             Build.PACKAGE_ASAN,
-            job_config=JobConfig(**{**statless_test_common_params, "timeout": 3600}),  # type: ignore
+            job_config=JobConfig(pr_only=True, **{**statless_test_common_params, "timeout": 3600}),  # type: ignore
         ),
         JobNames.JEPSEN_KEEPER: TestConfig(
             Build.BINARY_RELEASE,
@@ -1116,7 +1114,7 @@ CI_CONFIG = CiConfig(
         ),
         JobNames.CLCIKBENCH_TEST: TestConfig(Build.PACKAGE_RELEASE),
         JobNames.CLCIKBENCH_TEST_ARM: TestConfig(Build.PACKAGE_AARCH64),
-        JobNames.LIBFUZZER_TEST: TestConfig(Build.FUZZERS),  # type: ignore
+        JobNames.LIBFUZZER_TEST: TestConfig(Build.FUZZERS, job_config=JobConfig(run_by_label=Labels.libFuzzer)),  # type: ignore
     },
 )
 CI_CONFIG.validate()
diff --git a/tests/ci/ci_utils.py b/tests/ci/ci_utils.py
index 7e2a3d11725..2967ec2f309 100644
--- a/tests/ci/ci_utils.py
+++ b/tests/ci/ci_utils.py
@@ -1,6 +1,6 @@
 from contextlib import contextmanager
 import os
-from typing import List, Union, Iterator
+from typing import Any, List, Union, Iterator
 from pathlib import Path
 
 
@@ -27,9 +27,22 @@ def is_hex(s):
         return False
 
 
+def normalize_string(string: str) -> str:
+    lowercase_string = string.lower()
+    normalized_string = (
+        lowercase_string.replace(" ", "_")
+        .replace("-", "_")
+        .replace("/", "_")
+        .replace("(", "")
+        .replace(")", "")
+        .replace(",", "")
+    )
+    return normalized_string
+
+
 class GHActions:
     @staticmethod
-    def print_in_group(group_name: str, lines: Union[str, List[str]]) -> None:
+    def print_in_group(group_name: str, lines: Union[Any, List[Any]]) -> None:
         lines = list(lines)
         print(f"::group::{group_name}")
         for line in lines:
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 5dd2a33adaf..8a34d375d1e 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -370,6 +370,9 @@ class CommitStatusData:
     def is_ok(self):
         return self.status == SUCCESS
 
+    def is_failure(self):
+        return self.status == FAILURE
+
     @staticmethod
     def cleanup():
         STATUS_FILE_PATH.unlink(missing_ok=True)
diff --git a/tests/ci/report.py b/tests/ci/report.py
index ce20c7293f9..ef09e9738ee 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -23,6 +23,7 @@ from typing import (
 from build_download_helper import get_gh_api
 from ci_config import CI_CONFIG, BuildConfig
 from env_helper import REPORT_PATH, TEMP_PATH
+from ci_utils import normalize_string
 
 logger = logging.getLogger(__name__)
 
@@ -550,7 +551,7 @@ class BuildResult:
 
     def write_json(self, directory: Union[Path, str] = REPORT_PATH) -> Path:
         path = Path(directory) / self.get_report_name(
-            self.build_name, self.pr_number or self.head_ref
+            self.build_name, self.pr_number or normalize_string(self.head_ref)
         )
         path.write_text(
             json.dumps(
diff --git a/tests/ci/test_ci_cache.py b/tests/ci/test_ci_cache.py
index 0f8acf2656c..3cdd6c78390 100644
--- a/tests/ci/test_ci_cache.py
+++ b/tests/ci/test_ci_cache.py
@@ -96,16 +96,27 @@ class TestCiCache(unittest.TestCase):
             pr_num=PR_NUM,
         )
 
-        ### add some pending statuses for two batches and on non-release branch
+        ### add some pending statuses for two batches, non-release branch
         for job in JobNames:
-            ci_cache.push_pending(job, [0, 1], NUM_BATCHES, release_branch=False)
-            ci_cache_2.push_pending(job, [0, 1], NUM_BATCHES, release_branch=False)
+            ci_cache.push_pending(job, [0, 1, 2], NUM_BATCHES, release_branch=False)
+            ci_cache_2.push_pending(job, [0, 1, 2], NUM_BATCHES, release_branch=False)
 
         ### add success status for 0 batch, non-release branch
+        batch = 0
         for job in JobNames:
-            ci_cache.push_successful(job, 0, NUM_BATCHES, status, release_branch=False)
+            ci_cache.push_successful(
+                job, batch, NUM_BATCHES, status, release_branch=False
+            )
             ci_cache_2.push_successful(
-                job, 0, NUM_BATCHES, status, release_branch=False
+                job, batch, NUM_BATCHES, status, release_branch=False
+            )
+
+        ### add failed status for 2 batch, non-release branch
+        batch = 2
+        for job in JobNames:
+            ci_cache.push_failed(job, batch, NUM_BATCHES, status, release_branch=False)
+            ci_cache_2.push_failed(
+                job, batch, NUM_BATCHES, status, release_branch=False
             )
 
         ### check all expected directories were created on s3 mock
@@ -128,7 +139,7 @@ class TestCiCache(unittest.TestCase):
         )
 
         ### check number of cache files is as expected
-        FILES_PER_JOB = 3  # 1 successful + 2 pending batches = 3
+        FILES_PER_JOB = 5  # 1 successful + 1 failed + 3 pending batches = 5
         self.assertEqual(
             len(
                 s3_mock.files_on_s3_paths[
@@ -219,7 +230,7 @@ class TestCiCache(unittest.TestCase):
             ci_cache.push_successful(job, 0, NUM_BATCHES, status, release_branch=True)
 
         ### check number of cache files is as expected
-        FILES_PER_JOB = 6  # 1 successful + 1 successful_release + 2 pending batches + 2 pending batches release = 6
+        FILES_PER_JOB = 8  # 1 successful + 1 failed + 1 successful_release + 3 pending batches + 2 pending batches release = 8
         self.assertEqual(
             len(
                 s3_mock.files_on_s3_paths[
@@ -252,6 +263,9 @@ class TestCiCache(unittest.TestCase):
             self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, False), True)
             self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, True), True)
 
+            self.assertEqual(ci_cache.is_failed(job, 2, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_failed(job, 2, NUM_BATCHES, True), False)
+
             status2 = ci_cache.get_successful(job, 0, NUM_BATCHES)
             assert status2 and status2.pr_num == PR_NUM
             status2 = ci_cache.get_successful(job, 1, NUM_BATCHES)
@@ -273,6 +287,13 @@ class TestCiCache(unittest.TestCase):
             self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, False), True)
             self.assertEqual(ci_cache.is_pending(job, 1, NUM_BATCHES, True), True)
 
+            self.assertEqual(ci_cache.is_failed(job, 2, NUM_BATCHES, False), True)
+            self.assertEqual(ci_cache.is_failed(job, 2, NUM_BATCHES, True), False)
+
+            # is_pending() is false for failed jobs batches
+            self.assertEqual(ci_cache.is_pending(job, 2, NUM_BATCHES, False), False)
+            self.assertEqual(ci_cache.is_pending(job, 2, NUM_BATCHES, True), False)
+
             status2 = ci_cache.get_successful(job, 0, NUM_BATCHES)
             assert status2 and status2.pr_num == PR_NUM
             status2 = ci_cache.get_successful(job, 1, NUM_BATCHES)

From b112fd1e3cde6088ec403fe9c2fca6b2dd828f4f Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 8 Feb 2024 19:09:28 +0000
Subject: [PATCH 0758/1081] CI: ci test await

 #do_not_test
---
 tests/ci/ci.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 5c33d4e02a8..ce8d1c8c20e 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1274,7 +1274,7 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
     with concurrent.futures.ThreadPoolExecutor() as executor:
         futures = []
         for job in job_digests:
-            if job not in jobs_to_skip or job not in jobs_to_do:
+            if job not in jobs_to_skip and job not in jobs_to_do:
                 # no need to create status for job that are not supposed to be executed
                 continue
             if CI_CONFIG.is_build_job(job):

From a2beae80f5077e0a477df9a136f8f32224e67246 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 20:57:33 +0100
Subject: [PATCH 0759/1081] Improve test

---
 .../02985_shard_query_start_time.reference    |  4 ++--
 .../02985_shard_query_start_time.sql          | 21 ++++++++++++-------
 2 files changed, 15 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/02985_shard_query_start_time.reference b/tests/queries/0_stateless/02985_shard_query_start_time.reference
index 1957f3a9604..ff563ea1d53 100644
--- a/tests/queries/0_stateless/02985_shard_query_start_time.reference
+++ b/tests/queries/0_stateless/02985_shard_query_start_time.reference
@@ -1,2 +1,2 @@
-1	1
-1	1
+QueryStart	2	2	2	2
+QueryFinish	2	2	2	2
diff --git a/tests/queries/0_stateless/02985_shard_query_start_time.sql b/tests/queries/0_stateless/02985_shard_query_start_time.sql
index b0d8d2b6e53..c31d81e58ae 100644
--- a/tests/queries/0_stateless/02985_shard_query_start_time.sql
+++ b/tests/queries/0_stateless/02985_shard_query_start_time.sql
@@ -1,29 +1,34 @@
 DROP TABLE IF EXISTS sharded_table;
 CREATE TABLE sharded_table (dummy UInt8) ENGINE = Distributed('test_cluster_two_shards', 'system', 'one');
 
+SET prefer_localhost_replica=0;
 SELECT * FROM sharded_table FORMAT Null SETTINGS log_comment='02985_shard_query_start_time_query_1';
 
 SYSTEM FLUSH LOGS;
 
--- We do not test for query_start_time because that would conflict pretty easily
+-- Check that there are 2 queries to shards and for each one query_start_time_microseconds is more recent
+-- than initial_query_start_time_microseconds, and initial_query_start_time_microseconds matches the original query
+-- query_start_time_microseconds
 WITH
 (
     SELECT
-        (query_id, query_start_time_microseconds)
+        (query_id, query_start_time, query_start_time_microseconds)
     FROM
         system.query_log
     WHERE
-            event_date >= yesterday()
+          event_date >= yesterday()
       AND current_database = currentDatabase()
       AND log_comment = '02985_shard_query_start_time_query_1'
       AND type = 'QueryFinish'
-    ORDER BY query_start_time_microseconds DESC
-    LIMIT 1
 ) AS id_and_start_tuple
 SELECT
-    query_start_time_microseconds > initial_query_start_time_microseconds,
-    initial_query_start_time_microseconds = id_and_start_tuple.2
+    type,
+    countIf(query_start_time >= initial_query_start_time), -- Using >= because it's comparing seconds
+    countIf(query_start_time_microseconds > initial_query_start_time_microseconds),
+    countIf(initial_query_start_time = id_and_start_tuple.2),
+    countIf(initial_query_start_time_microseconds = id_and_start_tuple.3)
 FROM
     system.query_log
 WHERE
-    NOT is_initial_query AND initial_query_id = id_and_start_tuple.1;
+    NOT is_initial_query AND initial_query_id = id_and_start_tuple.1
+GROUP BY type;

From 075da5602fdc03d4d5b15cd8d769704259b168a9 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 8 Feb 2024 21:10:49 +0100
Subject: [PATCH 0760/1081] Remove incorrect test

---
 ...nt_info_initial_query_start_time.reference |  8 ---
 ...de_client_info_initial_query_start_time.sh | 67 -------------------
 2 files changed, 75 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
 delete mode 100755 tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh

diff --git a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
deleted file mode 100644
index fbce8ae2026..00000000000
--- a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
+++ /dev/null
@@ -1,8 +0,0 @@
-SELECT
-3	0	0
-3	0	0
-INSERT
-CHECK
-1
-2
-6	0	2
diff --git a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh
deleted file mode 100755
index 5da643bd17b..00000000000
--- a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh
+++ /dev/null
@@ -1,67 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-fasttest
-# Tag no-fasttest: interserver mode requires SSL
-#
-# Test that checks that some of ClientInfo correctly passed in inter-server mode.
-# NOTE: we need .sh test (.sql is not enough) because queries on remote nodes does not have current_database = currentDatabase()
-#
-# Check-style suppression: select * from system.query_log where current_database = currentDatabase();
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-function get_query_id() { random_str 10; }
-
-$CLICKHOUSE_CLIENT -nm -q "
-    drop table if exists buf;
-    drop table if exists dist;
-    drop table if exists data;
-
-    create table data (key Int) engine=Memory();
-    create table dist as data engine=Distributed(test_cluster_interserver_secret, currentDatabase(), data, key);
-    create table dist_dist as data engine=Distributed(test_cluster_interserver_secret, currentDatabase(), dist, key);
-    system stop distributed sends dist;
-"
-
-echo "SELECT"
-query_id="$(get_query_id)"
-# initialize connection, but actually if there are other tables that uses this
-# cluster then, it will be created long time ago, but this is OK for this
-# test, since we care about the difference between NOW() and there should
-# not be any significant difference.
-$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -q "select * from dist"
-$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
-    system flush logs;
-    select count(), countIf(initial_query_start_time_microseconds != query_start_time_microseconds), countIf(event_time - initial_query_start_time > 3) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
-"
-
-sleep 6
-
-query_id="$(get_query_id)"
-# this query (and all subsequent) should reuse the previous connection (at least most of the time)
-$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -q "select * from dist"
-
-$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
-    system flush logs;
-    select count(), countIf(initial_query_start_time_microseconds != query_start_time_microseconds), countIf(event_time - initial_query_start_time > 3) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
-"
-
-echo "INSERT"
-query_id="$(get_query_id)"
-$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -nm -q "
-    insert into dist_dist values (1),(2);
-    select * from data;
-"
-
-sleep 3
-$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "system flush distributed dist_dist"
-sleep 1
-$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "system flush distributed dist"
-
-echo "CHECK"
-$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
-    select * from data order by key;
-    system flush logs;
-    select count(), countIf(initial_query_start_time_microseconds != query_start_time_microseconds), countIf(event_time - initial_query_start_time > 3) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
-"

From 91c607f249fe6320c5c6a3bbffd61a6dcc44ff49 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 8 Feb 2024 22:11:37 +0100
Subject: [PATCH 0761/1081] Fix a test

---
 docker/test/base/setup_export_logs.sh                     | 8 ++++----
 src/Dictionaries/CacheDictionary.cpp                      | 2 --
 .../0_stateless/02982_comments_in_system_tables.sh        | 4 ++--
 3 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 6209336ab4e..917701b8d35 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -140,10 +140,10 @@ function setup_logs_replication
     clickhouse-client --query "
         CREATE TABLE IF NOT EXISTS system.coverage_log
         (
-            time DateTime,
-            test_name String,
-            coverage Array(UInt64)
-        ) ENGINE = MergeTree ORDER BY test_name
+            time DateTime COMMENT 'The time of test run',
+            test_name String COMMENT 'The name of the test',
+            coverage Array(UInt64) COMMENT 'An array of addresses of the code (a subset of addresses instrumented for coverage) that were encountered during the test run'
+        ) ENGINE = MergeTree ORDER BY test_name COMMENT 'Contains information about per-test coverage from the CI'
     "
 
     # For each system log table:
diff --git a/src/Dictionaries/CacheDictionary.cpp b/src/Dictionaries/CacheDictionary.cpp
index 000f0ef5b4c..bf3d5a5cd12 100644
--- a/src/Dictionaries/CacheDictionary.cpp
+++ b/src/Dictionaries/CacheDictionary.cpp
@@ -3,9 +3,7 @@
 #include <memory>
 #include <base/chrono_io.h>
 
-#include <Core/Defines.h>
 #include <Common/CurrentMetrics.h>
-#include <Common/HashTable/Hash.h>
 #include <Common/HashTable/HashSet.h>
 #include <Common/ProfileEvents.h>
 #include <Common/ProfilingScopedRWLock.h>
diff --git a/tests/queries/0_stateless/02982_comments_in_system_tables.sh b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
index cc04592bc27..0825b1be2d6 100755
--- a/tests/queries/0_stateless/02982_comments_in_system_tables.sh
+++ b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
@@ -4,5 +4,5 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-${CLICKHOUSE_LOCAL}  --query "SELECT 'Table ' || database || '.' || name || ' doesnt have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
-${CLICKHOUSE_CLIENT} --query "SELECT 'Table ' || database || '.' || name || ' doesnt have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
+${CLICKHOUSE_LOCAL}  --query "SELECT 'Table ' || database || '.' || name || ' doesn\'t have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
+${CLICKHOUSE_CLIENT} --query "SELECT 'Table ' || database || '.' || name || ' doesn\'t have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"

From e598ad9157e63cfd08800839c5c2d4d9a15ba95f Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Thu, 8 Feb 2024 21:26:48 +0000
Subject: [PATCH 0762/1081] Better logging for adaptive async timeouts

Log the adaptive async timeout value after normalization.
---
 src/Interpreters/AsynchronousInsertQueue.cpp | 34 ++++++++------------
 src/Interpreters/AsynchronousInsertQueue.h   |  1 -
 2 files changed, 13 insertions(+), 22 deletions(-)

diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index e7f292d9b77..44cc58cec84 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -353,7 +353,18 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
 
         auto [it, inserted] = shard.iterators.try_emplace(key.hash);
         auto now = std::chrono::steady_clock::now();
-        auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, shard_num, flush_time_points, now);
+        auto timeout_ms = getBusyWaitTimeoutMs(settings, shard, flush_time_points, now);
+        if (timeout_ms != shard.busy_timeout_ms)
+        {
+            LOG_TRACE(
+                log,
+                "Asynchronous timeout {} from {} to {} for queue shard {}.",
+                timeout_ms < shard.busy_timeout_ms ? "decreased" : "increased",
+                shard.busy_timeout_ms.count(),
+                timeout_ms.count(),
+                size_t(shard_num));
+        }
+
         if (inserted)
             it->second = shard.queue.emplace(now + timeout_ms, Container{key, std::make_unique<InsertData>(timeout_ms)}).first;
 
@@ -431,7 +442,6 @@ AsynchronousInsertQueue::pushDataChunk(ASTPtr query, DataChunk chunk, ContextPtr
 AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeoutMs(
     const Settings & settings,
     const QueueShard & shard,
-    size_t shard_num,
     const QueueShardFlushTimeHistory::TimePoints & flush_time_points,
     std::chrono::steady_clock::time_point now) const
 {
@@ -460,13 +470,6 @@ AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeou
         auto timeout_ms = std::max(
             std::chrono::duration_cast<Milliseconds>(shard.busy_timeout_ms * (1.0 + increase_rate)),
             shard.busy_timeout_ms + Milliseconds(1));
-        if (timeout_ms != shard.busy_timeout_ms)
-            LOG_TRACE(
-                log,
-                "Async timeout increased from {} to {} for queue shard {}.",
-                shard.busy_timeout_ms.count(),
-                timeout_ms.count(),
-                shard_num);
 
         return normalize(timeout_ms);
     }
@@ -475,18 +478,7 @@ AsynchronousInsertQueue::Milliseconds AsynchronousInsertQueue::getBusyWaitTimeou
     /// long enough (exceeding the adjusted timeout).
     /// This ensures the timeout value converges to the minimum over time for non-frequent inserts.
     else if (last_insert_time + decreased_timeout_ms < now && t1 + decreased_timeout_ms < t2)
-    {
-        auto timeout_ms = decreased_timeout_ms;
-        if (timeout_ms != shard.busy_timeout_ms)
-            LOG_TRACE(
-                log,
-                "Async timeout decreased from {} to {} for queue shard {}.",
-                shard.busy_timeout_ms.count(),
-                timeout_ms.count(),
-                shard_num);
-
-        return normalize(timeout_ms);
-    }
+        return normalize(decreased_timeout_ms);
 
     return normalize(shard.busy_timeout_ms);
 }
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index c2c4755f192..17140030766 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -248,7 +248,6 @@ private:
     Milliseconds getBusyWaitTimeoutMs(
         const Settings & settings,
         const QueueShard & shard,
-        size_t shard_num,
         const QueueShardFlushTimeHistory::TimePoints & flush_time_points,
         std::chrono::steady_clock::time_point now) const;
 

From dbc288cd51affc3f6758a66ac51130aa8b5b565f Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Thu, 8 Feb 2024 23:13:44 +0100
Subject: [PATCH 0763/1081] Update ne-tormozit.md

Fix broken youtube video embedding
---
 docs/ru/faq/general/ne-tormozit.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/faq/general/ne-tormozit.md b/docs/ru/faq/general/ne-tormozit.md
index 0f888de839f..6d0803680a8 100644
--- a/docs/ru/faq/general/ne-tormozit.md
+++ b/docs/ru/faq/general/ne-tormozit.md
@@ -20,6 +20,6 @@ sidebar_position: 11
 
 Если вы не видели наших футболок, посмотрите видео о ClickHouse. Например, вот это:
 
-![iframe](https://www.youtube.com/embed/bSyQahMVZ7w)
+<iframe width="675" height="380" src="https://www.youtube.com/embed/bSyQahMVZ7w" frameborder="0" allow="accelerometer; autoplay; gyroscope; picture-in-picture" allowfullscreen></iframe>
 
 P.S. Эти футболки не продаются, а распространяются бесплатно на большинстве митапов [ClickHouse](https://clickhouse.com/#meet), обычно в награду за самые интересные вопросы или другие виды активного участия.

From c12e34df199c0c30764dfa865cc30da427635aca Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 8 Feb 2024 23:28:29 +0100
Subject: [PATCH 0764/1081] Fix report

---
 .github/workflows/master.yml       | 1 +
 .github/workflows/pull_request.yml | 1 +
 tests/ci/ci_config.py              | 9 +++------
 3 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 653b46300ac..1bebe80ca7e 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -285,6 +285,7 @@ jobs:
       - BuilderDebDebug
       - BuilderDebMsan
       - BuilderDebRelease
+      - BuilderDebReleaseCoverage
       - BuilderDebTsan
       - BuilderDebUBsan
     uses: ./.github/workflows/reusable_test.yml
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 6a5bb851447..405e1ec1502 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -317,6 +317,7 @@ jobs:
       - BuilderDebDebug
       - BuilderDebMsan
       - BuilderDebRelease
+      - BuilderDebReleaseCoverage
       - BuilderDebTsan
       - BuilderDebUBsan
     uses: ./.github/workflows/reusable_test.yml
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index b40584ff1a8..817018f044c 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -204,10 +204,9 @@ class JobConfig:
 
 # About the "sparse_checkout" option:
 #
-# Misha f. Shiryaev
-# :facepalm:
-# we have this feature, it's used by devs, we need to test it in CI
-# It's not useful for the CI itself
+# It's needed only to test the option itself.
+# No particular sense to use it in the build,
+# and it is even slows down the job.
 
 
 @dataclass
@@ -730,7 +729,6 @@ CI_CONFIG = CIConfig(
             compiler="clang-17",
             coverage=True,
             package_type="deb",
-            sparse_checkout=True,
         ),
         Build.BINARY_RELEASE: BuildConfig(
             name=Build.BINARY_RELEASE,
@@ -751,7 +749,6 @@ CI_CONFIG = CIConfig(
             compiler="clang-17-darwin",
             package_type="binary",
             static_binary_name="macos",
-            sparse_checkout=True,  # Check that it works with at least one build, see also update-submodules.sh
         ),
         Build.BINARY_AARCH64: BuildConfig(
             name=Build.BINARY_AARCH64,

From 41ff8b3217595a6d24eaaf973e73b04f09242ae6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:15:52 +0100
Subject: [PATCH 0765/1081] Reading Docker files

---
 docker/test/stateless/Dockerfile | 1 -
 docker/test/util/Dockerfile      | 8 ++------
 2 files changed, 2 insertions(+), 7 deletions(-)

diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index f09ba46de1e..7f4bad3d4e6 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -74,7 +74,6 @@ RUN arch=${TARGETARCH:-amd64} \
     && wget "https://dl.min.io/client/mc/release/linux-${arch}/archive/mc.RELEASE.${MINIO_CLIENT_VERSION}" -O ./mc \
     && chmod +x ./mc ./minio
 
-
 RUN wget --no-verbose 'https://archive.apache.org/dist/hadoop/common/hadoop-3.3.1/hadoop-3.3.1.tar.gz' \
     && tar -xvf hadoop-3.3.1.tar.gz \
     && rm -rf hadoop-3.3.1.tar.gz
diff --git a/docker/test/util/Dockerfile b/docker/test/util/Dockerfile
index 054eac5f764..396d5801be9 100644
--- a/docker/test/util/Dockerfile
+++ b/docker/test/util/Dockerfile
@@ -5,7 +5,6 @@ FROM ubuntu:22.04
 ARG apt_archive="http://archive.ubuntu.com"
 RUN sed -i "s|http://archive.ubuntu.com|$apt_archive|g" /etc/apt/sources.list
 
-# 15.0.2
 ENV DEBIAN_FRONTEND=noninteractive LLVM_VERSION=17
 
 RUN apt-get update \
@@ -30,8 +29,7 @@ RUN apt-get update \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
-
-# Install cmake 3.20+ for rust support
+# Install cmake 3.20+ for Rust support
 # Used https://askubuntu.com/a/1157132 as reference
 RUN curl -s https://apt.kitware.com/keys/kitware-archive-latest.asc | \
         gpg --dearmor - > /etc/apt/trusted.gpg.d/kitware.gpg && \
@@ -65,8 +63,7 @@ RUN apt-get update \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 
-
-# This symlink required by gcc to find lld compiler
+# This symlink is required by gcc to find the lld linker
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld
 # for external_symbolizer_path
 RUN ln -s /usr/bin/llvm-symbolizer-${LLVM_VERSION} /usr/bin/llvm-symbolizer
@@ -111,5 +108,4 @@ RUN arch=${TARGETARCH:-amd64} \
   && mv "/tmp/sccache-$SCCACHE_VERSION-$rarch-unknown-linux-musl/sccache" /usr/bin \
   && rm "/tmp/sccache-$SCCACHE_VERSION-$rarch-unknown-linux-musl" -r
 
-
 COPY process_functional_tests_result.py /

From 1b91b7b999e8681d972e3a5a93a4a166bbfd4e2a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:16:15 +0100
Subject: [PATCH 0766/1081] Better logs in CI and non-interactive install

---
 programs/install/Install.cpp | 30 ++++++++++++++++++------------
 1 file changed, 18 insertions(+), 12 deletions(-)

diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index 52f30098b38..978b5cc38ba 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -79,10 +79,6 @@ namespace ErrorCodes
 
 }
 
-/// ANSI escape sequence for intense color in terminal.
-#define HILITE "\033[1m"
-#define END_HILITE "\033[0m"
-
 #if defined(OS_DARWIN)
 /// Until createUser() and createGroup() are implemented, only sudo-less installations are supported/default for macOS.
 static constexpr auto DEFAULT_CLICKHOUSE_SERVER_USER = "";
@@ -216,6 +212,16 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
 {
     try
     {
+        const char * start_hilite = "";
+        const char * end_hilite = "";
+
+        if (isatty(STDOUT_FILENO))
+        {
+            /// ANSI escape sequence for intense color in terminal.
+            start_hilite = "\033[1m";
+            end_hilite = "\033[0m";
+        }
+
         po::options_description desc;
         desc.add_options()
             ("help,h", "produce help message")
@@ -799,13 +805,13 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
         /// Set up password for default user.
         if (has_password_for_default_user)
         {
-            fmt::print(HILITE "Password for default user is already specified. To remind or reset, see {} and {}." END_HILITE "\n",
-                       users_config_file.string(), users_d.string());
+            fmt::print("{}Password for default user is already specified. To remind or reset, see {} and {}.{}\n",
+                start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
         else if (!can_ask_password)
         {
-            fmt::print(HILITE "Password for default user is empty string. See {} and {} to change it." END_HILITE "\n",
-                       users_config_file.string(), users_d.string());
+            fmt::print("{}Password for default user is empty string. See {} and {} to change it.{}\n",
+                start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
         else
         {
@@ -839,7 +845,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     "</clickhouse>\n";
                 out.sync();
                 out.finalize();
-                fmt::print(HILITE "Password for default user is saved in file {}." END_HILITE "\n", password_file);
+                fmt::print("{}Password for default user is saved in file {}.{}\n", start_hilite, password_file, end_hilite);
 #else
                 out << "<clickhouse>\n"
                     "    <users>\n"
@@ -850,13 +856,13 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     "</clickhouse>\n";
                 out.sync();
                 out.finalize();
-                fmt::print(HILITE "Password for default user is saved in plaintext in file {}." END_HILITE "\n", password_file);
+                fmt::print("{}Password for default user is saved in plaintext in file {}.{}\n", start_hilite, password_file, end_hilite);
 #endif
                 has_password_for_default_user = true;
             }
             else
-                fmt::print(HILITE "Password for default user is empty string. See {} and {} to change it." END_HILITE "\n",
-                           users_config_file.string(), users_d.string());
+                fmt::print("{}Password for default user is empty string. See {} and {} to change it.{}\n",
+                    start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
 
         /** Set capabilities for the binary.

From a585ae60a85aa22bfee4f3e2a47685c915cbb770 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:30:29 +0100
Subject: [PATCH 0767/1081] English (somewhat incomplete)

---
 programs/install/Install.cpp | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index 978b5cc38ba..a4a4672f5c4 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -713,7 +713,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
         {
             fmt::print("Users config file {} already exists, will keep it and extract users info from it.\n", users_config_file.string());
 
-            /// Check if password for default user already specified.
+            /// Check if password for the default user already specified.
             ConfigProcessor processor(users_config_file.string(), /* throw_on_bad_incl = */ false, /* log_to_console = */ false);
             ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(processor.processConfig()));
 
@@ -805,12 +805,12 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
         /// Set up password for default user.
         if (has_password_for_default_user)
         {
-            fmt::print("{}Password for default user is already specified. To remind or reset, see {} and {}.{}\n",
+            fmt::print("{}Password for the default user is already specified. To remind or reset, see {} and {}.{}\n",
                 start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
         else if (!can_ask_password)
         {
-            fmt::print("{}Password for default user is empty string. See {} and {} to change it.{}\n",
+            fmt::print("{}Password for the default user is an empty string. See {} and {} to change it.{}\n",
                 start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
         else
@@ -820,7 +820,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
 
             char buf[1000] = {};
             std::string password;
-            if (auto * result = readpassphrase("Enter password for default user: ", buf, sizeof(buf), 0))
+            if (auto * result = readpassphrase("Enter password for the default user: ", buf, sizeof(buf), 0))
                 password = result;
 
             if (!password.empty())
@@ -845,7 +845,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     "</clickhouse>\n";
                 out.sync();
                 out.finalize();
-                fmt::print("{}Password for default user is saved in file {}.{}\n", start_hilite, password_file, end_hilite);
+                fmt::print("{}Password for the default user is saved in file {}.{}\n", start_hilite, password_file, end_hilite);
 #else
                 out << "<clickhouse>\n"
                     "    <users>\n"
@@ -856,12 +856,12 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     "</clickhouse>\n";
                 out.sync();
                 out.finalize();
-                fmt::print("{}Password for default user is saved in plaintext in file {}.{}\n", start_hilite, password_file, end_hilite);
+                fmt::print("{}Password for the default user is saved in plaintext in file {}.{}\n", start_hilite, password_file, end_hilite);
 #endif
                 has_password_for_default_user = true;
             }
             else
-                fmt::print("{}Password for default user is empty string. See {} and {} to change it.{}\n",
+                fmt::print("{}Password for the default user is an empty string. See {} and {} to change it.{}\n",
                     start_hilite, users_config_file.string(), users_d.string(), end_hilite);
         }
 

From f386e34b912d3ba2b4af4abff1632b6f4985f42d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:45:16 +0100
Subject: [PATCH 0768/1081] Fix an error by rewriting the CI from Perl to
 Python

---
 tests/ci/build_download_helper.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/build_download_helper.py b/tests/ci/build_download_helper.py
index 21012f6337d..99044e786cc 100644
--- a/tests/ci/build_download_helper.py
+++ b/tests/ci/build_download_helper.py
@@ -113,7 +113,7 @@ def get_build_name_for_check(check_name: str) -> str:
 def read_build_urls(build_name: str, reports_path: Union[Path, str]) -> List[str]:
     for root, _, files in os.walk(reports_path):
         for f in files:
-            if build_name in f:
+            if f.endswith(f"_{build_name}.json"):
                 logging.info("Found build report json %s", f)
                 with open(os.path.join(root, f), "r", encoding="utf-8") as file_handler:
                     build_report = json.load(file_handler)

From ad665f9b063f49903c74771bcb92091906926411 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:46:12 +0100
Subject: [PATCH 0769/1081] Better

---
 tests/ci/build_download_helper.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/ci/build_download_helper.py b/tests/ci/build_download_helper.py
index 99044e786cc..74478fd8038 100644
--- a/tests/ci/build_download_helper.py
+++ b/tests/ci/build_download_helper.py
@@ -112,10 +112,10 @@ def get_build_name_for_check(check_name: str) -> str:
 
 def read_build_urls(build_name: str, reports_path: Union[Path, str]) -> List[str]:
     for root, _, files in os.walk(reports_path):
-        for f in files:
-            if f.endswith(f"_{build_name}.json"):
-                logging.info("Found build report json %s", f)
-                with open(os.path.join(root, f), "r", encoding="utf-8") as file_handler:
+        for file in files:
+            if file.endswith(f"_{build_name}.json"):
+                logging.info("Found build report json %s", file)
+                with open(os.path.join(root, file), "r", encoding="utf-8") as file_handler:
                     build_report = json.load(file_handler)
                     return build_report["build_urls"]  # type: ignore
     return []

From b58a2387ef12e5b18c10b22827063412b0df56e5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 00:49:48 +0100
Subject: [PATCH 0770/1081] Probably better

---
 packages/build | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/packages/build b/packages/build
index c2285b8ee7c..b2dd085d9dd 100755
--- a/packages/build
+++ b/packages/build
@@ -130,6 +130,8 @@ if [ -n "$SANITIZER" ]; then
     fi
 elif [[ $BUILD_TYPE == 'debug' ]]; then
     VERSION_POSTFIX+="+debug"
+elif [[ $BUILD_TYPE =~ 'coverage' ]]; then
+    VERSION_POSTFIX+="+coverage"
 fi
 
 if [[ "$PKG_ROOT" != "$SOURCE" ]]; then

From 07ae125a52c60370d74f4fe44c5fd29b0bc328c2 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 9 Feb 2024 00:34:00 +0000
Subject: [PATCH 0771/1081] Automatic style fix

---
 tests/ci/build_download_helper.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/ci/build_download_helper.py b/tests/ci/build_download_helper.py
index 74478fd8038..0d24cb80021 100644
--- a/tests/ci/build_download_helper.py
+++ b/tests/ci/build_download_helper.py
@@ -115,7 +115,9 @@ def read_build_urls(build_name: str, reports_path: Union[Path, str]) -> List[str
         for file in files:
             if file.endswith(f"_{build_name}.json"):
                 logging.info("Found build report json %s", file)
-                with open(os.path.join(root, file), "r", encoding="utf-8") as file_handler:
+                with open(
+                    os.path.join(root, file), "r", encoding="utf-8"
+                ) as file_handler:
                     build_report = json.load(file_handler)
                     return build_report["build_urls"]  # type: ignore
     return []

From aa004cabffdc5a7a40b0090f3540da0464c0924b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 02:00:05 +0100
Subject: [PATCH 0772/1081] Fix tests

---
 src/Parsers/IParser.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index d5c9d48d730..e8f95954e70 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -82,7 +82,7 @@ public:
               * The frequency is arbitrary, but not too large, not too small,
               * and a power of two to simplify the division.
               */
-#ifdef USE_MUSL
+#if defined(USE_MUSL) || defined(SANITIZER)
             static constexpr uint32_t check_frequency = 128;
 #else
             static constexpr uint32_t check_frequency = 8192;

From fe6d8316a35ce5ca93759a3eac2e36193476af22 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 17:34:43 -0800
Subject: [PATCH 0773/1081] [Docs] Add default cloud core settings

---
 docs/en/operations/settings/settings.md | 44 ++++++++++++++++++++-----
 1 file changed, 36 insertions(+), 8 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 3a826b095d2..a552616b3ec 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -508,7 +508,9 @@ Possible values:
 - Any positive integer number of hops.
 - 0 — No hops allowed.
 
-Default value: 0.
+Default value: `0`.
+
+Cloud default value: `10`.
 
 ## insert_null_as_default {#insert_null_as_default}
 
@@ -1126,7 +1128,9 @@ Possible values:
 - 0 (or 1) — `INSERT SELECT` no parallel execution.
 - Positive integer. Bigger than 1.
 
-Default value: 0.
+Default value: `0`.
+
+Cloud default value: `2`.
 
 Parallel `INSERT SELECT` has effect only if the `SELECT` part is executed in parallel, see [max_threads](#max_threads) setting.
 Higher values will lead to higher memory usage.
@@ -1207,7 +1211,9 @@ Default value: 10000.
 
 Cancels HTTP read-only queries (e.g. SELECT) when a client closes the connection without waiting for the response.
 
-Default value: 0
+Default value: `0`.
+
+Cloud default value: `1`.
 
 ## poll_interval {#poll-interval}
 
@@ -1946,6 +1952,8 @@ Possible values:
 
 Default value: `200`.
 
+Cloud default value: `1000`.
+
 ### async_insert_poll_timeout_ms {#async-insert-poll-timeout-ms}
 
 Timeout in milliseconds for polling data from asynchronous insert queue.
@@ -2132,6 +2140,8 @@ Possible values:
 
 Default value: 0
 
+Cloud default value: `20`.
+
 Keeper request retries are done after some timeout. The timeout is controlled by the following settings: `insert_keeper_retry_initial_backoff_ms`, `insert_keeper_retry_max_backoff_ms`.
 The first retry is done after `insert_keeper_retry_initial_backoff_ms` timeout. The consequent timeouts will be calculated as follows:
 ```
@@ -2660,6 +2670,8 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Default value: 1000000000 nanoseconds (once a second).
 
+Cloud default value: `0`.
+
 See also:
 
 - System table [trace_log](../../operations/system-tables/trace_log.md/#system_tables-trace_log)
@@ -2683,6 +2695,8 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Default value: 1000000000 nanoseconds.
 
+Cloud default value: `0`.
+
 See also:
 
 - System table [trace_log](../../operations/system-tables/trace_log.md/#system_tables-trace_log)
@@ -2804,6 +2818,8 @@ Possible values:
 
 Default value: `0`.
 
+Cloud default value: `1`.
+
 **See Also**
 
 - [Distributed Table Engine](../../engines/table-engines/special/distributed.md/#distributed)
@@ -3319,7 +3335,9 @@ Possible values:
 
 - a string representing any valid table engine name
 
-Default value: `None`
+Default value: `None`.
+
+Cloud default value: `SharedMergeTree`.
 
 **Example**
 
@@ -3689,6 +3707,8 @@ Possible values:
 
 Default value: `0`.
 
+Cloud default value: `1`.
+
 ## live_view_heartbeat_interval {#live-view-heartbeat-interval}
 
 Sets the heartbeat interval in seconds to indicate [live view](../../sql-reference/statements/create/view.md/#live-view) is alive .
@@ -3933,6 +3953,8 @@ Possible values:
 
 Default value: `throw`.
 
+Cloud default value: `none`.
+
 ## flatten_nested {#flatten-nested}
 
 Sets the data format of a [nested](../../sql-reference/data-types/nested-data-structures/index.md) columns.
@@ -4068,6 +4090,8 @@ Possible values:
 
 Default value: `1`.
 
+Cloud default value: `0`.
+
 :::note
 `alter_sync` is applicable to `Replicated` tables only, it does nothing to alters of not `Replicated` tables.
 :::
@@ -4723,6 +4747,8 @@ other connections are cancelled. Queries with `max_parallel_replicas > 1` are su
 
 Enabled by default.
 
+Disabled by default on Cloud.
+
 ## hedged_connection_timeout {#hedged_connection_timeout}
 
 If we can't establish connection with replica after this timeout in hedged requests, we start working with the next replica without cancelling connection to the previous.
@@ -5348,10 +5374,11 @@ Default value: `false`.
 
 ## max_partition_size_to_drop
 
-Restriction on dropping partitions in query time.
+Restriction on dropping partitions in query time. The value 0 means that you can drop partitions without any restrictions.
 
 Default value: 50 GB.
-The value 0 means that you can drop partitions without any restrictions.
+
+Cloud default value: 1 TB.
 
 :::note
 This query setting overwrites its server setting equivalent, see [max_partition_size_to_drop](/docs/en/operations/server-configuration-parameters/settings.md/#max-partition-size-to-drop)
@@ -5359,10 +5386,11 @@ This query setting overwrites its server setting equivalent, see [max_partition_
 
 ## max_table_size_to_drop
 
-Restriction on deleting tables in query time.
+Restriction on deleting tables in query time. The value 0 means that you can delete all tables without any restrictions.
 
 Default value: 50 GB.
-The value 0 means that you can delete all tables without any restrictions.
+
+Cloud default value: 1 TB.
 
 :::note
 This query setting overwrites its server setting equivalent, see [max_table_size_to_drop](/docs/en/operations/server-configuration-parameters/settings.md/#max-table-size-to-drop)

From d17a12fe6451e02dc13101cbdacb4e81951c239e Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 17:46:37 -0800
Subject: [PATCH 0774/1081] [Docs] Fix for default cloud core settings

---
 docs/en/operations/settings/settings.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index a552616b3ec..b6db3ccc197 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3707,8 +3707,6 @@ Possible values:
 
 Default value: `0`.
 
-Cloud default value: `1`.
-
 ## live_view_heartbeat_interval {#live-view-heartbeat-interval}
 
 Sets the heartbeat interval in seconds to indicate [live view](../../sql-reference/statements/create/view.md/#live-view) is alive .
@@ -3915,6 +3913,8 @@ Possible values:
 
 Default value: `0`.
 
+Cloud default value: `1`.
+
 ## database_replicated_initial_query_timeout_sec {#database_replicated_initial_query_timeout_sec}
 
 Sets how long initial DDL query should wait for Replicated database to process previous DDL queue entries in seconds.

From 2954cdf200f9f03dc1fa4c1a5fff37454edba3b7 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 18:06:34 -0800
Subject: [PATCH 0775/1081] [Docs] Add cloud default values for query
 complexity

---
 .../operations/settings/query-complexity.md   | 22 +++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/settings/query-complexity.md b/docs/en/operations/settings/query-complexity.md
index 9a80f977ed1..f6d5a2a5017 100644
--- a/docs/en/operations/settings/query-complexity.md
+++ b/docs/en/operations/settings/query-complexity.md
@@ -1,4 +1,4 @@
----
+![image](https://github.com/ClickHouse/ClickHouse/assets/3936029/17039d32-4699-4498-bcff-947079345a66)---
 slug: /en/operations/settings/query-complexity
 sidebar_position: 59
 sidebar_label: Restrictions on Query Complexity
@@ -28,6 +28,8 @@ The maximum amount of RAM to use for running a query on a single server.
 
 The default setting is unlimited (set to `0`).
 
+Cloud default value: 17 GB.
+
 The setting does not consider the volume of available memory or the total volume of memory on the machine.
 The restriction applies to a single query within a single server.
 You can use `SHOW PROCESSLIST` to see the current memory consumption for each query.
@@ -104,7 +106,9 @@ Possible values:
 - Maximum volume of RAM (in bytes) that can be used by the single [GROUP BY](../../sql-reference/statements/select/group-by.md#select-group-by-clause) operation.
 - 0 — `GROUP BY` in external memory disabled.
 
-Default value: 0.
+Default value: `0`.
+
+Cloud default value: 8 GB.
 
 ## max_bytes_before_external_sort {#settings-max_bytes_before_external_sort}
 
@@ -115,6 +119,8 @@ Enables or disables execution of `ORDER BY` clauses in external memory. See [ORD
 
 Default value: 0.
 
+Cloud default value: 8 GB.
+
 ## max_rows_to_sort {#max-rows-to-sort}
 
 A maximum number of rows before sorting. This allows you to limit memory consumption when sorting.
@@ -129,7 +135,11 @@ What to do if the number of rows received before sorting exceeds one of the limi
 
 ## max_result_rows {#setting-max_result_rows}
 
-Limit on the number of rows in the result. Also checked for subqueries, and on remote servers when running parts of a distributed query.
+Limit on the number of rows in the result. Also checked for subqueries, and on remote servers when running parts of a distributed query. No limit is applied when value is `0`.
+
+Default value: `0`.
+
+Cloud default value: `500000`.
 
 ## max_result_bytes {#max-result-bytes}
 
@@ -137,10 +147,14 @@ Limit on the number of bytes in the result. The same as the previous setting.
 
 ## result_overflow_mode {#result-overflow-mode}
 
-What to do if the volume of the result exceeds one of the limits: ‘throw’ or ‘break’. By default, throw.
+What to do if the volume of the result exceeds one of the limits: ‘throw’ or ‘break’.
 
 Using ‘break’ is similar to using LIMIT. `Break` interrupts execution only at the block level. This means that amount of returned rows is greater than [max_result_rows](#setting-max_result_rows), multiple of [max_block_size](../../operations/settings/settings.md#setting-max_block_size) and depends on [max_threads](../../operations/settings/settings.md#max_threads).
 
+Default value: `throw`.
+
+Cloud default value: `break`.
+
 Example:
 
 ``` sql

From 32305adb0865f67f589565f8e2416dcdf991c693 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 18:10:01 -0800
Subject: [PATCH 0776/1081] [Docs] Remove accidental link on query complexity
 page

---
 docs/en/operations/settings/query-complexity.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/query-complexity.md b/docs/en/operations/settings/query-complexity.md
index f6d5a2a5017..9c54e22b01d 100644
--- a/docs/en/operations/settings/query-complexity.md
+++ b/docs/en/operations/settings/query-complexity.md
@@ -1,4 +1,4 @@
-![image](https://github.com/ClickHouse/ClickHouse/assets/3936029/17039d32-4699-4498-bcff-947079345a66)---
+---
 slug: /en/operations/settings/query-complexity
 sidebar_position: 59
 sidebar_label: Restrictions on Query Complexity

From f2f8a63ba8aa4c8fe4013632a51b17fc38326c49 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 18:14:21 -0800
Subject: [PATCH 0777/1081] [Docs] Change cloud default value for
 enable_filesystem_cache_on_write_operations

---
 docs/en/operations/storing-data.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index b3ef1128c42..003277c8d4f 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -206,7 +206,7 @@ Some of these settings will disable cache features per query/profile that are en
 
 - `read_from_filesystem_cache_if_exists_otherwise_bypass_cache` - allows to use cache in query only if it already exists, otherwise query data will not be written to local cache storage. Default: `false`.
 
-- `enable_filesystem_cache_on_write_operations` - turn on `write-through` cache. This setting works only if setting `cache_on_write_operations` in cache configuration is turned on. Default: `false`.
+- `enable_filesystem_cache_on_write_operations` - turn on `write-through` cache. This setting works only if setting `cache_on_write_operations` in cache configuration is turned on. Default: `false`. Cloud default value: `true`.
 
 - `enable_filesystem_cache_log` - turn on logging to `system.filesystem_cache_log` table. Gives a detailed view of cache usage per query. It can be turn on for specific queries or enabled in a profile. Default: `false`.
 

From af6ae28f3cf965f7d41db819688b255529e818f9 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 18:16:44 -0800
Subject: [PATCH 0778/1081] [Docs] Specify cloud default value for
 date_time_input_format

---
 docs/en/operations/settings/settings-formats.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/en/operations/settings/settings-formats.md b/docs/en/operations/settings/settings-formats.md
index eb09af44efd..1682e1e4673 100644
--- a/docs/en/operations/settings/settings-formats.md
+++ b/docs/en/operations/settings/settings-formats.md
@@ -212,6 +212,8 @@ Possible values:
 
 Default value: `'basic'`.
 
+Cloud default value: `'best_effort'`.
+
 See also:
 
 - [DateTime data type.](../../sql-reference/data-types/datetime.md)

From d466e8d61ef7b4813fd4e632ed0ff7486d8e312f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 03:55:39 +0100
Subject: [PATCH 0779/1081] Run coverage collection sequentially

---
 docker/test/stateless/run.sh | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index ea76447aef2..55349c6c406 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -185,11 +185,15 @@ function run_tests()
 
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
         ADDITIONAL_OPTIONS+=('--replicated-database')
+        # Too many tests fail for DatabaseReplicated in parallel.
         ADDITIONAL_OPTIONS+=('--jobs')
         ADDITIONAL_OPTIONS+=('2')
+    elif [[ 1 == $(clickhouse-client --query "SELECT value LIKE '%sanitize-coverage%' FROM system.build_options WHERE name = 'CXX_FLAGS'") ]]; then
+        # Coverage on a per-test basis could only be collected sequentially.
+        # Do not set the --jobs parameter.
+        echo "Running tests with coverage collection."
     else
-        # Too many tests fail for DatabaseReplicated in parallel. All other
-        # configurations are OK.
+        # All other configurations are OK.
         ADDITIONAL_OPTIONS+=('--jobs')
         ADDITIONAL_OPTIONS+=('8')
     fi

From 2dfd310cf26740344ecc633a5ae438f834649ce7 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 9 Feb 2024 03:31:30 +0000
Subject: [PATCH 0780/1081] Hide URL/S3 'headers' argument in SHOW CREATE

---
 src/Parsers/ASTFunction.cpp                   | 121 +++++++++++++++---
 .../0_stateless/02968_url_args.reference      |   9 +-
 tests/queries/0_stateless/02968_url_args.sql  |  17 ++-
 3 files changed, 126 insertions(+), 21 deletions(-)

diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index e309dec2131..e7f7b48091a 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -71,6 +71,13 @@ namespace
             size_t count = 0; /// Mostly it's either 0 or 1. There are only a few cases where `count` can be greater than 1 (e.g. see `encrypt`).
                               /// In all known cases secret arguments are consecutive
             bool are_named = false; /// Arguments like `password = 'password'` are considered as named arguments.
+            /// E.g. "headers" in `url('..', headers('foo' = '[HIDDEN]'))`
+            std::vector<std::string> nested_maps;
+
+            bool hasSecrets() const
+            {
+                return count != 0 || !nested_maps.empty();
+            }
         };
 
         Result getResult() const { return result; }
@@ -127,6 +134,10 @@ namespace
                 /// encrypt('mode', 'plaintext', 'key' [, iv, aad])
                 findEncryptionFunctionSecretArguments();
             }
+            else if (function.name == "url")
+            {
+                findURLSecretArguments();
+            }
         }
 
         void findMySQLFunctionSecretArguments()
@@ -143,6 +154,25 @@ namespace
             }
         }
 
+        /// Returns the number of arguments excluding "headers" and "extra_credentials" (which should
+        /// always be at the end). Marks "headers" as secret, if found.
+        size_t excludeS3OrURLNestedMaps()
+        {
+            size_t count = arguments->size();
+            while (count > 0)
+            {
+                const ASTFunction * f = arguments->at(count - 1)->as<ASTFunction>();
+                if (!f)
+                    break;
+                if (f->name == "headers")
+                    result.nested_maps.push_back(f->name);
+                else if (f->name != "extra_credentials")
+                    break;
+                count -= 1;
+            }
+            return count;
+        }
+
         void findS3FunctionSecretArguments(bool is_cluster_function)
         {
             /// s3Cluster('cluster_name', 'url', ...) has 'url' as its second argument.
@@ -156,9 +186,10 @@ namespace
             }
 
             /// We should check other arguments first because we don't need to do any replacement in case of
-            /// s3('url', NOSIGN, 'format' [, 'compression'])
-            /// s3('url', 'format', 'structure' [, 'compression'])
-            if ((url_arg_idx + 3 <= arguments->size()) && (arguments->size() <= url_arg_idx + 4))
+            /// s3('url', NOSIGN, 'format' [, 'compression'] [, extra_credentials(..)] [, headers(..)])
+            /// s3('url', 'format', 'structure' [, 'compression'] [, extra_credentials(..)] [, headers(..)])
+            size_t count = excludeS3OrURLNestedMaps();
+            if ((url_arg_idx + 3 <= count) && (count <= url_arg_idx + 4))
             {
                 String second_arg;
                 if (tryGetStringFromArgument(url_arg_idx + 1, &second_arg))
@@ -174,7 +205,14 @@ namespace
             /// We're going to replace 'aws_secret_access_key' with '[HIDDEN]' for the following signatures:
             /// s3('url', 'aws_access_key_id', 'aws_secret_access_key', ...)
             /// s3Cluster('cluster_name', 'url', 'aws_access_key_id', 'aws_secret_access_key', 'format', 'compression')
-            markSecretArgument(url_arg_idx + 2);
+            if (url_arg_idx + 2 < count)
+                markSecretArgument(url_arg_idx + 2);
+        }
+
+        void findURLSecretArguments()
+        {
+            if (!isNamedCollectionName(0))
+                excludeS3OrURLNestedMaps();
         }
 
         bool tryGetStringFromArgument(size_t arg_idx, String * res, bool allow_identifier = true) const
@@ -347,6 +385,10 @@ namespace
                 /// S3('url', ['aws_access_key_id', 'aws_secret_access_key',] ...)
                 findS3TableEngineSecretArguments();
             }
+            else if (engine_name == "URL")
+            {
+                findURLSecretArguments();
+            }
         }
 
         void findExternalDistributedTableEngineSecretArguments()
@@ -373,9 +415,10 @@ namespace
             }
 
             /// We should check other arguments first because we don't need to do any replacement in case of
-            /// S3('url', NOSIGN, 'format' [, 'compression'])
-            /// S3('url', 'format', 'compression')
-            if ((3 <= arguments->size()) && (arguments->size() <= 4))
+            /// S3('url', NOSIGN, 'format' [, 'compression'] [, extra_credentials(..)] [, headers(..)])
+            /// S3('url', 'format', 'compression' [, extra_credentials(..)] [, headers(..)])
+            size_t count = excludeS3OrURLNestedMaps();
+            if ((3 <= count) && (count <= 4))
             {
                 String second_arg;
                 if (tryGetStringFromArgument(1, &second_arg))
@@ -383,7 +426,7 @@ namespace
                     if (boost::iequals(second_arg, "NOSIGN"))
                         return; /// The argument after 'url' is "NOSIGN".
 
-                    if (arguments->size() == 3)
+                    if (count == 3)
                     {
                         if (second_arg == "auto" || KnownFormatNames::instance().exists(second_arg))
                             return; /// The argument after 'url' is a format: S3('url', 'format', ...)
@@ -391,11 +434,12 @@ namespace
                 }
             }
 
-            /// We replace 'aws_secret_access_key' with '[HIDDEN'] for the following signatures:
+            /// We replace 'aws_secret_access_key' with '[HIDDEN]' for the following signatures:
             /// S3('url', 'aws_access_key_id', 'aws_secret_access_key')
             /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'format')
             /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'format', 'compression')
-            markSecretArgument(2);
+            if (2 < count)
+                markSecretArgument(2);
         }
 
         void findDatabaseEngineSecretArguments()
@@ -724,6 +768,25 @@ ASTSelectWithUnionQuery * ASTFunction::tryGetQueryArgument() const
 }
 
 
+static bool formatNamedArgWithHiddenValue(IAST * arg, const IAST::FormatSettings & settings, IAST::FormatState & state, IAST::FormatStateStacked frame)
+{
+    const auto * equals_func = arg->as<ASTFunction>();
+    if (!equals_func || (equals_func->name != "equals"))
+        return false;
+    const auto * expr_list = equals_func->arguments->as<ASTExpressionList>();
+    if (!expr_list)
+        return false;
+    const auto & equal_args = expr_list->children;
+    if (equal_args.size() != 2)
+        return false;
+
+    equal_args[0]->formatImpl(settings, state, frame);
+    settings.ostr << (settings.hilite ? IAST::hilite_operator : "") << " = " << (settings.hilite ? IAST::hilite_none : "");
+    settings.ostr << "'[HIDDEN]'";
+
+    return true;
+}
+
 void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const
 {
     frame.expression_list_prepend_whitespace = false;
@@ -1133,17 +1196,37 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
             if (argument->as<ASTSetQuery>())
                 settings.ostr << "SETTINGS ";
 
-            if (!settings.show_secrets && (secret_arguments.start <= i) && (i < secret_arguments.start + secret_arguments.count))
+            if (!settings.show_secrets)
             {
-                if (secret_arguments.are_named)
+                if (secret_arguments.start <= i && i < secret_arguments.start + secret_arguments.count)
                 {
-                   assert_cast<const ASTFunction *>(argument.get())->arguments->children[0]->formatImpl(settings, state, nested_dont_need_parens);
-                   settings.ostr << (settings.hilite ? hilite_operator : "") << " = " << (settings.hilite ? hilite_none : "");
+                    if (secret_arguments.are_named)
+                    {
+                        assert_cast<const ASTFunction *>(argument.get())->arguments->children[0]->formatImpl(settings, state, nested_dont_need_parens);
+                        settings.ostr << (settings.hilite ? hilite_operator : "") << " = " << (settings.hilite ? hilite_none : "");
+                    }
+                    settings.ostr << "'[HIDDEN]'";
+                    if (size <= secret_arguments.start + secret_arguments.count && !secret_arguments.are_named)
+                        break; /// All other arguments should also be hidden.
+                    continue;
+                }
+
+                const ASTFunction * function = argument->as<ASTFunction>();
+                if (function && function->arguments && std::count(secret_arguments.nested_maps.begin(), secret_arguments.nested_maps.end(), function->name) != 0)
+                {
+                    /// headers('foo' = '[HIDDEN]', 'bar' = '[HIDDEN]')
+                    settings.ostr << (settings.hilite ? hilite_function : "") << function->name << (settings.hilite ? hilite_none : "") << "(";
+                    for (size_t j = 0; j < function->arguments->children.size(); ++j)
+                    {
+                        if (j != 0)
+                            settings.ostr << ", ";
+                        auto inner_arg = function->arguments->children[j];
+                        if (!formatNamedArgWithHiddenValue(inner_arg.get(), settings, state, nested_dont_need_parens))
+                            inner_arg->formatImpl(settings, state, nested_dont_need_parens);
+                    }
+                    settings.ostr << ")";
+                    continue;
                 }
-                settings.ostr << "'[HIDDEN]'";
-                if (size <= secret_arguments.start + secret_arguments.count && !secret_arguments.are_named)
-                    break; /// All other arguments should also be hidden.
-                continue;
             }
 
             if ((i == 1) && special_hilite_regexp
@@ -1166,7 +1249,7 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
 
 bool ASTFunction::hasSecretParts() const
 {
-    return (FunctionSecretArgumentsFinder{*this}.getResult().count > 0) || childrenHaveSecretParts();
+    return (FunctionSecretArgumentsFinder{*this}.getResult().hasSecrets()) || childrenHaveSecretParts();
 }
 
 String getFunctionName(const IAST * ast)
diff --git a/tests/queries/0_stateless/02968_url_args.reference b/tests/queries/0_stateless/02968_url_args.reference
index aa19e45301c..1c3693e4a66 100644
--- a/tests/queries/0_stateless/02968_url_args.reference
+++ b/tests/queries/0_stateless/02968_url_args.reference
@@ -1 +1,8 @@
-CREATE TABLE default.a\n(\n    `x` Int64\n)\nENGINE = URL(\'https://example.com/\', \'CSV\', headers(\'foo\' = \'bar\'))
+CREATE TABLE default.a\n(\n    `x` Int64\n)\nENGINE = URL(\'https://example.com/\', \'CSV\', headers(\'foo\' = \'[HIDDEN]\', \'a\' = \'[HIDDEN]\'))
+CREATE TABLE default.b\n(\n    `x` Int64\n)\nENGINE = URL(\'https://example.com/\', \'CSV\', headers())
+CREATE TABLE default.c\n(\n    `x` Int64\n)\nENGINE = S3(\'https://example.s3.amazonaws.com/a.csv\', \'NOSIGN\', \'CSV\', headers(\'foo\' = \'[HIDDEN]\'))
+CREATE TABLE default.d\n(\n    `x` Int64\n)\nENGINE = S3(\'https://example.s3.amazonaws.com/a.csv\', \'NOSIGN\', headers(\'foo\' = \'[HIDDEN]\'))
+CREATE VIEW default.e\n(\n    `x` Int64\n) AS\nSELECT count()\nFROM url(\'https://example.com/\', CSV, headers(\'foo\' = \'[HIDDEN]\', \'a\' = \'[HIDDEN]\'))
+CREATE VIEW default.f\n(\n    `x` Int64\n) AS\nSELECT count()\nFROM url(\'https://example.com/\', CSV, headers())
+CREATE VIEW default.g\n(\n    `x` Int64\n) AS\nSELECT count()\nFROM s3(\'https://example.s3.amazonaws.com/a.csv\', CSV, headers(\'foo\' = \'[HIDDEN]\'))
+CREATE VIEW default.h\n(\n    `x` Int64\n) AS\nSELECT count()\nFROM s3(\'https://example.s3.amazonaws.com/a.csv\', headers(\'foo\' = \'[HIDDEN]\'))
diff --git a/tests/queries/0_stateless/02968_url_args.sql b/tests/queries/0_stateless/02968_url_args.sql
index 8bee9fec0ac..e97ea381ea5 100644
--- a/tests/queries/0_stateless/02968_url_args.sql
+++ b/tests/queries/0_stateless/02968_url_args.sql
@@ -1,2 +1,17 @@
-create table a (x Int64) engine URL('https://example.com/', CSV, headers('foo' = 'bar'));
+create table a (x Int64) engine URL('https://example.com/', CSV, headers('foo' = 'bar', 'a' = '13'));
 show create a;
+create table b (x Int64) engine URL('https://example.com/', CSV, headers());
+show create b;
+create table c (x Int64) engine S3('https://example.s3.amazonaws.com/a.csv', NOSIGN, CSV, headers('foo' = 'bar'));
+show create c;
+create table d (x Int64) engine S3('https://example.s3.amazonaws.com/a.csv', NOSIGN, headers('foo' = 'bar'));
+show create d;
+
+create view e (x Int64) as select count() from url('https://example.com/', CSV, headers('foo' = 'bar', 'a' = '13'));
+show create e;
+create view f (x Int64) as select count() from url('https://example.com/', CSV, headers());
+show create f;
+create view g (x Int64) as select count() from s3('https://example.s3.amazonaws.com/a.csv', CSV, headers('foo' = 'bar'));
+show create g;
+create view h (x Int64) as select count() from s3('https://example.s3.amazonaws.com/a.csv', headers('foo' = 'bar'));
+show create h;

From 2a34bbb0e027f40c65da7db475496c20a455e0a0 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 21:36:45 -0800
Subject: [PATCH 0781/1081] [Docs] Cloud core settings corrections

Co-authored-by: Alexey Milovidov <milovidov@clickhouse.com>
---
 docs/en/operations/settings/settings.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index b6db3ccc197..9e259ea43b4 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -1130,7 +1130,7 @@ Possible values:
 
 Default value: `0`.
 
-Cloud default value: `2`.
+Cloud default value: from `2` to `4`, depending on the service size.
 
 Parallel `INSERT SELECT` has effect only if the `SELECT` part is executed in parallel, see [max_threads](#max_threads) setting.
 Higher values will lead to higher memory usage.
@@ -2138,7 +2138,7 @@ Possible values:
 - Positive integer.
 - 0 — Retries are disabled
 
-Default value: 0
+Default value: 20
 
 Cloud default value: `20`.
 
@@ -3335,7 +3335,7 @@ Possible values:
 
 - a string representing any valid table engine name
 
-Default value: `None`.
+Default value: `MergeTree`.
 
 Cloud default value: `SharedMergeTree`.
 

From 89d4b1e77b545c18d4ad6017aa04ebe2d66da192 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 21:39:08 -0800
Subject: [PATCH 0782/1081] [Docs] Specify that some query profiler settings
 are disabled in Cloud

---
 docs/en/operations/settings/settings.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 9e259ea43b4..a275878f32e 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -2670,7 +2670,7 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Default value: 1000000000 nanoseconds (once a second).
 
-Cloud default value: `0`.
+**Temporarily disabled in ClickHouse Cloud.**
 
 See also:
 
@@ -2695,7 +2695,7 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Default value: 1000000000 nanoseconds.
 
-Cloud default value: `0`.
+**Temporarily disabled in ClickHouse Cloud.**
 
 See also:
 

From aa05f07130cb2fe6070a32198138348df4bf1a03 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 8 Feb 2024 21:41:11 -0800
Subject: [PATCH 0783/1081] [Docs] Corrections for default cloud values for
 query complexity

Co-authored-by: Alexey Milovidov <milovidov@clickhouse.com>
---
 docs/en/operations/settings/query-complexity.md | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/en/operations/settings/query-complexity.md b/docs/en/operations/settings/query-complexity.md
index 9c54e22b01d..d86f18ff982 100644
--- a/docs/en/operations/settings/query-complexity.md
+++ b/docs/en/operations/settings/query-complexity.md
@@ -28,7 +28,7 @@ The maximum amount of RAM to use for running a query on a single server.
 
 The default setting is unlimited (set to `0`).
 
-Cloud default value: 17 GB.
+Cloud default value: depends on the amount of RAM on the replica.
 
 The setting does not consider the volume of available memory or the total volume of memory on the machine.
 The restriction applies to a single query within a single server.
@@ -108,7 +108,7 @@ Possible values:
 
 Default value: `0`.
 
-Cloud default value: 8 GB.
+Cloud default value: half the memory amount per replica.
 
 ## max_bytes_before_external_sort {#settings-max_bytes_before_external_sort}
 
@@ -119,7 +119,7 @@ Enables or disables execution of `ORDER BY` clauses in external memory. See [ORD
 
 Default value: 0.
 
-Cloud default value: 8 GB.
+Cloud default value: half the memory amount per replica.
 
 ## max_rows_to_sort {#max-rows-to-sort}
 
@@ -139,7 +139,7 @@ Limit on the number of rows in the result. Also checked for subqueries, and on r
 
 Default value: `0`.
 
-Cloud default value: `500000`.
+Cloud default value: `0`.
 
 ## max_result_bytes {#max-result-bytes}
 
@@ -153,7 +153,7 @@ Using ‘break’ is similar to using LIMIT. `Break` interrupts execution only a
 
 Default value: `throw`.
 
-Cloud default value: `break`.
+Cloud default value: `throw`.
 
 Example:
 

From e8fa8c3f7525c1507263b35222060dae81ae94f8 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 9 Feb 2024 06:36:45 +0000
Subject: [PATCH 0784/1081] no-fasttest

---
 tests/queries/0_stateless/02968_url_args.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02968_url_args.sql b/tests/queries/0_stateless/02968_url_args.sql
index e97ea381ea5..a9ac96970e0 100644
--- a/tests/queries/0_stateless/02968_url_args.sql
+++ b/tests/queries/0_stateless/02968_url_args.sql
@@ -1,3 +1,5 @@
+-- Tags: no-fasttest
+
 create table a (x Int64) engine URL('https://example.com/', CSV, headers('foo' = 'bar', 'a' = '13'));
 show create a;
 create table b (x Int64) engine URL('https://example.com/', CSV, headers());

From 359dda569337837be2ce08411188fa899ceb5c13 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Thu, 8 Feb 2024 22:38:53 -0800
Subject: [PATCH 0785/1081] Fix DB type check - now it'll refuse to create in
 Replicated databases (#59743)

Fix DB type check - now it'll refuse to create in Replicated databases
---
 src/Interpreters/InterpreterCreateQuery.cpp | 21 ++++++++++-----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 7133c9eef34..c491ee30321 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1076,15 +1076,22 @@ void InterpreterCreateQuery::assertOrSetUUID(ASTCreateQuery & create, const Data
 {
     const auto * kind = create.is_dictionary ? "Dictionary" : "Table";
     const auto * kind_upper = create.is_dictionary ? "DICTIONARY" : "TABLE";
+    bool is_replicated_database_internal = database->getEngineName() == "Replicated" && getContext()->getClientInfo().is_replicated_database_internal;
+    bool from_path = create.attach_from_path.has_value();
+    bool is_on_cluster = getContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
 
-    if (database->getEngineName() == "Replicated" && getContext()->getClientInfo().is_replicated_database_internal
-        && !internal)
+    if (is_replicated_database_internal && !internal)
     {
         if (create.uuid == UUIDHelpers::Nil)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Table UUID is not specified in DDL log");
     }
 
-    bool from_path = create.attach_from_path.has_value();
+    if (create.refresh_strategy && database->getEngineName() != "Atomic")
+        throw Exception(ErrorCodes::INCORRECT_QUERY,
+            "Refreshable materialized view requires Atomic database engine, but database {} has engine {}", create.getDatabase(), database->getEngineName());
+            /// TODO: Support Replicated databases, only with Shared/ReplicatedMergeTree.
+            ///       Figure out how to make the refreshed data appear all at once on other
+            ///       replicas; maybe a replicated SYSTEM SYNC REPLICA query before the rename?
 
     if (database->getUUID() != UUIDHelpers::Nil)
     {
@@ -1108,7 +1115,6 @@ void InterpreterCreateQuery::assertOrSetUUID(ASTCreateQuery & create, const Data
     }
     else
     {
-        bool is_on_cluster = getContext()->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY;
         bool has_uuid = create.uuid != UUIDHelpers::Nil || create.to_inner_uuid != UUIDHelpers::Nil;
         if (has_uuid && !is_on_cluster && !internal)
         {
@@ -1121,13 +1127,6 @@ void InterpreterCreateQuery::assertOrSetUUID(ASTCreateQuery & create, const Data
                             "{} UUID specified, but engine of database {} is not Atomic", kind, create.getDatabase());
         }
 
-        if (create.refresh_strategy && database->getEngineName() != "Atomic")
-            throw Exception(ErrorCodes::INCORRECT_QUERY,
-                "Refreshable materialized view requires Atomic database engine, but database {} has engine {}", create.getDatabase(), database->getEngineName());
-                /// TODO: Support Replicated databases, only with Shared/ReplicatedMergeTree.
-                ///       Figure out how to make the refreshed data appear all at once on other
-                ///       replicas; maybe a replicated SYSTEM SYNC REPLICA query before the rename?
-
         /// The database doesn't support UUID so we'll ignore it. The UUID could be set here because of either
         /// a) the initiator of `ON CLUSTER` query generated it to ensure the same UUIDs are used on different hosts; or
         /// b) `RESTORE from backup` query generated it to ensure the same UUIDs are used on different hosts.

From 42f2fefeab9941b11436dafcdcd62cfd31346980 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 9 Feb 2024 10:40:43 +0100
Subject: [PATCH 0786/1081] Fix data race and leak

---
 src/Coordination/KeeperSnapshotManager.cpp |  6 +--
 src/Coordination/KeeperStorage.cpp         | 51 ++++++++++------------
 src/Coordination/KeeperStorage.h           | 41 +++++------------
 src/Coordination/ZooKeeperDataReader.cpp   |  4 +-
 4 files changed, 39 insertions(+), 63 deletions(-)

diff --git a/src/Coordination/KeeperSnapshotManager.cpp b/src/Coordination/KeeperSnapshotManager.cpp
index d7c9acae07a..091571b4a1a 100644
--- a/src/Coordination/KeeperSnapshotManager.cpp
+++ b/src/Coordination/KeeperSnapshotManager.cpp
@@ -82,7 +82,7 @@ namespace
         writeBinary(node.czxid, out);
         writeBinary(node.mzxid, out);
         writeBinary(node.ctime(), out);
-        writeBinary(node.mtime(), out);
+        writeBinary(node.mtime, out);
         writeBinary(node.version, out);
         writeBinary(node.cversion, out);
         writeBinary(node.aversion, out);
@@ -143,9 +143,7 @@ namespace
         int64_t ctime;
         readBinary(ctime, in);
         node.setCtime(ctime);
-        int64_t mtime;
-        readBinary(mtime, in);
-        node.setMtime(mtime);
+        readBinary(node.mtime, in);
         readBinary(node.version, in);
         readBinary(node.cversion, in);
         readBinary(node.aversion, in);
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 9d4c22164d3..446d3877c1c 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -175,13 +175,13 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
     if (node.data_size != 0)
     {
         chassert(node.data != nullptr);
-        hash.update(node.data, node.data_size);
+        hash.update(node.getData());
     }
 
     hash.update(node.czxid);
     hash.update(node.mzxid);
     hash.update(node.ctime());
-    hash.update(node.mtime());
+    hash.update(node.mtime);
     hash.update(node.version);
     hash.update(node.cversion);
     hash.update(node.aversion);
@@ -189,17 +189,17 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
     hash.update(node.numChildren());
     hash.update(node.pzxid);
 
+    auto digest = hash.get64();
+
+    /// 0 means no cached digest
+    if (digest == 0)
+        return 1;
+
     return hash.get64();
 }
 
 }
 
-KeeperStorage::Node::~Node()
-{
-    if (data_size)
-        delete[] data;
-}
-
 KeeperStorage::Node & KeeperStorage::Node::operator=(const Node & other)
 {
     if (this == &other)
@@ -209,8 +209,8 @@ KeeperStorage::Node & KeeperStorage::Node::operator=(const Node & other)
     mzxid = other.mzxid;
     pzxid = other.pzxid;
     acl_id = other.acl_id;
-    has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
-    is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
+    mtime = other.mtime;
+    is_ephemeral_and_ctime = other.is_ephemeral_and_ctime;
     ephemeral_or_children_data = other.ephemeral_or_children_data;
     data_size = other.data_size;
     version = other.version;
@@ -219,8 +219,8 @@ KeeperStorage::Node & KeeperStorage::Node::operator=(const Node & other)
 
     if (data_size != 0)
     {
-        data = new char[data_size];
-        memcpy(data, other.data, data_size);
+        data = std::unique_ptr<char[]>(new char[data_size]);
+        memcpy(data.get(), other.data.get(), data_size);
     }
 
     children = other.children;
@@ -244,8 +244,8 @@ void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
     mzxid = stat.mzxid;
     pzxid = stat.pzxid;
 
+    mtime = stat.mtime;
     setCtime(stat.ctime);
-    setMtime(stat.mtime);
 
     version = stat.version;
     cversion = stat.cversion;
@@ -253,7 +253,7 @@ void KeeperStorage::Node::copyStats(const Coordination::Stat & stat)
 
     if (stat.ephemeralOwner == 0)
     {
-        is_ephemeral_and_mtime.is_ephemeral = false;
+        is_ephemeral_and_ctime.is_ephemeral = false;
         setNumChildren(stat.numChildren);
     }
     else
@@ -267,7 +267,7 @@ void KeeperStorage::Node::setResponseStat(Coordination::Stat & response_stat) co
     response_stat.czxid = czxid;
     response_stat.mzxid = mzxid;
     response_stat.ctime = ctime();
-    response_stat.mtime = mtime();
+    response_stat.mtime = mtime;
     response_stat.version = version;
     response_stat.cversion = cversion;
     response_stat.aversion = aversion;
@@ -288,8 +288,8 @@ void KeeperStorage::Node::setData(const String & new_data)
     data_size = static_cast<uint32_t>(new_data.size());
     if (data_size != 0)
     {
-        data = new char[new_data.size()];
-        memcpy(data, new_data.data(), data_size);
+        data = std::unique_ptr<char[]>(new char[new_data.size()]);
+        memcpy(data.get(), new_data.data(), data_size);
     }
 }
 
@@ -305,16 +305,13 @@ void KeeperStorage::Node::removeChild(StringRef child_path)
 
 void KeeperStorage::Node::invalidateDigestCache() const
 {
-    has_cached_digest_and_ctime.has_cached_digest = false;
+    cached_digest = 0;
 }
 
 UInt64 KeeperStorage::Node::getDigest(const std::string_view path) const
 {
-    if (!has_cached_digest_and_ctime.has_cached_digest)
-    {
+    if (cached_digest == 0)
         cached_digest = calculateDigest(path, *this);
-        has_cached_digest_and_ctime.has_cached_digest = true;
-    }
 
     return cached_digest;
 };
@@ -326,17 +323,17 @@ void KeeperStorage::Node::shallowCopy(const KeeperStorage::Node & other)
     pzxid = other.pzxid;
     acl_id = other.acl_id; /// 0 -- no ACL by default
 
-    has_cached_digest_and_ctime = other.has_cached_digest_and_ctime;
+    mtime = other.mtime;
 
-    is_ephemeral_and_mtime = other.is_ephemeral_and_mtime;
+    is_ephemeral_and_ctime = other.is_ephemeral_and_ctime;
 
     ephemeral_or_children_data = other.ephemeral_or_children_data;
 
     data_size = other.data_size;
     if (data_size != 0)
     {
-        data = new char[data_size];
-        memcpy(data, other.data, data_size);
+        data = std::unique_ptr<char[]>(new char[data_size]);
+        memcpy(data.get(), other.data.get(), data_size);
     }
 
     version = other.version;
@@ -1448,7 +1445,7 @@ struct KeeperStorageSetRequestProcessor final : public KeeperStorageRequestProce
                 {
                     value.version++;
                     value.mzxid = zxid;
-                    value.setMtime(time);
+                    value.mtime = time;
                     value.setData(data);
                 },
                 request.version});
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index cf9c1710d3d..222433dc5d4 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -38,17 +38,13 @@ public:
         int64_t pzxid{0};
         uint64_t acl_id = 0; /// 0 -- no ACL by default
 
-        mutable struct
-        {
-            bool has_cached_digest : 1;
-            int64_t ctime : 63;
-        } has_cached_digest_and_ctime{false, 0};
+        int64_t mtime;
 
         struct
         {
             bool is_ephemeral : 1;
-            int64_t mtime : 63;
-        } is_ephemeral_and_mtime{false, 0};
+            int64_t ctime : 63;
+        } is_ephemeral_and_ctime{false, 0};
 
         union
         {
@@ -60,19 +56,15 @@ public:
             } children_info;
         } ephemeral_or_children_data{0};
 
-        char * data{nullptr};
+        std::unique_ptr<char[]> data{nullptr};
         uint32_t data_size{0};
 
         int32_t version{0};
         int32_t cversion{0};
         int32_t aversion{0};
 
-        /// we cannot use `std::optional<uint64_t> because we want to
-        /// pack the boolean with seq_num above
         mutable uint64_t cached_digest = 0;
 
-        ~Node();
-
         Node() = default;
 
         Node & operator=(const Node & other);
@@ -83,7 +75,7 @@ public:
 
         bool isEphemeral() const
         {
-            return is_ephemeral_and_mtime.is_ephemeral;
+            return is_ephemeral_and_ctime.is_ephemeral;
         }
 
         int64_t ephemeralOwner() const
@@ -96,7 +88,7 @@ public:
 
         void setEphemeralOwner(int64_t ephemeral_owner)
         {
-            is_ephemeral_and_mtime.is_ephemeral = ephemeral_owner != 0;
+            is_ephemeral_and_ctime.is_ephemeral = ephemeral_owner != 0;
             ephemeral_or_children_data.ephemeral_owner = ephemeral_owner;
         }
 
@@ -146,22 +138,12 @@ public:
 
         int64_t ctime() const
         {
-            return has_cached_digest_and_ctime.ctime;
+            return is_ephemeral_and_ctime.ctime;
         }
 
         void setCtime(uint64_t ctime)
         {
-            has_cached_digest_and_ctime.ctime = ctime;
-        }
-
-        int64_t mtime() const
-        {
-            return is_ephemeral_and_mtime.mtime;
-        }
-
-        void setMtime(uint64_t mtime)
-        {
-            is_ephemeral_and_mtime.mtime = mtime;
+            is_ephemeral_and_ctime.ctime = ctime;
         }
 
         void copyStats(const Coordination::Stat & stat);
@@ -173,7 +155,7 @@ public:
 
         void setData(const String & new_data);
 
-        StringRef getData() const noexcept { return {data, data_size}; }
+        StringRef getData() const noexcept { return {data.get(), data_size}; }
 
         void addChild(StringRef child_path);
 
@@ -205,10 +187,11 @@ public:
         NO_DIGEST = 0,
         V1 = 1,
         V2 = 2, // added system nodes that modify the digest on startup so digest from V0 is invalid
-        V3 = 3  // fixed bug with casting, removed duplicate czxid usage
+        V3 = 3, // fixed bug with casting, removed duplicate czxid usage
+        V4 = 4  // 0 is not a valid digest value
     };
 
-    static constexpr auto CURRENT_DIGEST_VERSION = DigestVersion::V3;
+    static constexpr auto CURRENT_DIGEST_VERSION = DigestVersion::V4;
 
     struct ResponseForSession
     {
diff --git a/src/Coordination/ZooKeeperDataReader.cpp b/src/Coordination/ZooKeeperDataReader.cpp
index e027b44b3a2..c7b1abf1d83 100644
--- a/src/Coordination/ZooKeeperDataReader.cpp
+++ b/src/Coordination/ZooKeeperDataReader.cpp
@@ -114,9 +114,7 @@ int64_t deserializeStorageData(KeeperStorage & storage, ReadBuffer & in, LoggerP
         int64_t ctime;
         Coordination::read(ctime, in);
         node.setCtime(ctime);
-        int64_t mtime;
-        Coordination::read(mtime, in);
-        node.setMtime(mtime);
+        Coordination::read(node.mtime, in);
         Coordination::read(node.version, in);
         Coordination::read(node.cversion, in);
         Coordination::read(node.aversion, in);

From 1ff0a5430e63600f65b006513ac16d15b577d5b8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 9 Feb 2024 11:08:54 +0100
Subject: [PATCH 0787/1081] Fix unpoison call

---
 src/Common/memcmpSmall.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Common/memcmpSmall.h b/src/Common/memcmpSmall.h
index 0b05b4a53bd..103eabb5b8d 100644
--- a/src/Common/memcmpSmall.h
+++ b/src/Common/memcmpSmall.h
@@ -661,8 +661,8 @@ inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Ch
     if (a_size != b_size)
         return false;
 
-    __msan_unpoison(&a[a_size - a_size % 16], a_size % 16);
-    __msan_unpoison(&b[b_size - b_size % 16], b_size % 16);
+    __msan_unpoison_overflow_15(a, a_size);
+    __msan_unpoison_overflow_15(b, b_size);
 
     for (size_t offset = 0; offset < a_size; offset += 16)
     {

From 8655c11280c154f267b8f36fd24dc21c7b786aec Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Fri, 9 Feb 2024 11:45:15 +0100
Subject: [PATCH 0788/1081] Fix typo

---
 src/Storages/StorageMerge.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 09c38996b22..79d7b83cada 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -786,7 +786,7 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     projection.clear();
     NamesAndTypes projection_columns;
 
-    // Select only required columns from the table, because prjection list may contain:
+    // Select only required columns from the table, because projection list may contain:
     // 1. aggregate functions
     // 2. expressions referencing other tables of JOIN
     for (auto const & column_name : required_column_names)

From d2eac53c86ccfbd809f45511dfc087c11bc92f9a Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 9 Feb 2024 12:06:01 +0100
Subject: [PATCH 0789/1081] Fix

---
 src/Coordination/KeeperStorage.cpp | 45 ++++++++++++++++++++++++++----
 src/Coordination/KeeperStorage.h   | 38 ++-----------------------
 utils/keeper-data-dumper/main.cpp  |  2 +-
 3 files changed, 44 insertions(+), 41 deletions(-)

diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 446d3877c1c..c62ed90e378 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -172,10 +172,11 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
 
     hash.update(path);
 
-    if (node.data_size != 0)
+    auto data = node.getData();
+    if (!data.empty())
     {
-        chassert(node.data != nullptr);
-        hash.update(node.getData());
+        chassert(data.data() != nullptr);
+        hash.update(data);
     }
 
     hash.update(node.czxid);
@@ -195,7 +196,7 @@ uint64_t calculateDigest(std::string_view path, const KeeperStorage::Node & node
     if (digest == 0)
         return 1;
 
-    return hash.get64();
+    return digest;
 }
 
 }
@@ -477,6 +478,40 @@ void KeeperStorage::UncommittedState::applyDelta(const Delta & delta)
         delta.operation);
 }
 
+bool KeeperStorage::UncommittedState::hasACL(int64_t session_id, bool is_local, std::function<bool(const AuthID &)> predicate) const
+{
+    const auto check_auth = [&](const auto & auth_ids)
+    {
+        for (const auto & auth : auth_ids)
+        {
+            using TAuth = std::remove_reference_t<decltype(auth)>;
+
+            const AuthID * auth_ptr = nullptr;
+            if constexpr (std::is_pointer_v<TAuth>)
+                auth_ptr = auth;
+            else
+                auth_ptr = &auth;
+
+            if (predicate(*auth_ptr))
+                return true;
+        }
+        return false;
+    };
+
+    if (is_local)
+        return check_auth(storage.session_and_auth[session_id]);
+
+    if (check_auth(storage.session_and_auth[session_id]))
+        return true;
+
+    // check if there are uncommitted
+    const auto auth_it = session_and_auth.find(session_id);
+    if (auth_it == session_and_auth.end())
+        return false;
+
+    return check_auth(auth_it->second);
+}
+
 void KeeperStorage::UncommittedState::addDelta(Delta new_delta)
 {
     const auto & added_delta = deltas.emplace_back(std::move(new_delta));
@@ -1228,7 +1263,7 @@ struct KeeperStorageGetRequestProcessor final : public KeeperStorageRequestProce
         {
             node_it->value.setResponseStat(response.stat);
             auto data = node_it->value.getData();
-            response.data = std::string(data.data, data.size);
+            response.data = std::string(data);
             response.error = Coordination::Error::ZOK;
         }
 
diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 222433dc5d4..9743e051422 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -38,7 +38,7 @@ public:
         int64_t pzxid{0};
         uint64_t acl_id = 0; /// 0 -- no ACL by default
 
-        int64_t mtime;
+        int64_t mtime{0};
 
         struct
         {
@@ -155,7 +155,7 @@ public:
 
         void setData(const String & new_data);
 
-        StringRef getData() const noexcept { return {data.get(), data_size}; }
+        std::string_view getData() const noexcept { return {data.get(), data_size}; }
 
         void addChild(StringRef child_path);
 
@@ -335,39 +335,7 @@ public:
 
         void applyDelta(const Delta & delta);
 
-        bool hasACL(int64_t session_id, bool is_local, std::function<bool(const AuthID &)> predicate)
-        {
-            const auto check_auth = [&](const auto & auth_ids)
-            {
-                for (const auto & auth : auth_ids)
-                {
-                    using TAuth = std::remove_reference_t<decltype(auth)>;
-
-                    const AuthID * auth_ptr = nullptr;
-                    if constexpr (std::is_pointer_v<TAuth>)
-                        auth_ptr = auth;
-                    else
-                        auth_ptr = &auth;
-
-                    if (predicate(*auth_ptr))
-                        return true;
-                }
-                return false;
-            };
-
-            if (is_local)
-                return check_auth(storage.session_and_auth[session_id]);
-
-            if (check_auth(storage.session_and_auth[session_id]))
-                return true;
-
-            // check if there are uncommitted
-            const auto auth_it = session_and_auth.find(session_id);
-            if (auth_it == session_and_auth.end())
-                return false;
-
-            return check_auth(auth_it->second);
-        }
+        bool hasACL(int64_t session_id, bool is_local, std::function<bool(const AuthID &)> predicate) const;
 
         void forEachAuthInSession(int64_t session_id, std::function<void(const AuthID &)> func) const;
 
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index 12acd0a8db9..bae44bb1628 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -26,7 +26,7 @@ void dumpMachine(std::shared_ptr<KeeperStateMachine> machine)
         std::cout << key << "\n";
         auto value = storage.container.getValue(key);
         std::cout << "\tStat: {version: " << value.version <<
-            ", mtime: " << value.mtime() <<
+            ", mtime: " << value.mtime <<
             ", emphemeralOwner: " << value.ephemeralOwner() <<
             ", czxid: " << value.czxid <<
             ", mzxid: " << value.mzxid <<

From e522e23ce86b92c0b9765687cda8153a1f8ccd42 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 9 Feb 2024 12:41:25 +0100
Subject: [PATCH 0790/1081] Update reference file

---
 .../02731_parallel_replicas_join_subquery.reference           | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
index ec4928bc325..48ea1154bc3 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
@@ -31,7 +31,7 @@
 29	2j&S)ba?XG	QuQj	17163829389637435056
 3	UlI+1		14144472852965836438
 =============== QUERIES EXECUTED BY PARALLEL INNER QUERY ALONE ===============
-0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2`, toUInt64(min(`__table1`.`time`)) AS `start_ts` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > 1610517366120) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2` ORDER BY `__table1`.`key` ASC, `__table1`.`value1` ASC, `__table1`.`value2` ASC LIMIT _CAST(10, \'UInt64\') SETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer = 1
+0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2`, toUInt64(min(`__table1`.`time`)) AS `start_ts` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2` ORDER BY `__table1`.`key` ASC, `__table1`.`value1` ASC, `__table1`.`value2` ASC LIMIT _CAST(10, \'UInt64\') SETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer = 1
 0	3	SELECT `key`, `value1`, `value2`, toUInt64(min(`time`)) AS `start_ts` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2` ORDER BY `key` ASC, `value1` ASC, `value2` ASC LIMIT 10
 1	1	-- Parallel inner query alone\nSELECT\n    key,\n    value1,\n    value2,\n    toUInt64(min(time)) AS start_ts\nFROM join_inner_table\nPREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\nGROUP BY key, value1, value2\nORDER BY key, value1, value2\nLIMIT 10\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=0;
 1	1	-- Parallel inner query alone\nSELECT\n    key,\n    value1,\n    value2,\n    toUInt64(min(time)) AS start_ts\nFROM join_inner_table\nPREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\nGROUP BY key, value1, value2\nORDER BY key, value1, value2\nLIMIT 10\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=1;
@@ -58,7 +58,7 @@ U	c	10
 UlI+1		10
 bX?}ix [	Ny]2 G	10
 t<iT	X48q:Z]t0	10
-0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > 1610517366120) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2`
+0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2`
 0	3	SELECT `__table2`.`value1` AS `value1`, `__table2`.`value2` AS `value2`, count() AS `count` FROM `default`.`join_outer_table` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` USING (`key`) GROUP BY `__table1`.`key`, `__table2`.`value1`, `__table2`.`value2`
 0	3	SELECT `key`, `value1`, `value2` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2`
 0	3	SELECT `value1`, `value2`, count() AS `count` FROM `default`.`join_outer_table` ALL INNER JOIN `_data_` USING (`key`) GROUP BY `key`, `value1`, `value2`

From fc34507a94019465ce6aa23ae084fd21714c9aec Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Fri, 9 Feb 2024 12:48:07 +0100
Subject: [PATCH 0791/1081] Bump version

---
 tests/integration/test_replicating_constants/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_replicating_constants/test.py b/tests/integration/test_replicating_constants/test.py
index 90132b71a64..af8916dd625 100644
--- a/tests/integration/test_replicating_constants/test.py
+++ b/tests/integration/test_replicating_constants/test.py
@@ -9,7 +9,7 @@ node2 = cluster.add_instance(
     "node2",
     with_zookeeper=True,
     image="clickhouse/clickhouse-server",
-    tag="22.3",
+    tag="23.3",
     with_installed_binary=True,
 )
 

From 3ee2dda51142c5321837eeaf7a00404ac46c74f4 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 9 Feb 2024 12:59:06 +0100
Subject: [PATCH 0792/1081] Fix special build reports in release branches

---
 .github/workflows/release_branches.yml | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index c5d8294b999..87fbf363f0b 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -206,13 +206,8 @@ jobs:
     if: ${{ !cancelled() }}
     needs:
       - RunConfig
-      - BuilderDebRelease
-      - BuilderDebAarch64
-      - BuilderDebAsan
-      - BuilderDebTsan
-      - BuilderDebUBsan
-      - BuilderDebMsan
-      - BuilderDebDebug
+      - BuilderBinDarwin
+      - BuilderBinDarwinAarch64
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: ClickHouse special build check

From 54b7fdb8329160cee44b47af980dd0499eeed253 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 9 Feb 2024 12:24:33 +0000
Subject: [PATCH 0793/1081] Update version_date.tsv and changelogs after
 v24.1.3.31-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.3.31-stable.md | 34 ++++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  2 ++
 5 files changed, 39 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.3.31-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index fe33bf9e0ea..e8293869a56 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index f0adadd2d59..3cf89f1b841 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index dd00684cc24..d477d8aaca1 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.3.31-stable.md b/docs/changelogs/v24.1.3.31-stable.md
new file mode 100644
index 00000000000..046ca451fbc
--- /dev/null
+++ b/docs/changelogs/v24.1.3.31-stable.md
@@ -0,0 +1,34 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.3.31-stable (135b08cbd28) FIXME as compared to v24.1.2.5-stable (b2605dd4a5a)
+
+#### Improvement
+* Backported in [#59569](https://github.com/ClickHouse/ClickHouse/issues/59569): Now dashboard understands both compressed and uncompressed state of URL's #hash (backward compatibility). Continuation of [#59124](https://github.com/ClickHouse/ClickHouse/issues/59124) . [#59548](https://github.com/ClickHouse/ClickHouse/pull/59548) ([Amos Bird](https://github.com/amosbird)).
+* Backported in [#59776](https://github.com/ClickHouse/ClickHouse/issues/59776): Added settings `split_parts_ranges_into_intersecting_and_non_intersecting_final` and `split_intersecting_parts_ranges_into_layers_final`. This settings are needed to disable optimizations for queries with `FINAL` and needed for debug only. [#59705](https://github.com/ClickHouse/ClickHouse/pull/59705) ([Maksim Kita](https://github.com/kitaisreal)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix `ASTAlterCommand::formatImpl` in case of column specific settings… [#59445](https://github.com/ClickHouse/ClickHouse/pull/59445) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Make MAX use the same rules as permutation for complex types [#59498](https://github.com/ClickHouse/ClickHouse/pull/59498) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix corner case when passing `update_insert_deduplication_token_in_dependent_materialized_views` [#59544](https://github.com/ClickHouse/ClickHouse/pull/59544) ([Jordi Villar](https://github.com/jrdi)).
+* Fix incorrect result of arrayElement / map[] on empty value [#59594](https://github.com/ClickHouse/ClickHouse/pull/59594) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash in topK when merging empty states [#59603](https://github.com/ClickHouse/ClickHouse/pull/59603) ([Raúl Marín](https://github.com/Algunenano)).
+* Maintain function alias in RewriteSumFunctionWithSumAndCountVisitor [#59658](https://github.com/ClickHouse/ClickHouse/pull/59658) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix leftPad / rightPad function with FixedString input [#59739](https://github.com/ClickHouse/ClickHouse/pull/59739) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Backport [#59650](https://github.com/ClickHouse/ClickHouse/issues/59650) to 24.1: MergeTree FINAL optimization diagnostics and settings"'. [#59701](https://github.com/ClickHouse/ClickHouse/pull/59701) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Fix 02720_row_policy_column_with_dots [#59453](https://github.com/ClickHouse/ClickHouse/pull/59453) ([Duc Canh Le](https://github.com/canhld94)).
+* Refactoring of dashboard state encoding [#59554](https://github.com/ClickHouse/ClickHouse/pull/59554) ([Sergei Trifonov](https://github.com/serxa)).
+* MergeTree FINAL optimization diagnostics and settings [#59650](https://github.com/ClickHouse/ClickHouse/pull/59650) ([Maksim Kita](https://github.com/kitaisreal)).
+* Pin python dependencies in stateless tests [#59663](https://github.com/ClickHouse/ClickHouse/pull/59663) ([Raúl Marín](https://github.com/Algunenano)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 36b1db583a8..1e931b95b41 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,5 +1,7 @@
+v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28

From 582abd40fdba6cca9a645271034fc75a292ae3a2 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 9 Feb 2024 12:25:38 +0000
Subject: [PATCH 0794/1081] Update version_date.tsv and changelogs after
 v23.12.4.15-stable

---
 docker/keeper/Dockerfile              |  2 +-
 docker/server/Dockerfile.alpine       |  2 +-
 docker/server/Dockerfile.ubuntu       |  2 +-
 docs/changelogs/v23.12.4.15-stable.md | 21 +++++++++++++++++++++
 utils/list-versions/version_date.tsv  |  2 ++
 5 files changed, 26 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v23.12.4.15-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index fe33bf9e0ea..e8293869a56 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index f0adadd2d59..3cf89f1b841 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index dd00684cc24..d477d8aaca1 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.2.5"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v23.12.4.15-stable.md b/docs/changelogs/v23.12.4.15-stable.md
new file mode 100644
index 00000000000..a67b5aee312
--- /dev/null
+++ b/docs/changelogs/v23.12.4.15-stable.md
@@ -0,0 +1,21 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.12.4.15-stable (4233d111d20) FIXME as compared to v23.12.3.40-stable (a594704ae75)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix incorrect result of arrayElement / map[] on empty value [#59594](https://github.com/ClickHouse/ClickHouse/pull/59594) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash in topK when merging empty states [#59603](https://github.com/ClickHouse/ClickHouse/pull/59603) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix distributed table with a constant sharding key [#59606](https://github.com/ClickHouse/ClickHouse/pull/59606) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix leftPad / rightPad function with FixedString input [#59739](https://github.com/ClickHouse/ClickHouse/pull/59739) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Fix 02720_row_policy_column_with_dots [#59453](https://github.com/ClickHouse/ClickHouse/pull/59453) ([Duc Canh Le](https://github.com/canhld94)).
+* Pin python dependencies in stateless tests [#59663](https://github.com/ClickHouse/ClickHouse/pull/59663) ([Raúl Marín](https://github.com/Algunenano)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 36b1db583a8..1e931b95b41 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,5 +1,7 @@
+v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
 v23.12.1.1368-stable	2023-12-28

From 361dd64374c843293ae6cccbcebcb04388c21ff9 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 9 Feb 2024 13:41:49 +0100
Subject: [PATCH 0795/1081] Fix expected error message

---
 tests/integration/test_access_for_functions/test.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_access_for_functions/test.py b/tests/integration/test_access_for_functions/test.py
index 5069468110c..3e58c961421 100644
--- a/tests/integration/test_access_for_functions/test.py
+++ b/tests/integration/test_access_for_functions/test.py
@@ -38,8 +38,11 @@ def test_access_rights_for_function():
 
     instance.query("GRANT DROP FUNCTION ON *.* TO B")
     instance.query("DROP FUNCTION MySum", user="B")
-    assert "Unknown function MySum" in instance.query_and_get_error(
-        "SELECT MySum(1, 2)"
+
+    function_resolution_error = instance.query_and_get_error("SELECT MySum(1, 2)")
+    assert (
+        "Unknown function MySum" in function_resolution_error
+        or "Function with name 'MySum' does not exists." in function_resolution_error
     )
 
     instance.query("REVOKE CREATE FUNCTION ON *.* FROM A")

From 19fcffb69949b1aa2e7da5231f8c65f79c3bdf36 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 9 Feb 2024 13:42:46 +0100
Subject: [PATCH 0796/1081] Update tests/analyzer_integration_broken_tests.txt

---
 tests/analyzer_integration_broken_tests.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c04ed440c18..725b746f1a0 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,4 +1,3 @@
-test_access_for_functions/test.py::test_access_rights_for_function
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
 test_distributed_backward_compatability/test.py::test_distributed_in_tuple

From 9dfe3f55590d3f094b6bb7dffda6e4d8f7b44739 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Fri, 9 Feb 2024 12:21:11 +0000
Subject: [PATCH 0797/1081] CI: do not reuse builds on release branches

 #job_package_debug #job_style_check
---
 .github/workflows/master.yml           | 22 +++++++++++++---------
 .github/workflows/release_branches.yml | 11 ++++++++---
 .github/workflows/reusable_build.yml   |  9 +++++++--
 tests/ci/ci.py                         |  8 +++++++-
 tests/ci/ci_config.py                  |  5 -----
 5 files changed, 35 insertions(+), 20 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index dac1332adc6..33f98e492b5 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -318,15 +318,19 @@ jobs:
       run_command: |
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
-    needs: [RunConfig, BuilderBinDarwin, BuilderBinDarwinAarch64, BuilderDebRelease, BuilderDebAarch64]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Mark Commit Release Ready
-      runner_type: style-checker
-      data: ${{ needs.RunConfig.outputs.data }}
-      run_command: |
-        python3 mark_release_ready.py
+    needs:
+      - BuilderBinDarwin
+      - BuilderBinDarwinAarch64
+      - BuilderDebRelease
+      - BuilderDebAarch64
+    runs-on: [self-hosted, style-checker]
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+      - name: Mark Commit Release Ready
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          python3 mark_release_ready.py
 ############################################################################################
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index c5d8294b999..c1e4a1800c7 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -91,6 +91,8 @@ jobs:
       build_name: package_release
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+      # always rebuild on release branches to be able to publish from any commit
+      force: true
   BuilderDebAarch64:
     needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
@@ -99,6 +101,8 @@ jobs:
       build_name: package_aarch64
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+      # always rebuild on release branches to be able to publish from any commit
+      force: true
   BuilderDebAsan:
     needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
@@ -142,6 +146,8 @@ jobs:
       build_name: binary_darwin
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+      # always rebuild on release branches to be able to publish from any commit
+      force: true
   BuilderBinDarwinAarch64:
     needs: [RunConfig, BuildDockers]
     if: ${{ !failure() && !cancelled() }}
@@ -150,6 +156,8 @@ jobs:
       build_name: binary_darwin_aarch64
       checkout_depth: 0
       data: ${{ needs.RunConfig.outputs.data }}
+      # always rebuild on release branches to be able to publish from any commit
+      force: true
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
@@ -225,7 +233,6 @@ jobs:
       run_command: |
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
-    if: ${{ !failure() && !cancelled() }}
     needs:
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
@@ -235,8 +242,6 @@ jobs:
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
       - name: Mark Commit Release Ready
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
diff --git a/.github/workflows/reusable_build.yml b/.github/workflows/reusable_build.yml
index 6be9d30175e..80d78d93e1b 100644
--- a/.github/workflows/reusable_build.yml
+++ b/.github/workflows/reusable_build.yml
@@ -26,6 +26,10 @@ name: Build ClickHouse
         description: json ci data
         type: string
         required: true
+      force:
+        description: disallow job skipping
+        type: boolean
+        default: false
       additional_envs:
         description: additional ENV variables to setup the job
         type: string
@@ -33,7 +37,7 @@ name: Build ClickHouse
 jobs:
   Build:
     name: Build-${{inputs.build_name}}
-    if: contains(fromJson(inputs.data).jobs_data.jobs_to_do, inputs.build_name)
+    if: ${{ contains(fromJson(inputs.data).jobs_data.jobs_to_do, inputs.build_name) || inputs.force }}
     env:
       GITHUB_JOB_OVERRIDDEN: Build-${{inputs.build_name}}
     runs-on: [self-hosted, '${{inputs.runner_type}}']
@@ -78,7 +82,8 @@ jobs:
           python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" \
             --infile ${{ toJson(inputs.data) }} \
             --job-name "$BUILD_NAME" \
-            --run
+            --run \
+            ${{ inputs.force && '--force' || '' }}
       - name: Post
         # it still be build report to upload for failed build job
         if: ${{ !cancelled() }}
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index ce8d1c8c20e..213225d0ea8 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -816,6 +816,12 @@ def parse_args(parser: argparse.ArgumentParser) -> argparse.Namespace:
         default=False,
         help="skip fetching data about job runs, used in --configure action (for debugging and nigthly ci)",
     )
+    parser.add_argument(
+        "--force",
+        action="store_true",
+        default=False,
+        help="Used with --run, force the job to run, omitting the ci cache",
+    )
     # FIXME: remove, not used
     parser.add_argument(
         "--rebuild-all-binaries",
@@ -1762,7 +1768,7 @@ def main() -> int:
                     previous_status = job_status.status
                     GHActions.print_in_group("Commit Status Data", job_status)
 
-        if previous_status:
+        if previous_status and not args.force:
             print(
                 f"Commit status or Build Report is already present - job will be skipped with status: [{previous_status}]"
             )
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 7c8990e8d16..998d0876527 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -140,8 +140,6 @@ class JobNames(metaclass=WithIter):
     DOCS_CHECK = "Docs check"
     BUGFIX_VALIDATE = "tests bugfix validate check"
 
-    MARK_RELEASE_READY = "Mark Commit Release Ready"
-
 
 # dynamically update JobName with Build jobs
 for attr_name in dir(Build):
@@ -828,9 +826,6 @@ CI_CONFIG = CiConfig(
         ),
     },
     other_jobs_configs={
-        JobNames.MARK_RELEASE_READY: TestConfig(
-            "", job_config=JobConfig(release_only=True)
-        ),
         JobNames.DOCKER_SERVER: TestConfig(
             "",
             job_config=JobConfig(

From 6aad9b1f134c76f59160b45c58e4bd720e3dde1d Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 9 Feb 2024 14:05:01 +0100
Subject: [PATCH 0798/1081] Analyzer: Fix
 test_wrong_db_or_table_name/test.py::test_wrong_table_name

---
 tests/analyzer_integration_broken_tests.txt   |  1 -
 .../test_wrong_db_or_table_name/test.py       | 33 +++++++++++--------
 2 files changed, 19 insertions(+), 15 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c04ed440c18..1eac8b0e49c 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -17,6 +17,5 @@ test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
 test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
 test_user_defined_object_persistence/test.py::test_persistence
-test_wrong_db_or_table_name/test.py::test_wrong_table_name
 test_zookeeper_config/test.py::test_chroot_with_same_root
 test_zookeeper_config/test.py::test_chroot_with_different_root
diff --git a/tests/integration/test_wrong_db_or_table_name/test.py b/tests/integration/test_wrong_db_or_table_name/test.py
index a5096d80ca9..4a6dcf5aa41 100644
--- a/tests/integration/test_wrong_db_or_table_name/test.py
+++ b/tests/integration/test_wrong_db_or_table_name/test.py
@@ -92,26 +92,31 @@ def test_wrong_table_name(start):
         INSERT INTO test.table_test SELECT 1;
         """
     )
-    with pytest.raises(
-        QueryRuntimeException,
-        match="DB::Exception: Table test.table_test1 does not exist. Maybe you meant test.table_test?.",
-    ):
-        node.query(
-            """
+
+    error_message = node.query_and_get_error(
+        """
             SELECT * FROM test.table_test1 LIMIT 1;
             """
-        )
+    )
+    assert (
+        "DB::Exception: Table test.table_test1 does not exist. Maybe you meant test.table_test?"
+        in error_message
+        or "DB::Exception: Unknown table expression identifier 'test.table_test1' in scope SELECT * FROM test.table_test1 LIMIT 1."
+        in error_message
+    )
     assert int(node.query("SELECT count() FROM test.table_test;")) == 1
 
-    with pytest.raises(
-        QueryRuntimeException,
-        match="DB::Exception: Table test2.table_test1 does not exist. Maybe you meant test.table_test?.",
-    ):
-        node.query(
-            """
+    error_message = node.query_and_get_error(
+        """
             SELECT * FROM test2.table_test1 LIMIT 1;
             """
-        )
+    )
+    assert (
+        "DB::Exception: Table test2.table_test1 does not exist. Maybe you meant test.table_test?."
+        in error_message
+        or "DB::Exception: Unknown table expression identifier 'test2.table_test1' in scope SELECT * FROM test2.table_test1 LIMIT 1."
+        in error_message
+    )
 
     node.query(
         """

From c2320c2d160b3a04a03a3bff9fa738af09066c92 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Fri, 9 Feb 2024 13:17:49 +0000
Subject: [PATCH 0799/1081] CI: await tune ups

 #no_ci_cache #job_package_debug
---
 tests/ci/ci.py | 18 ++++++++----------
 1 file changed, 8 insertions(+), 10 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 213225d0ea8..47e20b3ec09 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -646,14 +646,14 @@ class CiCache:
         TIMEOUT = 3600
         await_finished: Dict[str, List[int]] = {}
         round_cnt = 0
-        while len(jobs_with_params) > 5 and round_cnt < 3:
+        while len(jobs_with_params) > 4 and round_cnt < 5:
             round_cnt += 1
             GHActions.print_in_group(
                 f"Wait pending jobs, round [{round_cnt}]:", list(jobs_with_params)
             )
             # this is initial approach to wait pending jobs:
-            # start waiting for the next TIMEOUT seconds if there are more than X(=5) jobs to wait
-            # wait TIMEOUT seconds in rounds. Y(=3) is the max number of rounds
+            # start waiting for the next TIMEOUT seconds if there are more than X(=4) jobs to wait
+            # wait TIMEOUT seconds in rounds. Y(=5) is the max number of rounds
             expired_sec = 0
             start_at = int(time.time())
             while expired_sec < TIMEOUT and jobs_with_params:
@@ -701,13 +701,11 @@ class CiCache:
                 print(
                     f"...awaiting continues... seconds left [{TIMEOUT - expired_sec}]"
                 )
-        if await_finished:
-            GHActions.print_in_group(
-                "Finished jobs:",
-                [f"{job}:{batches}" for job, batches in await_finished.items()],
-            )
-        else:
-            print("Awaiting FAILED. No job has finished successfully.")
+            if await_finished:
+                GHActions.print_in_group(
+                    f"Finished jobs, round [{round_cnt}]:",
+                    [f"{job}:{batches}" for job, batches in await_finished.items()],
+                )
         GHActions.print_in_group(
             "Remaining jobs:",
             [f"{job}:{params['batches']}" for job, params in jobs_with_params.items()],

From 68df20114508c838cff0dbc7bc0d7f81025a6bdf Mon Sep 17 00:00:00 2001
From: Alexander Nikolaev <zvava@ya.ru>
Date: Fri, 9 Feb 2024 16:50:50 +0300
Subject: [PATCH 0800/1081] Add CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS
 envoronment variable.

---
 docker/server/entrypoint.sh | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/docker/server/entrypoint.sh b/docker/server/entrypoint.sh
index 78f18f376f4..69c0fdda351 100755
--- a/docker/server/entrypoint.sh
+++ b/docker/server/entrypoint.sh
@@ -118,13 +118,19 @@ if [ -n "$CLICKHOUSE_USER" ] && [ "$CLICKHOUSE_USER" != "default" ] || [ -n "$CL
 EOT
 fi
 
+CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS="${CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS:-}"
+
 # checking $DATA_DIR for initialization
 if [ -d "${DATA_DIR%/}/data" ]; then
     DATABASE_ALREADY_EXISTS='true'
 fi
 
-# only run initialization on an empty data directory
-if [ -z "${DATABASE_ALREADY_EXISTS}" ]; then
+# run initialization if flag CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS is not empty or data directory is empty
+if [[ -n "${CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS}" || -z "${DATABASE_ALREADY_EXISTS}" ]]; then
+  RUN_INITDB_SCRIPTS='true'
+fi
+
+if [ -z "${RUN_INITDB_SCRIPTS}" ]; then
     if [ -n "$(ls /docker-entrypoint-initdb.d/)" ] || [ -n "$CLICKHOUSE_DB" ]; then
         # port is needed to check if clickhouse-server is ready for connections
         HTTP_PORT="$(clickhouse extract-from-config --config-file "$CLICKHOUSE_CONFIG" --key=http_port --try)"

From 50828dade25fa0f431907f9a466c305ca3d6e1b2 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Fri, 9 Feb 2024 14:53:03 +0100
Subject: [PATCH 0801/1081] Fix stacktraces on MacOS (#59690)

---
 CMakeLists.txt                            | 15 +++++---
 contrib/libunwind-cmake/unwind-override.c |  4 +++
 contrib/llvm-project                      |  2 +-
 src/Common/StackTrace.cpp                 | 43 ++++++++++++++++++++++-
 4 files changed, 58 insertions(+), 6 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 063cfc77302..8b232aa12ef 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -254,10 +254,17 @@ endif()
 
 include(cmake/cpu_features.cmake)
 
-# Asynchronous unwind tables are needed for Query Profiler.
-# They are already by default on some platforms but possibly not on all platforms.
-# Enable it explicitly.
-set (COMPILER_FLAGS "${COMPILER_FLAGS} -fasynchronous-unwind-tables")
+
+# Query Profiler doesn't work on MacOS for several reasons
+# - PHDR cache is not available
+# - We use native functionality to get stacktraces which is not async signal safe
+# and thus we don't need to generate asynchronous unwind tables
+if (NOT OS_DARWIN)
+    # Asynchronous unwind tables are needed for Query Profiler.
+    # They are already by default on some platforms but possibly not on all platforms.
+    # Enable it explicitly.
+    set (COMPILER_FLAGS "${COMPILER_FLAGS} -fasynchronous-unwind-tables")
+endif()
 
 # Reproducible builds.
 if (CMAKE_BUILD_TYPE_UC STREQUAL "DEBUG")
diff --git a/contrib/libunwind-cmake/unwind-override.c b/contrib/libunwind-cmake/unwind-override.c
index 616bab6ae4b..57928d817eb 100644
--- a/contrib/libunwind-cmake/unwind-override.c
+++ b/contrib/libunwind-cmake/unwind-override.c
@@ -1,6 +1,10 @@
 #include <libunwind.h>
 
+/// On MacOS this function will be replaced with a dynamic symbol
+/// from the system library.
+#if !defined(OS_DARWIN)
 int backtrace(void ** buffer, int size)
 {
     return unw_backtrace(buffer, size);
 }
+#endif
diff --git a/contrib/llvm-project b/contrib/llvm-project
index 2568a7cd129..d2142eed980 160000
--- a/contrib/llvm-project
+++ b/contrib/llvm-project
@@ -1 +1 @@
-Subproject commit 2568a7cd1297c7c3044b0f3cc0c23a6f6444d856
+Subproject commit d2142eed98046a47ff7112e3cc1e197c8a5cd80f
diff --git a/src/Common/StackTrace.cpp b/src/Common/StackTrace.cpp
index 8431630b16c..7e683ae91de 100644
--- a/src/Common/StackTrace.cpp
+++ b/src/Common/StackTrace.cpp
@@ -4,6 +4,7 @@
 #include <base/constexpr_helpers.h>
 #include <base/demangle.h>
 
+#include <Common/scope_guard_safe.h>
 #include <Common/Dwarf.h>
 #include <Common/Elf.h>
 #include <Common/MemorySanitizer.h>
@@ -24,6 +25,15 @@
 
 #include "config.h"
 
+#include <boost/algorithm/string/split.hpp>
+
+#if defined(OS_DARWIN)
+/// This header contains functions like `backtrace` and `backtrace_symbols`
+/// Which will be used for stack unwinding on Mac.
+/// Read: https://developer.apple.com/library/archive/documentation/System/Conceptual/ManPages_iPhoneOS/man3/backtrace.3.html
+#include "execinfo.h"
+#endif
+
 namespace
 {
 /// Currently this variable is set up once on server startup.
@@ -262,6 +272,33 @@ void StackTrace::forEachFrame(
             callback(current_inline_frame);
         }
 
+        callback(current_frame);
+    }
+#elif defined(OS_DARWIN)
+    UNUSED(fatal);
+
+    /// This function returns an array of string in a special (a little bit weird format)
+    /// The frame number, library name, address in hex, mangled symbol name, `+` sign, the offset.
+    char** strs = ::backtrace_symbols(frame_pointers.data(), static_cast<int>(size));
+    SCOPE_EXIT_SAFE({free(strs);});
+
+    for (size_t i = offset; i < size; ++i)
+    {
+        StackTrace::Frame current_frame;
+
+        std::vector<std::string> split;
+        boost::split(split, strs[i], isWhitespaceASCII);
+        split.erase(
+            std::remove_if(
+                split.begin(), split.end(),
+                [](const std::string & x) { return x.empty(); }),
+            split.end());
+        assert(split.size() == 6);
+
+        current_frame.virtual_addr = frame_pointers[i];
+        current_frame.physical_addr = frame_pointers[i];
+        current_frame.object = split[1];
+        current_frame.symbol = split[3];
         callback(current_frame);
     }
 #else
@@ -306,7 +343,11 @@ StackTrace::StackTrace(const ucontext_t & signal_context)
 
 void StackTrace::tryCapture()
 {
+#if defined(OS_DARWIN)
+    size = backtrace(frame_pointers.data(), capacity);
+#else
     size = unw_backtrace(frame_pointers.data(), capacity);
+#endif
     __msan_unpoison(frame_pointers.data(), size * sizeof(frame_pointers[0]));
 }
 
@@ -376,7 +417,7 @@ toStringEveryLineImpl([[maybe_unused]] bool fatal, const StackTraceRefTriple & s
         return callback("<Empty trace>");
 
     size_t frame_index = stack_trace.offset;
-#if defined(__ELF__) && !defined(OS_FREEBSD)
+#if (defined(__ELF__) && !defined(OS_FREEBSD)) || defined(OS_DARWIN)
     size_t inline_frame_index = 0;
     auto callback_wrapper = [&](const StackTrace::Frame & frame)
     {

From 3cca665f667bbda8b8c1a25b35e2684813ea61a3 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 14:06:41 +0000
Subject: [PATCH 0802/1081] Attempt to fix more tests.

---
 .../QueryPlan/Optimizations/optimizeTree.cpp  | 16 +++++++++
 .../QueryPlan/Optimizations/splitFilter.cpp   | 35 +++++++++++++++++--
 2 files changed, 48 insertions(+), 3 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index c8c95e7443f..93430e072bb 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -118,6 +118,22 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
         optimizePrewhere(stack, nodes);
         optimizePrimaryKeyCondition(stack);
 
+        auto & frame = stack.back();
+
+        /// Traverse all children first.
+        if (frame.next_child < frame.node->children.size())
+        {
+            auto next_frame = Frame{.node = frame.node->children[frame.next_child]};
+            ++frame.next_child;
+            stack.push_back(next_frame);
+            continue;
+        }
+
+        stack.pop_back();
+    }
+
+    while (!stack.empty())
+    {
         {
             /// NOTE: frame cannot be safely used after stack was modified.
             auto & frame = stack.back();
diff --git a/src/Processors/QueryPlan/Optimizations/splitFilter.cpp b/src/Processors/QueryPlan/Optimizations/splitFilter.cpp
index 8c212936195..561ad7302c6 100644
--- a/src/Processors/QueryPlan/Optimizations/splitFilter.cpp
+++ b/src/Processors/QueryPlan/Optimizations/splitFilter.cpp
@@ -14,19 +14,33 @@ size_t trySplitFilter(QueryPlan::Node * node, QueryPlan::Nodes & nodes)
         return 0;
 
     const auto & expr = filter_step->getExpression();
+    const std::string & filter_column_name = filter_step->getFilterColumnName();
 
     /// Do not split if there are function like runningDifference.
     if (expr->hasStatefulFunctions())
         return 0;
 
-    auto split = expr->splitActionsForFilter(filter_step->getFilterColumnName());
+    bool filter_name_clashs_with_input = false;
+    if (filter_step->removesFilterColumn())
+    {
+        for (const auto * input : expr->getInputs())
+        {
+            if (input->result_name == filter_column_name)
+            {
+                filter_name_clashs_with_input = true;
+                break;
+            }
+        }
+    }
+
+    auto split = expr->splitActionsForFilter(filter_column_name);
 
     if (split.second->trivial())
         return 0;
 
     bool remove_filter = false;
     if (filter_step->removesFilterColumn())
-        remove_filter = split.second->removeUnusedResult(filter_step->getFilterColumnName());
+        remove_filter = split.second->removeUnusedResult(filter_column_name);
 
     auto description = filter_step->getStepDescription();
 
@@ -34,10 +48,25 @@ size_t trySplitFilter(QueryPlan::Node * node, QueryPlan::Nodes & nodes)
     node->children.swap(filter_node.children);
     node->children.push_back(&filter_node);
 
+    std::string split_filter_name = filter_column_name;
+    if (filter_name_clashs_with_input)
+    {
+        split_filter_name = "__split_filter";
+
+        for (auto & filter_output : split.first->getOutputs())
+        {
+            if (filter_output->result_name == filter_column_name)
+            {
+                filter_output = &split.first->addAlias(*filter_output, split_filter_name);
+                break;
+            }
+        }
+    }
+
     filter_node.step = std::make_unique<FilterStep>(
             filter_node.children.at(0)->step->getOutputStream(),
             std::move(split.first),
-            filter_step->getFilterColumnName(),
+            std::move(split_filter_name),
             remove_filter);
 
     node->step = std::make_unique<ExpressionStep>(filter_node.step->getOutputStream(), std::move(split.second));

From 7575f0db84dc01fb1a6e5b5404d0f3d298e220f1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 14:36:56 +0000
Subject: [PATCH 0803/1081] Fix some tests.

---
 ...771_ignore_data_skipping_indices.reference | 111 +++++++++-----
 .../02771_ignore_data_skipping_indices.sql    |   8 ++
 ...ndex_in_function_different_types.reference | 136 +++++++-----------
 ..._key_index_in_function_different_types.sql |  17 +--
 ...f_indexes_support_match_function.reference |  12 --
 ...ngrambf_indexes_support_match_function.sql |  89 +-----------
 6 files changed, 140 insertions(+), 233 deletions(-)

diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
index fcede2caf2a..e23e3094ca3 100644
--- a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
@@ -1,40 +1,77 @@
 1	2	3
 1	2	3
 1	2	3
-  ReadFromMergeTree (default.data_02771)
-  Indexes:
-    PrimaryKey
-      Condition: true
-      Parts: 1/1
-      Granules: 1/1
-    Skip
-      Name: x_idx
-      Description: minmax GRANULARITY 1
-      Parts: 0/1
-      Granules: 0/1
-    Skip
-      Name: y_idx
-      Description: minmax GRANULARITY 1
-      Parts: 0/0
-      Granules: 0/0
-    Skip
-      Name: xy_idx
-      Description: minmax GRANULARITY 1
-      Parts: 0/0
-      Granules: 0/0
-  ReadFromMergeTree (default.data_02771)
-  Indexes:
-    PrimaryKey
-      Condition: true
-      Parts: 1/1
-      Granules: 1/1
-    Skip
-      Name: x_idx
-      Description: minmax GRANULARITY 1
-      Parts: 0/1
-      Granules: 0/1
-    Skip
-      Name: y_idx
-      Description: minmax GRANULARITY 1
-      Parts: 0/0
-      Granules: 0/0
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+      Skip
+        Name: xy_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+      Skip
+        Name: xy_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
+    ReadFromMergeTree (default.data_02771)
+    Indexes:
+      PrimaryKey
+        Condition: true
+        Parts: 1/1
+        Granules: 1/1
+      Skip
+        Name: x_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/1
+        Granules: 0/1
+      Skip
+        Name: y_idx
+        Description: minmax GRANULARITY 1
+        Parts: 0/0
+        Granules: 0/0
diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
index a49239e9de2..716421b7342 100644
--- a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
@@ -24,6 +24,14 @@ SELECT * FROM data_02771 SETTINGS ignore_data_skipping_indices='na_idx';
 
 SELECT * FROM data_02771 WHERE x = 1 AND y = 1 SETTINGS ignore_data_skipping_indices='xy_idx',force_data_skipping_indices='xy_idx' ; -- { serverError 277 }
 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx';
+
+SET allow_experimental_analyzer = 0;
+
+SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
+SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx' ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
+
+SET allow_experimental_analyzer = 1;
+
 SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
 SELECT * from ( EXPLAIN indexes = 1 SELECT * FROM data_02771 WHERE x = 1 AND y = 2 SETTINGS ignore_data_skipping_indices='xy_idx' ) WHERE explain NOT LIKE '%Expression%' AND explain NOT LIKE '%Filter%';
 
diff --git a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
index f34aad737d4..6338d048186 100644
--- a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
+++ b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
@@ -1,88 +1,48 @@
-CreatingSets (Create sets before main query execution)
-  Expression ((Projection + Before ORDER BY))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 1-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Projection + Before ORDER BY))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 1-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Projection + Before ORDER BY))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 5-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Projection + Before ORDER BY))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 5-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Project names + Projection))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 1-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Project names + Projection))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 1-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Project names + Projection))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 5-element set))
-        Parts: 1/1
-        Granules: 1/1
-CreatingSets (Create sets before main query execution)
-  Expression ((Project names + Projection))
-    ReadFromMergeTree (default.test_table)
-    Indexes:
-      PrimaryKey
-        Keys: 
-          id
-          value
-        Condition: and((id in (-Inf, 10]), (value in 5-element set))
-        Parts: 1/1
-        Granules: 1/1
+CreatingSets
+  Expression
+    Expression
+      ReadFromMergeTree
+      Indexes:
+        PrimaryKey
+          Keys: 
+            id
+            value
+          Condition: and((value in 1-element set), (id in (-Inf, 10]))
+          Parts: 1/1
+          Granules: 1/1
+CreatingSets
+  Expression
+    Expression
+      ReadFromMergeTree
+      Indexes:
+        PrimaryKey
+          Keys: 
+            id
+            value
+          Condition: and((value in 1-element set), (id in (-Inf, 10]))
+          Parts: 1/1
+          Granules: 1/1
+CreatingSets
+  Expression
+    Expression
+      ReadFromMergeTree
+      Indexes:
+        PrimaryKey
+          Keys: 
+            id
+            value
+          Condition: and((value in 5-element set), (id in (-Inf, 10]))
+          Parts: 1/1
+          Granules: 1/1
+CreatingSets
+  Expression
+    Expression
+      ReadFromMergeTree
+      Indexes:
+        PrimaryKey
+          Keys: 
+            id
+            value
+          Condition: and((value in 5-element set), (id in (-Inf, 10]))
+          Parts: 1/1
+          Granules: 1/1
diff --git a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
index 077c49fb22e..585c2635970 100644
--- a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
+++ b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
@@ -7,18 +7,9 @@ CREATE TABLE test_table
 
 INSERT INTO test_table SELECT number, number FROM numbers(10);
 
-SET allow_experimental_analyzer = 0;
-
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT 5);
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT '5');
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toUInt8(number) FROM numbers(5));
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toString(number) FROM numbers(5));
-
-SET allow_experimental_analyzer = 1;
-
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT 5);
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT '5');
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toUInt8(number) FROM numbers(5));
-EXPLAIN indexes = 1 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toString(number) FROM numbers(5));
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT 5);
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT '5');
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toUInt8(number) FROM numbers(5));
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toString(number) FROM numbers(5));
 
 DROP TABLE test_table;
diff --git a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
index 1cf1644fe0a..5c6a213a03f 100644
--- a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
+++ b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
@@ -2,12 +2,8 @@
 2	Hello World
 1	Hello ClickHouse
 2	Hello World
-          Granules: 6/6
-          Granules: 2/6
             Granules: 6/6
             Granules: 2/6
-          Granules: 6/6
-          Granules: 2/6
             Granules: 6/6
             Granules: 2/6
 ---
@@ -17,22 +13,14 @@
 1	Hello ClickHouse
 2	Hello World
 6	World Champion
-          Granules: 6/6
-          Granules: 3/6
             Granules: 6/6
             Granules: 3/6
-          Granules: 6/6
-          Granules: 3/6
             Granules: 6/6
             Granules: 3/6
 ---
 5	OLAP Database
 5	OLAP Database
-          Granules: 6/6
-          Granules: 1/6
             Granules: 6/6
             Granules: 1/6
-          Granules: 6/6
-          Granules: 1/6
             Granules: 6/6
             Granules: 1/6
diff --git a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
index 49d39c601ef..5db9697d018 100644
--- a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
+++ b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
@@ -38,20 +38,7 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes=1
-    SELECT * FROM tokenbf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 SELECT *
 FROM
@@ -60,20 +47,7 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes=1
-    SELECT * FROM ngrambf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 
 SELECT '---';
@@ -92,20 +66,7 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes = 1
-    SELECT * FROM tokenbf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 SELECT *
 FROM
@@ -114,20 +75,7 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes = 1
-    SELECT * FROM ngrambf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 SELECT '---';
 
@@ -145,19 +93,7 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes = 1
-    SELECT * FROM tokenbf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 SELECT *
 FROM
@@ -166,20 +102,7 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 0;
-
-SELECT *
-FROM
-(
-    EXPLAIN PLAN indexes = 1
-    SELECT * FROM ngrambf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
-)
-WHERE
-    explain LIKE '%Granules: %'
-SETTINGS
-  allow_experimental_analyzer = 1;
+    explain LIKE '%Granules: %';
 
 DROP TABLE tokenbf_tab;
 DROP TABLE ngrambf_tab;

From 1063d9ca5005c317cc6ce5dfaac6cbcfd271e9b7 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 14:47:24 +0000
Subject: [PATCH 0804/1081] Use opd prewhere optimizaer for old analyzer.

---
 src/Interpreters/InterpreterSelectQuery.cpp | 56 ++++++++++-----------
 1 file changed, 28 insertions(+), 28 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 187518b9f6c..d0cf9f1160c 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -600,7 +600,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
         query.setFinal();
     }
 
-    auto analyze = [&] (bool)
+    auto analyze = [&] (bool try_move_to_prewhere)
     {
         /// Allow push down and other optimizations for VIEW: replace with subquery and rewrite it.
         ASTPtr view_table;
@@ -632,37 +632,37 @@ InterpreterSelectQuery::InterpreterSelectQuery(
             view = nullptr;
         }
 
-        // if (try_move_to_prewhere
-        //     && storage && storage->canMoveConditionsToPrewhere()
-        //     && query.where() && !query.prewhere()
-        //     && !query.hasJoin()) /// Join may produce rows with nulls or default values, it's difficult to analyze if they affected or not.
-        // {
-        //     /// PREWHERE optimization: transfer some condition from WHERE to PREWHERE if enabled and viable
-        //     if (const auto & column_sizes = storage->getColumnSizes(); !column_sizes.empty())
-        //     {
-        //         /// Extract column compressed sizes.
-        //         std::unordered_map<std::string, UInt64> column_compressed_sizes;
-        //         for (const auto & [name, sizes] : column_sizes)
-        //             column_compressed_sizes[name] = sizes.data_compressed;
+        if (try_move_to_prewhere
+            && storage && storage->canMoveConditionsToPrewhere()
+            && query.where() && !query.prewhere()
+            && !query.hasJoin()) /// Join may produce rows with nulls or default values, it's difficult to analyze if they affected or not.
+        {
+            /// PREWHERE optimization: transfer some condition from WHERE to PREWHERE if enabled and viable
+            if (const auto & column_sizes = storage->getColumnSizes(); !column_sizes.empty())
+            {
+                /// Extract column compressed sizes.
+                std::unordered_map<std::string, UInt64> column_compressed_sizes;
+                for (const auto & [name, sizes] : column_sizes)
+                    column_compressed_sizes[name] = sizes.data_compressed;
 
-        //         SelectQueryInfo current_info;
-        //         current_info.query = query_ptr;
-        //         current_info.syntax_analyzer_result = syntax_analyzer_result;
+                SelectQueryInfo current_info;
+                current_info.query = query_ptr;
+                current_info.syntax_analyzer_result = syntax_analyzer_result;
 
-        //         Names queried_columns = syntax_analyzer_result->requiredSourceColumns();
-        //         const auto & supported_prewhere_columns = storage->supportedPrewhereColumns();
+                Names queried_columns = syntax_analyzer_result->requiredSourceColumns();
+                const auto & supported_prewhere_columns = storage->supportedPrewhereColumns();
 
-        //         MergeTreeWhereOptimizer where_optimizer{
-        //             std::move(column_compressed_sizes),
-        //             metadata_snapshot,
-        //             storage->getConditionEstimatorByPredicate(query_info, storage_snapshot, context),
-        //             queried_columns,
-        //             supported_prewhere_columns,
-        //             log};
+                MergeTreeWhereOptimizer where_optimizer{
+                    std::move(column_compressed_sizes),
+                    metadata_snapshot,
+                    storage->getConditionEstimatorByPredicate(query_info, storage_snapshot, context),
+                    queried_columns,
+                    supported_prewhere_columns,
+                    log};
 
-        //         where_optimizer.optimize(current_info, context);
-        //     }
-        // }
+                where_optimizer.optimize(current_info, context);
+            }
+        }
 
         if (query.prewhere() && query.where())
         {

From d3cccf856199d6cbd5c7eb1caff3ee0d9501351c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 15:44:51 +0000
Subject: [PATCH 0805/1081] Fixing tests.

---
 .../QueryPlan/Optimizations/optimizeTree.cpp  |  2 +
 ...f_indexes_support_match_function.reference | 12 +++
 ...ngrambf_indexes_support_match_function.sql | 89 +++++++++++++++++--
 3 files changed, 97 insertions(+), 6 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index 93430e072bb..55f7e7cb85b 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -132,6 +132,8 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
         stack.pop_back();
     }
 
+    stack.push_back({.node = &root});
+
     while (!stack.empty())
     {
         {
diff --git a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
index 5c6a213a03f..1cf1644fe0a 100644
--- a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
+++ b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.reference
@@ -2,8 +2,12 @@
 2	Hello World
 1	Hello ClickHouse
 2	Hello World
+          Granules: 6/6
+          Granules: 2/6
             Granules: 6/6
             Granules: 2/6
+          Granules: 6/6
+          Granules: 2/6
             Granules: 6/6
             Granules: 2/6
 ---
@@ -13,14 +17,22 @@
 1	Hello ClickHouse
 2	Hello World
 6	World Champion
+          Granules: 6/6
+          Granules: 3/6
             Granules: 6/6
             Granules: 3/6
+          Granules: 6/6
+          Granules: 3/6
             Granules: 6/6
             Granules: 3/6
 ---
 5	OLAP Database
 5	OLAP Database
+          Granules: 6/6
+          Granules: 1/6
             Granules: 6/6
             Granules: 1/6
+          Granules: 6/6
+          Granules: 1/6
             Granules: 6/6
             Granules: 1/6
diff --git a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
index 5db9697d018..49d39c601ef 100644
--- a/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
+++ b/tests/queries/0_stateless/02943_tokenbf_and_ngrambf_indexes_support_match_function.sql
@@ -38,7 +38,20 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes=1
+    SELECT * FROM tokenbf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 SELECT *
 FROM
@@ -47,7 +60,20 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes=1
+    SELECT * FROM ngrambf_tab WHERE match(str, 'Hello (ClickHouse|World)') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 
 SELECT '---';
@@ -66,7 +92,20 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes = 1
+    SELECT * FROM tokenbf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 SELECT *
 FROM
@@ -75,7 +114,20 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes = 1
+    SELECT * FROM ngrambf_tab WHERE match(str, '.*(ClickHouse|World)') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 SELECT '---';
 
@@ -93,7 +145,19 @@ FROM
     SELECT * FROM tokenbf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes = 1
+    SELECT * FROM tokenbf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 SELECT *
 FROM
@@ -102,7 +166,20 @@ FROM
     SELECT * FROM ngrambf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
 )
 WHERE
-    explain LIKE '%Granules: %';
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 0;
+
+SELECT *
+FROM
+(
+    EXPLAIN PLAN indexes = 1
+    SELECT * FROM ngrambf_tab WHERE match(str, 'OLAP (.*?)*') ORDER BY id
+)
+WHERE
+    explain LIKE '%Granules: %'
+SETTINGS
+  allow_experimental_analyzer = 1;
 
 DROP TABLE tokenbf_tab;
 DROP TABLE ngrambf_tab;

From b23ba02d4c75eebdabfd90d03d44218420f93582 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Fri, 9 Feb 2024 16:50:37 +0100
Subject: [PATCH 0806/1081] Enforce tests with enabled analyzer in CI

---
 tests/ci/ci_config.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 998d0876527..8ab6ceebb42 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1130,6 +1130,8 @@ REQUIRED_CHECKS = [
     JobNames.UNIT_TEST,
     JobNames.UNIT_TEST_TSAN,
     JobNames.UNIT_TEST_UBSAN,
+    JobNames.INTEGRATION_TEST_ASAN_ANALYZER,
+    JobNames.STATELESS_TEST_ANALYZER_RELEASE,
 ]
 
 
From f056e8b2c400fd676a37ab59727ebaf6d929e27c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 9 Feb 2024 16:54:00 +0100
Subject: [PATCH 0807/1081] Handle different timestamp related aspects of
 zip-files

---
 .../build_and_deploy_archive.sh                 | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
index 5b377d3c184..3c6c8e0ac1e 100644
--- a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
+++ b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
@@ -22,18 +22,29 @@ mkdir "$PACKAGE"
 cp app.py "$PACKAGE"
 if [ -f requirements.txt ]; then
   VENV=lambda-venv
-  rm -rf "$VENV" lambda-package.zip
+  rm -rf "$VENV"
   docker run --net=host --rm --user="${UID}" -e HOME=/tmp --entrypoint=/bin/bash \
     --volume="${WORKDIR}/..:/ci" --workdir="/ci/${DIR_NAME}" "${DOCKER_IMAGE}" \
     -exc "
       '$PY_EXEC' -m venv '$VENV' &&
       source '$VENV/bin/activate' &&
-      pip install -r requirements.txt
+      pip install -r requirements.txt &&
+      # To have consistent pyc files
+      find '$VENV/lib' -name '*.pyc' -delete
+      find '$VENV/lib' ! -type d -exec touch -t 201212121212 {} +
+      python -m compileall
     "
   cp -rT "$VENV/lib/$PY_EXEC/site-packages/" "$PACKAGE"
   rm -r "$PACKAGE"/{pip,pip-*,setuptools,setuptools-*}
+  # zip stores metadata about timestamps
+  find "$PACKAGE" ! -type d -exec touch -t 201212121212 {} +
 fi
-( cd "$PACKAGE" && zip -9 -r ../"$PACKAGE".zip . )
+(
+  export LC_ALL=c
+  cd "$PACKAGE"
+  # zip uses random files order by default, so we sort the files alphabetically
+  find . ! -type d -print0 | sort -z | tr '\0' '\n' | zip -XD -0 ../"$PACKAGE".zip --names-stdin
+)
 
 ECHO=()
 if [ -n "$DRY_RUN" ]; then

From ca2f51493155f5ea2663880d209c1b0a13e4cc94 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 9 Feb 2024 17:36:44 +0100
Subject: [PATCH 0808/1081] Fix msan unpoison

---
 src/Common/MemorySanitizer.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Common/MemorySanitizer.h b/src/Common/MemorySanitizer.h
index 02747d1e130..bd44ff62acb 100644
--- a/src/Common/MemorySanitizer.h
+++ b/src/Common/MemorySanitizer.h
@@ -13,7 +13,7 @@
 #undef __msan_unpoison_string
 
 #define __msan_unpoison(X, Y) /// NOLINT
-/// Given a pointer and **its size**, unpoisons up to 15 bytes **at the end**
+/// Given a pointer and **its size**, unpoisons 15 bytes **at the end**
 /// See memcmpSmall.h / memcpySmall.h
 #define __msan_unpoison_overflow_15(X, Y) /// NOLINT
 #define __msan_test_shadow(X, Y) (false) /// NOLINT
@@ -28,7 +28,7 @@
 #        undef __msan_unpoison_string
 #        include <sanitizer/msan_interface.h>
 #        undef __msan_unpoison_overflow_15
-#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE)], ((16 - ((PTR_SIZE) % 16)) % 16))
+#        define __msan_unpoison_overflow_15(PTR, PTR_SIZE) __msan_unpoison(&(PTR)[(PTR_SIZE)], 15)
 #    endif
 #endif
 

From 16f3dbea713840ef9c79faa358330986acdc81a7 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 16:43:48 +0000
Subject: [PATCH 0809/1081] Update optimizePrewjere

---
 .../QueryPlan/Optimizations/optimizePrewhere.cpp      |  4 ++--
 .../02149_read_in_order_fixed_prefix.reference        | 11 ++++-------
 2 files changed, 6 insertions(+), 9 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 2f790d9892f..ee5ad8d1a8a 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -139,8 +139,8 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     const auto & context = read_from_merge_tree->getContext();
     const auto & settings = context->getSettingsRef();
 
-    // if (!settings.allow_experimental_analyzer)
-    //     return;
+    if (!settings.allow_experimental_analyzer)
+        return;
 
     bool is_final = read_from_merge_tree->isQueryWithFinal();
     bool optimize_move_to_prewhere = settings.optimize_move_to_prewhere && (!is_final || settings.optimize_move_to_prewhere_if_final);
diff --git a/tests/queries/0_stateless/02149_read_in_order_fixed_prefix.reference b/tests/queries/0_stateless/02149_read_in_order_fixed_prefix.reference
index f2a4ef1f634..f3415a34823 100644
--- a/tests/queries/0_stateless/02149_read_in_order_fixed_prefix.reference
+++ b/tests/queries/0_stateless/02149_read_in_order_fixed_prefix.reference
@@ -76,8 +76,7 @@ ExpressionTransform
         (Expression)
         ExpressionTransform
           (ReadFromMergeTree)
-          ExpressionTransform
-            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1
+          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1
 2020-10-11	0	0
 2020-10-11	0	10
 2020-10-11	0	20
@@ -106,8 +105,7 @@ ExpressionTransform
           (Expression)
           ExpressionTransform
             (ReadFromMergeTree)
-            ExpressionTransform
-              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1
+            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1
 2020-10-12	0
 2020-10-12	1
 2020-10-12	2
@@ -140,9 +138,8 @@ ExpressionTransform
         (Expression)
         ExpressionTransform
           (ReadFromMergeTree)
-          ExpressionTransform
-            ReverseTransform
-              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InReverseOrder) 0 → 1
+          ReverseTransform
+            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InReverseOrder) 0 → 1
 2020-10-12	99999
 2020-10-12	99998
 2020-10-12	99997

From 67d5e5885eb330bb41c502695671215fc16b791e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 18:32:42 +0100
Subject: [PATCH 0810/1081] Update
 tests/queries/0_stateless/02982_comments_in_system_tables.sh

Co-authored-by: Mikhail f. Shiryaev <felixoid@clickhouse.com>
---
 tests/queries/0_stateless/02982_comments_in_system_tables.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02982_comments_in_system_tables.sh b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
index 0825b1be2d6..2d7fbf4d35a 100755
--- a/tests/queries/0_stateless/02982_comments_in_system_tables.sh
+++ b/tests/queries/0_stateless/02982_comments_in_system_tables.sh
@@ -4,5 +4,5 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-${CLICKHOUSE_LOCAL}  --query "SELECT 'Table ' || database || '.' || name || ' doesn\'t have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
-${CLICKHOUSE_CLIENT} --query "SELECT 'Table ' || database || '.' || name || ' doesn\'t have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
+${CLICKHOUSE_LOCAL}  --query "SELECT 'Table ' || database || '.' || name || ' does not have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"
+${CLICKHOUSE_CLIENT} --query "SELECT 'Table ' || database || '.' || name || ' does not have a comment' FROM system.tables WHERE name NOT LIKE '%\_log\_%' AND database='system' AND comment==''"

From e54fbd3367b0fef10a82ec3b133129274b87c8d5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 9 Feb 2024 18:32:54 +0100
Subject: [PATCH 0811/1081] Update tests/ci/ci_config.py

Co-authored-by: Mikhail f. Shiryaev <felixoid@clickhouse.com>
---
 tests/ci/ci_config.py | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 817018f044c..4a62d686e35 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -202,13 +202,6 @@ class JobConfig:
     release_only: bool = False
 
 
-# About the "sparse_checkout" option:
-#
-# It's needed only to test the option itself.
-# No particular sense to use it in the build,
-# and it is even slows down the job.
-
-
 @dataclass
 class BuildConfig:
     name: str
@@ -219,6 +212,8 @@ class BuildConfig:
     coverage: bool = False
     sanitizer: str = ""
     tidy: bool = False
+    # sparse_checkout is needed only to test the option itself.
+    # No particular sense to use it in every build, since it slows down the job.
     sparse_checkout: bool = False
     comment: str = ""
     static_binary_name: str = ""

From a76e07207aa7645316fdba83ae3db5398b650c1a Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 9 Feb 2024 18:58:15 +0100
Subject: [PATCH 0812/1081] Add new setting azure_max_single_part_copy_size to
 SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 5bd38d600c1..c453dd837eb 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -92,7 +92,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_increase_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases"},
               {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
               {"split_parts_ranges_into_intersecting_and_non_intersecting_final", true, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
-              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"}}},
+              {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"},
+              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},

From 1d0a86ccdfb94863b09125a554a329b971b16587 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 18:31:51 +0000
Subject: [PATCH 0813/1081] Try to fix tests.

---
 .../QueryPlan/Optimizations/optimizeTree.cpp  |  9 ++-
 .../01763_filter_push_down_bugs.reference     |  2 +-
 .../01786_explain_merge_tree.reference        | 12 ---
 .../0_stateless/01786_explain_merge_tree.sh   |  4 +-
 ...771_ignore_data_skipping_indices.reference | 74 +++++++++----------
 .../02771_ignore_data_skipping_indices.sql    |  2 -
 ...ndex_in_function_different_types.reference | 44 +++++++++++
 ..._key_index_in_function_different_types.sql |  9 +++
 8 files changed, 99 insertions(+), 57 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index 55f7e7cb85b..c64bc308246 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -120,6 +120,12 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
 
         auto & frame = stack.back();
 
+        if (frame.next_child == 0)
+        {
+            if (optimization_settings.distinct_in_order)
+                tryDistinctReadInOrder(frame.node);
+        }
+
         /// Traverse all children first.
         if (frame.next_child < frame.node->children.size())
         {
@@ -154,9 +160,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
 
                 if (optimization_settings.aggregation_in_order)
                     optimizeAggregationInOrder(*frame.node, nodes);
-
-                if (optimization_settings.distinct_in_order)
-                    tryDistinctReadInOrder(frame.node);
             }
 
             /// Traverse all children first.
diff --git a/tests/queries/0_stateless/01763_filter_push_down_bugs.reference b/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
index c8045dd26f5..80bd7dfd8c0 100644
--- a/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
+++ b/tests/queries/0_stateless/01763_filter_push_down_bugs.reference
@@ -28,7 +28,7 @@ Expression ((Projection + Before ORDER BY))
 Expression ((Project names + Projection))
   Filter ((WHERE + DROP unused columns after JOIN))
     Join (JOIN FillRightFirst)
-      Expression (Change column names to column identifiers)
+      Expression
         ReadFromMergeTree (default.t1)
         Indexes:
           PrimaryKey
diff --git a/tests/queries/0_stateless/01786_explain_merge_tree.reference b/tests/queries/0_stateless/01786_explain_merge_tree.reference
index 096090f8fa1..fd1bc713b08 100644
--- a/tests/queries/0_stateless/01786_explain_merge_tree.reference
+++ b/tests/queries/0_stateless/01786_explain_merge_tree.reference
@@ -3,21 +3,18 @@
     MinMax
       Keys: 
         y
-      Condition: (y in [1, +Inf))
       Parts: 4/5
       Granules: 11/12
     Partition
       Keys: 
         y
         bitAnd(z, 3)
-      Condition: and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))
       Parts: 3/4
       Granules: 10/11
     PrimaryKey
       Keys: 
         x
         y
-      Condition: and((x in [11, +Inf)), (y in [1, +Inf)))
       Parts: 2/3
       Granules: 6/10
     Skip
@@ -37,7 +34,6 @@
             {
               "Type": "MinMax",
               "Keys": ["y"],
-              "Condition": "(y in [1, +Inf))",
               "Initial Parts": 5,
               "Selected Parts": 4,
               "Initial Granules": 12,
@@ -46,7 +42,6 @@
             {
               "Type": "Partition",
               "Keys": ["y", "bitAnd(z, 3)"],
-              "Condition": "and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))",
               "Initial Parts": 4,
               "Selected Parts": 3,
               "Initial Granules": 11,
@@ -55,7 +50,6 @@
             {
               "Type": "PrimaryKey",
               "Keys": ["x", "y"],
-              "Condition": "and((x in [11, +Inf)), (y in [1, +Inf)))",
               "Initial Parts": 3,
               "Selected Parts": 2,
               "Initial Granules": 10,
@@ -109,21 +103,18 @@
       MinMax
         Keys: 
           y
-        Condition: (y in [1, +Inf))
         Parts: 4/5
         Granules: 11/12
       Partition
         Keys: 
           y
           bitAnd(z, 3)
-        Condition: and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))
         Parts: 3/4
         Granules: 10/11
       PrimaryKey
         Keys: 
           x
           y
-        Condition: and((x in [11, +Inf)), (y in [1, +Inf)))
         Parts: 2/3
         Granules: 6/10
       Skip
@@ -138,7 +129,6 @@
                 {
                   "Type": "MinMax",
                   "Keys": ["y"],
-                  "Condition": "(y in [1, +Inf))",
                   "Initial Parts": 5,
                   "Selected Parts": 4,
                   "Initial Granules": 12,
@@ -147,7 +137,6 @@
                 {
                   "Type": "Partition",
                   "Keys": ["y", "bitAnd(z, 3)"],
-                  "Condition": "and((y in [1, +Inf)), (bitAnd(z, 3) not in [1, 1]))",
                   "Initial Parts": 4,
                   "Selected Parts": 3,
                   "Initial Granules": 11,
@@ -156,7 +145,6 @@
                 {
                   "Type": "PrimaryKey",
                   "Keys": ["x", "y"],
-                  "Condition": "and((x in [11, +Inf)), (y in [1, +Inf)))",
                   "Initial Parts": 3,
                   "Selected Parts": 2,
                   "Initial Granules": 10,
diff --git a/tests/queries/0_stateless/01786_explain_merge_tree.sh b/tests/queries/0_stateless/01786_explain_merge_tree.sh
index 23537013204..e3b28acdc41 100755
--- a/tests/queries/0_stateless/01786_explain_merge_tree.sh
+++ b/tests/queries/0_stateless/01786_explain_merge_tree.sh
@@ -17,13 +17,13 @@ do
 
     $CH_CLIENT -q "
         explain indexes = 1 select *, _part from test_index where t % 19 = 16 and y > 0 and bitAnd(z, 3) != 1 and x > 10 and t % 20 > 14;
-        " | grep -A 100 "ReadFromMergeTree" # | grep -v "Description"
+        " | grep -A 100 "ReadFromMergeTree" | grep -v "Condition"
 
     echo "-----------------"
 
     $CH_CLIENT -q "
         explain indexes = 1, json = 1 select *, _part from test_index where t % 19 = 16 and y > 0 and bitAnd(z, 3) != 1 and x > 10 and t % 20 > 14 format TSVRaw;
-        " | grep -A 100 "ReadFromMergeTree" # | grep -v "Description"
+        " | grep -A 100 "ReadFromMergeTree" | grep -v "Condition"
 
     echo "-----------------"
 
diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
index e23e3094ca3..33df18c8801 100644
--- a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.reference
@@ -1,43 +1,43 @@
 1	2	3
 1	2	3
 1	2	3
-    ReadFromMergeTree (default.data_02771)
-    Indexes:
-      PrimaryKey
-        Condition: true
-        Parts: 1/1
-        Granules: 1/1
-      Skip
-        Name: x_idx
-        Description: minmax GRANULARITY 1
-        Parts: 0/1
-        Granules: 0/1
-      Skip
-        Name: y_idx
-        Description: minmax GRANULARITY 1
-        Parts: 0/0
-        Granules: 0/0
-      Skip
-        Name: xy_idx
-        Description: minmax GRANULARITY 1
-        Parts: 0/0
-        Granules: 0/0
-    ReadFromMergeTree (default.data_02771)
-    Indexes:
-      PrimaryKey
-        Condition: true
-        Parts: 1/1
-        Granules: 1/1
-      Skip
-        Name: x_idx
-        Description: minmax GRANULARITY 1
-        Parts: 0/1
-        Granules: 0/1
-      Skip
-        Name: y_idx
-        Description: minmax GRANULARITY 1
-        Parts: 0/0
-        Granules: 0/0
+  ReadFromMergeTree (default.data_02771)
+  Indexes:
+    PrimaryKey
+      Condition: true
+      Parts: 1/1
+      Granules: 1/1
+    Skip
+      Name: x_idx
+      Description: minmax GRANULARITY 1
+      Parts: 0/1
+      Granules: 0/1
+    Skip
+      Name: y_idx
+      Description: minmax GRANULARITY 1
+      Parts: 0/0
+      Granules: 0/0
+    Skip
+      Name: xy_idx
+      Description: minmax GRANULARITY 1
+      Parts: 0/0
+      Granules: 0/0
+  ReadFromMergeTree (default.data_02771)
+  Indexes:
+    PrimaryKey
+      Condition: true
+      Parts: 1/1
+      Granules: 1/1
+    Skip
+      Name: x_idx
+      Description: minmax GRANULARITY 1
+      Parts: 0/1
+      Granules: 0/1
+    Skip
+      Name: y_idx
+      Description: minmax GRANULARITY 1
+      Parts: 0/0
+      Granules: 0/0
     ReadFromMergeTree (default.data_02771)
     Indexes:
       PrimaryKey
diff --git a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
index 716421b7342..951d87fd2c0 100644
--- a/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
+++ b/tests/queries/0_stateless/02771_ignore_data_skipping_indices.sql
@@ -1,5 +1,3 @@
-SET allow_experimental_analyzer = 0;
-
 DROP TABLE IF EXISTS data_02771;
 
 
diff --git a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
index 6338d048186..7a5e798359b 100644
--- a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
+++ b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.reference
@@ -1,3 +1,47 @@
+CreatingSets
+  Expression
+    ReadFromMergeTree
+    Indexes:
+      PrimaryKey
+        Keys: 
+          id
+          value
+        Condition: and((id in (-Inf, 10]), (value in 1-element set))
+        Parts: 1/1
+        Granules: 1/1
+CreatingSets
+  Expression
+    ReadFromMergeTree
+    Indexes:
+      PrimaryKey
+        Keys: 
+          id
+          value
+        Condition: and((id in (-Inf, 10]), (value in 1-element set))
+        Parts: 1/1
+        Granules: 1/1
+CreatingSets
+  Expression
+    ReadFromMergeTree
+    Indexes:
+      PrimaryKey
+        Keys: 
+          id
+          value
+        Condition: and((id in (-Inf, 10]), (value in 5-element set))
+        Parts: 1/1
+        Granules: 1/1
+CreatingSets
+  Expression
+    ReadFromMergeTree
+    Indexes:
+      PrimaryKey
+        Keys: 
+          id
+          value
+        Condition: and((id in (-Inf, 10]), (value in 5-element set))
+        Parts: 1/1
+        Granules: 1/1
 CreatingSets
   Expression
     Expression
diff --git a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
index 585c2635970..1b1a7607344 100644
--- a/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
+++ b/tests/queries/0_stateless/02882_primary_key_index_in_function_different_types.sql
@@ -7,6 +7,15 @@ CREATE TABLE test_table
 
 INSERT INTO test_table SELECT number, number FROM numbers(10);
 
+set allow_experimental_analyzer = 0;
+
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT 5);
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT '5');
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toUInt8(number) FROM numbers(5));
+EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toString(number) FROM numbers(5));
+
+set allow_experimental_analyzer = 1;
+
 EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT 5);
 EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT '5');
 EXPLAIN indexes = 1, description=0 SELECT id FROM test_table WHERE id <= 10 AND value IN (SELECT toUInt8(number) FROM numbers(5));

From 69e118e58734aa822f86d33c3596310509af3c42 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Fri, 9 Feb 2024 19:34:21 +0100
Subject: [PATCH 0814/1081] Fix potential endless loop during merge (#59812)

---
 src/Processors/Merges/Algorithms/MergedData.h       |  4 ++--
 src/Processors/Transforms/ColumnGathererTransform.h | 12 ++++++++----
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/src/Processors/Merges/Algorithms/MergedData.h b/src/Processors/Merges/Algorithms/MergedData.h
index f92d20d22e1..7ffde835ad0 100644
--- a/src/Processors/Merges/Algorithms/MergedData.h
+++ b/src/Processors/Merges/Algorithms/MergedData.h
@@ -100,7 +100,7 @@ public:
         merged_rows = 0;
         sum_blocks_granularity = 0;
         ++total_chunks;
-        total_allocated_bytes += chunk.allocatedBytes();
+        total_allocated_bytes += chunk.bytes();
         need_flush = false;
 
         return chunk;
@@ -122,7 +122,7 @@ public:
         {
             size_t merged_bytes = 0;
             for (const auto & column : columns)
-                merged_bytes += column->allocatedBytes();
+                merged_bytes += column->byteSize();
             if (merged_bytes >= max_block_size_bytes)
                 return true;
         }
diff --git a/src/Processors/Transforms/ColumnGathererTransform.h b/src/Processors/Transforms/ColumnGathererTransform.h
index 821d04db0df..4e56cffa46a 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.h
+++ b/src/Processors/Transforms/ColumnGathererTransform.h
@@ -145,10 +145,14 @@ void ColumnGathererStream::gather(Column & column_res)
 
     next_required_source = -1;
 
-    while (row_source_pos < row_sources_end
-        && column_res.size() < block_preferred_size_rows
-        && column_res.allocatedBytes() < block_preferred_size_bytes)
+
+    /// We use do ... while here to ensure there will be at least one iteration of this loop.
+    /// Because the column_res.byteSize() could be bigger than block_preferred_size_bytes already at this point.
+    do
     {
+        if (row_source_pos >= row_sources_end)
+            break;
+
         RowSourcePart row_source = *row_source_pos;
         size_t source_num = row_source.getSourceNum();
         Source & source = sources[source_num];
@@ -191,7 +195,7 @@ void ColumnGathererStream::gather(Column & column_res)
         }
 
         source.pos += len;
-    }
+    } while (column_res.size() < block_preferred_size_rows && column_res.byteSize() < block_preferred_size_bytes);
 }
 
 }

From dc52def9ebfcd10ac826108ac846d3c4d00792e0 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 5 Feb 2024 12:33:17 +0300
Subject: [PATCH 0815/1081] Revert "Revert "Poco Logger small refactoring""

---
 base/poco/Foundation/CMakeLists.txt           |   6 +
 base/poco/Foundation/include/Poco/Logger.h    |  42 ++--
 .../include/Poco/RefCountedObject.h           |   3 +-
 base/poco/Foundation/src/Logger.cpp           | 226 +++++++++++-------
 src/Common/Logger.h                           |  12 +
 src/Common/tests/gtest_log.cpp                |  73 ++++++
 .../ObjectStorages/ObjectStorageFactory.cpp   |   2 +-
 .../ObjectStorages/Web/WebObjectStorage.cpp   |   2 +-
 utils/keeper-data-dumper/main.cpp             |   2 +-
 9 files changed, 255 insertions(+), 113 deletions(-)

diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index dfb41a33fb1..5fe644d3057 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -166,6 +166,12 @@ set (SRCS
 )
 
 add_library (_poco_foundation ${SRCS})
+target_link_libraries (_poco_foundation
+    PUBLIC
+        boost::headers_only
+        boost::system
+)
+
 add_library (Poco::Foundation ALIAS _poco_foundation)
 
 # TODO: remove these warning exclusions
diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index cf202718662..883294a071a 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -22,6 +22,9 @@
 #include <cstddef>
 #include <map>
 #include <vector>
+
+#include <boost/smart_ptr/intrusive_ptr.hpp>
+
 #include "Poco/Channel.h"
 #include "Poco/Format.h"
 #include "Poco/Foundation.h"
@@ -34,7 +37,7 @@ namespace Poco
 
 class Exception;
 class Logger;
-using LoggerPtr = std::shared_ptr<Logger>;
+using LoggerPtr = boost::intrusive_ptr<Logger>;
 
 class Foundation_API Logger : public Channel
 /// Logger is a special Channel that acts as the main
@@ -871,21 +874,11 @@ public:
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
-    static LoggerPtr getShared(const std::string & name);
+    static LoggerPtr getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created = true);
     /// Returns a shared pointer to the Logger with the given name.
     /// If the Logger does not yet exist, it is created, based
     /// on its parent logger.
 
-    static Logger & unsafeGet(const std::string & name);
-    /// Returns a reference to the Logger with the given name.
-    /// If the Logger does not yet exist, it is created, based
-    /// on its parent logger.
-    ///
-    /// WARNING: This method is not thread safe. You should
-    /// probably use get() instead.
-    /// The only time this method should be used is during
-    /// program initialization, when only one thread is running.
-
     static Logger & create(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
     /// Creates and returns a reference to a Logger with the
     /// given name. The Logger's Channel and log level as set as
@@ -932,6 +925,16 @@ public:
 
     static const std::string ROOT; /// The name of the root logger ("").
 
+public:
+    struct LoggerEntry
+    {
+        Poco::Logger * logger;
+        bool owned_by_shared_ptr = false;
+    };
+
+    using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
+    using LoggerMapIterator = LoggerMap::iterator;
+
 protected:
     Logger(const std::string & name, Channel * pChannel, int level);
     ~Logger();
@@ -940,12 +943,19 @@ protected:
     void log(const std::string & text, Message::Priority prio, const char * file, int line);
 
     static std::string format(const std::string & fmt, int argc, std::string argv[]);
-    static Logger & unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
-    static Logger & parent(const std::string & name);
-    static void add(Logger * pLogger);
-    static Logger * find(const std::string & name);
 
 private:
+    static std::pair<Logger::LoggerMapIterator, bool> unsafeGet(const std::string & name, bool get_shared);
+    static Logger * unsafeGetRawPtr(const std::string & name);
+    static std::pair<LoggerMapIterator, bool> unsafeCreate(const std::string & name, Channel * pChannel, int level = Message::PRIO_INFORMATION);
+    static Logger & parent(const std::string & name);
+    static std::pair<LoggerMapIterator, bool> add(Logger * pLogger);
+    static std::optional<LoggerMapIterator> find(const std::string & name);
+    static Logger * findRawPtr(const std::string & name);
+
+    friend void intrusive_ptr_add_ref(Logger * ptr);
+    friend void intrusive_ptr_release(Logger * ptr);
+
     Logger();
     Logger(const Logger &);
     Logger & operator=(const Logger &);
diff --git a/base/poco/Foundation/include/Poco/RefCountedObject.h b/base/poco/Foundation/include/Poco/RefCountedObject.h
index db966089e00..1f806bdacb1 100644
--- a/base/poco/Foundation/include/Poco/RefCountedObject.h
+++ b/base/poco/Foundation/include/Poco/RefCountedObject.h
@@ -53,11 +53,10 @@ protected:
     virtual ~RefCountedObject();
     /// Destroys the RefCountedObject.
 
+    mutable std::atomic<size_t> _counter;
 private:
     RefCountedObject(const RefCountedObject &);
     RefCountedObject & operator=(const RefCountedObject &);
-
-    mutable std::atomic<size_t> _counter;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index cfc063c8979..16fc3a0480e 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -38,14 +38,7 @@ std::mutex & getLoggerMutex()
 	return *logger_mutex;
 }
 
-struct LoggerEntry
-{
-	Poco::Logger * logger;
-	bool owned_by_shared_ptr = false;
-};
-
-using LoggerMap = std::unordered_map<std::string, LoggerEntry>;
-LoggerMap * _pLoggerMap = nullptr;
+Poco::Logger::LoggerMap * _pLoggerMap = nullptr;
 
 }
 
@@ -309,38 +302,9 @@ void Logger::formatDump(std::string& message, const void* buffer, std::size_t le
 namespace
 {
 
-struct LoggerDeleter
-{
-	void operator()(Poco::Logger * logger)
-	{
-		std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-		/// If logger infrastructure is destroyed just decrement logger reference count
-		if (!_pLoggerMap)
-		{
-			logger->release();
-			return;
-		}
-
-		auto it = _pLoggerMap->find(logger->name());
-		assert(it != _pLoggerMap->end());
-
-		/** If reference count is 1, this means this shared pointer owns logger
-		  * and need destroy it.
-		  */
-		size_t reference_count_before_release = logger->release();
-		if (reference_count_before_release == 1)
-		{
-			assert(it->second.owned_by_shared_ptr);
-			_pLoggerMap->erase(it);
-		}
-	}
-};
-
-
 inline LoggerPtr makeLoggerPtr(Logger & logger)
 {
-	return std::shared_ptr<Logger>(&logger, LoggerDeleter());
+	return LoggerPtr(&logger, false /*add_ref*/);
 }
 
 }
@@ -350,64 +314,87 @@ Logger& Logger::get(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	Logger & logger = unsafeGet(name);
-
-	/** If there are already shared pointer created for this logger
-	  * we need to increment Logger reference count and now logger
-	  * is owned by logger infrastructure.
-	  */
-	auto it = _pLoggerMap->find(name);
-	if (it->second.owned_by_shared_ptr)
-	{
-		it->second.logger->duplicate();
-		it->second.owned_by_shared_ptr = false;
-	}
-
-	return logger;
+	auto [it, inserted] = unsafeGet(name, false /*get_shared*/);
+	return *it->second.logger;
 }
 
 
-LoggerPtr Logger::getShared(const std::string & name)
+LoggerPtr Logger::getShared(const std::string & name, bool should_be_owned_by_shared_ptr_if_created)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
-	bool logger_exists = _pLoggerMap && _pLoggerMap->contains(name);
+	auto [it, inserted] = unsafeGet(name, true /*get_shared*/);
 
-	Logger & logger = unsafeGet(name);
-
-	/** If logger already exists, then this shared pointer does not own it.
-	  * If logger does not exists, logger infrastructure could be already destroyed
-	  * or logger was created.
+	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
+	  * If logger was already created, then this shared pointer does not own it.
 	  */
-	if (logger_exists)
+	if (inserted)
 	{
-		logger.duplicate();
-	}
-	else if (_pLoggerMap)
-	{
-		_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+		if (should_be_owned_by_shared_ptr_if_created)
+			it->second.owned_by_shared_ptr = true;
+		else
+			it->second.logger->duplicate();
 	}
 
-	return makeLoggerPtr(logger);
+	return makeLoggerPtr(*it->second.logger);
 }
 
 
-Logger& Logger::unsafeGet(const std::string& name)
+std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string& name, bool get_shared)
 {
-	Logger* pLogger = find(name);
-	if (!pLogger)
+	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
+
+	bool should_recreate_logger = false;
+
+	if (optional_logger_it)
 	{
+		auto & logger_it = *optional_logger_it;
+		std::optional<size_t> reference_count_before;
+
+		if (get_shared)
+		{
+			reference_count_before = logger_it->second.logger->duplicate();
+		}
+		else if (logger_it->second.owned_by_shared_ptr)
+		{
+			reference_count_before = logger_it->second.logger->duplicate();
+			logger_it->second.owned_by_shared_ptr = false;
+		}
+
+		/// Other thread already decided to delete this logger, but did not yet remove it from map
+		if (reference_count_before && reference_count_before == 0)
+			should_recreate_logger = true;
+	}
+
+	if (!optional_logger_it || should_recreate_logger)
+	{
+		Logger * logger = nullptr;
+
 		if (name == ROOT)
 		{
-			pLogger = new Logger(name, 0, Message::PRIO_INFORMATION);
+			logger = new Logger(name, nullptr, Message::PRIO_INFORMATION);
 		}
 		else
 		{
 			Logger& par = parent(name);
-			pLogger = new Logger(name, par.getChannel(), par.getLevel());
+			logger = new Logger(name, par.getChannel(), par.getLevel());
 		}
-		add(pLogger);
+
+		if (should_recreate_logger)
+		{
+			(*optional_logger_it)->second.logger = logger;
+			return std::make_pair(*optional_logger_it, true);
+		}
+
+		return add(logger);
 	}
-	return *pLogger;
+
+	return std::make_pair(*optional_logger_it, false);
+}
+
+
+Logger * Logger::unsafeGetRawPtr(const std::string & name)
+{
+	return unsafeGet(name, false /*get_shared*/).first->second.logger;
 }
 
 
@@ -415,24 +402,24 @@ Logger& Logger::create(const std::string& name, Channel* pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeCreate(name, pChannel, level);
+	return *unsafeCreate(name, pChannel, level).first->second.logger;
 }
 
 LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int level)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	Logger & logger = unsafeCreate(name, pChannel, level);
-	_pLoggerMap->find(name)->second.owned_by_shared_ptr = true;
+	auto [it, inserted] = unsafeCreate(name, pChannel, level);
+	it->second.owned_by_shared_ptr = true;
 
-	return makeLoggerPtr(logger);
+	return makeLoggerPtr(*it->second.logger);
 }
 
 Logger& Logger::root()
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return unsafeGet(ROOT);
+	return *unsafeGetRawPtr(ROOT);
 }
 
 
@@ -440,7 +427,11 @@ Logger* Logger::has(const std::string& name)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());
 
-	return find(name);
+	auto optional_it = find(name);
+	if (!optional_it)
+		return nullptr;
+
+	return (*optional_it)->second.logger;
 }
 
 
@@ -459,20 +450,69 @@ void Logger::shutdown()
 		}
 
 		delete _pLoggerMap;
-		_pLoggerMap = 0;
+		_pLoggerMap = nullptr;
 	}
 }
 
 
-Logger* Logger::find(const std::string& name)
+std::optional<Logger::LoggerMapIterator> Logger::find(const std::string& name)
 {
 	if (_pLoggerMap)
 	{
 		LoggerMap::iterator it = _pLoggerMap->find(name);
 		if (it != _pLoggerMap->end())
-			return it->second.logger;
+			return it;
+
+		return {};
 	}
-	return 0;
+
+	return {};
+}
+
+Logger * Logger::findRawPtr(const std::string & name)
+{
+	auto optional_it = find(name);
+	if (!optional_it)
+		return nullptr;
+
+	return (*optional_it)->second.logger;
+}
+
+
+void intrusive_ptr_add_ref(Logger * ptr)
+{
+	ptr->duplicate();
+}
+
+
+void intrusive_ptr_release(Logger * ptr)
+{
+	size_t reference_count_before = ptr->_counter.fetch_sub(1, std::memory_order_acq_rel);
+	if (reference_count_before != 1)
+		return;
+
+	{
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		if (_pLoggerMap)
+		{
+			auto it = _pLoggerMap->find(ptr->name());
+
+			/** It is possible that during release other thread created logger and
+			  * updated iterator in map.
+			  */
+			if (it != _pLoggerMap->end() && ptr == it->second.logger)
+			{
+				/** If reference count is 0, this means this intrusive pointer owns logger
+				  * and need destroy it.
+				  */
+				assert(it->second.owned_by_shared_ptr);
+				_pLoggerMap->erase(it);
+			}
+		}
+	}
+
+	delete ptr;
 }
 
 
@@ -490,28 +530,28 @@ void Logger::names(std::vector<std::string>& names)
 	}
 }
 
-Logger& Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
+
+std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeCreate(const std::string & name, Channel * pChannel, int level)
 {
 	if (find(name)) throw ExistsException();
 	Logger* pLogger = new Logger(name, pChannel, level);
-	add(pLogger);
-
-	return *pLogger;
+	return add(pLogger);
 }
 
+
 Logger& Logger::parent(const std::string& name)
 {
 	std::string::size_type pos = name.rfind('.');
 	if (pos != std::string::npos)
 	{
 		std::string pname = name.substr(0, pos);
-		Logger* pParent = find(pname);
+		Logger* pParent = findRawPtr(pname);
 		if (pParent)
 			return *pParent;
 		else
 			return parent(pname);
 	}
-	else return unsafeGet(ROOT);
+	else return *unsafeGetRawPtr(ROOT);
 }
 
 
@@ -579,12 +619,14 @@ namespace
 }
 
 
-void Logger::add(Logger* pLogger)
+std::pair<Logger::LoggerMapIterator, bool> Logger::add(Logger* pLogger)
 {
 	if (!_pLoggerMap)
-		_pLoggerMap = new LoggerMap;
+		_pLoggerMap = new Logger::LoggerMap;
 
-	_pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
+	auto result = _pLoggerMap->emplace(pLogger->name(), LoggerEntry{pLogger, false /*owned_by_shared_ptr*/});
+	assert(result.second);
+	return result;
 }
 
 
diff --git a/src/Common/Logger.h b/src/Common/Logger.h
index 6dcdea9a9d8..0425da8c847 100644
--- a/src/Common/Logger.h
+++ b/src/Common/Logger.h
@@ -2,6 +2,8 @@
 
 #include <memory>
 
+#include <base/defines.h>
+
 #include <Poco/Channel.h>
 #include <Poco/Logger.h>
 #include <Poco/Message.h>
@@ -24,6 +26,16 @@ using LoggerRawPtr = Poco::Logger *;
   */
 LoggerPtr getLogger(const std::string & name);
 
+/** Get Logger with specified name. If the Logger does not exists, it is created.
+  * This overload was added for specific purpose, when logger is constructed from constexpr string.
+  * Logger is destroyed only during program shutdown.
+  */
+template <size_t n>
+ALWAYS_INLINE LoggerPtr getLogger(const char (&name)[n])
+{
+    return Poco::Logger::getShared(name, false /*should_be_owned_by_shared_ptr_if_created*/);
+}
+
 /** Create Logger with specified name, channel and logging level.
   * If Logger already exists, throws exception.
   * Logger is destroyed, when last shared ptr that refers to Logger with specified name is destroyed.
diff --git a/src/Common/tests/gtest_log.cpp b/src/Common/tests/gtest_log.cpp
index 622497fe2f5..6d2bd56ad77 100644
--- a/src/Common/tests/gtest_log.cpp
+++ b/src/Common/tests/gtest_log.cpp
@@ -9,6 +9,7 @@
 #include <Poco/NullChannel.h>
 #include <Poco/StreamChannel.h>
 #include <sstream>
+#include <thread>
 
 
 TEST(Logger, Log)
@@ -100,3 +101,75 @@ TEST(Logger, SideEffects)
 
     LOG_TRACE(log, "test no throw {}", getLogMessageParamOrThrow());
 }
+
+TEST(Logger, SharedRawLogger)
+{
+    {
+        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
+
+        auto shared_logger = getLogger("Logger_1");
+        shared_logger->setChannel(stream_channel.get());
+        shared_logger->setLevel("trace");
+
+        LOG_TRACE(shared_logger, "SharedLogger1Log1");
+        LOG_TRACE(getRawLogger("Logger_1"), "RawLogger1Log");
+        LOG_TRACE(shared_logger, "SharedLogger1Log2");
+
+        auto actual = stream.str();
+        EXPECT_EQ(actual, "SharedLogger1Log1\nRawLogger1Log\nSharedLogger1Log2\n");
+    }
+    {
+        std::ostringstream stream; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        auto stream_channel = Poco::AutoPtr<Poco::StreamChannel>(new Poco::StreamChannel(stream));
+
+        auto * raw_logger = getRawLogger("Logger_2");
+        raw_logger->setChannel(stream_channel.get());
+        raw_logger->setLevel("trace");
+
+        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log1");
+        LOG_TRACE(raw_logger, "RawLogger2Log");
+        LOG_TRACE(getLogger("Logger_2"), "SharedLogger2Log2");
+
+        auto actual = stream.str();
+        EXPECT_EQ(actual, "SharedLogger2Log1\nRawLogger2Log\nSharedLogger2Log2\n");
+    }
+}
+
+TEST(Logger, SharedLoggersThreadSafety)
+{
+    static size_t threads_count = std::thread::hardware_concurrency();
+    static constexpr size_t loggers_count = 10;
+    static constexpr size_t logger_get_count = 1000;
+
+    Poco::Logger::root();
+
+    std::vector<std::string> names;
+
+    Poco::Logger::names(names);
+    size_t loggers_size_before = names.size();
+
+    std::vector<std::thread> threads;
+
+    for (size_t thread_index = 0; thread_index < threads_count; ++thread_index)
+    {
+        threads.emplace_back([]()
+        {
+            for (size_t logger_index = 0; logger_index < loggers_count; ++logger_index)
+            {
+                for (size_t iteration = 0; iteration < logger_get_count; ++iteration)
+                {
+                    getLogger("Logger_" + std::to_string(logger_index));
+                }
+            }
+        });
+    }
+
+    for (auto & thread : threads)
+        thread.join();
+
+    Poco::Logger::names(names);
+    size_t loggers_size_after = names.size();
+
+    EXPECT_EQ(loggers_size_before, loggers_size_after);
+}
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 866373db44a..b3626135177 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -102,7 +102,7 @@ void checkS3Capabilities(
     if (s3_capabilities.support_batch_delete && !checkBatchRemove(storage, key_with_trailing_slash))
     {
         LOG_WARNING(
-            &Poco::Logger::get("S3ObjectStorage"),
+            getLogger("S3ObjectStorage"),
             "Storage for disk {} does not support batch delete operations, "
             "so `s3_capabilities.support_batch_delete` was automatically turned off during the access check. "
             "To remove this message set `s3_capabilities.support_batch_delete` for the disk to `false`.",
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 0223c24973e..786b23caf48 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -82,7 +82,7 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
             if (!inserted)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Loading data for {} more than once", file_path);
 
-            LOG_TRACE(&Poco::Logger::get("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
+            LOG_TRACE(getLogger("DiskWeb"), "Adding file: {}, size: {}", file_path, size);
             loaded_files.emplace_back(file_path);
         }
 
diff --git a/utils/keeper-data-dumper/main.cpp b/utils/keeper-data-dumper/main.cpp
index e06b301edbf..9e107c99534 100644
--- a/utils/keeper-data-dumper/main.cpp
+++ b/utils/keeper-data-dumper/main.cpp
@@ -59,7 +59,7 @@ int main(int argc, char *argv[])
         Poco::Logger::root().setChannel(channel);
         Poco::Logger::root().setLevel("trace");
     }
-    auto * logger = &Poco::Logger::get("keeper-dumper");
+    auto logger = getLogger("keeper-dumper");
     ResponsesQueue queue(std::numeric_limits<size_t>::max());
     SnapshotsQueue snapshots_queue{1};
     CoordinationSettingsPtr settings = std::make_shared<CoordinationSettings>();

From cb702f72ef040e3974d3f25e228aaeb8971cbdb7 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 5 Feb 2024 16:30:04 +0300
Subject: [PATCH 0816/1081] Updated implementation

---
 base/poco/Foundation/CMakeLists.txt           |   6 -
 base/poco/Foundation/include/Poco/Logger.h    |   7 +-
 .../include/Poco/RefCountedObject.h           |   3 +-
 base/poco/Foundation/src/Logger.cpp           | 112 +++++++-----------
 4 files changed, 46 insertions(+), 82 deletions(-)

diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index 5fe644d3057..dfb41a33fb1 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -166,12 +166,6 @@ set (SRCS
 )
 
 add_library (_poco_foundation ${SRCS})
-target_link_libraries (_poco_foundation
-    PUBLIC
-        boost::headers_only
-        boost::system
-)
-
 add_library (Poco::Foundation ALIAS _poco_foundation)
 
 # TODO: remove these warning exclusions
diff --git a/base/poco/Foundation/include/Poco/Logger.h b/base/poco/Foundation/include/Poco/Logger.h
index 883294a071a..2a1cb33b407 100644
--- a/base/poco/Foundation/include/Poco/Logger.h
+++ b/base/poco/Foundation/include/Poco/Logger.h
@@ -23,8 +23,6 @@
 #include <map>
 #include <vector>
 
-#include <boost/smart_ptr/intrusive_ptr.hpp>
-
 #include "Poco/Channel.h"
 #include "Poco/Format.h"
 #include "Poco/Foundation.h"
@@ -37,7 +35,7 @@ namespace Poco
 
 class Exception;
 class Logger;
-using LoggerPtr = boost::intrusive_ptr<Logger>;
+using LoggerPtr = std::shared_ptr<Logger>;
 
 class Foundation_API Logger : public Channel
 /// Logger is a special Channel that acts as the main
@@ -953,9 +951,6 @@ private:
     static std::optional<LoggerMapIterator> find(const std::string & name);
     static Logger * findRawPtr(const std::string & name);
 
-    friend void intrusive_ptr_add_ref(Logger * ptr);
-    friend void intrusive_ptr_release(Logger * ptr);
-
     Logger();
     Logger(const Logger &);
     Logger & operator=(const Logger &);
diff --git a/base/poco/Foundation/include/Poco/RefCountedObject.h b/base/poco/Foundation/include/Poco/RefCountedObject.h
index 1f806bdacb1..db966089e00 100644
--- a/base/poco/Foundation/include/Poco/RefCountedObject.h
+++ b/base/poco/Foundation/include/Poco/RefCountedObject.h
@@ -53,10 +53,11 @@ protected:
     virtual ~RefCountedObject();
     /// Destroys the RefCountedObject.
 
-    mutable std::atomic<size_t> _counter;
 private:
     RefCountedObject(const RefCountedObject &);
     RefCountedObject & operator=(const RefCountedObject &);
+
+    mutable std::atomic<size_t> _counter;
 };
 
 
diff --git a/base/poco/Foundation/src/Logger.cpp b/base/poco/Foundation/src/Logger.cpp
index 16fc3a0480e..779af384b0b 100644
--- a/base/poco/Foundation/src/Logger.cpp
+++ b/base/poco/Foundation/src/Logger.cpp
@@ -302,9 +302,40 @@ void Logger::formatDump(std::string& message, const void* buffer, std::size_t le
 namespace
 {
 
-inline LoggerPtr makeLoggerPtr(Logger & logger)
+struct LoggerDeleter
 {
-	return LoggerPtr(&logger, false /*add_ref*/);
+	void operator()(Poco::Logger * logger)
+	{
+		std::lock_guard<std::mutex> lock(getLoggerMutex());
+
+		/// If logger infrastructure is destroyed just decrement logger reference count
+		if (!_pLoggerMap)
+		{
+			logger->release();
+			return;
+		}
+
+		auto it = _pLoggerMap->find(logger->name());
+		assert(it != _pLoggerMap->end());
+
+		/** If reference count is 1, this means this shared pointer owns logger
+		  * and need destroy it.
+		  */
+		size_t reference_count_before_release = logger->release();
+		if (reference_count_before_release == 1)
+		{
+			assert(it->second.owned_by_shared_ptr);
+			_pLoggerMap->erase(it);
+		}
+	}
+};
+
+inline LoggerPtr makeLoggerPtr(Logger & logger, bool owned_by_shared_ptr)
+{
+	if (owned_by_shared_ptr)
+		return LoggerPtr(&logger, LoggerDeleter());
+
+	return LoggerPtr(std::shared_ptr<void>{}, &logger);
 }
 
 }
@@ -327,15 +358,10 @@ LoggerPtr Logger::getShared(const std::string & name, bool should_be_owned_by_sh
 	/** If during `unsafeGet` logger was created, then this shared pointer owns it.
 	  * If logger was already created, then this shared pointer does not own it.
 	  */
-	if (inserted)
-	{
-		if (should_be_owned_by_shared_ptr_if_created)
-			it->second.owned_by_shared_ptr = true;
-		else
-			it->second.logger->duplicate();
-	}
+	if (inserted && should_be_owned_by_shared_ptr_if_created)
+		it->second.owned_by_shared_ptr = true;
 
-	return makeLoggerPtr(*it->second.logger);
+	return makeLoggerPtr(*it->second.logger, it->second.owned_by_shared_ptr);
 }
 
 
@@ -343,29 +369,20 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string&
 {
 	std::optional<Logger::LoggerMapIterator> optional_logger_it = find(name);
 
-	bool should_recreate_logger = false;
-
 	if (optional_logger_it)
 	{
 		auto & logger_it = *optional_logger_it;
-		std::optional<size_t> reference_count_before;
 
-		if (get_shared)
+		if (logger_it->second.owned_by_shared_ptr)
 		{
-			reference_count_before = logger_it->second.logger->duplicate();
-		}
-		else if (logger_it->second.owned_by_shared_ptr)
-		{
-			reference_count_before = logger_it->second.logger->duplicate();
-			logger_it->second.owned_by_shared_ptr = false;
-		}
+			logger_it->second.logger->duplicate();
 
-		/// Other thread already decided to delete this logger, but did not yet remove it from map
-		if (reference_count_before && reference_count_before == 0)
-			should_recreate_logger = true;
+			if (!get_shared)
+				logger_it->second.owned_by_shared_ptr = false;
+		}
 	}
 
-	if (!optional_logger_it || should_recreate_logger)
+	if (!optional_logger_it)
 	{
 		Logger * logger = nullptr;
 
@@ -379,12 +396,6 @@ std::pair<Logger::LoggerMapIterator, bool> Logger::unsafeGet(const std::string&
 			logger = new Logger(name, par.getChannel(), par.getLevel());
 		}
 
-		if (should_recreate_logger)
-		{
-			(*optional_logger_it)->second.logger = logger;
-			return std::make_pair(*optional_logger_it, true);
-		}
-
 		return add(logger);
 	}
 
@@ -412,7 +423,7 @@ LoggerPtr Logger::createShared(const std::string & name, Channel * pChannel, int
 	auto [it, inserted] = unsafeCreate(name, pChannel, level);
 	it->second.owned_by_shared_ptr = true;
 
-	return makeLoggerPtr(*it->second.logger);
+	return makeLoggerPtr(*it->second.logger, it->second.owned_by_shared_ptr);
 }
 
 Logger& Logger::root()
@@ -479,43 +490,6 @@ Logger * Logger::findRawPtr(const std::string & name)
 }
 
 
-void intrusive_ptr_add_ref(Logger * ptr)
-{
-	ptr->duplicate();
-}
-
-
-void intrusive_ptr_release(Logger * ptr)
-{
-	size_t reference_count_before = ptr->_counter.fetch_sub(1, std::memory_order_acq_rel);
-	if (reference_count_before != 1)
-		return;
-
-	{
-		std::lock_guard<std::mutex> lock(getLoggerMutex());
-
-		if (_pLoggerMap)
-		{
-			auto it = _pLoggerMap->find(ptr->name());
-
-			/** It is possible that during release other thread created logger and
-			  * updated iterator in map.
-			  */
-			if (it != _pLoggerMap->end() && ptr == it->second.logger)
-			{
-				/** If reference count is 0, this means this intrusive pointer owns logger
-				  * and need destroy it.
-				  */
-				assert(it->second.owned_by_shared_ptr);
-				_pLoggerMap->erase(it);
-			}
-		}
-	}
-
-	delete ptr;
-}
-
-
 void Logger::names(std::vector<std::string>& names)
 {
 	std::lock_guard<std::mutex> lock(getLoggerMutex());

From 2fc8895ae8aae3cb861faf04e424482ffcd081b3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 7 Feb 2024 20:04:51 +0300
Subject: [PATCH 0817/1081] Fixed tests

---
 src/Server/GRPCServer.cpp | 10 +++++-----
 src/Server/GRPCServer.h   |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 7c532312612..15765f99b4b 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -76,7 +76,7 @@ namespace
         static std::once_flag once_flag;
         std::call_once(once_flag, [&config]
         {
-            static LoggerPtr logger = getLogger("grpc");
+            static LoggerRawPtr logger = getRawLogger("grpc");
             gpr_set_log_function([](gpr_log_func_args* args)
             {
                 if (args->severity == GPR_LOG_SEVERITY_DEBUG)
@@ -622,7 +622,7 @@ namespace
     class Call
     {
     public:
-        Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerPtr log_);
+        Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerRawPtr log_);
         ~Call();
 
         void start(const std::function<void(void)> & on_finish_call_callback);
@@ -664,7 +664,7 @@ namespace
         const CallType call_type;
         std::unique_ptr<BaseResponder> responder;
         IServer & iserver;
-        LoggerPtr log = nullptr;
+        LoggerRawPtr log = nullptr;
 
         std::optional<Session> session;
         ContextMutablePtr query_context;
@@ -726,7 +726,7 @@ namespace
     };
 // NOLINTEND(clang-analyzer-optin.performance.Padding)
 
-    Call::Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerPtr log_)
+    Call::Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerRawPtr log_)
         : call_type(call_type_), responder(std::move(responder_)), iserver(iserver_), log(log_)
     {
     }
@@ -1851,7 +1851,7 @@ private:
 GRPCServer::GRPCServer(IServer & iserver_, const Poco::Net::SocketAddress & address_to_listen_)
     : iserver(iserver_)
     , address_to_listen(address_to_listen_)
-    , log(getLogger("GRPCServer"))
+    , log(getRawLogger("GRPCServer"))
     , runner(std::make_unique<Runner>(*this))
 {}
 
diff --git a/src/Server/GRPCServer.h b/src/Server/GRPCServer.h
index a9c8161298f..f86c2fe4ab7 100644
--- a/src/Server/GRPCServer.h
+++ b/src/Server/GRPCServer.h
@@ -47,7 +47,7 @@ private:
 
     IServer & iserver;
     const Poco::Net::SocketAddress address_to_listen;
-    LoggerPtr log;
+    LoggerRawPtr log;
     GRPCService grpc_service;
     std::unique_ptr<grpc::Server> grpc_server;
     std::unique_ptr<grpc::ServerCompletionQueue> queue;

From 9c3b363c81a2ea394a4b4d4c55468f6dcf7b8c8b Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 9 Feb 2024 21:38:56 +0300
Subject: [PATCH 0818/1081] Fixed tests

---
 src/Server/GRPCServer.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Server/GRPCServer.h b/src/Server/GRPCServer.h
index f86c2fe4ab7..70c16d3e9af 100644
--- a/src/Server/GRPCServer.h
+++ b/src/Server/GRPCServer.h
@@ -3,10 +3,11 @@
 #include "config.h"
 
 #if USE_GRPC
+
+#include "clickhouse_grpc.grpc.pb.h"
 #include <Poco/Net/SocketAddress.h>
 #include <base/types.h>
 #include <Common/Logger.h>
-#include "clickhouse_grpc.grpc.pb.h"
 
 namespace Poco { class Logger; }
 

From 769078e2d81cf8090c5b96bac24f80b5d3cae495 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 9 Feb 2024 19:32:53 +0000
Subject: [PATCH 0819/1081] Another attempt.

---
 src/Processors/QueryPlan/Optimizations/optimizeTree.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index c64bc308246..daf0a1b959b 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -122,6 +122,10 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
 
         if (frame.next_child == 0)
         {
+
+            if (optimization_settings.read_in_order)
+                optimizeReadInOrder(*frame.node, nodes);
+
             if (optimization_settings.distinct_in_order)
                 tryDistinctReadInOrder(frame.node);
         }
@@ -150,9 +154,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             {
                 has_reading_from_mt |= typeid_cast<const ReadFromMergeTree *>(frame.node->step.get()) != nullptr;
 
-                if (optimization_settings.read_in_order)
-                    optimizeReadInOrder(*frame.node, nodes);
-
                 /// Projection optimization relies on PK optimization
                 if (optimization_settings.optimize_projection)
                     num_applied_projection

From 99b66f75bddf42c008fc7bc7efa64e6881dd6dc7 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 10 Feb 2024 02:27:55 +0100
Subject: [PATCH 0820/1081] Sequential run

---
 docker/test/stateless/run.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index 55349c6c406..aec2add2857 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -188,7 +188,7 @@ function run_tests()
         # Too many tests fail for DatabaseReplicated in parallel.
         ADDITIONAL_OPTIONS+=('--jobs')
         ADDITIONAL_OPTIONS+=('2')
-    elif [[ 1 == $(clickhouse-client --query "SELECT value LIKE '%sanitize-coverage%' FROM system.build_options WHERE name = 'CXX_FLAGS'") ]]; then
+    elif [[ 1 == $(clickhouse-client --query "SELECT value LIKE '%SANITIZE_COVERAGE%' FROM system.build_options WHERE name = 'CXX_FLAGS'") ]]; then
         # Coverage on a per-test basis could only be collected sequentially.
         # Do not set the --jobs parameter.
         echo "Running tests with coverage collection."

From ed02154a4a5d00cc8bb0523582161f1342279511 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 10 Feb 2024 07:31:54 +0100
Subject: [PATCH 0821/1081] Fix "Too many parts"

---
 docker/test/base/setup_export_logs.sh                        | 2 +-
 .../0_stateless/01459_manual_write_to_replicas_quorum.sh     | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 917701b8d35..9e854dce65a 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -143,7 +143,7 @@ function setup_logs_replication
             time DateTime COMMENT 'The time of test run',
             test_name String COMMENT 'The name of the test',
             coverage Array(UInt64) COMMENT 'An array of addresses of the code (a subset of addresses instrumented for coverage) that were encountered during the test run'
-        ) ENGINE = MergeTree ORDER BY test_name COMMENT 'Contains information about per-test coverage from the CI'
+        ) ENGINE = Null COMMENT 'Contains information about per-test coverage from the CI, but used only for exporting to the CI cluster'
     "
 
     # For each system log table:
diff --git a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
index 209e18e3329..379f83c6271 100755
--- a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
+++ b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
@@ -8,6 +8,11 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+# This test does many invocations of clickhouse-client in a loop,
+# leading to "Too many parts" in the system.coverage_log,
+# but we are not interested in client-side coverage here.
+unset CLICKHOUSE_WRITE_COVERAGE
+
 NUM_REPLICAS=10
 
 for i in $(seq 1 $NUM_REPLICAS); do

From 43d8a879fefbca12bd03328d8cb9d483223b6520 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 11:38:21 +0000
Subject: [PATCH 0822/1081] Fixing tests.

---
 .../QueryPlan/Optimizations/optimizeTree.cpp  |  10 +-
 .../02521_aggregation_by_partitions.reference | 141 +++++++++---------
 2 files changed, 74 insertions(+), 77 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index daf0a1b959b..816850cc82c 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -126,6 +126,9 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             if (optimization_settings.read_in_order)
                 optimizeReadInOrder(*frame.node, nodes);
 
+            if (optimization_settings.aggregation_in_order)
+                optimizeAggregationInOrder(*frame.node, nodes);
+
             if (optimization_settings.distinct_in_order)
                 tryDistinctReadInOrder(frame.node);
         }
@@ -139,6 +142,8 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             continue;
         }
 
+        enableMemoryBoundMerging(*stack.back().node, nodes);
+
         stack.pop_back();
     }
 
@@ -158,9 +163,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
                 if (optimization_settings.optimize_projection)
                     num_applied_projection
                         += optimizeUseAggregateProjections(*frame.node, nodes, optimization_settings.optimize_use_implicit_projections);
-
-                if (optimization_settings.aggregation_in_order)
-                    optimizeAggregationInOrder(*frame.node, nodes);
             }
 
             /// Traverse all children first.
@@ -192,8 +194,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             }
         }
 
-        enableMemoryBoundMerging(*stack.back().node, nodes);
-
         stack.pop_back();
     }
 
diff --git a/tests/queries/0_stateless/02521_aggregation_by_partitions.reference b/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
index 67a131ff853..d32e6c7d416 100644
--- a/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
+++ b/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
@@ -91,19 +91,18 @@ ExpressionTransform × 16
         (Expression)
         ExpressionTransform × 4
           (ReadFromMergeTree)
-          ExpressionTransform × 4
-            MergingSortedTransform 2 → 1
-              ExpressionTransform × 2
-                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                  MergingSortedTransform 2 → 1
-                    ExpressionTransform × 2
-                      MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                        MergingSortedTransform 2 → 1
-                          ExpressionTransform × 2
-                            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                              MergingSortedTransform 2 → 1
-                                ExpressionTransform × 2
-                                  MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+          MergingSortedTransform 2 → 1
+            ExpressionTransform × 2
+              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                MergingSortedTransform 2 → 1
+                  ExpressionTransform × 2
+                    MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                      MergingSortedTransform 2 → 1
+                        ExpressionTransform × 2
+                          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                            MergingSortedTransform 2 → 1
+                              ExpressionTransform × 2
+                                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
 1000000
 (Expression)
 ExpressionTransform × 16
@@ -114,41 +113,6 @@ ExpressionTransform × 16
         (Expression)
         ExpressionTransform × 8
           (ReadFromMergeTree)
-          ExpressionTransform × 8
-            MergingSortedTransform 2 → 1
-              ExpressionTransform × 2
-                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                  MergingSortedTransform 2 → 1
-                    ExpressionTransform × 2
-                      MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                        MergingSortedTransform 2 → 1
-                          ExpressionTransform × 2
-                            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                              MergingSortedTransform 2 → 1
-                                ExpressionTransform × 2
-                                  MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                    MergingSortedTransform 2 → 1
-                                      ExpressionTransform × 2
-                                        MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                          MergingSortedTransform 2 → 1
-                                            ExpressionTransform × 2
-                                              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                MergingSortedTransform 2 → 1
-                                                  ExpressionTransform × 2
-                                                    MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                      MergingSortedTransform 2 → 1
-                                                        ExpressionTransform × 2
-                                                          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-1000000
-(Expression)
-ExpressionTransform × 16
-  (Aggregating)
-  FinalizeAggregatedTransform × 16
-    AggregatingInOrderTransform × 16
-      (Expression)
-      ExpressionTransform × 16
-        (ReadFromMergeTree)
-        ExpressionTransform × 16
           MergingSortedTransform 2 → 1
             ExpressionTransform × 2
               MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
@@ -173,30 +137,63 @@ ExpressionTransform × 16
                                                     MergingSortedTransform 2 → 1
                                                       ExpressionTransform × 2
                                                         MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                          MergingSortedTransform 2 → 1
-                                                            ExpressionTransform × 2
-                                                              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                MergingSortedTransform 2 → 1
-                                                                  ExpressionTransform × 2
-                                                                    MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                      MergingSortedTransform 2 → 1
-                                                                        ExpressionTransform × 2
-                                                                          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                            MergingSortedTransform 2 → 1
-                                                                              ExpressionTransform × 2
-                                                                                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                                  MergingSortedTransform 2 → 1
-                                                                                    ExpressionTransform × 2
-                                                                                      MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                                        MergingSortedTransform 2 → 1
-                                                                                          ExpressionTransform × 2
-                                                                                            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                                              MergingSortedTransform 2 → 1
-                                                                                                ExpressionTransform × 2
-                                                                                                  MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
-                                                                                                    MergingSortedTransform 2 → 1
-                                                                                                      ExpressionTransform × 2
-                                                                                                        MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+1000000
+(Expression)
+ExpressionTransform × 16
+  (Aggregating)
+  FinalizeAggregatedTransform × 16
+    AggregatingInOrderTransform × 16
+      (Expression)
+      ExpressionTransform × 16
+        (ReadFromMergeTree)
+        MergingSortedTransform 2 → 1
+          ExpressionTransform × 2
+            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+              MergingSortedTransform 2 → 1
+                ExpressionTransform × 2
+                  MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                    MergingSortedTransform 2 → 1
+                      ExpressionTransform × 2
+                        MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                          MergingSortedTransform 2 → 1
+                            ExpressionTransform × 2
+                              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                MergingSortedTransform 2 → 1
+                                  ExpressionTransform × 2
+                                    MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                      MergingSortedTransform 2 → 1
+                                        ExpressionTransform × 2
+                                          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                            MergingSortedTransform 2 → 1
+                                              ExpressionTransform × 2
+                                                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                  MergingSortedTransform 2 → 1
+                                                    ExpressionTransform × 2
+                                                      MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                        MergingSortedTransform 2 → 1
+                                                          ExpressionTransform × 2
+                                                            MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                              MergingSortedTransform 2 → 1
+                                                                ExpressionTransform × 2
+                                                                  MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                    MergingSortedTransform 2 → 1
+                                                                      ExpressionTransform × 2
+                                                                        MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                          MergingSortedTransform 2 → 1
+                                                                            ExpressionTransform × 2
+                                                                              MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                                MergingSortedTransform 2 → 1
+                                                                                  ExpressionTransform × 2
+                                                                                    MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                                      MergingSortedTransform 2 → 1
+                                                                                        ExpressionTransform × 2
+                                                                                          MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                                            MergingSortedTransform 2 → 1
+                                                                                              ExpressionTransform × 2
+                                                                                                MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
+                                                                                                  MergingSortedTransform 2 → 1
+                                                                                                    ExpressionTransform × 2
+                                                                                                      MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
 1000000
 Skip merging: 1
 Skip merging: 1

From 74caa8e44e66f0ce2803b088d8bd0bb796de5bef Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 11:43:35 +0000
Subject: [PATCH 0823/1081] Updaye test.

---
 .../02521_aggregation_by_partitions.reference        | 12 ++++++++++++
 .../0_stateless/02521_aggregation_by_partitions.sql  | 12 ++++++++++++
 2 files changed, 24 insertions(+)

diff --git a/tests/queries/0_stateless/02521_aggregation_by_partitions.reference b/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
index d32e6c7d416..87b2d5c3430 100644
--- a/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
+++ b/tests/queries/0_stateless/02521_aggregation_by_partitions.reference
@@ -1,3 +1,5 @@
+-- { echoOn }
+explain pipeline select a from t1 group by a;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
@@ -15,6 +17,8 @@ ExpressionTransform × 16
                     Resize 3 → 1
                       MergeTreeSelect(pool: ReadPool, algorithm: Thread) × 3 0 → 1
 1000000
+-- { echoOn }
+explain pipeline select a from t2 group by a;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
@@ -40,6 +44,8 @@ ExpressionTransform × 16
                                     Resize 2 → 1
                                       MergeTreeSelect(pool: ReadPool, algorithm: Thread) × 2 0 → 1
 1000000
+-- { echoOn }
+explain pipeline select a from t3 group by a;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
@@ -82,6 +88,8 @@ ExpressionTransform × 16
                                                                       MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
 1000000
 1000000
+-- { echoOn }
+explain pipeline select a from t4 group by a settings read_in_order_two_level_merge_threshold = 1e12;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
@@ -104,6 +112,8 @@ ExpressionTransform × 16
                               ExpressionTransform × 2
                                 MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
 1000000
+-- { echoOn }
+explain pipeline select a from t5 group by a settings read_in_order_two_level_merge_threshold = 1e12;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
@@ -138,6 +148,8 @@ ExpressionTransform × 16
                                                       ExpressionTransform × 2
                                                         MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) × 2 0 → 1
 1000000
+-- { echoOn }
+explain pipeline select a from t6 group by a settings read_in_order_two_level_merge_threshold = 1e12;
 (Expression)
 ExpressionTransform × 16
   (Aggregating)
diff --git a/tests/queries/0_stateless/02521_aggregation_by_partitions.sql b/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
index 87317e5fba4..5b013ca5aef 100644
--- a/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
+++ b/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
@@ -15,7 +15,9 @@ system stop merges t1;
 insert into t1 select number from numbers_mt(1e6);
 insert into t1 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t1 group by a;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t1 group by a);
 
@@ -28,7 +30,9 @@ system stop merges t2;
 insert into t2 select number from numbers_mt(1e6);
 insert into t2 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t2 group by a;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t2 group by a);
 
@@ -41,7 +45,9 @@ system stop merges t3;
 insert into t3 select number from numbers_mt(1e6);
 insert into t3 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t3 group by a;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t3 group by a);
 
@@ -63,7 +69,9 @@ system stop merges t4;
 insert into t4 select number from numbers_mt(1e6);
 insert into t4 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t4 group by a settings read_in_order_two_level_merge_threshold = 1e12;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t4 group by a);
 
@@ -76,7 +84,9 @@ system stop merges t5;
 insert into t5 select number from numbers_mt(1e6);
 insert into t5 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t5 group by a settings read_in_order_two_level_merge_threshold = 1e12;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t5 group by a);
 
@@ -89,7 +99,9 @@ system stop merges t6;
 insert into t6 select number from numbers_mt(1e6);
 insert into t6 select number from numbers_mt(1e6);
 
+-- { echoOn }
 explain pipeline select a from t6 group by a settings read_in_order_two_level_merge_threshold = 1e12;
+-- { echoOff }
 
 select count() from (select throwIf(count() != 2) from t6 group by a);
 

From bcae537810a221af9e83551bf3b083190e82f70e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 11:50:06 +0000
Subject: [PATCH 0824/1081] Remove commented code.

---
 .../Optimizations/optimizePrewhere.cpp        | 320 +-----------------
 1 file changed, 1 insertion(+), 319 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index ee5ad8d1a8a..6676f935b67 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -16,49 +16,6 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-// namespace
-// {
-
-// void matchDAGOutputNodesOrderWithHeader(ActionsDAGPtr & actions_dag, const Block & expected_header)
-// {
-//     std::unordered_map<std::string, const ActionsDAG::Node *> output_name_to_node;
-//     for (const auto * output_node : actions_dag->getOutputs())
-//         output_name_to_node.emplace(output_node->result_name, output_node);
-
-//     std::unordered_set<const ActionsDAG::Node *> used_output_nodes;
-
-//     ActionsDAG::NodeRawConstPtrs updated_outputs;
-//     updated_outputs.reserve(expected_header.columns());
-
-//     for (const auto & column : expected_header)
-//     {
-//         auto output_node_it = output_name_to_node.find(column.name);
-//         if (output_node_it == output_name_to_node.end())
-//             throw Exception(ErrorCodes::LOGICAL_ERROR,
-//                 "Invalid move to PREWHERE optimization. Cannot find column {} in output",
-//                 column.name);
-
-//         updated_outputs.push_back(output_node_it->second);
-//         used_output_nodes.insert(output_node_it->second);
-//     }
-
-//     ActionsDAG::NodeRawConstPtrs unused_outputs;
-//     for (const auto * output_node : actions_dag->getOutputs())
-//     {
-//         if (used_output_nodes.contains(output_node))
-//             continue;
-
-//         unused_outputs.push_back(output_node);
-//     }
-
-//     auto & actions_dag_outputs = actions_dag->getOutputs();
-//     actions_dag_outputs = std::move(updated_outputs);
-//     actions_dag_outputs.insert(actions_dag_outputs.end(), unused_outputs.begin(), unused_outputs.end());
-// }
-
-// }
-
-
 namespace QueryPlanOptimizations
 {
 
@@ -102,40 +59,6 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     if (!filter_step)
         return;
 
-    /** Collect required filter output columns.
-      * Collect output nodes that are mapped to input nodes.
-      * Collect input node to output nodes mapping.
-      */
-    ColumnsWithTypeAndName required_columns_after_filter;
-    // std::unordered_set<std::string> output_nodes_mapped_to_input;
-    // std::unordered_map<std::string, std::vector<std::string>> input_node_to_output_names;
-
-    // for (const auto * output_node : filter_step->getExpression()->getOutputs())
-    // {
-    //     const auto * node_without_alias = output_node;
-    //     while (node_without_alias->type == ActionsDAG::ActionType::ALIAS)
-    //         node_without_alias = node_without_alias->children[0];
-
-    //     if (node_without_alias->type == ActionsDAG::ActionType::INPUT)
-    //     {
-    //         output_nodes_mapped_to_input.emplace(output_node->result_name);
-
-    //         auto output_names_it = input_node_to_output_names.find(node_without_alias->result_name);
-    //         if (output_names_it == input_node_to_output_names.end())
-    //         {
-    //             auto [insert_it, _] = input_node_to_output_names.emplace(node_without_alias->result_name, std::vector<std::string>());
-    //             output_names_it = insert_it;
-    //         }
-
-    //         output_names_it->second.push_back(output_node->result_name);
-    //     }
-
-    //     if (output_node->result_name == filter_step->getFilterColumnName() && filter_step->removesFilterColumn())
-    //         continue;
-
-    //     required_columns_after_filter.push_back(ColumnWithTypeAndName(output_node->result_type, output_node->result_name));
-    // }
-
     const auto & context = read_from_merge_tree->getContext();
     const auto & settings = context->getSettingsRef();
 
@@ -149,6 +72,7 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
 
     const auto & storage_snapshot = read_from_merge_tree->getStorageSnapshot();
 
+    ColumnsWithTypeAndName required_columns_after_filter;
     if (read_from_merge_tree->isQueryWithSampling())
     {
         const auto & sampling_key = storage_snapshot->getMetadataForQuery()->getSamplingKey();
@@ -195,10 +119,6 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         prewhere_info = std::make_shared<PrewhereInfo>();
 
     prewhere_info->need_filter = true;
-    // std::cerr << filter_step->getExpression()->dumpDAG() << std::endl;
-
-    // QueryPlan::Node * replace_old_filter_node = nullptr;
-    // bool remove_filter_node = false;
 
     auto filter_expression = filter_step->getExpression();
     const auto & filter_column_name = filter_step->getFilterColumnName();
@@ -213,19 +133,8 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         outputs.resize(size);
     }
 
-    // if (!optimize_result.fully_moved_to_prewhere)
-    // {
     auto split_result = filter_step->getExpression()->split(optimize_result.prewhere_nodes, true);
 
-    // std::cerr << split_result.first->dumpDAG() << std::endl;
-    // std::cerr << split_result.second->dumpDAG() << std::endl;
-
-    // for (const auto * input : split_result.first->getInputs())
-    //     std::cerr << "in 1" << input->result_name << std::endl;
-    // for (const auto * input : split_result.second->getInputs())
-    //     std::cerr << "in 2" << input->result_name << std::endl;
-
-
     /// This is the leak of abstraction.
     /// Splited actions may have inputs which are needed only for PREWHERE.
     /// This is fine for ActionsDAG to have such a split, but it breaks defaults calculation.
@@ -239,13 +148,7 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     ///
     /// So, here we restore removed inputs for PREWHERE actions
     {
-        // const auto & virtuals = read_from_merge_tree->getVirtualColumnNames();
-        // NameSet virtual_names(virtuals.begin(), virtuals.end());
-
-        //std::unordered_set<const ActionsDAG::Node *> first_inputs(split_result.first->getInputs().begin(), split_result.first->getInputs().end());
         std::unordered_set<const ActionsDAG::Node *> first_outputs(split_result.first->getOutputs().begin(), split_result.first->getOutputs().end());
-        ///std::unordered_set<const ActionsDAG::Node *> second_inputs(split_result.second->getInputs().begin(), split_result.second->getInputs().end());
-
         for (const auto * input : split_result.first->getInputs())
         {
             if (!first_outputs.contains(input))
@@ -256,22 +159,12 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
                 split_result.second->addInput(input->result_name, input->result_type);
             }
         }
-
-        // NameSet input_columns;
-        // for (const auto * input : split_result.first->getInputs())
-        //     input_columns.insert(input->result_name);
-
-        // auto header = read_from_merge_tree->getStorageSnapshot()->getSampleBlockForColumns(read_from_merge_tree->getRealColumnNames());
-        // header = MergeTreeSelectProcessor::transformHeader(std::move(header), prewhere_info, {}, {});
     }
 
     ActionsDAG::NodeRawConstPtrs conditions;
     conditions.reserve(split_result.split_nodes_mapping.size());
     for (const auto * condition : optimize_result.prewhere_nodes)
-    {
-        // std::cerr << ".. " << condition->result_name << std::endl;
         conditions.push_back(split_result.split_nodes_mapping.at(condition));
-    }
 
     prewhere_info->prewhere_actions = std::move(split_result.first);
     prewhere_info->remove_prewhere_column = optimize_result.fully_moved_to_prewhere && filter_step->removesFilterColumn();
@@ -291,14 +184,8 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
         prewhere_info->prewhere_actions->getOutputs().push_back(node);
     }
 
-    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
-    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
-
     read_from_merge_tree->updatePrewhereInfo(prewhere_info);
 
-    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
-    // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
-
     if (!optimize_result.fully_moved_to_prewhere)
     {
         filter_node->step = std::make_unique<FilterStep>(
@@ -309,215 +196,10 @@ void optimizePrewhere(Stack & stack, QueryPlan::Nodes &)
     }
     else
     {
-        // std::cerr << split_result.second->dumpDAG() << std::endl;
-        // std::cerr << read_from_merge_tree->getOutputStream().header.dumpStructure() << std::endl;
-        // std::cerr << read_from_merge_tree->getOutputStream().header.dumpIndex() << std::endl;
-
         filter_node->step = std::make_unique<ExpressionStep>(
             read_from_merge_tree->getOutputStream(),
             std::move(split_result.second));
     }
-    // return;
-    // }
-
-    // prewhere_info->prewhere_actions = filter_step->getExpression();
-    // prewhere_info->prewhere_actions->projectInput(false);
-    // std::cerr << prewhere_info->prewhere_actions->dumpDAG() << std::endl;
-    // prewhere_info->prewhere_column_name = filter_step->getFilterColumnName();
-    // prewhere_info->remove_prewhere_column = filter_step->removesFilterColumn();
-
-    // read_from_merge_tree->updatePrewhereInfo(prewhere_info);
-
-    // replace_old_filter_node = frame.node;
-    // remove_filter_node = true;
-
-    // auto & prewhere_filter_actions = optimize_result->prewhere_filter_actions;
-
-    // ActionsChain actions_chain;
-
-    // std::string prewere_filter_node_name = prewhere_filter_actions->getOutputs().at(0)->result_name;
-    // actions_chain.addStep(std::make_unique<ActionsChainStep>(prewhere_filter_actions));
-
-    // auto & filter_actions = optimize_result->filter_actions;
-
-    // /** Merge tree where optimizer splits conjunctions in filter expression into 2 parts:
-    //   * 1. Filter expressions.
-    //   * 2. Prewhere filter expressions.
-    //   *
-    //   * There can be cases when all expressions are moved to PREWHERE, but it is not
-    //   * enough to produce required filter output columns.
-    //   *
-    //   * Example: SELECT (a AND b) AS cond FROM test_table WHERE cond AND c;
-    //   * In this example condition expressions `a`, `b`, `c` can move to PREWHERE, but PREWHERE will not contain expression `and(a, b)`.
-    //   * It will contain only `a`, `b`, `c`, `and(a, b, c)` expressions.
-    //   *
-    //   * In such scenario we need to create additional step to calculate `and(a, b)` expression after PREWHERE.
-    //   */
-    // bool need_additional_filter_after_prewhere = false;
-
-    // if (!filter_actions)
-    // {
-    //     /// Any node from PREWHERE filter actions can be used as possible output node
-    //     std::unordered_set<std::string> possible_prewhere_output_nodes;
-    //     for (const auto & node : prewhere_filter_actions->getNodes())
-    //         possible_prewhere_output_nodes.insert(node.result_name);
-
-    //     for (auto & required_column : required_columns_after_filter)
-    //     {
-    //         if (!possible_prewhere_output_nodes.contains(required_column.name) &&
-    //             !output_nodes_mapped_to_input.contains(required_column.name))
-    //         {
-    //             need_additional_filter_after_prewhere = true;
-    //             break;
-    //         }
-    //     }
-    // }
-
-    // /** If there are additional filter actions after PREWHERE filter actions, we create filter actions dag using PREWHERE filter
-    //   * actions output columns as filter actions dag input columns.
-    //   * Then we merge this filter actions dag nodes with old filter step actions dag nodes, to reuse some expressions from
-    //   * PREWHERE filter actions.
-    //   */
-    // if (need_additional_filter_after_prewhere || filter_actions)
-    // {
-    //     auto merged_filter_actions = std::make_shared<ActionsDAG>(actions_chain.getLastStepAvailableOutputColumns());
-    //     merged_filter_actions->getOutputs().clear();
-    //     merged_filter_actions->mergeNodes(std::move(*filter_step->getExpression()->clone()));
-
-    //     /// Add old filter step filter column to outputs
-    //     for (const auto & node : merged_filter_actions->getNodes())
-    //     {
-    //         if (node.result_name == filter_step->getFilterColumnName())
-    //         {
-    //             merged_filter_actions->getOutputs().push_back(&node);
-    //             break;
-    //         }
-    //     }
-
-    //     filter_actions = std::move(merged_filter_actions);
-
-    //     /// If there is filter after PREWHERE, we can ignore filtering during PREWHERE stage
-    //     prewhere_info->need_filter = false;
-
-    //     actions_chain.addStep(std::make_unique<ActionsChainStep>(filter_actions));
-    // }
-
-    // auto required_output_actions = std::make_shared<ActionsDAG>(required_columns_after_filter);
-    // actions_chain.addStep(std::make_unique<ActionsChainStep>(required_output_actions));
-
-    // actions_chain.finalize();
-
-    // prewhere_filter_actions->projectInput(false);
-
-    // auto & prewhere_actions_chain_node = actions_chain[0];
-    // prewhere_info->prewhere_actions = std::move(prewhere_filter_actions);
-    // prewhere_info->prewhere_column_name = prewere_filter_node_name;
-    // prewhere_info->remove_prewhere_column = !prewhere_actions_chain_node->getChildRequiredOutputColumnsNames().contains(prewere_filter_node_name);
-
-    // read_from_merge_tree->updatePrewhereInfo(prewhere_info);
-
-    // QueryPlan::Node * replace_old_filter_node = nullptr;
-    // bool remove_filter_node = false;
-
-    // if (filter_actions)
-    // {
-    //     filter_actions->projectInput(false);
-
-    //     /// Match dag output nodes with old filter step header
-    //     matchDAGOutputNodesOrderWithHeader(filter_actions, filter_step->getOutputStream().header);
-
-    //     auto & filter_actions_chain_node = actions_chain[1];
-    //     bool remove_filter_column = !filter_actions_chain_node->getChildRequiredOutputColumnsNames().contains(filter_step->getFilterColumnName());
-    //     auto after_prewhere_filter_step = std::make_unique<FilterStep>(read_from_merge_tree->getOutputStream(),
-    //         filter_actions,
-    //         filter_step->getFilterColumnName(),
-    //         remove_filter_column);
-
-    //     auto & node = nodes.emplace_back();
-    //     node.children.emplace_back(frame.node);
-    //     node.step = std::move(after_prewhere_filter_step);
-
-    //     replace_old_filter_node = &node;
-    // }
-    // else
-    // {
-    //     auto rename_actions_dag = std::make_shared<ActionsDAG>(read_from_merge_tree->getOutputStream().header.getColumnsWithTypeAndName());
-    //     bool apply_rename_step = false;
-
-    //     ActionsDAG::NodeRawConstPtrs updated_outputs;
-
-    //     /** If in output after read from merge tree there are column names without aliases,
-    //       * apply old filter step aliases to them.
-    //       */
-    //     for (const auto * output_node : rename_actions_dag->getOutputs())
-    //     {
-    //         const auto alias_it = input_node_to_output_names.find(output_node->result_name);
-    //         if (alias_it == input_node_to_output_names.end())
-    //         {
-    //             updated_outputs.push_back(output_node);
-    //             continue;
-    //         }
-
-    //         for (auto & output_name : alias_it->second)
-    //         {
-    //             if (output_name == output_node->result_name)
-    //             {
-    //                 updated_outputs.push_back(output_node);
-    //                 continue;
-    //             }
-
-    //             updated_outputs.push_back(&rename_actions_dag->addAlias(*output_node, output_name));
-    //             apply_rename_step = true;
-    //         }
-    //     }
-
-    //     rename_actions_dag->getOutputs() = std::move(updated_outputs);
-
-    //     bool apply_match_step = false;
-
-    //     /// If column order does not match old filter step column order, match dag output nodes with header
-    //     if (!blocksHaveEqualStructure(read_from_merge_tree->getOutputStream().header, filter_step->getOutputStream().header))
-    //     {
-    //         apply_match_step = true;
-    //         matchDAGOutputNodesOrderWithHeader(rename_actions_dag, filter_step->getOutputStream().header);
-    //     }
-
-    //     if (apply_rename_step || apply_match_step)
-    //     {
-    //         auto rename_step = std::make_unique<ExpressionStep>(read_from_merge_tree->getOutputStream(), rename_actions_dag);
-    //         if (apply_rename_step)
-    //             rename_step->setStepDescription("Change column names to column identifiers");
-
-    //         auto & node = nodes.emplace_back();
-    //         node.children.emplace_back(frame.node);
-    //         node.step = std::move(rename_step);
-
-    //         replace_old_filter_node = &node;
-    //     }
-    //     else
-    //     {
-    //         replace_old_filter_node = frame.node;
-    //         remove_filter_node = true;
-    //     }
-    // }
-
-    // QueryPlan::Node * filter_parent_node = (stack.rbegin() + 2)->node;
-
-    // for (auto & filter_parent_child : filter_parent_node->children)
-    // {
-    //     if (filter_parent_child == filter_node)
-    //     {
-    //         filter_parent_child = frame.node;
-
-    //         size_t stack_size = stack.size();
-
-    //         /// Step is completely replaced with PREWHERE filter actions, remove it from stack.
-    //         std::swap(stack[stack_size - 1], stack[stack_size - 2]);
-    //         stack.pop_back();
-
-    //         break;
-    //     }
-    // }
 }
 
 }

From 8b3c27d45bf6721c97231de0bba063463ecf2e0f Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sat, 10 Feb 2024 15:00:31 +0300
Subject: [PATCH 0825/1081] Updated a list of trusted contributors

---
 tests/ci/lambda_shared_package/lambda_shared/pr.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/ci/lambda_shared_package/lambda_shared/pr.py b/tests/ci/lambda_shared_package/lambda_shared/pr.py
index ce38475b3ee..a23d4bbb4c2 100644
--- a/tests/ci/lambda_shared_package/lambda_shared/pr.py
+++ b/tests/ci/lambda_shared_package/lambda_shared/pr.py
@@ -44,6 +44,7 @@ TRUSTED_CONTRIBUTORS = {
         "kitaisreal",
         "k-morozov",  # Konstantin Morozov, Yandex Cloud
         "justindeguzman",  # ClickHouse, Inc
+        "jrdi", # ClickHouse contributor, TinyBird
     ]
 }
 

From fb8723a15c00cc6eff7c2ea2765a528788d11b59 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 13:13:26 +0100
Subject: [PATCH 0826/1081] Update pr.py

---
 tests/ci/lambda_shared_package/lambda_shared/pr.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/lambda_shared_package/lambda_shared/pr.py b/tests/ci/lambda_shared_package/lambda_shared/pr.py
index a23d4bbb4c2..1b4f827cc0a 100644
--- a/tests/ci/lambda_shared_package/lambda_shared/pr.py
+++ b/tests/ci/lambda_shared_package/lambda_shared/pr.py
@@ -44,7 +44,7 @@ TRUSTED_CONTRIBUTORS = {
         "kitaisreal",
         "k-morozov",  # Konstantin Morozov, Yandex Cloud
         "justindeguzman",  # ClickHouse, Inc
-        "jrdi", # ClickHouse contributor, TinyBird
+        "jrdi",  # ClickHouse contributor, TinyBird
     ]
 }
 

From f1193bcd5dbf320195d8c99b2c64322fcbdafd64 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sat, 10 Feb 2024 13:22:58 +0000
Subject: [PATCH 0827/1081] Fix spellcheck

---
 .../aspell-ignore/en/aspell-dict.txt            | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 51aa8222a89..2c9a020f71b 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -190,6 +190,7 @@ CustomSeparatedWithNamesAndTypes
 DBAs
 DBMSs
 DBeaver
+DD
 DDLWORKER
 DDLWorker
 DDLWorkerThreads
@@ -215,7 +216,6 @@ DatabaseOrdinaryThreadsActive
 DateTime
 DateTimes
 DbCL
-DD
 Decrypted
 Deduplicate
 Deduplication
@@ -840,6 +840,7 @@ Sematext
 SendExternalTables
 SendScalars
 ShareAlike
+Shortkeys
 SimHash
 Simhash
 SimpleAggregateFunction
@@ -952,8 +953,8 @@ TotalRowsOfMergeTreeTables
 TotalTemporaryFiles
 Tradeoff
 Transactional
-TwoColumnList
 Tukey
+TwoColumnList
 UBSan
 UDFs
 UInt
@@ -1325,6 +1326,7 @@ cosineDistance
 countDigits
 countEqual
 countMatches
+countMatchesCaseInsensitiveb
 countSubstrings
 covarPop
 covarSamp
@@ -1688,6 +1690,7 @@ hudi
 hyperscan
 hypot
 hyvor
+iTerm
 icosahedron
 icudata
 idempotency
@@ -2132,6 +2135,7 @@ py
 qryn
 quantile
 quantileBFloat
+quantileDD
 quantileDeterministic
 quantileExact
 quantileExactExclusive
@@ -2146,6 +2150,7 @@ quantileTDigestWeighted
 quantileTiming
 quantileTimingWeighted
 quantilebfloat
+quantileddsketch
 quantiledeterministic
 quantileexact
 quantileexactweighted
@@ -2158,8 +2163,6 @@ quantiletdigest
 quantiletdigestweighted
 quantiletiming
 quantiletimingweighted
-quantileddsketch
-quantileDD
 quartile
 queryID
 queryString
@@ -2292,8 +2295,8 @@ seektable
 sequenceCount
 sequenceMatch
 sequenceNextNode
-seriesOutliersDetectTukey
 seriesDecomposeSTL
+seriesOutliersDetectTukey
 seriesPeriodDetectFFT
 serverTimeZone
 serverTimezone
@@ -2307,6 +2310,7 @@ shardNum
 sharded
 sharding
 shortcircuit
+shortkeys
 shoutout
 simdjson
 simpleLinearRegression
@@ -2730,6 +2734,3 @@ znode
 znodes
 zookeeperSessionUptime
 zstd
-iTerm
-shortkeys
-Shortkeys

From a6337fb6b0221fedb138c50feeb176776d572b5d Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sat, 10 Feb 2024 13:42:14 +0000
Subject: [PATCH 0828/1081] Incorporate review feedback

---
 src/Functions/countMatches.h                           | 2 +-
 tests/queries/0_stateless/01595_countMatches.reference | 2 ++
 tests/queries/0_stateless/01595_countMatches.sql       | 2 ++
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 04e86f31884..3ee049ad457 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -98,7 +98,7 @@ public:
             return col_res;
         }
         else
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Error in FunctionCountMatches::getReturnTypeImpl()");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Could not cast haystack argument to String or FixedString");
     }
 
     static uint64_t countMatches(std::string_view src, const OptimizedRegularExpression & re, OptimizedRegularExpression::MatchVec & matches)
diff --git a/tests/queries/0_stateless/01595_countMatches.reference b/tests/queries/0_stateless/01595_countMatches.reference
index 025db39f1fe..394c8508430 100644
--- a/tests/queries/0_stateless/01595_countMatches.reference
+++ b/tests/queries/0_stateless/01595_countMatches.reference
@@ -12,6 +12,7 @@ case sensitive
 2
 4
 4
+2
 case insensitive
 2
 1
@@ -21,6 +22,7 @@ case insensitive
 2
 4
 4
+2
 errors
 FixedString
 2
diff --git a/tests/queries/0_stateless/01595_countMatches.sql b/tests/queries/0_stateless/01595_countMatches.sql
index 5c016c52a4e..0c2982572cd 100644
--- a/tests/queries/0_stateless/01595_countMatches.sql
+++ b/tests/queries/0_stateless/01595_countMatches.sql
@@ -14,6 +14,7 @@ select countMatches(concat(toString(number), 'foofoo'), 'foo') from numbers(2);
 select countMatches('foobarbazfoobarbaz', 'foo(bar)(?:baz|)');
 select countMatches('foo.com bar.com baz.com bam.com', '([^. ]+)\.([^. ]+)');
 select countMatches('foo.com@foo.com bar.com@foo.com baz.com@foo.com bam.com@foo.com', '([^. ]+)\.([^. ]+)@([^. ]+)\.([^. ]+)');
+select countMatches(materialize('foobarfoo'), 'foo');
 
 select 'case insensitive';
 select countMatchesCaseInsensitive('foobarfoo', 'FOo');
@@ -23,6 +24,7 @@ select countMatchesCaseInsensitive(concat(toString(number), 'Foofoo'), 'foo') fr
 select countMatchesCaseInsensitive('foOBarBAZfoobarbaz', 'foo(bar)(?:baz|)');
 select countMatchesCaseInsensitive('foo.com BAR.COM baz.com bam.com', '([^. ]+)\.([^. ]+)');
 select countMatchesCaseInsensitive('foo.com@foo.com bar.com@foo.com BAZ.com@foo.com bam.com@foo.com', '([^. ]+)\.([^. ]+)@([^. ]+)\.([^. ]+)');
+select countMatchesCaseInsensitive(materialize('foobarfoo'), 'FOo');
 
 select 'errors';
 select countMatches(1, 'foo') from numbers(1); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }

From e6d96e43252df4df9198a0c08bd053b168aff097 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 10 Feb 2024 14:49:43 +0100
Subject: [PATCH 0829/1081] Better warning for disabled kernel.task_delayacct

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/server/Server.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 7d3953ae37e..f00da445c16 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -557,7 +557,7 @@ static void sanityChecks(Server & server)
     {
         const char * filename = "/proc/sys/kernel/task_delayacct";
         if (readNumber(filename) == 0)
-            server.context()->addWarningMessage("Delay accounting is not enabled, OSIOWaitMicroseconds will not be gathered. Check " + String(filename));
+            server.context()->addWarningMessage("Delay accounting is not enabled, OSIOWaitMicroseconds will not be gathered. You can enable it using `echo 1 > " + String(filename) + "` or by using sysctl.");
     }
     catch (...) // NOLINT(bugprone-empty-catch)
     {

From 8b25d868e269de6407377657b406114c62a0f2be Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 17:04:27 +0100
Subject: [PATCH 0830/1081] Update optimizePrewhere.cpp

---
 src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index 6676f935b67..ec07f028f20 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -11,11 +11,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
 namespace QueryPlanOptimizations
 {
 

From 04f61781768b6f6bbd3a81e1c4e61d2d343c3410 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sat, 10 Feb 2024 16:32:49 +0000
Subject: [PATCH 0831/1081] Fix spellcheck, pt. II

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 2c9a020f71b..0b29b0f0709 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1326,7 +1326,7 @@ cosineDistance
 countDigits
 countEqual
 countMatches
-countMatchesCaseInsensitiveb
+countMatchesCaseInsensitive
 countSubstrings
 covarPop
 covarSamp

From 306f5047818ea3dc13ec5575c5d6d96f5b25373f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Sat, 10 Feb 2024 19:53:03 +0000
Subject: [PATCH 0832/1081] Fixing test.

---
 .../QueryPlan/Optimizations/optimizeTree.cpp          | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
index 816850cc82c..fafd6d1dc00 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeTree.cpp
@@ -126,9 +126,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             if (optimization_settings.read_in_order)
                 optimizeReadInOrder(*frame.node, nodes);
 
-            if (optimization_settings.aggregation_in_order)
-                optimizeAggregationInOrder(*frame.node, nodes);
-
             if (optimization_settings.distinct_in_order)
                 tryDistinctReadInOrder(frame.node);
         }
@@ -142,8 +139,6 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             continue;
         }
 
-        enableMemoryBoundMerging(*stack.back().node, nodes);
-
         stack.pop_back();
     }
 
@@ -163,6 +158,10 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
                 if (optimization_settings.optimize_projection)
                     num_applied_projection
                         += optimizeUseAggregateProjections(*frame.node, nodes, optimization_settings.optimize_use_implicit_projections);
+
+
+                if (optimization_settings.aggregation_in_order)
+                    optimizeAggregationInOrder(*frame.node, nodes);
             }
 
             /// Traverse all children first.
@@ -194,6 +193,8 @@ void optimizeTreeSecondPass(const QueryPlanOptimizationSettings & optimization_s
             }
         }
 
+        enableMemoryBoundMerging(*stack.back().node, nodes);
+
         stack.pop_back();
     }
 

From 40ea04faf57226e5d67c4f2224dee4e5a9ff488e Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Sat, 10 Feb 2024 13:44:55 +0100
Subject: [PATCH 0833/1081] Add check that recursiveRemoveLowCardinality()
 doesn't change the size of a column.

---
 .../DataTypeLowCardinalityHelpers.cpp         | 60 +++++++++----------
 1 file changed, 30 insertions(+), 30 deletions(-)

diff --git a/src/DataTypes/DataTypeLowCardinalityHelpers.cpp b/src/DataTypes/DataTypeLowCardinalityHelpers.cpp
index 98eb76267a4..116e806f89c 100644
--- a/src/DataTypes/DataTypeLowCardinalityHelpers.cpp
+++ b/src/DataTypes/DataTypeLowCardinalityHelpers.cpp
@@ -20,6 +20,7 @@ namespace ErrorCodes
 {
     extern const int ILLEGAL_COLUMN;
     extern const int TYPE_MISMATCH;
+    extern const int LOGICAL_ERROR;
 }
 
 DataTypePtr recursiveRemoveLowCardinality(const DataTypePtr & type)
@@ -55,62 +56,61 @@ DataTypePtr recursiveRemoveLowCardinality(const DataTypePtr & type)
 
 ColumnPtr recursiveRemoveLowCardinality(const ColumnPtr & column)
 {
-    if (!column)
-        return column;
+    ColumnPtr res = column;
 
     if (const auto * column_array = typeid_cast<const ColumnArray *>(column.get()))
     {
         const auto & data = column_array->getDataPtr();
         auto data_no_lc = recursiveRemoveLowCardinality(data);
-        if (data.get() == data_no_lc.get())
-            return column;
-
-        return ColumnArray::create(data_no_lc, column_array->getOffsetsPtr());
+        if (data.get() != data_no_lc.get())
+            res = ColumnArray::create(data_no_lc, column_array->getOffsetsPtr());
     }
-
-    if (const auto * column_const = typeid_cast<const ColumnConst *>(column.get()))
+    else if (const auto * column_const = typeid_cast<const ColumnConst *>(column.get()))
     {
         const auto & nested = column_const->getDataColumnPtr();
         auto nested_no_lc = recursiveRemoveLowCardinality(nested);
-        if (nested.get() == nested_no_lc.get())
-            return column;
-
-        return ColumnConst::create(nested_no_lc, column_const->size());
+        if (nested.get() != nested_no_lc.get())
+            res = ColumnConst::create(nested_no_lc, column_const->size());
     }
-
-    if (const auto * column_tuple = typeid_cast<const ColumnTuple *>(column.get()))
+    else if (const auto * column_tuple = typeid_cast<const ColumnTuple *>(column.get()))
     {
         auto columns = column_tuple->getColumns();
         for (auto & element : columns)
             element = recursiveRemoveLowCardinality(element);
-        return ColumnTuple::create(columns);
+        res = ColumnTuple::create(columns);
     }
-
-    if (const auto * column_map = typeid_cast<const ColumnMap *>(column.get()))
+    else if (const auto * column_map = typeid_cast<const ColumnMap *>(column.get()))
     {
         const auto & nested = column_map->getNestedColumnPtr();
         auto nested_no_lc = recursiveRemoveLowCardinality(nested);
-        if (nested.get() == nested_no_lc.get())
-            return column;
-
-        return ColumnMap::create(nested_no_lc);
+        if (nested.get() != nested_no_lc.get())
+            res = ColumnMap::create(nested_no_lc);
     }
-
     /// Special case when column is a lazy argument of short circuit function.
     /// We should call recursiveRemoveLowCardinality on the result column
     /// when function will be executed.
-    if (const auto * column_function = typeid_cast<const ColumnFunction *>(column.get()))
+    else if (const auto * column_function = typeid_cast<const ColumnFunction *>(column.get()))
     {
-        if (!column_function->isShortCircuitArgument())
-            return column;
-
-        return column_function->recursivelyConvertResultToFullColumnIfLowCardinality();
+        if (column_function->isShortCircuitArgument())
+            res = column_function->recursivelyConvertResultToFullColumnIfLowCardinality();
+    }
+    else if (const auto * column_low_cardinality = typeid_cast<const ColumnLowCardinality *>(column.get()))
+    {
+        res = column_low_cardinality->convertToFullColumn();
     }
 
-    if (const auto * column_low_cardinality = typeid_cast<const ColumnLowCardinality *>(column.get()))
-        return column_low_cardinality->convertToFullColumn();
+    if (res != column)
+    {
+        /// recursiveRemoveLowCardinality() must not change the size of a passed column!
+        if (res->size() != column->size())
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "recursiveRemoveLowCardinality() somehow changed the size of column {}. Old size={}, new size={}. It's a bug",
+                            column->getName(), column->size(), res->size());
+        }
+    }
 
-    return column;
+    return res;
 }
 
 ColumnPtr recursiveLowCardinalityTypeConversion(const ColumnPtr & column, const DataTypePtr & from_type, const DataTypePtr & to_type)

From 5424f235a92331c8ed2dba72b29de24d3ff1e8f7 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Sat, 10 Feb 2024 00:27:15 +0000
Subject: [PATCH 0834/1081] Fix StorageURL doing some of the query execution in
 one thread instead of max_threads

---
 src/Storages/StorageURL.cpp                                 | 6 ++++--
 .../0_stateless/02723_parallelize_output_setting.reference  | 4 ++++
 .../0_stateless/02723_parallelize_output_setting.sql        | 3 +++
 3 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 433f4ed7700..ce9b0cd366b 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -904,6 +904,7 @@ public:
         , context(std::move(context_))
         , max_block_size(max_block_size_)
         , num_streams(num_streams_)
+        , max_num_streams(num_streams_)
     {
     }
 
@@ -920,6 +921,7 @@ private:
 
     size_t max_block_size;
     size_t num_streams;
+    const size_t max_num_streams;
 
     std::shared_ptr<StorageURLSource::IteratorWrapper> iterator_wrapper;
     bool is_url_with_globs = false;
@@ -1093,8 +1095,8 @@ void ReadFromURL::initializePipeline(QueryPipelineBuilder & pipeline, const Buil
     auto pipe = Pipe::unitePipes(std::move(pipes));
     size_t output_ports = pipe.numOutputPorts();
     const bool parallelize_output = context->getSettingsRef().parallelize_output_from_storages;
-    if (parallelize_output && storage->parallelizeOutputAfterReading(context) && output_ports > 0 && output_ports < num_streams)
-        pipe.resize(num_streams);
+    if (parallelize_output && storage->parallelizeOutputAfterReading(context) && output_ports > 0 && output_ports < max_num_streams)
+        pipe.resize(max_num_streams);
 
     if (pipe.empty())
         pipe = Pipe(std::make_shared<NullSource>(info.source_header));
diff --git a/tests/queries/0_stateless/02723_parallelize_output_setting.reference b/tests/queries/0_stateless/02723_parallelize_output_setting.reference
index 0f2a396f471..36e4e68ecd5 100644
--- a/tests/queries/0_stateless/02723_parallelize_output_setting.reference
+++ b/tests/queries/0_stateless/02723_parallelize_output_setting.reference
@@ -5,3 +5,7 @@ select startsWith(trimLeft(explain),'Resize') as resize from (explain pipeline s
 -- no Resize in pipeline
 set parallelize_output_from_storages=0;
 select startsWith(trimLeft(explain),'Resize') as resize from (explain pipeline select * from file(data_02723.csv)) where resize;
+-- Data from URL source is immediately resized to max_treads streams, before any ExpressionTransform.
+set parallelize_output_from_storages=1;
+select match(arrayStringConcat(groupArray(explain), ''), '.*Resize 1 → 2 *URL 0 → 1 *$') from (explain pipeline select x, count() from url('https://example.com', Parquet, 'x Int64') group by x order by count() limit 10);
+1
diff --git a/tests/queries/0_stateless/02723_parallelize_output_setting.sql b/tests/queries/0_stateless/02723_parallelize_output_setting.sql
index 7db28ca4dec..12786b80f69 100644
--- a/tests/queries/0_stateless/02723_parallelize_output_setting.sql
+++ b/tests/queries/0_stateless/02723_parallelize_output_setting.sql
@@ -10,3 +10,6 @@ select startsWith(trimLeft(explain),'Resize') as resize from (explain pipeline s
 set parallelize_output_from_storages=0;
 select startsWith(trimLeft(explain),'Resize') as resize from (explain pipeline select * from file(data_02723.csv)) where resize;
 
+-- Data from URL source is immediately resized to max_treads streams, before any ExpressionTransform.
+set parallelize_output_from_storages=1;
+select match(arrayStringConcat(groupArray(explain), ''), '.*Resize 1 → 2 *URL 0 → 1 *$') from (explain pipeline select x, count() from url('https://example.com', Parquet, 'x Int64') group by x order by count() limit 10);
\ No newline at end of file

From b5fd68a2b6b9c50accc62671f1b87ea4cd30785c Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Sat, 10 Feb 2024 03:40:55 +0000
Subject: [PATCH 0835/1081] no-fasttest

---
 tests/queries/0_stateless/02723_parallelize_output_setting.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02723_parallelize_output_setting.sql b/tests/queries/0_stateless/02723_parallelize_output_setting.sql
index 12786b80f69..86e6d4b4e3d 100644
--- a/tests/queries/0_stateless/02723_parallelize_output_setting.sql
+++ b/tests/queries/0_stateless/02723_parallelize_output_setting.sql
@@ -1,4 +1,4 @@
--- Tags: no-parallel
+-- Tags: no-parallel, no-fasttest
 
 insert into function file(data_02723.csv) select number from numbers(5) settings engine_file_truncate_on_insert=1;
 

From 64e53fee7bb935a7be84aed5ecc31300e18e4b3d Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 11 Feb 2024 10:07:21 +0100
Subject: [PATCH 0836/1081] Reintroduce
 02590_interserver_mode_client_info_initial_query_start_time

Reintroduce the test without assumption that initial_query_start_time is
the same as query_start_time.

This reverts commit 075da5602fdc03d4d5b15cd8d769704259b168a9.
---
 ...nt_info_initial_query_start_time.reference |  8 +++
 ...de_client_info_initial_query_start_time.sh | 67 +++++++++++++++++++
 2 files changed, 75 insertions(+)
 create mode 100644 tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
 create mode 100755 tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh

diff --git a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
new file mode 100644
index 00000000000..eafcfc23fb8
--- /dev/null
+++ b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.reference
@@ -0,0 +1,8 @@
+SELECT
+3	1
+3	1
+INSERT
+CHECK
+1
+2
+6	2
diff --git a/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh
new file mode 100755
index 00000000000..3b0d2309784
--- /dev/null
+++ b/tests/queries/0_stateless/02590_interserver_mode_client_info_initial_query_start_time.sh
@@ -0,0 +1,67 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: interserver mode requires SSL
+#
+# Test that checks that some of ClientInfo correctly passed in inter-server mode.
+# NOTE: we need .sh test (.sql is not enough) because queries on remote nodes does not have current_database = currentDatabase()
+#
+# Check-style suppression: select * from system.query_log where current_database = currentDatabase();
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+function get_query_id() { random_str 10; }
+
+$CLICKHOUSE_CLIENT -nm -q "
+    drop table if exists buf;
+    drop table if exists dist;
+    drop table if exists data;
+
+    create table data (key Int) engine=Memory();
+    create table dist as data engine=Distributed(test_cluster_interserver_secret, currentDatabase(), data, key);
+    create table dist_dist as data engine=Distributed(test_cluster_interserver_secret, currentDatabase(), dist, key);
+    system stop distributed sends dist;
+"
+
+echo "SELECT"
+query_id="$(get_query_id)"
+# initialize connection, but actually if there are other tables that uses this
+# cluster then, it will be created long time ago, but this is OK for this
+# test, since we care about the difference between NOW() and there should
+# not be any significant difference.
+$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -q "select * from dist"
+$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
+    system flush logs;
+    select count(), count(distinct initial_query_start_time_microseconds) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
+"
+
+sleep 1
+
+query_id="$(get_query_id)"
+# this query (and all subsequent) should reuse the previous connection (at least most of the time)
+$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -q "select * from dist"
+
+$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
+    system flush logs;
+    select count(), count(distinct initial_query_start_time_microseconds) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
+"
+
+echo "INSERT"
+query_id="$(get_query_id)"
+$CLICKHOUSE_CLIENT --prefer_localhost_replica=0 --query_id "$query_id" -nm -q "
+    insert into dist_dist values (1),(2);
+    select * from data;
+"
+
+sleep 1
+$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "system flush distributed dist_dist"
+sleep 1
+$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "system flush distributed dist"
+
+echo "CHECK"
+$CLICKHOUSE_CLIENT -nm --param_query_id "$query_id" -q "
+    select * from data order by key;
+    system flush logs;
+    select count(), count(distinct initial_query_start_time_microseconds) from system.query_log where type = 'QueryFinish' and initial_query_id = {query_id:String};
+"

From a3938e7df0c1b4a8c38b19a23cdb6253f86dc330 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 11 Feb 2024 10:42:36 +0100
Subject: [PATCH 0837/1081] Respect CMAKE_OSX_DEPLOYMENT_TARGET for Rust
 targets

This should fix the following warnings:

    ld: warning: object file (rust/prql/Debug/lib_ch_rust_prql.a[74](aarch_aapcs64.o)) was built for newer 'macOS' version (14.0) than being linked (11.0)
    ld: warning: object file (rust/skim/Debug/lib_ch_rust_skim_rust.a[40](c0e230e4543ad627-lib.rs.o)) was built for newer 'macOS' version (14.0) than being linked (11.0)
    ld: warning: object file (rust/skim/Debug/lib_ch_rust_skim_rust.a[46](6c3a6ae2099d4914-cxx.o)) was built for newer 'macOS' version (14.0) than being linked (11.0)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 rust/CMakeLists.txt | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/rust/CMakeLists.txt b/rust/CMakeLists.txt
index 66694ee16f8..6715a54221a 100644
--- a/rust/CMakeLists.txt
+++ b/rust/CMakeLists.txt
@@ -14,6 +14,11 @@ macro(configure_rustc)
         set(RUST_CFLAGS "${RUST_CFLAGS} --sysroot ${CMAKE_SYSROOT}")
     endif()
 
+    if (CMAKE_OSX_DEPLOYMENT_TARGET)
+        set(RUST_CXXFLAGS "${RUST_CXXFLAGS} -mmacosx-version-min=${CMAKE_OSX_DEPLOYMENT_TARGET}")
+        set(RUST_CFLAGS "${RUST_CFLAGS} -mmacosx-version-min=${CMAKE_OSX_DEPLOYMENT_TARGET}")
+    endif()
+
     if (USE_MUSL)
         set(RUST_CXXFLAGS "${RUST_CXXFLAGS} -D_LIBCPP_HAS_MUSL_LIBC=1")
     endif ()
@@ -25,14 +30,23 @@ macro(configure_rustc)
         set(RUSTCWRAPPER "")
     endif()
 
-    set(RUSTFLAGS "[]")
+    set(RUSTFLAGS)
+    if (CMAKE_OSX_DEPLOYMENT_TARGET)
+        list(APPEND RUSTFLAGS "-C" "link-arg=-mmacosx-version-min=${CMAKE_OSX_DEPLOYMENT_TARGET}")
+    endif()
+
     set(RUST_CARGO_BUILD_STD "")
     # For more info: https://doc.rust-lang.org/beta/unstable-book/compiler-flags/sanitizer.html#memorysanitizer
     if (SANITIZE STREQUAL "memory")
         set(RUST_CARGO_BUILD_STD "build-std = [\"std\", \"panic_abort\", \"core\", \"alloc\"]")
-        set(RUSTFLAGS "[\"-Zsanitizer=memory\", \"-Zsanitizer-memory-track-origins\"]")
+        list(APPEND RUSTFLAGS "-Zsanitizer=memory" "-Zsanitizer-memory-track-origins")
     endif()
 
+    list(TRANSFORM RUSTFLAGS PREPEND "\"")
+    list(TRANSFORM RUSTFLAGS APPEND "\"")
+    list(JOIN RUSTFLAGS "," RUSTFLAGS)
+    set(RUSTFLAGS "[${RUSTFLAGS}]")
+
     message(STATUS "RUST_CFLAGS: ${RUST_CFLAGS}")
     message(STATUS "RUST_CXXFLAGS: ${RUST_CXXFLAGS}")
     message(STATUS "RUSTFLAGS: ${RUSTFLAGS}")

From b1099e181d178072daffcf78d9dfa2fe8a97cd73 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sun, 11 Feb 2024 11:38:33 +0000
Subject: [PATCH 0838/1081] Add check for NULL pattern argument

---
 src/Functions/countMatches.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 3ee049ad457..4664ad18cb3 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -47,6 +47,9 @@ public:
     {
         const IColumn * col_pattern = arguments[1].column.get();
         const ColumnConst * col_pattern_const = checkAndGetColumnConst<ColumnString>(col_pattern);
+        if (col_pattern_const == nullptr)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Pattern argument is not const");
+
         const OptimizedRegularExpression re = Regexps::createRegexp</*is_like*/ false, /*no_capture*/ true, CountMatchesBase::case_insensitive>(col_pattern_const->getValue<String>());
 
         const IColumn * col_haystack = arguments[0].column.get();

From 309db427e76aea295ffb3b5e6e787fa6fc0bdf2c Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Sun, 11 Feb 2024 13:13:49 +0100
Subject: [PATCH 0839/1081] Do not reinitialize ZooKeeperWithFaultInjection on
 each chunk

---
 src/Storages/System/StorageSystemZooKeeper.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index a4920d49b6d..abf93bf1ac0 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -220,6 +220,7 @@ private:
     const UInt64 max_block_size;
     Paths paths;
     ContextPtr context;
+    ZooKeeperWithFaultInjection::Ptr zookeeper;
     bool started = false;
 };
 
@@ -484,7 +485,6 @@ Chunk SystemZooKeeperSource::generate()
         settings.insert_keeper_retry_initial_backoff_ms,
         settings.insert_keeper_retry_max_backoff_ms);
 
-    ZooKeeperWithFaultInjection::Ptr zookeeper;
     /// Handles reconnects when needed
     auto get_zookeeper = [&] ()
     {

From cb812d84cf6fb215b3a40d1278c6c5c09cec587a Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Sun, 11 Feb 2024 22:31:33 +0000
Subject: [PATCH 0840/1081] Fix: check if std::function is set before calling
 it

---
 src/Interpreters/executeQuery.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 9cc8d346aa4..8b36790a269 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1374,8 +1374,11 @@ void executeQuery(
                     /// Force an update of the headers before we start writing
                     result_details.content_type = output_format->getContentType();
                     result_details.format = format_name;
-                    set_result_details(result_details);
-                    set_result_details = nullptr;
+                    if (set_result_details)
+                    {
+                        set_result_details(result_details);
+                        set_result_details = nullptr;
+                    }
                 }
             }
             catch (const DB::Exception & e)

From c9c0e12b4cdc7272135089d5ceae7d0ffca9ab43 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 12 Feb 2024 09:15:40 +0100
Subject: [PATCH 0841/1081] Address PR reviews

---
 src/Coordination/KeeperStorage.h | 40 ++++++++++++++++++--------------
 1 file changed, 23 insertions(+), 17 deletions(-)

diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index 9743e051422..f20f3cca668 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -40,22 +40,6 @@ public:
 
         int64_t mtime{0};
 
-        struct
-        {
-            bool is_ephemeral : 1;
-            int64_t ctime : 63;
-        } is_ephemeral_and_ctime{false, 0};
-
-        union
-        {
-            int64_t ephemeral_owner;
-            struct
-            {
-                int32_t seq_num;
-                int32_t num_children;
-            } children_info;
-        } ephemeral_or_children_data{0};
-
         std::unique_ptr<char[]> data{nullptr};
         uint32_t data_size{0};
 
@@ -174,12 +158,34 @@ public:
         // (e.g. we don't need to copy list of children)
         void shallowCopy(const Node & other);
     private:
+        /// as ctime can't be negative because it stores the timestamp when the
+        /// node was created, we can use the MSB for a bool
+        struct
+        {
+            bool is_ephemeral : 1;
+            int64_t ctime : 63;
+        } is_ephemeral_and_ctime{false, 0};
+
+        /// ephemeral notes cannot have children so a node can set either
+        /// ephemeral_owner OR seq_num + num_children 
+        union
+        {
+            int64_t ephemeral_owner;
+            struct
+            {
+                int32_t seq_num;
+                int32_t num_children;
+            } children_info;
+        } ephemeral_or_children_data{0};
+
         ChildrenSet children{};
     };
 
 #if !defined(ADDRESS_SANITIZER) && !defined(MEMORY_SANITIZER)
     static_assert(
-        sizeof(ListNode<Node>) <= 144, "std::list node containing ListNode<Node> is > 160 bytes which will increase memory consumption");
+        sizeof(ListNode<Node>) <= 144,
+        "std::list node containing ListNode<Node> is > 160 bytes (sizeof(ListNode<Node>) + 16 bytes for pointers) which will increase "
+        "memory consumption");
 #endif
 
     enum DigestVersion : uint8_t

From a0507c204465ac5a0715736cd1f0cba84b2683cd Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 12 Feb 2024 10:36:35 +0100
Subject: [PATCH 0842/1081] Whitespace

---
 src/Coordination/KeeperStorage.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Coordination/KeeperStorage.h b/src/Coordination/KeeperStorage.h
index f20f3cca668..6618ec0bd85 100644
--- a/src/Coordination/KeeperStorage.h
+++ b/src/Coordination/KeeperStorage.h
@@ -167,7 +167,7 @@ public:
         } is_ephemeral_and_ctime{false, 0};
 
         /// ephemeral notes cannot have children so a node can set either
-        /// ephemeral_owner OR seq_num + num_children 
+        /// ephemeral_owner OR seq_num + num_children
         union
         {
             int64_t ephemeral_owner;

From 504e3b0f1bb3075219af8fbcc5fac51fd3bc0b3f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 06:08:57 +0100
Subject: [PATCH 0843/1081] Install ch/chc/chl via nfpm

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 packages/clickhouse-client.yaml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/packages/clickhouse-client.yaml b/packages/clickhouse-client.yaml
index 4d707b28ad9..34b42d92adf 100644
--- a/packages/clickhouse-client.yaml
+++ b/packages/clickhouse-client.yaml
@@ -49,6 +49,12 @@ contents:
   dst: /usr/bin/clickhouse-client
 - src: root/usr/bin/clickhouse-local
   dst: /usr/bin/clickhouse-local
+- src: root/usr/bin/ch
+  dst: /usr/bin/ch
+- src: root/usr/bin/chc
+  dst: /usr/bin/chc
+- src: root/usr/bin/chl
+  dst: /usr/bin/chl
 - src: root/usr/bin/clickhouse-obfuscator
   dst: /usr/bin/clickhouse-obfuscator
 # docs

From 7fb31fe16081421ae17b2f66fe31e0c3d0293bb4 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 11 Feb 2024 20:00:37 +0100
Subject: [PATCH 0844/1081] Remove ability to disable generic clickhouse
 components

Components like client/server/... are very generic, and there is no
point in disabling them, since it does not reduce amount of compiled
code a lot anyway (just a few modules for entrypoints, everything else
is already included in the clickhouse binary), and eventually they are
just symlinks to the clickhouse binary.

But there are few, that requires extra libraries, like ODBC bridge or
keeper components (and there is also standalone keeper binary compiled
with musl), those had been kept.

Also add some descriptions for some utils and change exit code to 0 for
--help.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/CMakeLists.txt              | 263 ++++-----------------------
 programs/benchmark/Benchmark.cpp     |   3 +-
 programs/client/Client.cpp           |   1 +
 programs/compressor/Compressor.cpp   |   1 +
 programs/config_tools.h.in           |  15 --
 programs/copier/ClusterCopierApp.cpp |   1 +
 programs/git-import/git-import.cpp   |   1 +
 programs/install/Install.cpp         |   3 +-
 programs/local/LocalServer.cpp       |   1 +
 programs/main.cpp                    |  97 +++-------
 programs/su/su.cpp                   |   1 +
 11 files changed, 69 insertions(+), 318 deletions(-)

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index 6e544bac81c..7ebbf52ea7e 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -7,35 +7,16 @@ endif ()
 include(${ClickHouse_SOURCE_DIR}/cmake/split_debug_symbols.cmake)
 
 # The `clickhouse` binary is a multi purpose tool that contains multiple execution modes (client, server, etc.),
-# each of them may be built and linked as a separate library.
-# If you do not know what modes you need, turn this option OFF and enable SERVER and CLIENT only.
+# So client/server/... is just a symlink to `clickhouse` binary.
+#
+# But, there are several components that requires extra libraries, like keeper
+# requires NuRaft, that regular binary does not requires, so you can disable
+# compilation of this components.
+#
+# If you do not know what modes you need, turn then all.
 option (ENABLE_CLICKHOUSE_ALL "Enable all ClickHouse modes by default" ON)
 
-option (ENABLE_CLICKHOUSE_SERVER "Server mode (main mode)" ${ENABLE_CLICKHOUSE_ALL})
-option (ENABLE_CLICKHOUSE_CLIENT "Client mode (interactive tui/shell that connects to the server)"
-    ${ENABLE_CLICKHOUSE_ALL})
-
-# https://clickhouse.com/docs/en/operations/utilities/clickhouse-local/
-option (ENABLE_CLICKHOUSE_LOCAL "Local files fast processing mode" ${ENABLE_CLICKHOUSE_ALL})
-
-# https://clickhouse.com/docs/en/operations/utilities/clickhouse-benchmark/
-option (ENABLE_CLICKHOUSE_BENCHMARK "Queries benchmarking mode" ${ENABLE_CLICKHOUSE_ALL})
-
-option (ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG "Configs processor (extract values etc.)" ${ENABLE_CLICKHOUSE_ALL})
-
-# https://clickhouse.com/docs/en/operations/utilities/clickhouse-compressor/
-option (ENABLE_CLICKHOUSE_COMPRESSOR "Data compressor and decompressor" ${ENABLE_CLICKHOUSE_ALL})
-
-# https://clickhouse.com/docs/en/operations/utilities/clickhouse-copier/
-option (ENABLE_CLICKHOUSE_COPIER "Inter-cluster data copying mode" ${ENABLE_CLICKHOUSE_ALL})
-
-option (ENABLE_CLICKHOUSE_FORMAT "Queries pretty-printer and formatter with syntax highlighting"
-    ${ENABLE_CLICKHOUSE_ALL})
-
 # https://clickhouse.com/docs/en/operations/utilities/clickhouse-obfuscator/
-option (ENABLE_CLICKHOUSE_OBFUSCATOR "Table data obfuscator (convert real data to benchmark-ready one)"
-    ${ENABLE_CLICKHOUSE_ALL})
-
 # https://clickhouse.com/docs/en/operations/utilities/odbc-bridge/
 # TODO Also needs NANODBC.
 if (ENABLE_ODBC AND NOT USE_MUSL)
@@ -51,18 +32,12 @@ endif ()
 # https://presentations.clickhouse.com/matemarketing_2020/
 option (ENABLE_CLICKHOUSE_GIT_IMPORT "A tool to analyze Git repositories" ${ENABLE_CLICKHOUSE_ALL})
 
-option (ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER "A tool to export table data files to be later put to a static files web server" ${ENABLE_CLICKHOUSE_ALL})
-
 option (ENABLE_CLICKHOUSE_KEEPER "ClickHouse alternative to ZooKeeper" ${ENABLE_CLICKHOUSE_ALL})
 
 option (ENABLE_CLICKHOUSE_KEEPER_CONVERTER "Util allows to convert ZooKeeper logs and snapshots into clickhouse-keeper snapshot" ${ENABLE_CLICKHOUSE_ALL})
 
 option (ENABLE_CLICKHOUSE_KEEPER_CLIENT "ClickHouse Keeper Client" ${ENABLE_CLICKHOUSE_ALL})
 
-option (ENABLE_CLICKHOUSE_SU "A tool similar to 'su'" ${ENABLE_CLICKHOUSE_ALL})
-
-option (ENABLE_CLICKHOUSE_DISKS "A tool to manage disks" ${ENABLE_CLICKHOUSE_ALL})
-
 if (NOT ENABLE_NURAFT)
     # RECONFIGURE_MESSAGE_LEVEL should not be used here,
     # since ENABLE_NURAFT is set to OFF for FreeBSD and Darwin.
@@ -71,27 +46,7 @@ if (NOT ENABLE_NURAFT)
     set(ENABLE_CLICKHOUSE_KEEPER_CONVERTER OFF)
 endif()
 
-option(ENABLE_CLICKHOUSE_INSTALL "Install ClickHouse without .deb/.rpm/.tgz packages (having the binary only)" ${ENABLE_CLICKHOUSE_ALL})
-
-message(STATUS "ClickHouse modes:")
-
-if (NOT ENABLE_CLICKHOUSE_SERVER)
-    message(WARNING "ClickHouse server mode is not going to be built.")
-else()
-    message(STATUS "Server mode: ON")
-endif()
-
-if (NOT ENABLE_CLICKHOUSE_CLIENT)
-    message(WARNING "ClickHouse client mode is not going to be built. You won't be able to connect to the server and run tests")
-else()
-    message(STATUS "Client mode: ON")
-endif()
-
-if (ENABLE_CLICKHOUSE_LOCAL)
-    message(STATUS "Local mode: ON")
-else()
-    message(STATUS "Local mode: OFF")
-endif()
+message(STATUS "ClickHouse extra components:")
 
 if (ENABLE_CLICKHOUSE_SELF_EXTRACTING)
     message(STATUS "Self-extracting executable: ON")
@@ -99,42 +54,6 @@ else()
     message(STATUS "Self-extracting executable: OFF")
 endif()
 
-if (ENABLE_CLICKHOUSE_BENCHMARK)
-    message(STATUS "Benchmark mode: ON")
-else()
-    message(STATUS "Benchmark mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG)
-    message(STATUS "Extract from config mode: ON")
-else()
-    message(STATUS "Extract from config mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_COMPRESSOR)
-    message(STATUS "Compressor mode: ON")
-else()
-    message(STATUS "Compressor mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_COPIER)
-    message(STATUS "Copier mode: ON")
-else()
-    message(STATUS "Copier mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_FORMAT)
-    message(STATUS "Format mode: ON")
-else()
-    message(STATUS "Format mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_OBFUSCATOR)
-    message(STATUS "Obfuscator mode: ON")
-else()
-    message(STATUS "Obfuscator mode: OFF")
-endif()
-
 if (ENABLE_CLICKHOUSE_ODBC_BRIDGE)
     message(STATUS "ODBC bridge mode: ON")
 else()
@@ -147,18 +66,6 @@ else()
     message(STATUS "Library bridge mode: OFF")
 endif()
 
-if (ENABLE_CLICKHOUSE_INSTALL)
-    message(STATUS "ClickHouse install: ON")
-else()
-    message(STATUS "ClickHouse install: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_GIT_IMPORT)
-    message(STATUS "ClickHouse git-import: ON")
-else()
-    message(STATUS "ClickHouse git-import: OFF")
-endif()
-
 if (ENABLE_CLICKHOUSE_KEEPER)
     message(STATUS "ClickHouse keeper mode: ON")
 else()
@@ -177,19 +84,6 @@ else()
     message(STATUS "ClickHouse keeper-client mode: OFF")
 endif()
 
-
-if (ENABLE_CLICKHOUSE_DISKS)
-    message(STATUS "Clickhouse disks mode: ON")
-else()
-    message(STATUS "ClickHouse disks mode: OFF")
-endif()
-
-if (ENABLE_CLICKHOUSE_SU)
-    message(STATUS "ClickHouse su: ON")
-else()
-    message(STATUS "ClickHouse su: OFF")
-endif()
-
 configure_file (config_tools.h.in ${CONFIG_INCLUDE_PATH}/config_tools.h)
 
 macro(clickhouse_target_link_split_lib target name)
@@ -272,42 +166,6 @@ endif ()
 target_link_libraries (clickhouse PRIVATE clickhouse_common_io string_utils ${HARMFUL_LIB})
 target_include_directories (clickhouse PRIVATE ${CMAKE_CURRENT_BINARY_DIR})
 
-if (ENABLE_CLICKHOUSE_SERVER)
-    clickhouse_target_link_split_lib(clickhouse server)
-endif ()
-if (ENABLE_CLICKHOUSE_CLIENT)
-    clickhouse_target_link_split_lib(clickhouse client)
-endif ()
-if (ENABLE_CLICKHOUSE_LOCAL)
-    clickhouse_target_link_split_lib(clickhouse local)
-endif ()
-if (ENABLE_CLICKHOUSE_BENCHMARK)
-    clickhouse_target_link_split_lib(clickhouse benchmark)
-endif ()
-if (ENABLE_CLICKHOUSE_COPIER)
-    clickhouse_target_link_split_lib(clickhouse copier)
-endif ()
-if (ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG)
-    clickhouse_target_link_split_lib(clickhouse extract-from-config)
-endif ()
-if (ENABLE_CLICKHOUSE_COMPRESSOR)
-    clickhouse_target_link_split_lib(clickhouse compressor)
-endif ()
-if (ENABLE_CLICKHOUSE_FORMAT)
-    clickhouse_target_link_split_lib(clickhouse format)
-endif ()
-if (ENABLE_CLICKHOUSE_OBFUSCATOR)
-    clickhouse_target_link_split_lib(clickhouse obfuscator)
-endif ()
-if (ENABLE_CLICKHOUSE_GIT_IMPORT)
-    clickhouse_target_link_split_lib(clickhouse git-import)
-endif ()
-if (ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER)
-    clickhouse_target_link_split_lib(clickhouse static-files-disk-uploader)
-endif ()
-if (ENABLE_CLICKHOUSE_SU)
-    clickhouse_target_link_split_lib(clickhouse su)
-endif ()
 if (ENABLE_CLICKHOUSE_KEEPER)
     clickhouse_target_link_split_lib(clickhouse keeper)
 endif()
@@ -317,83 +175,41 @@ endif()
 if (ENABLE_CLICKHOUSE_KEEPER_CLIENT)
     clickhouse_target_link_split_lib(clickhouse keeper-client)
 endif()
-if (ENABLE_CLICKHOUSE_INSTALL)
-    clickhouse_target_link_split_lib(clickhouse install)
-endif ()
-if (ENABLE_CLICKHOUSE_DISKS)
-    clickhouse_target_link_split_lib(clickhouse disks)
-endif ()
+clickhouse_target_link_split_lib(clickhouse install)
 
 set (CLICKHOUSE_BUNDLE)
+macro(clickhouse_program_install name lib_name)
+    clickhouse_target_link_split_lib(clickhouse ${lib_name})
+    add_custom_target (${name} ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ${name} DEPENDS clickhouse)
+    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/${name}" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+    list(APPEND CLICKHOUSE_BUNDLE ${name})
+endmacro()
+
 if (ENABLE_CLICKHOUSE_SELF_EXTRACTING)
     list(APPEND CLICKHOUSE_BUNDLE self-extracting)
 endif ()
 
-if (NOT BUILD_STANDALONE_KEEPER)
-    add_custom_target (ch ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ch DEPENDS clickhouse)
-endif()
-if (ENABLE_CLICKHOUSE_SERVER)
-    add_custom_target (clickhouse-server ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-server DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-server" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-server)
-endif ()
-if (ENABLE_CLICKHOUSE_CLIENT)
-    add_custom_target (clickhouse-client ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-client DEPENDS clickhouse)
-    add_custom_target (chc ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chc DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-client" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-client)
-endif ()
-if (ENABLE_CLICKHOUSE_LOCAL)
-    add_custom_target (clickhouse-local ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-local DEPENDS clickhouse)
-    add_custom_target (chl ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chl DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-local" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-local)
-endif ()
-if (ENABLE_CLICKHOUSE_BENCHMARK)
-    add_custom_target (clickhouse-benchmark ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-benchmark DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-benchmark" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-benchmark)
-endif ()
-if (ENABLE_CLICKHOUSE_COPIER)
-    add_custom_target (clickhouse-copier ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-copier DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-copier" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-copier)
-endif ()
-if (ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG)
-    add_custom_target (clickhouse-extract-from-config ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-extract-from-config DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-extract-from-config" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-extract-from-config)
-endif ()
-if (ENABLE_CLICKHOUSE_COMPRESSOR)
-    add_custom_target (clickhouse-compressor ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-compressor DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-compressor" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-compressor)
-endif ()
-if (ENABLE_CLICKHOUSE_FORMAT)
-    add_custom_target (clickhouse-format ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-format DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-format" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-format)
-endif ()
-if (ENABLE_CLICKHOUSE_OBFUSCATOR)
-    add_custom_target (clickhouse-obfuscator ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-obfuscator DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-obfuscator" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-obfuscator)
-endif ()
-if (ENABLE_CLICKHOUSE_GIT_IMPORT)
-    add_custom_target (clickhouse-git-import ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-git-import DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-git-import" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-git-import)
-endif ()
-if (ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER)
-    add_custom_target (clickhouse-static-files-disk-uploader ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-static-files-disk-uploader DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-static-files-disk-uploader" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-static-files-disk-uploader)
-endif ()
-if (ENABLE_CLICKHOUSE_SU)
-    add_custom_target (clickhouse-su ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-su DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-su" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-su)
-endif ()
+clickhouse_program_install(clickhouse-server server)
+
+# client
+clickhouse_program_install(clickhouse-client client)
+add_custom_target (chc ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chc DEPENDS clickhouse)
+
+# local
+clickhouse_program_install(clickhouse-local local)
+add_custom_target (chl ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chl DEPENDS clickhouse)
+add_custom_target (ch ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ch DEPENDS clickhouse)
+
+clickhouse_program_install(clickhouse-benchmark benchmark)
+clickhouse_program_install(clickhouse-copier copier)
+clickhouse_program_install(clickhouse-extract-from-config extract-from-config)
+clickhouse_program_install(clickhouse-compressor compressor)
+clickhouse_program_install(clickhouse-format format)
+clickhouse_program_install(clickhouse-obfuscator obfuscator)
+clickhouse_program_install(clickhouse-git-import git-import)
+clickhouse_program_install(clickhouse-static-files-disk-uploader static-files-disk-uploader)
+clickhouse_program_install(clickhouse-disks disks)
+clickhouse_program_install(clickhouse-su su)
 
 if (ENABLE_CLICKHOUSE_KEEPER)
     if (NOT BUILD_STANDALONE_KEEPER AND CREATE_KEEPER_SYMLINK)
@@ -423,11 +239,6 @@ if (ENABLE_CLICKHOUSE_KEEPER_CLIENT)
 
     list(APPEND CLICKHOUSE_BUNDLE clickhouse-keeper-client)
 endif ()
-if (ENABLE_CLICKHOUSE_DISKS)
-    add_custom_target (clickhouse-disks ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-disks DEPENDS clickhouse)
-    install (FILES "${CMAKE_CURRENT_BINARY_DIR}/clickhouse-disks" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-    list(APPEND CLICKHOUSE_BUNDLE clickhouse-disks)
-endif ()
 
 add_custom_target (clickhouse-bundle ALL DEPENDS ${CLICKHOUSE_BUNDLE})
 
diff --git a/programs/benchmark/Benchmark.cpp b/programs/benchmark/Benchmark.cpp
index 59fc6c0c17f..961c678b936 100644
--- a/programs/benchmark/Benchmark.cpp
+++ b/programs/benchmark/Benchmark.cpp
@@ -640,7 +640,8 @@ int mainEntryClickHouseBenchmark(int argc, char ** argv)
         {
             std::cout << "Usage: " << argv[0] << " [options] < queries.txt\n";
             std::cout << desc << "\n";
-            return 1;
+            std::cout << "\nSee also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-benchmark/\n";
+            return 0;
         }
 
         print_stacktrace = options.count("stacktrace");
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index cc142470d7f..fdd262f185d 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -1000,6 +1000,7 @@ void Client::printHelpMessage(const OptionsDescription & options_description)
     std::cout << options_description.external_description.value() << "\n";
     std::cout << options_description.hosts_and_ports_description.value() << "\n";
     std::cout << "In addition, --param_name=value can be specified for substitution of parameters for parametrized queries.\n";
+    std::cout << "\nSee also: https://clickhouse.com/docs/en/integrations/sql-clients/cli\n";
 }
 
 
diff --git a/programs/compressor/Compressor.cpp b/programs/compressor/Compressor.cpp
index cc25747702a..7125fdc744f 100644
--- a/programs/compressor/Compressor.cpp
+++ b/programs/compressor/Compressor.cpp
@@ -100,6 +100,7 @@ int mainEntryClickHouseCompressor(int argc, char ** argv)
             std::cout << "Usage: " << argv[0] << " [options] < INPUT > OUTPUT" << std::endl;
             std::cout << "Usage: " << argv[0] << " [options] INPUT OUTPUT" << std::endl;
             std::cout << desc << std::endl;
+            std::cout << "\nSee also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-compressor/\n";
             return 0;
         }
 
diff --git a/programs/config_tools.h.in b/programs/config_tools.h.in
index 65ef3ca762b..50a1de5628b 100644
--- a/programs/config_tools.h.in
+++ b/programs/config_tools.h.in
@@ -2,23 +2,8 @@
 
 #pragma once
 
-#cmakedefine01 ENABLE_CLICKHOUSE_SERVER
-#cmakedefine01 ENABLE_CLICKHOUSE_CLIENT
-#cmakedefine01 ENABLE_CLICKHOUSE_LOCAL
-#cmakedefine01 ENABLE_CLICKHOUSE_BENCHMARK
-#cmakedefine01 ENABLE_CLICKHOUSE_PERFORMANCE_TEST
-#cmakedefine01 ENABLE_CLICKHOUSE_COPIER
-#cmakedefine01 ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG
-#cmakedefine01 ENABLE_CLICKHOUSE_COMPRESSOR
-#cmakedefine01 ENABLE_CLICKHOUSE_FORMAT
-#cmakedefine01 ENABLE_CLICKHOUSE_OBFUSCATOR
-#cmakedefine01 ENABLE_CLICKHOUSE_GIT_IMPORT
-#cmakedefine01 ENABLE_CLICKHOUSE_INSTALL
 #cmakedefine01 ENABLE_CLICKHOUSE_ODBC_BRIDGE
 #cmakedefine01 ENABLE_CLICKHOUSE_LIBRARY_BRIDGE
 #cmakedefine01 ENABLE_CLICKHOUSE_KEEPER
 #cmakedefine01 ENABLE_CLICKHOUSE_KEEPER_CLIENT
 #cmakedefine01 ENABLE_CLICKHOUSE_KEEPER_CONVERTER
-#cmakedefine01 ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER
-#cmakedefine01 ENABLE_CLICKHOUSE_SU
-#cmakedefine01 ENABLE_CLICKHOUSE_DISKS
diff --git a/programs/copier/ClusterCopierApp.cpp b/programs/copier/ClusterCopierApp.cpp
index 53f79888573..fdf07dec61a 100644
--- a/programs/copier/ClusterCopierApp.cpp
+++ b/programs/copier/ClusterCopierApp.cpp
@@ -78,6 +78,7 @@ void ClusterCopierApp::handleHelp(const std::string &, const std::string &)
     help_formatter.setHeader("Copies tables from one cluster to another");
     help_formatter.setUsage("--config-file <config-file> --task-path <task-path>");
     help_formatter.format(std::cerr);
+    help_formatter.setFooter("See also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-copier/");
 
     stopOptionsProcessing();
 }
diff --git a/programs/git-import/git-import.cpp b/programs/git-import/git-import.cpp
index 16244232bee..fdabeacd46e 100644
--- a/programs/git-import/git-import.cpp
+++ b/programs/git-import/git-import.cpp
@@ -172,6 +172,7 @@ clickhouse-client --query "INSERT INTO git.commits FORMAT TSV" < commits.tsv
 clickhouse-client --query "INSERT INTO git.file_changes FORMAT TSV" < file_changes.tsv
 clickhouse-client --query "INSERT INTO git.line_changes FORMAT TSV" < line_changes.tsv
 
+Check out this presentation: https://presentations.clickhouse.com/matemarketing_2020/
 )";
 
 namespace po = boost::program_options;
diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index a4a4672f5c4..c3d2c61d6d0 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -242,9 +242,10 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
 
         if (options.count("help"))
         {
+            std::cout << "Install ClickHouse without .deb/.rpm/.tgz packages (having the binary only)\n\n";
             std::cout << "Usage: " << formatWithSudo(std::string(argv[0]) + " install [options]", getuid() != 0) << '\n';
             std::cout << desc << '\n';
-            return 1;
+            return 0;
         }
 
         /// We need to copy binary to the binary directory.
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 443d4a52fa3..d7acf4112a5 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -828,6 +828,7 @@ void LocalServer::printHelpMessage([[maybe_unused]] const OptionsDescription & o
     std::cout << options_description.main_description.value() << "\n";
     std::cout << getHelpFooter() << "\n";
     std::cout << "In addition, --param_name=value can be specified for substitution of parameters for parametrized queries.\n";
+    std::cout << "\nSee also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-local/\n";
 #endif
 }
 
diff --git a/programs/main.cpp b/programs/main.cpp
index 1ff7e5db560..3896b3819a8 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -24,36 +24,28 @@
 
 
 /// Universal executable for various clickhouse applications
-#if ENABLE_CLICKHOUSE_SERVER
 int mainEntryClickHouseServer(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_CLIENT
 int mainEntryClickHouseClient(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_LOCAL
 int mainEntryClickHouseLocal(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_BENCHMARK
 int mainEntryClickHouseBenchmark(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG
 int mainEntryClickHouseExtractFromConfig(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_COMPRESSOR
 int mainEntryClickHouseCompressor(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_FORMAT
 int mainEntryClickHouseFormat(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_COPIER
 int mainEntryClickHouseClusterCopier(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_OBFUSCATOR
 int mainEntryClickHouseObfuscator(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_GIT_IMPORT
 int mainEntryClickHouseGitImport(int argc, char ** argv);
-#endif
+int mainEntryClickHouseStaticFilesDiskUploader(int argc, char ** argv);
+int mainEntryClickHouseSU(int argc, char ** argv);
+int mainEntryClickHouseDisks(int argc, char ** argv);
+
+int mainEntryClickHouseHashBinary(int, char **)
+{
+    /// Intentionally without newline. So you can run:
+    /// objcopy --add-section .clickhouse.hash=<(./clickhouse hash-binary) clickhouse
+    std::cout << getHashOfLoadedBinaryHex();
+    return 0;
+}
+
 #if ENABLE_CLICKHOUSE_KEEPER
 int mainEntryClickHouseKeeper(int argc, char ** argv);
 #endif
@@ -63,30 +55,13 @@ int mainEntryClickHouseKeeperConverter(int argc, char ** argv);
 #if ENABLE_CLICKHOUSE_KEEPER_CLIENT
 int mainEntryClickHouseKeeperClient(int argc, char ** argv);
 #endif
-#if ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER
-int mainEntryClickHouseStaticFilesDiskUploader(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_SU
-int mainEntryClickHouseSU(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_INSTALL
+
+// install
 int mainEntryClickHouseInstall(int argc, char ** argv);
 int mainEntryClickHouseStart(int argc, char ** argv);
 int mainEntryClickHouseStop(int argc, char ** argv);
 int mainEntryClickHouseStatus(int argc, char ** argv);
 int mainEntryClickHouseRestart(int argc, char ** argv);
-#endif
-#if ENABLE_CLICKHOUSE_DISKS
-int mainEntryClickHouseDisks(int argc, char ** argv);
-#endif
-
-int mainEntryClickHouseHashBinary(int, char **)
-{
-    /// Intentionally without newline. So you can run:
-    /// objcopy --add-section .clickhouse.hash=<(./clickhouse hash-binary) clickhouse
-    std::cout << getHashOfLoadedBinaryHex();
-    return 0;
-}
 
 namespace
 {
@@ -98,36 +73,22 @@ using MainFunc = int (*)(int, char**);
 /// Add an item here to register new application
 std::pair<std::string_view, MainFunc> clickhouse_applications[] =
 {
-#if ENABLE_CLICKHOUSE_LOCAL
     {"local", mainEntryClickHouseLocal},
-#endif
-#if ENABLE_CLICKHOUSE_CLIENT
     {"client", mainEntryClickHouseClient},
-#endif
-#if ENABLE_CLICKHOUSE_BENCHMARK
     {"benchmark", mainEntryClickHouseBenchmark},
-#endif
-#if ENABLE_CLICKHOUSE_SERVER
     {"server", mainEntryClickHouseServer},
-#endif
-#if ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG
     {"extract-from-config", mainEntryClickHouseExtractFromConfig},
-#endif
-#if ENABLE_CLICKHOUSE_COMPRESSOR
     {"compressor", mainEntryClickHouseCompressor},
-#endif
-#if ENABLE_CLICKHOUSE_FORMAT
     {"format", mainEntryClickHouseFormat},
-#endif
-#if ENABLE_CLICKHOUSE_COPIER
     {"copier", mainEntryClickHouseClusterCopier},
-#endif
-#if ENABLE_CLICKHOUSE_OBFUSCATOR
     {"obfuscator", mainEntryClickHouseObfuscator},
-#endif
-#if ENABLE_CLICKHOUSE_GIT_IMPORT
     {"git-import", mainEntryClickHouseGitImport},
-#endif
+    {"static-files-disk-uploader", mainEntryClickHouseStaticFilesDiskUploader},
+    {"su", mainEntryClickHouseSU},
+    {"hash-binary", mainEntryClickHouseHashBinary},
+    {"disks", mainEntryClickHouseDisks},
+
+    // keeper
 #if ENABLE_CLICKHOUSE_KEEPER
     {"keeper", mainEntryClickHouseKeeper},
 #endif
@@ -137,34 +98,20 @@ std::pair<std::string_view, MainFunc> clickhouse_applications[] =
 #if ENABLE_CLICKHOUSE_KEEPER_CLIENT
     {"keeper-client", mainEntryClickHouseKeeperClient},
 #endif
-#if ENABLE_CLICKHOUSE_INSTALL
+
+    // install
     {"install", mainEntryClickHouseInstall},
     {"start", mainEntryClickHouseStart},
     {"stop", mainEntryClickHouseStop},
     {"status", mainEntryClickHouseStatus},
     {"restart", mainEntryClickHouseRestart},
-#endif
-#if ENABLE_CLICKHOUSE_STATIC_FILES_DISK_UPLOADER
-    {"static-files-disk-uploader", mainEntryClickHouseStaticFilesDiskUploader},
-#endif
-#if ENABLE_CLICKHOUSE_SU
-    {"su", mainEntryClickHouseSU},
-#endif
-    {"hash-binary", mainEntryClickHouseHashBinary},
-#if ENABLE_CLICKHOUSE_DISKS
-    {"disks", mainEntryClickHouseDisks},
-#endif
 };
 
 /// Add an item here to register a new short name
 std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
 {
-#if ENABLE_CLICKHOUSE_LOCAL
     {"chl", "local"},
-#endif
-#if ENABLE_CLICKHOUSE_CLIENT
     {"chc", "client"},
-#endif
 };
 
 int printHelp(int, char **)
diff --git a/programs/su/su.cpp b/programs/su/su.cpp
index a8f61fb32b6..33d929898f4 100644
--- a/programs/su/su.cpp
+++ b/programs/su/su.cpp
@@ -107,6 +107,7 @@ try
 
     if (argc < 3)
     {
+        std::cout << "A tool similar to 'su'" << std::endl;
         std::cout << "Usage: ./clickhouse su user:group ..." << std::endl;
         exit(0); // NOLINT(concurrency-mt-unsafe)
     }

From 67b73c3e496b804ee207ead514e25db079613730 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 11:33:40 +0100
Subject: [PATCH 0845/1081] Fix long shutdown of FileLog storage

Previously it was possible to wait up to
poll_directory_watch_events_backoff_max (default is 32000) on shutdown,
because it was not possible to stop poll of inotify.

Before (takes 3 seconds):

    2024.02.12 11:27:55.058192 [ 10134 ] {} <Trace> StorageFileLog (file_log): Waiting for cleanup
    2024.02.12 11:27:58.178021 [ 10271 ] {} <Trace> directory_watch: Execution took 7519 ms.

After:

    2024.02.12 11:33:29.722403 [ 15866 ] {} <Trace> StorageFileLog (file_log): Waiting for cleanup
    2024.02.12 11:33:29.722473 [ 15956 ] {} <Trace> directory_watch: Execution took 6399 ms.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/FileLog/DirectoryWatcherBase.cpp | 23 +++++++++++--------
 src/Storages/FileLog/DirectoryWatcherBase.h   | 11 +++++----
 2 files changed, 20 insertions(+), 14 deletions(-)

diff --git a/src/Storages/FileLog/DirectoryWatcherBase.cpp b/src/Storages/FileLog/DirectoryWatcherBase.cpp
index 8209483fac9..f1cf0866de7 100644
--- a/src/Storages/FileLog/DirectoryWatcherBase.cpp
+++ b/src/Storages/FileLog/DirectoryWatcherBase.cpp
@@ -34,8 +34,8 @@ DirectoryWatcherBase::DirectoryWatcherBase(
     if (!std::filesystem::is_directory(path))
         throw Exception(ErrorCodes::BAD_FILE_TYPE, "Path {} is not a directory", path);
 
-    fd = inotify_init();
-    if (fd == -1)
+    inotify_fd = inotify_init();
+    if (inotify_fd == -1)
         throw ErrnoException(ErrorCodes::IO_SETUP_ERROR, "Cannot initialize inotify");
 
     watch_task = getContext()->getSchedulePool().createTask("directory_watch", [this] { watchFunc(); });
@@ -56,7 +56,7 @@ void DirectoryWatcherBase::watchFunc()
     if (eventMask() & DirectoryWatcherBase::DW_ITEM_MOVED_TO)
         mask |= IN_MOVED_TO;
 
-    int wd = inotify_add_watch(fd, path.c_str(), mask);
+    int wd = inotify_add_watch(inotify_fd, path.c_str(), mask);
     if (wd == -1)
     {
         owner.onError(Exception(ErrorCodes::IO_SETUP_ERROR, "Watch directory {} failed", path));
@@ -65,16 +65,20 @@ void DirectoryWatcherBase::watchFunc()
 
     std::string buffer;
     buffer.resize(buffer_size);
-    pollfd pfd;
-    pfd.fd = fd;
-    pfd.events = POLLIN;
+    pollfd pfds[2];
+    /// inotify descriptor
+    pfds[0].fd = inotify_fd;
+    pfds[0].events = POLLIN;
+    // notifier
+    pfds[1].fd = event_pipe.fds_rw[0];
+    pfds[1].events = POLLIN;
     while (!stopped)
     {
         const auto & settings = owner.storage.getFileLogSettings();
-        if (poll(&pfd, 1, static_cast<int>(milliseconds_to_wait)) > 0 && pfd.revents & POLLIN)
+        if (poll(pfds, 2, static_cast<int>(milliseconds_to_wait)) > 0 && pfds[0].revents & POLLIN)
         {
             milliseconds_to_wait = settings->poll_directory_watch_events_backoff_init.totalMilliseconds();
-            ssize_t n = read(fd, buffer.data(), buffer.size());
+            ssize_t n = read(inotify_fd, buffer.data(), buffer.size());
             int i = 0;
             if (n > 0)
             {
@@ -130,7 +134,7 @@ void DirectoryWatcherBase::watchFunc()
 DirectoryWatcherBase::~DirectoryWatcherBase()
 {
     stop();
-    int err = ::close(fd);
+    int err = ::close(inotify_fd);
     chassert(!err || errno == EINTR);
 }
 
@@ -143,6 +147,7 @@ void DirectoryWatcherBase::start()
 void DirectoryWatcherBase::stop()
 {
     stopped = true;
+    ::write(event_pipe.fds_rw[1], "\0", 1);
     if (watch_task)
         watch_task->deactivate();
 }
diff --git a/src/Storages/FileLog/DirectoryWatcherBase.h b/src/Storages/FileLog/DirectoryWatcherBase.h
index a640f686c8a..0dfb58fbc5c 100644
--- a/src/Storages/FileLog/DirectoryWatcherBase.h
+++ b/src/Storages/FileLog/DirectoryWatcherBase.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Core/BackgroundSchedulePool.h>
+#include <Common/PipeFDs.h>
 
 #include <atomic>
 #include <memory>
@@ -85,10 +86,6 @@ public:
 
     void watchFunc();
 
-protected:
-    void start();
-    void stop();
-
 private:
     FileLogDirectoryWatcher & owner;
 
@@ -102,7 +99,11 @@ private:
     int event_mask;
     uint64_t milliseconds_to_wait;
 
-    int fd;
+    int inotify_fd;
+    PipeFDs event_pipe;
+
+    void start();
+    void stop();
 };
 
 }

From 3145c5d5f5c045a59faace2a3f07d49f8f44f9f3 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 12:02:42 +0100
Subject: [PATCH 0846/1081] Add missing install target for ch/chc/chl

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/CMakeLists.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index 7ebbf52ea7e..dac168bd226 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -194,11 +194,14 @@ clickhouse_program_install(clickhouse-server server)
 # client
 clickhouse_program_install(clickhouse-client client)
 add_custom_target (chc ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chc DEPENDS clickhouse)
+install (FILES "${CMAKE_CURRENT_BINARY_DIR}/chc" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
 
 # local
 clickhouse_program_install(clickhouse-local local)
 add_custom_target (chl ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chl DEPENDS clickhouse)
+install (FILES "${CMAKE_CURRENT_BINARY_DIR}/chl" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
 add_custom_target (ch ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ch DEPENDS clickhouse)
+install (FILES "${CMAKE_CURRENT_BINARY_DIR}/ch" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
 
 clickhouse_program_install(clickhouse-benchmark benchmark)
 clickhouse_program_install(clickhouse-copier copier)

From 11fddc8d63b274c33d60b8b9955c7ab70f11fb7c Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 12:04:17 +0100
Subject: [PATCH 0847/1081] Unify binary aliases

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/CMakeLists.txt | 21 ++++++++-------------
 1 file changed, 8 insertions(+), 13 deletions(-)

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index dac168bd226..e68b75db944 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -183,6 +183,12 @@ macro(clickhouse_program_install name lib_name)
     add_custom_target (${name} ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ${name} DEPENDS clickhouse)
     install (FILES "${CMAKE_CURRENT_BINARY_DIR}/${name}" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
     list(APPEND CLICKHOUSE_BUNDLE ${name})
+
+    foreach(alias ${ARGN})
+        message(STATUS "Adding alias ${alias} for ${name}")
+        add_custom_target (${alias} ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ${alias} DEPENDS clickhouse)
+        install (FILES "${CMAKE_CURRENT_BINARY_DIR}/${alias}" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+    endforeach()
 endmacro()
 
 if (ENABLE_CLICKHOUSE_SELF_EXTRACTING)
@@ -190,19 +196,8 @@ if (ENABLE_CLICKHOUSE_SELF_EXTRACTING)
 endif ()
 
 clickhouse_program_install(clickhouse-server server)
-
-# client
-clickhouse_program_install(clickhouse-client client)
-add_custom_target (chc ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chc DEPENDS clickhouse)
-install (FILES "${CMAKE_CURRENT_BINARY_DIR}/chc" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-
-# local
-clickhouse_program_install(clickhouse-local local)
-add_custom_target (chl ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse chl DEPENDS clickhouse)
-install (FILES "${CMAKE_CURRENT_BINARY_DIR}/chl" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-add_custom_target (ch ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ch DEPENDS clickhouse)
-install (FILES "${CMAKE_CURRENT_BINARY_DIR}/ch" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-
+clickhouse_program_install(clickhouse-client client chc)
+clickhouse_program_install(clickhouse-local local chl ch)
 clickhouse_program_install(clickhouse-benchmark benchmark)
 clickhouse_program_install(clickhouse-copier copier)
 clickhouse_program_install(clickhouse-extract-from-config extract-from-config)

From bc2921d1f11941a8f95fb047d0b0ecdcf692cf31 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 11:53:06 +0100
Subject: [PATCH 0848/1081] tests: fix 02322_sql_insert_format flakiness

02322_sql_insert_format failed from time to time [1] and I found only
one reason - structure cache, I guess it may fail when the mtime was the
same.

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/59857/46a9ced0f9031153538446f4b625e0cc34532a90/fast_test.html

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/02322_sql_insert_format.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02322_sql_insert_format.sql b/tests/queries/0_stateless/02322_sql_insert_format.sql
index 34cde1e56b6..ccceaee31d9 100644
--- a/tests/queries/0_stateless/02322_sql_insert_format.sql
+++ b/tests/queries/0_stateless/02322_sql_insert_format.sql
@@ -1,5 +1,7 @@
 -- Tags: no-parallel
 
+set schema_inference_use_cache_for_file=0;
+
 select number as x, number % 3 as y, 'Hello' as z from numbers(5) format SQLInsert;
 select number as x, number % 3 as y, 'Hello' as z from numbers(5) format SQLInsert settings output_format_sql_insert_max_batch_size=1;
 select number as x, number % 3 as y, 'Hello' as z from numbers(5) format SQLInsert settings output_format_sql_insert_max_batch_size=2;

From 13e38772546237e94864a55d6ea1ad58e1188591 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 14:30:42 +0100
Subject: [PATCH 0849/1081] Add chc/chl/ch into clickhouse-bundle target

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/CMakeLists.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index e68b75db944..62bcf068879 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -188,6 +188,7 @@ macro(clickhouse_program_install name lib_name)
         message(STATUS "Adding alias ${alias} for ${name}")
         add_custom_target (${alias} ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse ${alias} DEPENDS clickhouse)
         install (FILES "${CMAKE_CURRENT_BINARY_DIR}/${alias}" DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+        list(APPEND CLICKHOUSE_BUNDLE ${alias})
     endforeach()
 endmacro()
 

From fd2ee19f657276f47d280af83e2bfc95132fe919 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 13:37:25 +0000
Subject: [PATCH 0850/1081] Follow up for #58554. Cleanup.

---
 src/Interpreters/ActionsDAG.cpp                   | 15 ++-------------
 .../QueryPlan/Optimizations/optimizePrewhere.cpp  |  5 ++---
 .../MergeTree/MergeTreeWhereOptimizer.cpp         |  3 ---
 3 files changed, 4 insertions(+), 19 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 4fd7c6d9117..7240679abb7 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -1777,15 +1777,6 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
 
                         child = child_data.to_second;
                     }
-
-                    /// Input from second DAG should also be in the first.
-                    // if (copy.type == ActionType::INPUT)
-                    // {
-                    //     auto & input_copy = first_nodes.emplace_back(*cur.node);
-                    //     assert(cur_data.to_first == nullptr);
-                    //     cur_data.to_first = &input_copy;
-                    //     new_inputs.push_back(cur.node);
-                    // }
                 }
                 else
                 {
@@ -1837,10 +1828,8 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
     for (const auto * input : new_inputs)
     {
         const auto & cur = data[input];
-        if (cur.to_second)
-            second_inputs.push_back(cur.to_second);
-        if (cur.to_first)
-            first_outputs.push_back(cur.to_first);
+        second_inputs.push_back(cur.to_second);
+        first_outputs.push_back(cur.to_first);
     }
 
     for (const auto * input_node : inputs)
diff --git a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
index ec07f028f20..49e1a49f131 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizePrewhere.cpp
@@ -4,9 +4,8 @@
 #include <Processors/QueryPlan/ReadFromMergeTree.h>
 #include <Storages/MergeTree/MergeTreeWhereOptimizer.h>
 #include <Interpreters/ActionsDAG.h>
-#include <Planner/ActionsChain.h>
-#include "Functions/FunctionsLogical.h"
-#include "Functions/IFunctionAdaptors.h"
+#include <Functions/FunctionsLogical.h>
+#include <Functions/IFunctionAdaptors.h>
 
 namespace DB
 {
diff --git a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
index c52a2fee051..d9a89b9d4ef 100644
--- a/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
+++ b/src/Storages/MergeTree/MergeTreeWhereOptimizer.cpp
@@ -132,9 +132,6 @@ MergeTreeWhereOptimizer::FilterActionsOptimizeResult MergeTreeWhereOptimizer::op
     if (!optimize_result)
         return {};
 
-    // if (optimize_result->where_conditions.empty())
-    //     return {.prewhere_nodes = {}, .fully_moved_to_prewhere = true};
-
     std::unordered_set<const ActionsDAG::Node *> prewhere_conditions;
     for (const auto & condition : optimize_result->prewhere_conditions)
         prewhere_conditions.insert(condition.node.getDAGNode());

From 87b6d65b9bdd701f88c99670304c805344c7aa7c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 13:46:30 +0000
Subject: [PATCH 0851/1081] Remove outdated comment.

---
 src/Planner/Planner.cpp | 9 ---------
 1 file changed, 9 deletions(-)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index efccadcbe1a..bcc42dbae7f 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -71,7 +71,6 @@
 #include <Planner/PlannerAggregation.h>
 #include <Planner/PlannerSorting.h>
 #include <Planner/PlannerWindowFunctions.h>
-#include <Planner/ActionsChain.h>
 #include <Planner/CollectSets.h>
 #include <Planner/CollectTableExpressionData.h>
 #include <Planner/PlannerJoinTree.h>
@@ -98,14 +97,6 @@ namespace ErrorCodes
     extern const int SUPPORT_IS_DISABLED;
 }
 
-/** ClickHouse query planner.
-  *
-  * TODO: Support projections.
-  * TODO: Support trivial count using partition predicates.
-  * TODO: Support trivial count for table functions.
-  * TODO: Support indexes for IN function.
-  */
-
 namespace
 {
 

From 2d7fdc896a714c48d990264e17443d6c8834620b Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 12 Feb 2024 14:03:45 +0000
Subject: [PATCH 0852/1081] Add test 02988_join_using_prewhere_pushdown

---
 ...988_join_using_prewhere_pushdown.reference |  2 ++
 .../02988_join_using_prewhere_pushdown.sql    | 24 +++++++++++++++++++
 2 files changed, 26 insertions(+)
 create mode 100644 tests/queries/0_stateless/02988_join_using_prewhere_pushdown.reference
 create mode 100644 tests/queries/0_stateless/02988_join_using_prewhere_pushdown.sql

diff --git a/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.reference b/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.reference
new file mode 100644
index 00000000000..c9bf491872a
--- /dev/null
+++ b/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.reference
@@ -0,0 +1,2 @@
+1	a
+2	b	Int64
diff --git a/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.sql b/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.sql
new file mode 100644
index 00000000000..db49f155d3f
--- /dev/null
+++ b/tests/queries/0_stateless/02988_join_using_prewhere_pushdown.sql
@@ -0,0 +1,24 @@
+DROP TABLE IF EXISTS t;
+
+SET allow_suspicious_low_cardinality_types = 1;
+
+
+CREATE TABLE t (`id` UInt16, `u` LowCardinality(Int32), `s` LowCardinality(String))
+ENGINE = MergeTree ORDER BY id;
+
+INSERT INTO t VALUES (1,1,'a'),(2,2,'b');
+
+SELECT u, s FROM t
+INNER JOIN ( SELECT number :: Int32 AS u FROM numbers(10) ) AS t1
+USING (u)
+WHERE u != 2
+;
+
+SELECT u, s, toTypeName(u) FROM t
+FULL JOIN ( SELECT number :: UInt32 AS u FROM numbers(10) ) AS t1
+USING (u)
+WHERE u == 2
+ORDER BY 1
+;
+
+DROP TABLE IF EXISTS t;

From c8807393114b870bf94c751ed32d054741cf22b0 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 12 Feb 2024 13:44:14 +0000
Subject: [PATCH 0853/1081] CI: Fix build job failures due to jepsen artifacts

---
 tests/jepsen.clickhouse/project.clj | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/jepsen.clickhouse/project.clj b/tests/jepsen.clickhouse/project.clj
index 6c714604b56..bb41be1ba10 100644
--- a/tests/jepsen.clickhouse/project.clj
+++ b/tests/jepsen.clickhouse/project.clj
@@ -13,4 +13,7 @@
                  [com.hierynomus/sshj "0.34.0"]
                  [com.clickhouse/clickhouse-jdbc "0.3.2-patch11"]
                  [org.apache.zookeeper/zookeeper "3.6.1" :exclusions [org.slf4j/slf4j-log4j12]]]
-  :repl-options {:init-ns jepsen.clickhouse-keeper.main})
+  :repl-options {:init-ns jepsen.clickhouse-keeper.main}
+  ;; otherwise, target artifacts will be created under the repo root, so that checkout with clear might fail in ci
+  :target-path "/tmp/jepsen_clickhouse"
+)

From b094ab9763120ed03015e27eeb2f13247330a017 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 12 Feb 2024 15:27:20 +0000
Subject: [PATCH 0854/1081] Add comment

---
 tests/clickhouse-test | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 49c517852a6..9c21f1fd2a2 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -2494,7 +2494,8 @@ def main(args):
                     time DateTime,
                     test_name String,
                     coverage Array(UInt64)
-                ) ENGINE = MergeTree ORDER BY test_name;
+                ) ENGINE = MergeTree ORDER BY test_name
+                COMMENT 'Contains information about per-test coverage from the CI, but used only for exporting to the CI cluster';
             """,
         )
 

From c7c05c9881362079fa6a02430fc5cd63dfa65bb7 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 16:22:10 +0100
Subject: [PATCH 0855/1081] Do not pull mutations if pulling replication log
 had been stopped

Right now, mutations can be pulled even after:

    SYSTEM STOP PULLING REPLICATION LOG

Since they pulled from two places:
- StorageReplicatedMergeTree::mutationsUpdatingTask()
- ReplicatedMergeTreeQueue::pullLogsToQueue()

And only the last one checks action blocker.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
index 8d921bdcb1c..e26a36202dd 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
@@ -860,6 +860,9 @@ ActiveDataPartSet getPartNamesToMutate(
 
 int32_t ReplicatedMergeTreeQueue::updateMutations(zkutil::ZooKeeperPtr zookeeper, Coordination::WatchCallbackPtr watch_callback)
 {
+    if (pull_log_blocker.isCancelled())
+        throw Exception(ErrorCodes::ABORTED, "Log pulling is cancelled");
+
     std::lock_guard lock(update_mutations_mutex);
 
     Coordination::Stat mutations_stat;

From 0628ae62681d970a37414a251e0894de1e3b4569 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 12 Feb 2024 17:13:30 +0100
Subject: [PATCH 0856/1081] S3 queue fix uninitialized value

---
 src/Storages/S3Queue/S3QueueTableMetadata.cpp | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.cpp b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
index 3ee2594135d..1830bac4743 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.cpp
@@ -69,16 +69,23 @@ void S3QueueTableMetadata::read(const String & metadata_str)
 {
     Poco::JSON::Parser parser;
     auto json = parser.parse(metadata_str).extract<Poco::JSON::Object::Ptr>();
+
     after_processing = json->getValue<String>("after_processing");
     mode = json->getValue<String>("mode");
     s3queue_tracked_files_limit = json->getValue<UInt64>("s3queue_tracked_files_limit");
     s3queue_tracked_file_ttl_sec = json->getValue<UInt64>("s3queue_tracked_file_ttl_sec");
     format_name = json->getValue<String>("format_name");
     columns = json->getValue<String>("columns");
+
     if (json->has("s3queue_total_shards_num"))
         s3queue_total_shards_num = json->getValue<UInt64>("s3queue_total_shards_num");
+    else
+        s3queue_total_shards_num = 1;
+
     if (json->has("s3queue_processing_threads_num"))
         s3queue_processing_threads_num = json->getValue<UInt64>("s3queue_processing_threads_num");
+    else
+        s3queue_processing_threads_num = 1;
 }
 
 S3QueueTableMetadata S3QueueTableMetadata::parse(const String & metadata_str)

From 69273b46451a288f6f686b3e1238d8992e9ce0de Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 12 Feb 2024 17:10:10 +0000
Subject: [PATCH 0857/1081] Fix parsing of partition expressions surrounded by
 parens

---
 src/Parsers/ParserPartition.cpp               | 34 +++++++++----------
 ...02897_alter_partition_parameters.reference |  5 +++
 .../02897_alter_partition_parameters.sql      | 29 ++++++++++++++++
 3 files changed, 51 insertions(+), 17 deletions(-)

diff --git a/src/Parsers/ParserPartition.cpp b/src/Parsers/ParserPartition.cpp
index 80debc13c67..0cbd6898dd9 100644
--- a/src/Parsers/ParserPartition.cpp
+++ b/src/Parsers/ParserPartition.cpp
@@ -8,6 +8,7 @@
 #include <Parsers/ASTIdentifier.h>
 #include <Common/typeid_cast.h>
 #include <Parsers/ASTQueryParameter.h>
+#include <iostream>
 
 namespace DB
 {
@@ -18,8 +19,6 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     ParserKeyword s_all("ALL");
     ParserStringLiteral parser_string_literal;
     ParserSubstitution parser_substitution;
-    ParserLiteral literal_parser;
-    ParserTupleOfLiterals tuple_of_literals;
     ParserExpression parser_expr;
 
     auto partition = std::make_shared<ASTPartition>();
@@ -45,34 +44,35 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     {
         ASTPtr value;
         std::optional<size_t> fields_count;
-        if (literal_parser.parse(pos, value, expected) || tuple_of_literals.parse(pos, value, expected))
-        {
-            auto * literal = value->as<ASTLiteral>();
-            if (literal->value.getType() == Field::Types::Tuple)
-            {
-                fields_count = literal->value.get<const Tuple &>().size();
-            }
-            else
-            {
-                fields_count = 1;
-            }
-        }
-        else if (parser_substitution.parse(pos, value, expected))
+        if (parser_substitution.parse(pos, value, expected))
         {
             /// It can be tuple substitution
             fields_count = std::nullopt;
         }
         else if (parser_expr.parse(pos, value, expected))
         {
-            const auto * tuple_ast = value->as<ASTFunction>();
-            if (tuple_ast && tuple_ast->name == "tuple")
+            if (const auto * tuple_ast = value->as<ASTFunction>(); tuple_ast)
             {
+                if (tuple_ast->name != "tuple")
+                    return false;
+
                 const auto * arguments_ast = tuple_ast->arguments->as<ASTExpressionList>();
                 if (arguments_ast)
                     fields_count = arguments_ast->children.size();
                 else
                     fields_count = 0;
             }
+            else if (const auto* literal_ast = value->as<ASTLiteral>(); literal_ast)
+            {
+                if (literal_ast->value.getType() == Field::Types::Tuple)
+                {
+                    fields_count = literal_ast->value.get<const Tuple &>().size();
+                }
+                else
+                {
+                    fields_count = 1;
+                }
+            }
             else
                 return false;
         }
diff --git a/tests/queries/0_stateless/02897_alter_partition_parameters.reference b/tests/queries/0_stateless/02897_alter_partition_parameters.reference
index bc6ff2b709c..d4b70c58ae5 100644
--- a/tests/queries/0_stateless/02897_alter_partition_parameters.reference
+++ b/tests/queries/0_stateless/02897_alter_partition_parameters.reference
@@ -7,3 +7,8 @@
 0
 0
 0
+0
+0
+0
+0
+0
diff --git a/tests/queries/0_stateless/02897_alter_partition_parameters.sql b/tests/queries/0_stateless/02897_alter_partition_parameters.sql
index 62ceb9d9768..0be7308ed1a 100644
--- a/tests/queries/0_stateless/02897_alter_partition_parameters.sql
+++ b/tests/queries/0_stateless/02897_alter_partition_parameters.sql
@@ -10,6 +10,24 @@ PARTITION BY toMonday(EventDate);
 
 INSERT INTO test VALUES(toDate('2023-10-09'));
 
+ALTER TABLE test DROP PARTITION ('2023-10-09');
+
+SELECT count() FROM test;
+
+INSERT INTO test VALUES(toDate('2023-10-09'));
+
+ALTER TABLE test DROP PARTITION (('2023-10-09'));
+
+SELECT count() FROM test;
+
+INSERT INTO test VALUES(toDate('2023-10-09'));
+
+ALTER TABLE test DROP PARTITION '2023-10-09';
+
+SELECT count() FROM test;
+
+INSERT INTO test VALUES(toDate('2023-10-09'));
+
 SET param_partition='2023-10-09';
 
 ALTER TABLE test DROP PARTITION {partition:String};
@@ -51,6 +69,17 @@ ENGINE = MergeTree
 ORDER BY tuple()
 PARTITION BY (a * b, b * b);
 
+INSERT INTO test2 VALUES(1, 2);
+
+ALTER TABLE test2 DROP PARTITION tuple(2, 4);
+
+SELECT count() FROM test2;
+
+INSERT INTO test2 VALUES(1, 2);
+
+ALTER TABLE test2 DROP PARTITION (2, 4);
+
+SELECT count() FROM test2;
 
 INSERT INTO test2 VALUES(1, 2);
 

From f5a71455b86210c8ec9968071f63b88ae434da5e Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 12 Feb 2024 17:56:05 +0100
Subject: [PATCH 0858/1081] Do not rebuild a lambda package if it is updated

---
 .../ci/team_keys_lambda/build_and_deploy_archive.sh  | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
index 3c6c8e0ac1e..6ba0987010a 100644
--- a/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
+++ b/tests/ci/team_keys_lambda/build_and_deploy_archive.sh
@@ -17,6 +17,18 @@ DOCKER_IMAGE="public.ecr.aws/lambda/python:${PY_VERSION}"
 LAMBDA_NAME=${DIR_NAME//_/-}
 # The name of directory with lambda code
 PACKAGE=lambda-package
+
+# Do not rebuild and deploy the archive if it's newer than sources
+if [ -e "$PACKAGE.zip" ] && [ -z "$FORCE" ]; then
+  REBUILD=""
+  for src in app.py build_and_deploy_archive.sh requirements.txt lambda_shared/*; do
+    if [ "$src" -nt "$PACKAGE.zip" ]; then
+      REBUILD=1
+    fi
+  done
+  [ -n "$REBUILD" ] || exit 0
+fi
+
 rm -rf "$PACKAGE" "$PACKAGE".zip
 mkdir "$PACKAGE"
 cp app.py "$PACKAGE"

From 310b0773b271d165dd152da1474ba4a892b05b54 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 12 Feb 2024 17:25:17 +0000
Subject: [PATCH 0859/1081] Fix include used for debugging

---
 src/Parsers/ParserPartition.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Parsers/ParserPartition.cpp b/src/Parsers/ParserPartition.cpp
index 0cbd6898dd9..f7d972dd4af 100644
--- a/src/Parsers/ParserPartition.cpp
+++ b/src/Parsers/ParserPartition.cpp
@@ -8,7 +8,6 @@
 #include <Parsers/ASTIdentifier.h>
 #include <Common/typeid_cast.h>
 #include <Parsers/ASTQueryParameter.h>
-#include <iostream>
 
 namespace DB
 {

From d7850db40c8491d1f023dd5f532eee9ee1e8b80a Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Mon, 12 Feb 2024 09:54:38 -0800
Subject: [PATCH 0860/1081] [Docs] Remove incorrect statement about Memory
 table engine

---
 docs/en/engines/table-engines/special/memory.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index 54547b1bc69..0d552a69804 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -10,7 +10,6 @@ sidebar_label:  Memory
 When using the Memory table engine on ClickHouse Cloud, data is not replicated across all nodes (by design). To guarantee that all queries are routed to the same node and that the Memory table engine works as expected, you can do one of the following:
 - Execute all operations in the same session
 - Use a client that uses TCP or the native interface (which enables support for sticky connections) such as [clickhouse-client](/en/interfaces/cli)
-- Submit and execute all queries at once using a multi-statement query (required with clients using the HTTP interface such as [clickhouse-connect](/en/integrations/python))
 :::
 
 The Memory engine stores data in RAM, in uncompressed form. Data is stored in exactly the same form as it is received when read. In other words, reading from this table is completely free.

From 3aefd0f50bc1cbfd6e6c84ab6196417f8e062aa0 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <yakov@clickhouse.com>
Date: Mon, 12 Feb 2024 18:01:43 +0000
Subject: [PATCH 0861/1081] copy on mac instead renaming

---
 utils/self-extracting-executable/decompressor.cpp | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/utils/self-extracting-executable/decompressor.cpp b/utils/self-extracting-executable/decompressor.cpp
index 6614403c0ab..071ecb066cb 100644
--- a/utils/self-extracting-executable/decompressor.cpp
+++ b/utils/self-extracting-executable/decompressor.cpp
@@ -529,14 +529,22 @@ int main(int/* argc*/, char* argv[])
         char decompressed_name[decompressed_name_len + 1];
         (void)snprintf(decompressed_name, decompressed_name_len + 1, decompressed_name_fmt, self, decompressed_suffix);
 
+#if defined(OS_DARWIN)
+        // We can't just rename it on Mac due to security issues, so we copy it...
         std::error_code ec;
-
+        std::filesystem::copy_file(static_cast<char *>(decompressed_name), static_cast<char *>(self), ec);
+        if (ec)
+        {
+            std::cerr << ec.message() << std::endl;
+            return 1;
+        }
+#else
         if (link(decompressed_name, self))
         {
             perror("link");
             return 1;
         }
-
+#endif
         if (chmod(self, static_cast<uint32_t>(decompressed_umask)))
         {
             perror("chmod");

From 6a3c3624435d749c6a83caa0c4f03c67d9f25b50 Mon Sep 17 00:00:00 2001
From: MyroTk <44327070+MyroTk@users.noreply.github.com>
Date: Mon, 12 Feb 2024 10:39:26 -0800
Subject: [PATCH 0862/1081] Update Dockerfile

---
 docker/test/integration/runner/Dockerfile | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index b876f7b9635..473278104b2 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -62,6 +62,7 @@ RUN curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add - \
 # kazoo 2.10.0 is broken
 # https://s3.amazonaws.com/clickhouse-test-reports/59337/524625a1d2f4cc608a3f1059e3df2c30f353a649/integration_tests__asan__analyzer__[5_6].html
 RUN python3 -m pip install --no-cache-dir \
+    aerospike==11.1.0 \
     PyMySQL==1.1.0 \
     asyncio==3.4.3 \
     avro==1.10.2 \

From d008ee725f7d1e1bad802c5153111e41622481b1 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 12 Feb 2024 20:23:21 +0100
Subject: [PATCH 0863/1081] Add a test

---
 src/Storages/S3Queue/S3QueueTableMetadata.h   |  8 +--
 .../integration/test_storage_s3_queue/test.py | 50 +++++++++++++++++++
 2 files changed, 54 insertions(+), 4 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueTableMetadata.h b/src/Storages/S3Queue/S3QueueTableMetadata.h
index 30642869930..84087f72a6a 100644
--- a/src/Storages/S3Queue/S3QueueTableMetadata.h
+++ b/src/Storages/S3Queue/S3QueueTableMetadata.h
@@ -21,10 +21,10 @@ struct S3QueueTableMetadata
     String columns;
     String after_processing;
     String mode;
-    UInt64 s3queue_tracked_files_limit;
-    UInt64 s3queue_tracked_file_ttl_sec;
-    UInt64 s3queue_total_shards_num;
-    UInt64 s3queue_processing_threads_num;
+    UInt64 s3queue_tracked_files_limit = 0;
+    UInt64 s3queue_tracked_file_ttl_sec = 0;
+    UInt64 s3queue_total_shards_num = 1;
+    UInt64 s3queue_processing_threads_num = 1;
 
     S3QueueTableMetadata() = default;
     S3QueueTableMetadata(const StorageS3::Configuration & configuration, const S3QueueSettings & engine_settings, const StorageInMemoryMetadata & storage_metadata);
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index 810c4f29e9d..a7abd840834 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -101,6 +101,15 @@ def started_cluster():
             ],
             stay_alive=True,
         )
+        cluster.add_instance(
+            "old_instance",
+            with_zookeeper=True,
+            image="clickhouse/clickhouse-server",
+            tag="23.12",
+            stay_alive=True,
+            with_installed_binary=True,
+            allow_analyzer=False,
+        )
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -1386,3 +1395,44 @@ def test_processed_file_setting_distributed(started_cluster, processing_threads)
             break
         time.sleep(1)
     assert expected_rows == get_count()
+
+
+def test_upgrade(started_cluster):
+    node = started_cluster.instances["old_instance"]
+
+    table_name = f"test_upgrade"
+    dst_table_name = f"{table_name}_dst"
+    keeper_path = f"/clickhouse/test_{table_name}"
+    files_path = f"{table_name}_data"
+    files_to_generate = 10
+
+    create_table(
+        started_cluster,
+        node,
+        table_name,
+        "ordered",
+        files_path,
+        additional_settings={
+            "keeper_path": keeper_path,
+        },
+    )
+    total_values = generate_random_files(
+        started_cluster, files_path, files_to_generate, start_ind=0, row_num=1
+    )
+
+    create_mv(node, table_name, dst_table_name)
+
+    def get_count():
+        return int(node.query(f"SELECT count() FROM {dst_table_name}"))
+
+    expected_rows = 10
+    for _ in range(20):
+        if expected_rows == get_count():
+            break
+        time.sleep(1)
+
+    assert expected_rows == get_count()
+
+    node.restart_with_latest_version()
+
+    assert expected_rows == get_count()

From 50db80a7e3bfd4a0c6135faca865e3bd6d6e6c95 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 19:36:41 +0000
Subject: [PATCH 0864/1081] Update tests with indexHint for analyzer.

---
 tests/queries/0_stateless/01739_index_hint.reference         | 5 ++++-
 tests/queries/0_stateless/01739_index_hint.sql               | 4 +++-
 .../0_stateless/02880_indexHint__partition_id.reference      | 5 +++--
 tests/queries/0_stateless/02880_indexHint__partition_id.sql  | 5 +++--
 4 files changed, 13 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/01739_index_hint.reference b/tests/queries/0_stateless/01739_index_hint.reference
index 21673bf698b..21f4edc0049 100644
--- a/tests/queries/0_stateless/01739_index_hint.reference
+++ b/tests/queries/0_stateless/01739_index_hint.reference
@@ -35,6 +35,9 @@ SELECT count() FROM XXXX WHERE indexHint(t = toDateTime(0)) SETTINGS optimize_us
 drop table XXXX;
 CREATE TABLE XXXX (p Nullable(Int64), k Decimal(76, 39)) ENGINE = MergeTree PARTITION BY toDate(p) ORDER BY k SETTINGS index_granularity = 1, allow_nullable_key = 1;
 INSERT INTO XXXX FORMAT Values ('2020-09-01 00:01:02', 1), ('2020-09-01 20:01:03', 2), ('2020-09-02 00:01:03', 3);
-SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1;
+SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1, allow_experimental_analyzer=0;
 0
+-- TODO: optimize_use_implicit_projections ignores indexHint (with analyzer) because source columns might be aliased.
+SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1, allow_experimental_analyzer=1;
+3
 drop table XXXX;
diff --git a/tests/queries/0_stateless/01739_index_hint.sql b/tests/queries/0_stateless/01739_index_hint.sql
index cde46a5a2bf..1eca65f0892 100644
--- a/tests/queries/0_stateless/01739_index_hint.sql
+++ b/tests/queries/0_stateless/01739_index_hint.sql
@@ -38,6 +38,8 @@ CREATE TABLE XXXX (p Nullable(Int64), k Decimal(76, 39)) ENGINE = MergeTree PART
 
 INSERT INTO XXXX FORMAT Values ('2020-09-01 00:01:02', 1), ('2020-09-01 20:01:03', 2), ('2020-09-02 00:01:03', 3);
 
-SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1;
+SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1, allow_experimental_analyzer=0;
+-- TODO: optimize_use_implicit_projections ignores indexHint (with analyzer) because source columns might be aliased.
+SELECT count() FROM XXXX WHERE indexHint(p = 1.) SETTINGS optimize_use_implicit_projections = 1, allow_experimental_analyzer=1;
 
 drop table XXXX;
diff --git a/tests/queries/0_stateless/02880_indexHint__partition_id.reference b/tests/queries/0_stateless/02880_indexHint__partition_id.reference
index 365e7b676c7..2cdd2cc1954 100644
--- a/tests/queries/0_stateless/02880_indexHint__partition_id.reference
+++ b/tests/queries/0_stateless/02880_indexHint__partition_id.reference
@@ -1,9 +1,10 @@
 -- { echoOn }
 select * from data prewhere indexHint(_partition_id = '1');
 1
-select count() from data prewhere indexHint(_partition_id = '1');
+-- TODO: optimize_use_implicit_projections ignores indexHint (with analyzer) because source columns might be aliased.
+select count() from data prewhere indexHint(_partition_id = '1') settings optimize_use_implicit_projections = 0;
 1
 select * from data where indexHint(_partition_id = '1');
 1
-select count() from data where indexHint(_partition_id = '1');
+select count() from data where indexHint(_partition_id = '1') settings optimize_use_implicit_projections = 0;
 1
diff --git a/tests/queries/0_stateless/02880_indexHint__partition_id.sql b/tests/queries/0_stateless/02880_indexHint__partition_id.sql
index d15b3f4ccea..9d5dc7bcbc2 100644
--- a/tests/queries/0_stateless/02880_indexHint__partition_id.sql
+++ b/tests/queries/0_stateless/02880_indexHint__partition_id.sql
@@ -4,6 +4,7 @@ insert into data values (1)(2);
 
 -- { echoOn }
 select * from data prewhere indexHint(_partition_id = '1');
-select count() from data prewhere indexHint(_partition_id = '1');
+-- TODO: optimize_use_implicit_projections ignores indexHint (with analyzer) because source columns might be aliased.
+select count() from data prewhere indexHint(_partition_id = '1') settings optimize_use_implicit_projections = 0;
 select * from data where indexHint(_partition_id = '1');
-select count() from data where indexHint(_partition_id = '1');
+select count() from data where indexHint(_partition_id = '1') settings optimize_use_implicit_projections = 0;

From 4d220322cb4a48f8817f3e1ea4296223b2c53edd Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 19:48:02 +0000
Subject: [PATCH 0865/1081] Update analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 53154085b62..29331d674c8 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -8,8 +8,6 @@
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints
 01656_test_query_log_factories_info
-01739_index_hint
-02880_indexHint__partition_id
 01747_join_view_filter_dictionary
 01761_cast_to_enum_nullable
 01925_join_materialized_columns

From 5868cdc708f5815ee22a298473898679ccf31146 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 20:11:44 +0100
Subject: [PATCH 0866/1081] Remove one unused implementation of
 Macros::expand()

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Common/Macros.cpp | 9 ---------
 src/Common/Macros.h   | 2 --
 2 files changed, 11 deletions(-)

diff --git a/src/Common/Macros.cpp b/src/Common/Macros.cpp
index 9e0977d9bcc..1d95037b38b 100644
--- a/src/Common/Macros.cpp
+++ b/src/Common/Macros.cpp
@@ -175,15 +175,6 @@ String Macros::expand(const String & s) const
     return expand(s, info);
 }
 
-String Macros::expand(const String & s, const StorageID & table_id, bool allow_uuid) const
-{
-    MacroExpansionInfo info;
-    info.table_id = table_id;
-    if (!allow_uuid)
-        info.table_id.uuid = UUIDHelpers::Nil;
-    return expand(s, info);
-}
-
 Names Macros::expand(const Names & source_names, size_t level) const
 {
     Names result_names;
diff --git a/src/Common/Macros.h b/src/Common/Macros.h
index 8b9eded7dcb..4f72932bdfd 100644
--- a/src/Common/Macros.h
+++ b/src/Common/Macros.h
@@ -57,8 +57,6 @@ public:
 
     String expand(const String & s) const;
 
-    String expand(const String & s, const StorageID & table_id, bool allow_uuid) const;
-
 
     /** Apply expand for the list.
       */

From c61ac1d3bc9f26ca30dfee7666de230833b855bc Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 20:30:12 +0100
Subject: [PATCH 0867/1081] Convert default_replica_path/default_replica_name
 into server settings

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 programs/server/config.xml                          |  5 +++++
 src/Backups/DDLAdjustingForBackupVisitor.cpp        |  6 +++---
 src/Core/ServerSettings.h                           |  2 ++
 src/Storages/MergeTree/registerStorageMergeTree.cpp |  6 +++---
 src/Storages/StorageReplicatedMergeTree.cpp         | 12 ------------
 src/Storages/StorageReplicatedMergeTree.h           |  3 ---
 6 files changed, 13 insertions(+), 21 deletions(-)

diff --git a/programs/server/config.xml b/programs/server/config.xml
index 6a40818332b..23f3458110e 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -937,6 +937,11 @@
     </macros>
     -->
 
+    <!--
+    <default_replica_path>/clickhouse/tables/{database}/{table}</default_replica_path>
+    <default_replica_name>{replica}</default_replica_name>
+    -->
+
     <!-- Replica group name for database Replicated.
           The cluster created by Replicated database will consist of replicas in the same group.
           DDL queries will only wail for the replicas in the same group.
diff --git a/src/Backups/DDLAdjustingForBackupVisitor.cpp b/src/Backups/DDLAdjustingForBackupVisitor.cpp
index 0bff3cc9f4e..5ea91094b75 100644
--- a/src/Backups/DDLAdjustingForBackupVisitor.cpp
+++ b/src/Backups/DDLAdjustingForBackupVisitor.cpp
@@ -57,9 +57,9 @@ namespace
                 if (size_t uuid_pos = zookeeper_path_arg.find(table_uuid_str); uuid_pos != String::npos)
                     zookeeper_path_arg.replace(uuid_pos, table_uuid_str.size(), "{uuid}");
             }
-            const auto & config = data.global_context->getConfigRef();
-            if ((zookeeper_path_arg == StorageReplicatedMergeTree::getDefaultZooKeeperPath(config))
-                && (replica_name_arg == StorageReplicatedMergeTree::getDefaultReplicaName(config))
+            const auto & server_settings = data.global_context->getServerSettings();
+            if ((zookeeper_path_arg == server_settings.default_replica_path.value)
+                && (replica_name_arg == server_settings.default_replica_name.value)
                 && ((engine_args.size() == 2) || !engine_args[2]->as<ASTLiteral>()))
             {
                 engine_args.erase(engine_args.begin(), engine_args.begin() + 2);
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index b10c0d8e093..de2a4e9b755 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -115,6 +115,8 @@ namespace DB
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
     M(UInt64, max_materialized_views_count_for_table, 0, "A limit on the number of materialized views attached to a table.", 0) \
     M(UInt32, max_database_replicated_create_table_thread_pool_size, 1, "The number of threads to create tables during replica recovery in DatabaseReplicated. Zero means number of threads equal number of cores.", 0) \
+    M(String, default_replica_path, "/clickhouse/tables/{uuid}/{shard}", "The path to the table in ZooKeeper", 0) \
+    M(String, default_replica_name, "{replica}", "The replica name in ZooKeeper", 0) \
 
     /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 8e646e48f16..832879b9a4f 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -404,10 +404,10 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         {
             /// Try use default values if arguments are not specified.
             /// Note: {uuid} macro works for ON CLUSTER queries when database engine is Atomic.
-            const auto & config = args.getContext()->getConfigRef();
-            zookeeper_path = StorageReplicatedMergeTree::getDefaultZooKeeperPath(config);
+            const auto & server_settings = args.getContext()->getServerSettings();
+            zookeeper_path = server_settings.default_replica_path;
             /// TODO maybe use hostname if {replica} is not defined?
-            replica_name = StorageReplicatedMergeTree::getDefaultReplicaName(config);
+            replica_name = server_settings.default_replica_name;
 
             /// Modify query, so default values will be written to metadata
             assert(arg_num == 0);
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 80fe2c7a838..b30d392d641 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -545,18 +545,6 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
 }
 
 
-String StorageReplicatedMergeTree::getDefaultZooKeeperPath(const Poco::Util::AbstractConfiguration & config)
-{
-    return config.getString("default_replica_path", "/clickhouse/tables/{uuid}/{shard}");
-}
-
-
-String StorageReplicatedMergeTree::getDefaultReplicaName(const Poco::Util::AbstractConfiguration & config)
-{
-    return config.getString("default_replica_name", "{replica}");
-}
-
-
 bool StorageReplicatedMergeTree::checkFixedGranularityInZookeeper()
 {
     auto zookeeper = getZooKeeper();
diff --git a/src/Storages/StorageReplicatedMergeTree.h b/src/Storages/StorageReplicatedMergeTree.h
index c682b1ec88d..79d6d1dce3d 100644
--- a/src/Storages/StorageReplicatedMergeTree.h
+++ b/src/Storages/StorageReplicatedMergeTree.h
@@ -143,9 +143,6 @@ public:
 
     ~StorageReplicatedMergeTree() override;
 
-    static String getDefaultZooKeeperPath(const Poco::Util::AbstractConfiguration & config);
-    static String getDefaultReplicaName(const Poco::Util::AbstractConfiguration & config);
-
     std::string getName() const override { return "Replicated" + merging_params.getModeName() + "MergeTree"; }
 
     bool supportsParallelInsert() const override { return true; }

From eb44faf867152713ebbbe3753a821acf803f8e37 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 12 Feb 2024 20:41:46 +0000
Subject: [PATCH 0868/1081] Test to reproduce absence of closing record in
 query_log

---
 src/Common/FailPoint.cpp                      |  5 ++--
 src/Common/FailPoint.h                        |  2 --
 src/Interpreters/executeQuery.cpp             | 18 ++++++++----
 .../__init__.py                               |  0
 .../test_insert_exception_over_http/test.py   | 29 +++++++++++++++++++
 5 files changed, 45 insertions(+), 9 deletions(-)
 create mode 100644 tests/integration/test_insert_exception_over_http/__init__.py
 create mode 100644 tests/integration/test_insert_exception_over_http/test.py

diff --git a/src/Common/FailPoint.cpp b/src/Common/FailPoint.cpp
index f29aee0cdcc..e0639df29b4 100644
--- a/src/Common/FailPoint.cpp
+++ b/src/Common/FailPoint.cpp
@@ -1,3 +1,4 @@
+#include "config.h"
 #include <Common/Exception.h>
 #include <Common/FailPoint.h>
 #include <Common/Config/ConfigHelper.h>
@@ -6,7 +7,6 @@
 #include <chrono>
 #include <condition_variable>
 #include <mutex>
-#include <optional>
 
 namespace DB
 {
@@ -44,7 +44,8 @@ static struct InitFiu
     REGULAR(dummy_failpoint) \
     REGULAR(prefetched_reader_pool_failpoint) \
     PAUSEABLE_ONCE(dummy_pausable_failpoint_once) \
-    PAUSEABLE(dummy_pausable_failpoint)
+    PAUSEABLE(dummy_pausable_failpoint) \
+    ONCE(execute_query_calling_empty_set_result_func_on_exception)
 
 namespace FailPoints
 {
diff --git a/src/Common/FailPoint.h b/src/Common/FailPoint.h
index b9eb13903a6..a0081d67081 100644
--- a/src/Common/FailPoint.h
+++ b/src/Common/FailPoint.h
@@ -1,5 +1,4 @@
 #pragma once
-#include "config.h"
 
 #include <Common/Exception.h>
 #include <Core/Types.h>
@@ -18,7 +17,6 @@
 #pragma clang diagnostic pop
 #endif
 
-#include <any>
 #include <unordered_map>
 
 namespace DB
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 8b36790a269..d724d350958 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -4,6 +4,7 @@
 #include <Common/ThreadProfileEvents.h>
 #include <Common/MemoryTrackerBlockerInThread.h>
 #include <Common/SensitiveDataMasker.h>
+#include <Common/FailPoint.h>
 
 #include <Interpreters/AsynchronousInsertQueue.h>
 #include <Interpreters/Cache/QueryCache.h>
@@ -105,6 +106,10 @@ namespace ErrorCodes
     extern const int SUPPORT_IS_DISABLED;
 }
 
+namespace FailPoints
+{
+    extern const char execute_query_calling_empty_set_result_func_on_exception[];
+}
 
 static void checkASTSizeLimits(const IAST & ast, const Settings & settings)
 {
@@ -1361,7 +1366,7 @@ void executeQuery(
     BlockIO streams;
     OutputFormatPtr output_format;
 
-    auto update_format_for_exception_if_needed = [&]()
+    auto update_format_on_exception_if_needed = [&]()
     {
         if (!output_format)
         {
@@ -1374,10 +1379,13 @@ void executeQuery(
                     /// Force an update of the headers before we start writing
                     result_details.content_type = output_format->getContentType();
                     result_details.format = format_name;
+
                     if (set_result_details)
                     {
-                        set_result_details(result_details);
+                        /// reset set_result_details func to avoid calling in SCOPE_EXIT()
+                        auto set_result_details_copy = set_result_details;
                         set_result_details = nullptr;
+                        set_result_details_copy(result_details);
                     }
                 }
             }
@@ -1397,7 +1405,7 @@ void executeQuery(
     {
         if (handle_exception_in_output_format)
         {
-            update_format_for_exception_if_needed();
+            update_format_on_exception_if_needed();
             if (output_format)
                 handle_exception_in_output_format(*output_format);
         }
@@ -1427,7 +1435,7 @@ void executeQuery(
                 const auto & out_file = typeid_cast<const ASTLiteral &>(*ast_query_with_output->out_file).value.safeGet<std::string>();
 
                 std::string compression_method;
-                if (ast_query_with_output->compression)
+                if (ast_query_with_output->compressiong
                 {
                     const auto & compression_method_node = ast_query_with_output->compression->as<ASTLiteral &>();
                     compression_method = compression_method_node.value.safeGet<std::string>();
@@ -1500,7 +1508,7 @@ void executeQuery(
     {
         if (handle_exception_in_output_format)
         {
-            update_format_for_exception_if_needed();
+            update_format_on_exception_if_needed();
             if (output_format)
                 handle_exception_in_output_format(*output_format);
         }
diff --git a/tests/integration/test_insert_exception_over_http/__init__.py b/tests/integration/test_insert_exception_over_http/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_insert_exception_over_http/test.py b/tests/integration/test_insert_exception_over_http/test.py
new file mode 100644
index 00000000000..3630b8379aa
--- /dev/null
+++ b/tests/integration/test_insert_exception_over_http/test.py
@@ -0,0 +1,29 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+instance = cluster.add_instance("instance", with_zookeeper=True)
+
+
+@pytest.fixture(scope="module", autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def test_insert_exception_over_http(start_cluster):
+    instance.query("DROP TABLE IF EXISTS tt SYNC");
+    instance.query("CREATE TABLE tt (KeyID UInt32) Engine = ReplicatedMergeTree('/test_insert_exception_over_http/tt', 'r1') ORDER BY (KeyID)");
+    instance.query("SYSTEM ENABLE FAILPOINT execute_query_calling_empty_set_result_func_on_exception");
+
+    assert True == instance.http_query_and_get_error("insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)").startswith("500 Internal Server Error")
+
+    assert "0\n" == instance.query("select count() from tt")
+    instance.query("SYSTEM FLUSH LOGS")
+    assert "2\n" ==  instance.query("select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday()")
+
+    instance.query("DROP TABLE tt SYNC")

From f5880d7201e0c939629d8115cf2cbfb148d0966c Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 12 Feb 2024 20:55:20 +0000
Subject: [PATCH 0869/1081] Automatic style fix

---
 .../test_insert_exception_over_http/test.py    | 18 +++++++++++++-----
 1 file changed, 13 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_insert_exception_over_http/test.py b/tests/integration/test_insert_exception_over_http/test.py
index 3630b8379aa..962c20d6bff 100644
--- a/tests/integration/test_insert_exception_over_http/test.py
+++ b/tests/integration/test_insert_exception_over_http/test.py
@@ -16,14 +16,22 @@ def start_cluster():
 
 
 def test_insert_exception_over_http(start_cluster):
-    instance.query("DROP TABLE IF EXISTS tt SYNC");
-    instance.query("CREATE TABLE tt (KeyID UInt32) Engine = ReplicatedMergeTree('/test_insert_exception_over_http/tt', 'r1') ORDER BY (KeyID)");
-    instance.query("SYSTEM ENABLE FAILPOINT execute_query_calling_empty_set_result_func_on_exception");
+    instance.query("DROP TABLE IF EXISTS tt SYNC")
+    instance.query(
+        "CREATE TABLE tt (KeyID UInt32) Engine = ReplicatedMergeTree('/test_insert_exception_over_http/tt', 'r1') ORDER BY (KeyID)"
+    )
+    instance.query(
+        "SYSTEM ENABLE FAILPOINT execute_query_calling_empty_set_result_func_on_exception"
+    )
 
-    assert True == instance.http_query_and_get_error("insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)").startswith("500 Internal Server Error")
+    assert True == instance.http_query_and_get_error(
+        "insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)"
+    ).startswith("500 Internal Server Error")
 
     assert "0\n" == instance.query("select count() from tt")
     instance.query("SYSTEM FLUSH LOGS")
-    assert "2\n" ==  instance.query("select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday()")
+    assert "2\n" == instance.query(
+        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday()"
+    )
 
     instance.query("DROP TABLE tt SYNC")

From d1167d0b04f3bec6abb6155c0e1f40851fa5d5e9 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Mon, 12 Feb 2024 20:55:19 +0000
Subject: [PATCH 0870/1081] Fix: corrupted source + fail point

---
 src/Interpreters/executeQuery.cpp | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index d724d350958..345472fe4d0 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1380,6 +1380,11 @@ void executeQuery(
                     result_details.content_type = output_format->getContentType();
                     result_details.format = format_name;
 
+                    fiu_do_on(FailPoint::execute_query_calling_empty_set_result_func_on_exception, {
+                        set_result_details = nullptr;
+                        set_result_details(result_details);
+                    });
+
                     if (set_result_details)
                     {
                         /// reset set_result_details func to avoid calling in SCOPE_EXIT()
@@ -1435,7 +1440,7 @@ void executeQuery(
                 const auto & out_file = typeid_cast<const ASTLiteral &>(*ast_query_with_output->out_file).value.safeGet<std::string>();
 
                 std::string compression_method;
-                if (ast_query_with_output->compressiong
+                if (ast_query_with_output->compression)
                 {
                     const auto & compression_method_node = ast_query_with_output->compression->as<ASTLiteral &>();
                     compression_method = compression_method_node.value.safeGet<std::string>();

From b68bc3d3d717b902f39c38e91d05e4979956a052 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 13 Feb 2024 02:07:10 +0100
Subject: [PATCH 0871/1081] Update
 docs/en/sql-reference/statements/create/table.md

---
 docs/en/sql-reference/statements/create/table.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/create/table.md b/docs/en/sql-reference/statements/create/table.md
index 067761e760b..0edf158e981 100644
--- a/docs/en/sql-reference/statements/create/table.md
+++ b/docs/en/sql-reference/statements/create/table.md
@@ -515,7 +515,7 @@ ENGINE = MergeTree ORDER BY x;
 ## Temporary Tables
 
 :::note
-Please note that on ClickHouse Cloud, temporary tables are not replicated. As a result, there is no guarantee that data inserted into a temporary table will be available in other replicas. The primary use case where temporary tables can be useful in ClickHouse Cloud is for querying or joining small external datasets during a single session.
+Please note that temporary tables are not replicated. As a result, there is no guarantee that data inserted into a temporary table will be available in other replicas. The primary use case where temporary tables can be useful is for querying or joining small external datasets during a single session.
 :::
 
 ClickHouse supports temporary tables which have the following characteristics:

From a98af159b5b8afc00a161cce437b8231e8bb164b Mon Sep 17 00:00:00 2001
From: Nikolai Fedorovskikh <fenik17@gmail.com>
Date: Tue, 13 Feb 2024 02:10:41 +0100
Subject: [PATCH 0872/1081] [Docs] fix some typos and missing commas

---
 docs/en/development/architecture.md            |  6 +++---
 docs/en/development/build-cross-s390x.md       |  2 +-
 .../building_and_benchmarking_deflate_qpl.md   |  4 ++--
 docs/en/development/contrib.md                 |  2 +-
 docs/en/development/developer-instruction.md   | 12 ++++++------
 .../mergetree-family/annindexes.md             | 12 ++++++------
 .../mergetree-family/collapsingmergetree.md    |  4 ++--
 .../table-engines/special/distributed.md       |  4 ++--
 .../example-datasets/amazon-reviews.md         |  2 +-
 .../example-datasets/cell-towers.md            |  4 ++--
 .../example-datasets/covid19.md                |  4 ++--
 docs/en/interfaces/cli.md                      |  2 +-
 docs/en/interfaces/formats.md                  |  2 +-
 docs/en/operations/configuration-files.md      |  4 ++--
 .../system-tables/asynchronous_loader.md       |  2 +-
 .../system-tables/asynchronous_metrics.md      | 10 +++++-----
 docs/en/operations/system-tables/clusters.md   |  2 +-
 .../operations/system-tables/dictionaries.md   |  2 +-
 .../operations/utilities/clickhouse-local.md   |  4 ++--
 .../utilities/clickhouse-obfuscator.md         |  2 +-
 .../aggregate-functions/reference/any.md       |  2 +-
 .../reference/contingency.md                   |  4 ++--
 docs/en/sql-reference/data-types/datetime64.md |  2 +-
 docs/en/sql-reference/data-types/decimal.md    |  2 +-
 docs/en/sql-reference/distributed-ddl.md       |  2 +-
 .../functions/bitmap-functions.md              |  2 +-
 .../functions/date-time-functions.md           | 18 +++++++++---------
 .../statements/alter/apply-deleted-mask.md     |  2 +-
 .../statements/alter/constraint.md             |  2 +-
 docs/en/sql-reference/statements/detach.md     |  4 ++--
 .../statements/select/distinct.md              |  2 +-
 docs/ru/development/architecture.md            |  2 +-
 docs/ru/development/developer-instruction.md   |  6 +++---
 .../mergetree-family/collapsingmergetree.md    |  2 +-
 .../ru/engines/table-engines/special/buffer.md |  4 ++--
 docs/ru/interfaces/cli.md                      |  6 +++---
 docs/ru/operations/clickhouse-keeper.md        |  4 ++--
 docs/ru/operations/configuration-files.md      |  4 ++--
 .../utilities/clickhouse-benchmark.md          |  2 +-
 docs/ru/sql-reference/data-types/datetime.md   |  2 +-
 .../functions/arithmetic-functions.md          |  2 +-
 .../sql-reference/functions/array-functions.md |  4 ++--
 .../statements/select/distinct.md              |  2 +-
 .../sql-reference/table-functions/cluster.md   |  2 +-
 .../operations/system-tables/dictionaries.md   |  2 +-
 45 files changed, 86 insertions(+), 86 deletions(-)

diff --git a/docs/en/development/architecture.md b/docs/en/development/architecture.md
index cfdd2bbcc41..d3a29c9171b 100644
--- a/docs/en/development/architecture.md
+++ b/docs/en/development/architecture.md
@@ -166,11 +166,11 @@ For most external applications, we recommend using the HTTP interface because it
 
 ## Configuration {#configuration}
 
-ClickHouse Server is based on POCO C++ Libraries and uses `Poco::Util::AbstractConfiguration` to represent it's configuration. Configuration is held by `Poco::Util::ServerApplication` class inherited by `DaemonBase` class, which in turn is inherited by `DB::Server` class, implementing clickhouse-server itself. So config can be accessed by `ServerApplication::config()` method.
+ClickHouse Server is based on POCO C++ Libraries and uses `Poco::Util::AbstractConfiguration` to represent its configuration. Configuration is held by `Poco::Util::ServerApplication` class inherited by `DaemonBase` class, which in turn is inherited by `DB::Server` class, implementing clickhouse-server itself. So config can be accessed by `ServerApplication::config()` method.
 
 Config is read from multiple files (in XML or YAML format) and merged into single `AbstractConfiguration` by `ConfigProcessor` class. Configuration is loaded at server startup and can be reloaded later if one of config files is updated, removed or added. `ConfigReloader` class is responsible for periodic monitoring of these changes and reload procedure as well. `SYSTEM RELOAD CONFIG` query also triggers config to be reloaded.
 
-For queries and subsystems other than `Server` config is accessible using `Context::getConfigRef()` method. Every subsystem that is capable of reloading it's config without server restart should register itself in reload callback in `Server::main()` method. Note that if newer config has an error, most subsystems will ignore new config, log warning messages and keep working with previously loaded config. Due to the nature of `AbstractConfiguration` it is not possible to pass reference to specific section, so `String config_prefix` is usually used instead.
+For queries and subsystems other than `Server` config is accessible using `Context::getConfigRef()` method. Every subsystem that is capable of reloading its config without server restart should register itself in reload callback in `Server::main()` method. Note that if newer config has an error, most subsystems will ignore new config, log warning messages and keep working with previously loaded config. Due to the nature of `AbstractConfiguration` it is not possible to pass reference to specific section, so `String config_prefix` is usually used instead.
 
 ## Threads and jobs {#threads-and-jobs}
 
@@ -255,7 +255,7 @@ When we are going to read something from a part in `MergeTree`, we look at `prim
 
 When you `INSERT` a bunch of data into `MergeTree`, that bunch is sorted by primary key order and forms a new part. There are background threads that periodically select some parts and merge them into a single sorted part to keep the number of parts relatively low. That’s why it is called `MergeTree`. Of course, merging leads to “write amplification”. All parts are immutable: they are only created and deleted, but not modified. When SELECT is executed, it holds a snapshot of the table (a set of parts). After merging, we also keep old parts for some time to make a recovery after failure easier, so if we see that some merged part is probably broken, we can replace it with its source parts.
 
-`MergeTree` is not an LSM tree because it does not contain MEMTABLE and LOG: inserted data is written directly to the filesystem. This behavior makes MergeTree much more suitable to insert data in batches. Therefore frequently inserting small amounts of rows is not ideal for MergeTree. For example, a couple of rows per second is OK, but doing it a thousand times a second is not optimal for MergeTree. However, there is an async insert mode for small inserts to overcome this limitation. We did it this way for simplicity’s sake, and because we are already inserting data in batches in our applications
+`MergeTree` is not an LSM tree because it does not contain MEMTABLE and LOG: inserted data is written directly to the filesystem. This behavior makes MergeTree much more suitable to insert data in batches. Therefore, frequently inserting small amounts of rows is not ideal for MergeTree. For example, a couple of rows per second is OK, but doing it a thousand times a second is not optimal for MergeTree. However, there is an async insert mode for small inserts to overcome this limitation. We did it this way for simplicity’s sake, and because we are already inserting data in batches in our applications
 
 There are MergeTree engines that are doing additional work during background merges. Examples are `CollapsingMergeTree` and `AggregatingMergeTree`. This could be treated as special support for updates. Keep in mind that these are not real updates because users usually have no control over the time when background merges are executed, and data in a `MergeTree` table is almost always stored in more than one part, not in completely merged form.
 
diff --git a/docs/en/development/build-cross-s390x.md b/docs/en/development/build-cross-s390x.md
index b7cda515d77..a4a83c7989b 100644
--- a/docs/en/development/build-cross-s390x.md
+++ b/docs/en/development/build-cross-s390x.md
@@ -38,7 +38,7 @@ ninja
 
 ## Running
 
-Once built, the binary can be run with, eg.:
+Once built, the binary can be run with, e.g.:
 
 ```bash
 qemu-s390x-static -L /usr/s390x-linux-gnu ./clickhouse
diff --git a/docs/en/development/building_and_benchmarking_deflate_qpl.md b/docs/en/development/building_and_benchmarking_deflate_qpl.md
index 4e01b41ab3c..b9d39b8cc2d 100644
--- a/docs/en/development/building_and_benchmarking_deflate_qpl.md
+++ b/docs/en/development/building_and_benchmarking_deflate_qpl.md
@@ -95,7 +95,7 @@ Complete below three steps mentioned in [Star Schema Benchmark](https://clickhou
 - Inserting data. Here should use `./benchmark_sample/rawdata_dir/ssb-dbgen/*.tbl` as input data.
 - Converting “star schema” to de-normalized “flat schema”
 
-Set up database with with IAA Deflate codec
+Set up database with IAA Deflate codec
 
 ``` bash
 $ cd ./database_dir/deflate
@@ -104,7 +104,7 @@ $ [CLICKHOUSE_EXE] client
 ```
 Complete three steps same as lz4 above
 
-Set up database with with ZSTD codec
+Set up database with ZSTD codec
 
 ``` bash
 $ cd ./database_dir/zstd
diff --git a/docs/en/development/contrib.md b/docs/en/development/contrib.md
index 4b296c43db4..bbc5fbeebcb 100644
--- a/docs/en/development/contrib.md
+++ b/docs/en/development/contrib.md
@@ -13,7 +13,7 @@ ClickHouse utilizes third-party libraries for different purposes, e.g., to conne
 SELECT library_name, license_type, license_path FROM system.licenses ORDER BY library_name COLLATE 'en';
 ```
 
-(Note that the listed libraries are the ones located in the `contrib/` directory of the ClickHouse repository. Depending on the build options, some of of the libraries may have not been compiled, and as a result, their functionality may not be available at runtime.
+Note that the listed libraries are the ones located in the `contrib/` directory of the ClickHouse repository. Depending on the build options, some of the libraries may have not been compiled, and as a result, their functionality may not be available at runtime.
 
 [Example](https://play.clickhouse.com/play?user=play#U0VMRUNUIGxpYnJhcnlfbmFtZSwgbGljZW5zZV90eXBlLCBsaWNlbnNlX3BhdGggRlJPTSBzeXN0ZW0ubGljZW5zZXMgT1JERVIgQlkgbGlicmFyeV9uYW1lIENPTExBVEUgJ2VuJw==)
 
diff --git a/docs/en/development/developer-instruction.md b/docs/en/development/developer-instruction.md
index 31346c77949..33558b4373c 100644
--- a/docs/en/development/developer-instruction.md
+++ b/docs/en/development/developer-instruction.md
@@ -7,13 +7,13 @@ description: Prerequisites and an overview of how to build ClickHouse
 
 # Getting Started Guide for Building ClickHouse
 
-ClickHouse can be build on Linux, FreeBSD and macOS. If you use Windows, you can still build ClickHouse in a virtual machine running Linux, e.g. [VirtualBox](https://www.virtualbox.org/) with Ubuntu.
+ClickHouse can be built on Linux, FreeBSD and macOS. If you use Windows, you can still build ClickHouse in a virtual machine running Linux, e.g. [VirtualBox](https://www.virtualbox.org/) with Ubuntu.
 
 ClickHouse requires a 64-bit system to compile and run, 32-bit systems do not work.
 
 ## Creating a Repository on GitHub {#creating-a-repository-on-github}
 
-To start developing for ClickHouse you will need a [GitHub](https://www.virtualbox.org/) account. Please also generate a SSH key locally (if you don't have one already) and upload the public key to GitHub as this is a prerequisite for contributing patches.
+To start developing for ClickHouse you will need a [GitHub](https://www.virtualbox.org/) account. Please also generate an SSH key locally (if you don't have one already) and upload the public key to GitHub as this is a prerequisite for contributing patches.
 
 Next, create a fork of the [ClickHouse repository](https://github.com/ClickHouse/ClickHouse/) in your personal account by clicking the "fork" button in the upper right corner.
 
@@ -37,7 +37,7 @@ git clone git@github.com:your_github_username/ClickHouse.git  # replace placehol
 cd ClickHouse
 ```
 
-This command creates a directory `ClickHouse/` containing the source code of ClickHouse. If you specify a custom checkout directory after the URL but it is important that this path does not contain whitespaces as it may lead to problems with the build later on.
+This command creates a directory `ClickHouse/` containing the source code of ClickHouse. If you specify a custom checkout directory after the URL, but it is important that this path does not contain whitespaces as it may lead to problems with the build later on.
 
 The ClickHouse repository uses Git submodules, i.e. references to external repositories (usually 3rd party libraries used by ClickHouse). These are not checked out by default. To do so, you can either
 
@@ -45,7 +45,7 @@ The ClickHouse repository uses Git submodules, i.e. references to external repos
 
 - if `git clone` did not check out submodules, run `git submodule update --init --jobs <N>` (e.g. `<N> = 12` to parallelize the checkout) to achieve the same as the previous alternative, or
 
-- if `git clone` did not check out submodules and you like to use [sparse](https://github.blog/2020-01-17-bring-your-monorepo-down-to-size-with-sparse-checkout/) and [shallow](https://github.blog/2020-12-21-get-up-to-speed-with-partial-clone-and-shallow-clone/) submodule checkout to omit unneeded files and history in submodules to save space (ca. 5 GB instead of ca. 15 GB), run `./contrib/update-submodules.sh`. Not really recommended as it generally makes working with submodules less convenient and slower.
+- if `git clone` did not check out submodules, and you like to use [sparse](https://github.blog/2020-01-17-bring-your-monorepo-down-to-size-with-sparse-checkout/) and [shallow](https://github.blog/2020-12-21-get-up-to-speed-with-partial-clone-and-shallow-clone/) submodule checkout to omit unneeded files and history in submodules to save space (ca. 5 GB instead of ca. 15 GB), run `./contrib/update-submodules.sh`. Not really recommended as it generally makes working with submodules less convenient and slower.
 
 You can check the Git status with the command: `git submodule status`.
 
@@ -143,7 +143,7 @@ When a large amount of RAM is available on build machine you should limit the nu
 
 On machines with 4GB of RAM, it is recommended to specify 1, for 8GB of RAM `-j 2` is recommended.
 
-If you get the message: `ninja: error: loading 'build.ninja': No such file or directory`, it means that generating a build configuration has failed and you need to inspect the message above.
+If you get the message: `ninja: error: loading 'build.ninja': No such file or directory`, it means that generating a build configuration has failed, and you need to inspect the message above.
 
 Upon the successful start of the building process, you’ll see the build progress - the number of processed tasks and the total number of tasks.
 
@@ -184,7 +184,7 @@ You can also run your custom-built ClickHouse binary with the config file from t
 
 **CLion (recommended)**
 
-If you do not know which IDE to use, we recommend that you use [CLion](https://www.jetbrains.com/clion/). CLion is commercial software but it offers a 30 day free trial. It is also free of charge for students. CLion can be used on both Linux and macOS.
+If you do not know which IDE to use, we recommend that you use [CLion](https://www.jetbrains.com/clion/). CLion is commercial software, but it offers a 30 day free trial. It is also free of charge for students. CLion can be used on both Linux and macOS.
 
 A few things to know when using CLion to develop ClickHouse:
 
diff --git a/docs/en/engines/table-engines/mergetree-family/annindexes.md b/docs/en/engines/table-engines/mergetree-family/annindexes.md
index be588f1764d..78a27d3ff86 100644
--- a/docs/en/engines/table-engines/mergetree-family/annindexes.md
+++ b/docs/en/engines/table-engines/mergetree-family/annindexes.md
@@ -2,7 +2,7 @@
 
 Nearest neighborhood search is the problem of finding the M closest points for a given point in an N-dimensional vector space. The most
 straightforward approach to solve this problem is a brute force search where the distance between all points in the vector space and the
-reference point is computed. This method guarantees perfect accuracy but it is usually too slow for practical applications. Thus, nearest
+reference point is computed. This method guarantees perfect accuracy, but it is usually too slow for practical applications. Thus, nearest
 neighborhood search problems are often solved with [approximative algorithms](https://github.com/erikbern/ann-benchmarks). Approximative
 nearest neighborhood search techniques, in conjunction with [embedding
 methods](https://cloud.google.com/architecture/overview-extracting-and-serving-feature-embeddings-for-machine-learning) allow to search huge
@@ -24,7 +24,7 @@ LIMIT N
 
 `vectors` contains N-dimensional values of type [Array](../../../sql-reference/data-types/array.md) or
 [Tuple](../../../sql-reference/data-types/tuple.md), for example embeddings. Function `Distance` computes the distance between two vectors.
-Often, the the Euclidean (L2) distance is chosen as distance function but [other
+Often, the Euclidean (L2) distance is chosen as distance function but [other
 distance functions](/docs/en/sql-reference/functions/distance-functions.md) are also possible. `Point` is the reference point, e.g. `(0.17,
 0.33, ...)`, and `N` limits the number of search results.
 
@@ -109,7 +109,7 @@ clickhouse-client --param_vec='hello' --query="SELECT * FROM table_with_ann_inde
 
 **Restrictions**: Queries that contain both a `WHERE Distance(vectors, Point) < MaxDistance` and an `ORDER BY Distance(vectors, Point)`
 clause cannot use ANN indexes. Also, the approximate algorithms used to determine the nearest neighbors require a limit, hence queries
-without `LIMIT` clause cannot utilize ANN indexes. Also ANN indexes are only used if the query has a `LIMIT` value smaller than setting
+without `LIMIT` clause cannot utilize ANN indexes. Also, ANN indexes are only used if the query has a `LIMIT` value smaller than setting
 `max_limit_for_ann_queries` (default: 1 million rows). This is a safeguard to prevent large memory allocations by external libraries for
 approximate neighbor search.
 
@@ -120,9 +120,9 @@ then each indexed block will contain 16384 rows. However, data structures and al
 provided by external libraries) are inherently row-oriented. They store a compact representation of a set of rows and also return rows for
 ANN queries. This causes some rather unintuitive differences in the way ANN indexes behave compared to normal skip indexes.
 
-When a user defines a ANN index on a column, ClickHouse internally creates a ANN "sub-index" for each index block. The sub-index is "local"
+When a user defines an ANN index on a column, ClickHouse internally creates an ANN "sub-index" for each index block. The sub-index is "local"
 in the sense that it only knows about the rows of its containing index block. In the previous example and assuming that a column has 65536
-rows, we obtain four index blocks (spanning eight granules) and a ANN sub-index for each index block. A sub-index is theoretically able to
+rows, we obtain four index blocks (spanning eight granules) and an ANN sub-index for each index block. A sub-index is theoretically able to
 return the rows with the N closest points within its index block directly. However, since ClickHouse loads data from disk to memory at the
 granularity of granules, sub-indexes extrapolate matching rows to granule granularity. This is different from regular skip indexes which
 skip data at the granularity of index blocks.
@@ -231,7 +231,7 @@ The Annoy index currently does not work with per-table, non-default `index_granu
 
 ## USearch {#usearch}
 
-This type of ANN index is based on the [the USearch library](https://github.com/unum-cloud/usearch), which implements the [HNSW
+This type of ANN index is based on the [USearch library](https://github.com/unum-cloud/usearch), which implements the [HNSW
 algorithm](https://arxiv.org/abs/1603.09320), i.e., builds a hierarchical graph where each point represents a vector and the edges represent
 similarity. Such hierarchical structures can be very efficient on large collections. They may often fetch 0.05% or less data from the
 overall dataset, while still providing 99% recall. This is especially useful when working with high-dimensional vectors,
diff --git a/docs/en/engines/table-engines/mergetree-family/collapsingmergetree.md b/docs/en/engines/table-engines/mergetree-family/collapsingmergetree.md
index 0043e1b6748..ba4021d8422 100644
--- a/docs/en/engines/table-engines/mergetree-family/collapsingmergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/collapsingmergetree.md
@@ -125,7 +125,7 @@ For each resulting data part ClickHouse saves:
 3.  The first “cancel” row, if there are more “cancel” rows than “state” rows.
 4.  None of the rows, in all other cases.
 
-Also when there are at least 2 more “state” rows than “cancel” rows, or at least 2 more “cancel” rows then “state” rows, the merge continues, but ClickHouse treats this situation as a logical error and records it in the server log. This error can occur if the same data were inserted more than once.
+Also, when there are at least 2 more “state” rows than “cancel” rows, or at least 2 more “cancel” rows then “state” rows, the merge continues, but ClickHouse treats this situation as a logical error and records it in the server log. This error can occur if the same data were inserted more than once.
 
 Thus, collapsing should not change the results of calculating statistics.
 Changes gradually collapsed so that in the end only the last state of almost every object left.
@@ -196,7 +196,7 @@ What do we see and where is collapsing?
 
 With two `INSERT` queries, we created 2 data parts. The `SELECT` query was performed in 2 threads, and we got a random order of rows. Collapsing not occurred because there was no merge of the data parts yet. ClickHouse merges data part in an unknown moment which we can not predict.
 
-Thus we need aggregation:
+Thus, we need aggregation:
 
 ``` sql
 SELECT
diff --git a/docs/en/engines/table-engines/special/distributed.md b/docs/en/engines/table-engines/special/distributed.md
index de8ae0357dc..c3b8a2f2048 100644
--- a/docs/en/engines/table-engines/special/distributed.md
+++ b/docs/en/engines/table-engines/special/distributed.md
@@ -72,7 +72,7 @@ Specifying the `sharding_key` is necessary for the following:
 
 #### fsync_directories
 
-`fsync_directories` - do the `fsync` for directories. Guarantees that the OS refreshed directory metadata after operations related to background inserts on Distributed table (after insert, after sending the data to shard, etc).
+`fsync_directories` - do the `fsync` for directories. Guarantees that the OS refreshed directory metadata after operations related to background inserts on Distributed table (after insert, after sending the data to shard, etc.).
 
 #### bytes_to_throw_insert
 
@@ -220,7 +220,7 @@ Second, you can perform `INSERT` statements on a `Distributed` table. In this ca
 
 Each shard can have a `<weight>` defined in the config file. By default, the weight is `1`. Data is distributed across shards in the amount proportional to the shard weight. All shard weights are summed up, then each shard's weight is divided by the total to determine each shard's proportion. For example, if there are two shards and the first has a weight of 1 while the second has a weight of 2, the first will be sent one third (1 / 3) of inserted rows and the second will be sent two thirds (2 / 3).
 
-Each shard can have the `internal_replication` parameter defined in the config file. If this parameter is set to `true`, the write operation selects the first healthy replica and writes data to it. Use this if the tables underlying the `Distributed` table are replicated tables (e.g. any of the `Replicated*MergeTree` table engines). One of the table replicas will receive the write and it will be replicated to the other replicas automatically.
+Each shard can have the `internal_replication` parameter defined in the config file. If this parameter is set to `true`, the write operation selects the first healthy replica and writes data to it. Use this if the tables underlying the `Distributed` table are replicated tables (e.g. any of the `Replicated*MergeTree` table engines). One of the table replicas will receive the write, and it will be replicated to the other replicas automatically.
 
 If `internal_replication` is set to `false` (the default), data is written to all replicas. In this case, the `Distributed` table replicates data itself. This is worse than using replicated tables because the consistency of replicas is not checked and, over time, they will contain slightly different data.
 
diff --git a/docs/en/getting-started/example-datasets/amazon-reviews.md b/docs/en/getting-started/example-datasets/amazon-reviews.md
index 00dc553782c..c07ffa86dd9 100644
--- a/docs/en/getting-started/example-datasets/amazon-reviews.md
+++ b/docs/en/getting-started/example-datasets/amazon-reviews.md
@@ -12,7 +12,7 @@ The queries below were executed on a **Production** instance of [ClickHouse Clou
 :::
 
 
-1. Without inserting the data into ClickHouse, we can query it in place. Let's grab some rows so we can see what they look like:
+1. Without inserting the data into ClickHouse, we can query it in place. Let's grab some rows, so we can see what they look like:
 
 ```sql
 SELECT *
diff --git a/docs/en/getting-started/example-datasets/cell-towers.md b/docs/en/getting-started/example-datasets/cell-towers.md
index a84eb5d561f..090de1b32fd 100644
--- a/docs/en/getting-started/example-datasets/cell-towers.md
+++ b/docs/en/getting-started/example-datasets/cell-towers.md
@@ -29,7 +29,7 @@ Here is a preview of the dashboard created in this guide:
 
 This dataset is from [OpenCelliD](https://www.opencellid.org/) - The world's largest Open Database of Cell Towers.
 
-As of 2021, it contains more than 40 million records about cell towers (GSM, LTE, UMTS, etc.) around the world with their geographical coordinates and metadata (country code, network, etc).
+As of 2021, it contains more than 40 million records about cell towers (GSM, LTE, UMTS, etc.) around the world with their geographical coordinates and metadata (country code, network, etc.).
 
 OpenCelliD Project is licensed under a Creative Commons Attribution-ShareAlike 4.0 International License, and we redistribute a snapshot of this dataset under the terms of the same license. The up-to-date version of the dataset is available to download after sign in.
 
@@ -355,7 +355,7 @@ Click on **UPDATE CHART** to render the visualization.
 
 ### Add the charts to a **dashboard**
 
-This screenshot shows cell tower locations with LTE, UMTS, and GSM radios.  The charts are all created in the same way and they are added to a dashboard.
+This screenshot shows cell tower locations with LTE, UMTS, and GSM radios.  The charts are all created in the same way, and they are added to a dashboard.
 
   ![Dashboard of cell towers by radio type in mcc 204](@site/docs/en/getting-started/example-datasets/images/superset-cell-tower-dashboard.png)
 
diff --git a/docs/en/getting-started/example-datasets/covid19.md b/docs/en/getting-started/example-datasets/covid19.md
index 3a7fae89ae0..da9dc4aa96b 100644
--- a/docs/en/getting-started/example-datasets/covid19.md
+++ b/docs/en/getting-started/example-datasets/covid19.md
@@ -132,7 +132,7 @@ FROM covid19;
 └────────────────────────────────────────────┘
 ```
 
-7. You will notice the data has a lot of 0's for dates - either weekends or days where numbers were not reported each day. We can use a window function to smooth out the daily averages of new cases:
+7. You will notice the data has a lot of 0's for dates - either weekends or days when numbers were not reported each day. We can use a window function to smooth out the daily averages of new cases:
 
 ```sql
 SELECT
@@ -262,4 +262,4 @@ The results look like
 
 :::note
 As mentioned in the [GitHub repo](https://github.com/GoogleCloudPlatform/covid-19-open-data), the dataset is no longer updated as of September 15, 2022.
-:::
\ No newline at end of file
+:::
diff --git a/docs/en/interfaces/cli.md b/docs/en/interfaces/cli.md
index 518037a2c7c..2b90d684c13 100644
--- a/docs/en/interfaces/cli.md
+++ b/docs/en/interfaces/cli.md
@@ -243,7 +243,7 @@ If no database is specified, the `default` database will be used.
 
 If the user name, password or database was specified in the connection string, it cannot be specified using `--user`, `--password` or `--database` (and vice versa).
 
-The host component can either be an a host name and IP address. Put an IPv6 address in square brackets to specify it:
+The host component can either be a host name and IP address. Put an IPv6 address in square brackets to specify it:
 
 ```text
 clickhouse://[2001:db8::1234]
diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index a11c3e5ef19..dad90454844 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -33,7 +33,7 @@ The supported formats are:
 | [JSONAsString](#jsonasstring)                                                             | ✔    | ✗     |
 | [JSONStrings](#jsonstrings)                                                               | ✔    | ✔     |
 | [JSONColumns](#jsoncolumns)                                                               | ✔    | ✔     |
-| [JSONColumnsWithMetadata](#jsoncolumnsmonoblock))                                         | ✔    | ✔     |
+| [JSONColumnsWithMetadata](#jsoncolumnsmonoblock)                                          | ✔    | ✔     |
 | [JSONCompact](#jsoncompact)                                                               | ✔    | ✔     |
 | [JSONCompactStrings](#jsoncompactstrings)                                                 | ✗    | ✔     |
 | [JSONCompactColumns](#jsoncompactcolumns)                                                 | ✔    | ✔     |
diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 005c7818eb1..5a7b12a7421 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -6,7 +6,7 @@ sidebar_label: Configuration Files
 
 # Configuration Files
 
-The ClickHouse server can be configured with configuration files in XML or YAML syntax. In most installation types, the ClickHouse server runs with `/etc/clickhouse-server/config.xml` as default configuration file but it is also possible to specify the location of the configuration file manually at server startup using command line option `--config-file=` or `-C`. Additional configuration files may be placed into directory `config.d/` relative to the main configuration file, for example into directory `/etc/clickhouse-server/config.d/`. Files in this directory and the main configuration are merged in a preprocessing step before the configuration is applied in ClickHouse server. Configuration files are merged in alphabetical order. To simplify updates and improve modularization, it is best practice to keep the default `config.xml` file unmodified and place additional customization into `config.d/`.
+The ClickHouse server can be configured with configuration files in XML or YAML syntax. In most installation types, the ClickHouse server runs with `/etc/clickhouse-server/config.xml` as default configuration file, but it is also possible to specify the location of the configuration file manually at server startup using command line option `--config-file=` or `-C`. Additional configuration files may be placed into directory `config.d/` relative to the main configuration file, for example into directory `/etc/clickhouse-server/config.d/`. Files in this directory and the main configuration are merged in a preprocessing step before the configuration is applied in ClickHouse server. Configuration files are merged in alphabetical order. To simplify updates and improve modularization, it is best practice to keep the default `config.xml` file unmodified and place additional customization into `config.d/`.
 
 It is possible to mix XML and YAML configuration files, for example you could have a main configuration file `config.xml` and additional configuration files `config.d/network.xml`, `config.d/timezone.yaml` and `config.d/keeper.yaml`. Mixing XML and YAML within a single configuration file is not supported. XML configuration files should use `<clickhouse>...</clickhouse>` as top-level tag. In YAML configuration files, `clickhouse:` is optional, the parser inserts it implicitly if absent.
 
@@ -63,7 +63,7 @@ XML substitution example:
 </clickhouse>
 ```
 
-Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node and it will be fully inserted into the source element.
+Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node, and it will be fully inserted into the source element.
 
 ## Encrypting and Hiding Configuration {#encryption}
 
diff --git a/docs/en/operations/system-tables/asynchronous_loader.md b/docs/en/operations/system-tables/asynchronous_loader.md
index af9aa4ecd09..75d98e4549d 100644
--- a/docs/en/operations/system-tables/asynchronous_loader.md
+++ b/docs/en/operations/system-tables/asynchronous_loader.md
@@ -49,6 +49,6 @@ Every job has a pool associated with it and is started in this pool. Each pool h
 
 Time instants during job lifetime:
 - `schedule_time` (`DateTime64`) - Time when job was created and scheduled to be executed (usually with all its dependencies).
-- `enqueue_time` (`Nullable(DateTime64)`) - Time when job became ready and was enqueued into a ready queue of it's pool. Null if the job is not ready yet.
+- `enqueue_time` (`Nullable(DateTime64)`) - Time when job became ready and was enqueued into a ready queue of its pool. Null if the job is not ready yet.
 - `start_time` (`Nullable(DateTime64)`) - Time when worker dequeues the job from ready queue and start its execution. Null if the job is not started yet.
 - `finish_time` (`Nullable(DateTime64)`) - Time when job execution is finished. Null if the job is not finished yet.
diff --git a/docs/en/operations/system-tables/asynchronous_metrics.md b/docs/en/operations/system-tables/asynchronous_metrics.md
index fe8f963b1ec..81725b97e41 100644
--- a/docs/en/operations/system-tables/asynchronous_metrics.md
+++ b/docs/en/operations/system-tables/asynchronous_metrics.md
@@ -297,11 +297,11 @@ Total number of databases on the server.
 
 ### NumberOfDetachedByUserParts
 
-The total number of parts detached from MergeTree tables by users with the `ALTER TABLE DETACH` query (as opposed to unexpected, broken or ignored parts). The server does not care about detached parts and they can be removed.
+The total number of parts detached from MergeTree tables by users with the `ALTER TABLE DETACH` query (as opposed to unexpected, broken or ignored parts). The server does not care about detached parts, and they can be removed.
 
 ### NumberOfDetachedParts
 
-The total number of parts detached from MergeTree tables. A part can be detached by a user with the `ALTER TABLE DETACH` query or by the server itself it the part is broken, unexpected or unneeded. The server does not care about detached parts and they can be removed.
+The total number of parts detached from MergeTree tables. A part can be detached by a user with the `ALTER TABLE DETACH` query or by the server itself it the part is broken, unexpected or unneeded. The server does not care about detached parts, and they can be removed.
 
 ### NumberOfTables
 
@@ -393,7 +393,7 @@ The amount of free memory plus OS page cache memory on the host system, in bytes
 
 ### OSMemoryFreeWithoutCached
 
-The amount of free memory on the host system, in bytes. This does not include the memory used by the OS page cache memory, in bytes. The page cache memory is also available for usage by programs, so the value of this metric can be confusing. See the `OSMemoryAvailable` metric instead. For convenience we also provide the `OSMemoryFreePlusCached` metric, that should be somewhat similar to OSMemoryAvailable. See also https://www.linuxatemyram.com/. This is a system-wide metric, it includes all the processes on the host machine, not just clickhouse-server.
+The amount of free memory on the host system, in bytes. This does not include the memory used by the OS page cache memory, in bytes. The page cache memory is also available for usage by programs, so the value of this metric can be confusing. See the `OSMemoryAvailable` metric instead. For convenience, we also provide the `OSMemoryFreePlusCached` metric, that should be somewhat similar to OSMemoryAvailable. See also https://www.linuxatemyram.com/. This is a system-wide metric, it includes all the processes on the host machine, not just clickhouse-server.
 
 ### OSMemoryTotal
 
@@ -493,7 +493,7 @@ Number of threads in the server of the PostgreSQL compatibility protocol.
 
 ### QueryCacheBytes
 
-Total size of the query cache cache in bytes.
+Total size of the query cache in bytes.
 
 ### QueryCacheEntries
 
@@ -549,7 +549,7 @@ Total amount of bytes (compressed, including data and indices) stored in all tab
 
 ### TotalPartsOfMergeTreeTables
 
-Total amount of data parts in all tables of MergeTree family. Numbers larger than 10 000 will negatively affect the server startup time and it may indicate unreasonable choice of the partition key.
+Total amount of data parts in all tables of MergeTree family. Numbers larger than 10 000 will negatively affect the server startup time, and it may indicate unreasonable choice of the partition key.
 
 ### TotalPrimaryKeyBytesInMemory
 
diff --git a/docs/en/operations/system-tables/clusters.md b/docs/en/operations/system-tables/clusters.md
index 63cc083e4bc..7a9f1438b87 100644
--- a/docs/en/operations/system-tables/clusters.md
+++ b/docs/en/operations/system-tables/clusters.md
@@ -19,7 +19,7 @@ Columns:
 - `default_database` ([String](../../sql-reference/data-types/string.md)) — The default database name.
 - `errors_count` ([UInt32](../../sql-reference/data-types/int-uint.md)) — The number of times this host failed to reach replica.
 - `slowdowns_count` ([UInt32](../../sql-reference/data-types/int-uint.md)) — The number of slowdowns that led to changing replica when establishing a connection with hedged requests.
-- `estimated_recovery_time` ([UInt32](../../sql-reference/data-types/int-uint.md)) — Seconds remaining until the replica error count is zeroed and it is considered to be back to normal.
+- `estimated_recovery_time` ([UInt32](../../sql-reference/data-types/int-uint.md)) — Seconds remaining until the replica error count is zeroed, and it is considered to be back to normal.
 - `database_shard_name` ([String](../../sql-reference/data-types/string.md)) — The name of the `Replicated` database shard (for clusters that belong to a `Replicated` database).
 - `database_replica_name` ([String](../../sql-reference/data-types/string.md)) — The name of the `Replicated` database replica (for clusters that belong to a `Replicated` database).
 - `is_active` ([Nullable(UInt8)](../../sql-reference/data-types/int-uint.md)) — The status of the `Replicated` database replica (for clusters that belong to a `Replicated` database): 1 means "replica is online", 0 means "replica is offline", `NULL` means "unknown".
diff --git a/docs/en/operations/system-tables/dictionaries.md b/docs/en/operations/system-tables/dictionaries.md
index 8632581144c..c4cf7ba8bfb 100644
--- a/docs/en/operations/system-tables/dictionaries.md
+++ b/docs/en/operations/system-tables/dictionaries.md
@@ -18,7 +18,7 @@ Columns:
     - `LOADED_AND_RELOADING` — Dictionary is loaded successfully, and is being reloaded right now (frequent reasons: [SYSTEM RELOAD DICTIONARY](../../sql-reference/statements/system.md#query_language-system-reload-dictionary) query, timeout, dictionary config has changed).
     - `FAILED_AND_RELOADING` — Could not load the dictionary as a result of an error and is loading now.
 - `origin` ([String](../../sql-reference/data-types/string.md)) — Path to the configuration file that describes the dictionary.
-- `type` ([String](../../sql-reference/data-types/string.md)) — Type of a dictionary allocation. [Storing Dictionaries in Memory](../../sql-reference/dictionaries/index.md#storig-dictionaries-in-memory).
+- `type` ([String](../../sql-reference/data-types/string.md)) — Type of dictionary allocation. [Storing Dictionaries in Memory](../../sql-reference/dictionaries/index.md#storig-dictionaries-in-memory).
 - `key.names` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) — Array of [key names](../../sql-reference/dictionaries/index.md#dictionary-key-and-fields#ext_dict_structure-key) provided by the dictionary.
 - `key.types` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) — Corresponding array of [key types](../../sql-reference/dictionaries/index.md#dictionary-key-and-fields#ext_dict_structure-key) provided by the dictionary.
 - `attribute.names` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) — Array of [attribute names](../../sql-reference/dictionaries/index.md#dictionary-key-and-fields#ext_dict_structure-attributes) provided by the dictionary.
diff --git a/docs/en/operations/utilities/clickhouse-local.md b/docs/en/operations/utilities/clickhouse-local.md
index c863282efc1..437a5f0fff0 100644
--- a/docs/en/operations/utilities/clickhouse-local.md
+++ b/docs/en/operations/utilities/clickhouse-local.md
@@ -34,7 +34,7 @@ The binary you just downloaded can run all sorts of ClickHouse tools and utiliti
 
 A common use of `clickhouse-local` is to run ad-hoc queries on files: where you don't have to insert the data into a table. `clickhouse-local` can stream the data from a file into a temporary table and execute your SQL.
 
-If the file is sitting on the same machine as `clickhouse-local`, you can simple specify the file to load. The following `reviews.tsv` file contains a sampling of Amazon product reviews:
+If the file is sitting on the same machine as `clickhouse-local`, you can simply specify the file to load. The following `reviews.tsv` file contains a sampling of Amazon product reviews:
 
 ```bash
 ./clickhouse local -q "SELECT * FROM 'reviews.tsv'"
@@ -220,7 +220,7 @@ Arguments:
 - `--help` — arguments references for `clickhouse-local`.
 - `-V`, `--version` — print version information and exit.
 
-Also there are arguments for each ClickHouse configuration variable which are more commonly used instead of `--config-file`.
+Also, there are arguments for each ClickHouse configuration variable which are more commonly used instead of `--config-file`.
 
 
 ## Examples {#examples}
diff --git a/docs/en/operations/utilities/clickhouse-obfuscator.md b/docs/en/operations/utilities/clickhouse-obfuscator.md
index ad51e9c7776..f9a94713be7 100644
--- a/docs/en/operations/utilities/clickhouse-obfuscator.md
+++ b/docs/en/operations/utilities/clickhouse-obfuscator.md
@@ -38,7 +38,7 @@ For example, you have a column `IsMobile` in your table with values 0 and 1. In
 
 So, the user will be able to count the exact ratio of mobile traffic.
 
-Let's give another example. When you have some private data in your table, like user email and you don't want to publish any single email address.
+Let's give another example. When you have some private data in your table, like user email, and you don't want to publish any single email address.
 If your table is large enough and contains multiple different emails and no email has a very high frequency than all others, it will anonymize all data. But if you have a small number of different values in a column, it can reproduce some of them.
 You should look at the working algorithm of this tool works, and fine-tune its command line parameters.
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/any.md b/docs/en/sql-reference/aggregate-functions/reference/any.md
index a45eb1b409f..4631060f33f 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/any.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/any.md
@@ -9,7 +9,7 @@ Selects the first encountered value of a column.
 
 By default, it ignores NULL values and returns the first NOT NULL value found in the column. As [`first_value`](../../../sql-reference/aggregate-functions/reference/first_value.md) if supports `RESPECT NULLS`, in which case it will select the first value passed, independently on whether it's NULL or not.
 
-The return type of the function is the same as the input, except for LowCardinality which is discarded). This means that given no rows as input it will return the default value of that type (0 for integers, or Null for a Nullable() column). You might use the `-OrNull` [combinator](../../../sql-reference/aggregate-functions/combinators.md) ) to modify this behaviour.
+The return type of the function is the same as the input, except for LowCardinality which is discarded. This means that given no rows as input it will return the default value of that type (0 for integers, or Null for a Nullable() column). You might use the `-OrNull` [combinator](../../../sql-reference/aggregate-functions/combinators.md) ) to modify this behaviour.
 
 The query can be executed in any order and even in a different order each time, so the result of this function is indeterminate.
 To get a determinate result, you can use the ‘min’ or ‘max’ function instead of ‘any’.
diff --git a/docs/en/sql-reference/aggregate-functions/reference/contingency.md b/docs/en/sql-reference/aggregate-functions/reference/contingency.md
index 1b53ca1528f..902c1f4af80 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/contingency.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/contingency.md
@@ -20,7 +20,7 @@ contingency(column1, column2)
 
 **Returned value**
 
-- a value between 0 to 1. The larger the result, the closer the association of the two columns.
+- a value between 0 and 1. The larger the result, the closer the association of the two columns.
 
 **Return type** is always [Float64](../../../sql-reference/data-types/float.md).
 
@@ -48,4 +48,4 @@ Result:
 ┌──────cramersV(a, b)─┬───contingency(a, b)─┐
 │ 0.41171788506213564 │ 0.05812725261759165 │
 └─────────────────────┴─────────────────────┘
-```
\ No newline at end of file
+```
diff --git a/docs/en/sql-reference/data-types/datetime64.md b/docs/en/sql-reference/data-types/datetime64.md
index 8c7fa17ae92..504d0e2b0a6 100644
--- a/docs/en/sql-reference/data-types/datetime64.md
+++ b/docs/en/sql-reference/data-types/datetime64.md
@@ -9,7 +9,7 @@ sidebar_label: DateTime64
 Allows to store an instant in time, that can be expressed as a calendar date and a time of a day, with defined sub-second precision
 
 Tick size (precision): 10<sup>-precision</sup> seconds. Valid range: [ 0 : 9 ].
-Typically are used - 3 (milliseconds), 6 (microseconds), 9 (nanoseconds).
+Typically, are used - 3 (milliseconds), 6 (microseconds), 9 (nanoseconds).
 
 **Syntax:**
 
diff --git a/docs/en/sql-reference/data-types/decimal.md b/docs/en/sql-reference/data-types/decimal.md
index e082eb29fbd..2b32e72a28f 100644
--- a/docs/en/sql-reference/data-types/decimal.md
+++ b/docs/en/sql-reference/data-types/decimal.md
@@ -10,7 +10,7 @@ Signed fixed-point numbers that keep precision during add, subtract and multiply
 
 ## Parameters
 
-- P - precision. Valid range: \[ 1 : 76 \]. Determines how many decimal digits number can have (including fraction). By default the precision is 10.
+- P - precision. Valid range: \[ 1 : 76 \]. Determines how many decimal digits number can have (including fraction). By default, the precision is 10.
 - S - scale. Valid range: \[ 0 : P \]. Determines how many decimal digits fraction can have.
 
 Decimal(P) is equivalent to Decimal(P, 0). Similarly, the syntax Decimal is equivalent to Decimal(10, 0).
diff --git a/docs/en/sql-reference/distributed-ddl.md b/docs/en/sql-reference/distributed-ddl.md
index d170f3765c2..7952792cbf4 100644
--- a/docs/en/sql-reference/distributed-ddl.md
+++ b/docs/en/sql-reference/distributed-ddl.md
@@ -6,7 +6,7 @@ sidebar_label: Distributed DDL
 
 # Distributed DDL Queries (ON CLUSTER Clause)
 
-By default the `CREATE`, `DROP`, `ALTER`, and `RENAME` queries affect only the current server where they are executed. In a cluster setup, it is possible to run such queries in a distributed manner with the `ON CLUSTER` clause.
+By default, the `CREATE`, `DROP`, `ALTER`, and `RENAME` queries affect only the current server where they are executed. In a cluster setup, it is possible to run such queries in a distributed manner with the `ON CLUSTER` clause.
 
 For example, the following query creates the `all_hits` `Distributed` table on each host in `cluster`:
 
diff --git a/docs/en/sql-reference/functions/bitmap-functions.md b/docs/en/sql-reference/functions/bitmap-functions.md
index 9b66d00656b..379be302881 100644
--- a/docs/en/sql-reference/functions/bitmap-functions.md
+++ b/docs/en/sql-reference/functions/bitmap-functions.md
@@ -372,7 +372,7 @@ Result:
 
 ## bitmapAnd
 
-Computes the logical conjunction of two two bitmaps.
+Computes the logical conjunction of two bitmaps.
 
 **Syntax**
 
diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 5622097537e..c5b3b4cc3ae 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -1564,7 +1564,7 @@ Alias: `TO_DAYS`
 **Arguments**
 
 - `date` — The date to calculate the number of days passed since year zero from. [Date](../../sql-reference/data-types/date.md), [Date32](../../sql-reference/data-types/date32.md), [DateTime](../../sql-reference/data-types/datetime.md) or [DateTime64](../../sql-reference/data-types/datetime64.md).
-- `time_zone` — A String type const value or a expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
+- `time_zone` — A String type const value or an expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
 
 **Returned value**
 
@@ -2218,7 +2218,7 @@ now64([scale], [timezone])
 
 **Arguments**
 
-- `scale` - Tick size (precision): 10<sup>-precision</sup> seconds. Valid range: [ 0 : 9 ]. Typically are used - 3 (default) (milliseconds), 6 (microseconds), 9 (nanoseconds).
+- `scale` - Tick size (precision): 10<sup>-precision</sup> seconds. Valid range: [ 0 : 9 ]. Typically, are used - 3 (default) (milliseconds), 6 (microseconds), 9 (nanoseconds).
 - `timezone` — [Timezone name](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone) for the returned value (optional). [String](../../sql-reference/data-types/string.md).
 
 **Returned value**
@@ -2305,7 +2305,7 @@ Rounds the time to the half hour.
 
 Converts a date or date with time to a UInt32 number containing the year and month number (YYYY \* 100 + MM). Accepts a second optional timezone argument. If provided, the timezone must be a string constant.
 
-This functions is the opposite of function `YYYYMMDDToDate()`.
+This function is the opposite of function `YYYYMMDDToDate()`.
 
 **Example**
 
@@ -2362,7 +2362,7 @@ Result:
 
 Converts a number containing the year, month and day number to a [Date](../../sql-reference/data-types/date.md).
 
-This functions is the opposite of function `toYYYYMMDD()`.
+This function is the opposite of function `toYYYYMMDD()`.
 
 The output is undefined if the input does not encode a valid Date value.
 
@@ -2406,7 +2406,7 @@ Converts a number containing the year, month, day, hours, minute and second numb
 
 The output is undefined if the input does not encode a valid DateTime value.
 
-This functions is the opposite of function `toYYYYMMDDhhmmss()`.
+This function is the opposite of function `toYYYYMMDDhhmmss()`.
 
 **Syntax**
 
@@ -2981,8 +2981,8 @@ toUTCTimestamp(time_val, time_zone)
 
 **Arguments**
 
-- `time_val` — A DateTime/DateTime64 type const value or a expression . [DateTime/DateTime64 types](../../sql-reference/data-types/datetime.md)
-- `time_zone` — A String type const value or a expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
+- `time_val` — A DateTime/DateTime64 type const value or an expression . [DateTime/DateTime64 types](../../sql-reference/data-types/datetime.md)
+- `time_zone` — A String type const value or an expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
 
 **Returned value**
 
@@ -3014,8 +3014,8 @@ fromUTCTimestamp(time_val, time_zone)
 
 **Arguments**
 
-- `time_val` — A DateTime/DateTime64 type const value or a expression . [DateTime/DateTime64 types](../../sql-reference/data-types/datetime.md)
-- `time_zone` — A String type const value or a expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
+- `time_val` — A DateTime/DateTime64 type const value or an expression . [DateTime/DateTime64 types](../../sql-reference/data-types/datetime.md)
+- `time_zone` — A String type const value or an expression represent the time zone. [String types](../../sql-reference/data-types/string.md)
 
 **Returned value**
 
diff --git a/docs/en/sql-reference/statements/alter/apply-deleted-mask.md b/docs/en/sql-reference/statements/alter/apply-deleted-mask.md
index 7a11d66e739..1afc2a0ff5a 100644
--- a/docs/en/sql-reference/statements/alter/apply-deleted-mask.md
+++ b/docs/en/sql-reference/statements/alter/apply-deleted-mask.md
@@ -10,7 +10,7 @@ sidebar_label: APPLY DELETED MASK
 ALTER TABLE [db].name [ON CLUSTER cluster] APPLY DELETED MASK [IN PARTITION partition_id]
 ```
 
-The command applies mask created by [lightweight delete](/docs/en/sql-reference/statements/delete) and forcefully removes rows marked as deleted from disk. This command is a heavyweight mutation and it semantically equals to query ```ALTER TABLE [db].name DELETE WHERE _row_exists = 0```.
+The command applies mask created by [lightweight delete](/docs/en/sql-reference/statements/delete) and forcefully removes rows marked as deleted from disk. This command is a heavyweight mutation, and it semantically equals to query ```ALTER TABLE [db].name DELETE WHERE _row_exists = 0```.
 
 :::note
 It only works for tables in the [`MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) family (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) tables).
diff --git a/docs/en/sql-reference/statements/alter/constraint.md b/docs/en/sql-reference/statements/alter/constraint.md
index 7a8f5809320..29675f704b5 100644
--- a/docs/en/sql-reference/statements/alter/constraint.md
+++ b/docs/en/sql-reference/statements/alter/constraint.md
@@ -15,7 +15,7 @@ ALTER TABLE [db].name [ON CLUSTER cluster] DROP CONSTRAINT constraint_name;
 
 See more on [constraints](../../../sql-reference/statements/create/table.md#constraints).
 
-Queries will add or remove metadata about constraints from table so they are processed immediately.
+Queries will add or remove metadata about constraints from table, so they are processed immediately.
 
 :::tip
 Constraint check **will not be executed** on existing data if it was added.
diff --git a/docs/en/sql-reference/statements/detach.md b/docs/en/sql-reference/statements/detach.md
index 938a5f9c3cb..e88e625aed1 100644
--- a/docs/en/sql-reference/statements/detach.md
+++ b/docs/en/sql-reference/statements/detach.md
@@ -16,13 +16,13 @@ DETACH TABLE|VIEW|DICTIONARY|DATABASE [IF EXISTS] [db.]name [ON CLUSTER cluster]
 Detaching does not delete the data or metadata of a table, a materialized view, a dictionary or a database. If an entity was not detached `PERMANENTLY`, on the next server launch the server will read the metadata and recall the table/view/dictionary/database again. If an entity was detached `PERMANENTLY`, there will be no automatic recall.
 
 Whether a table, a dictionary or a database was detached permanently or not, in both cases you can reattach them using the [ATTACH](../../sql-reference/statements/attach.md) query.
-System log tables can be also attached back (e.g. `query_log`, `text_log`, etc). Other system tables can't be reattached. On the next server launch the server will recall those tables again.
+System log tables can be also attached back (e.g. `query_log`, `text_log`, etc.). Other system tables can't be reattached. On the next server launch the server will recall those tables again.
 
 `ATTACH MATERIALIZED VIEW` does not work with short syntax (without `SELECT`), but you can attach it using the `ATTACH TABLE` query.
 
 Note that you can not detach permanently the table which is already detached (temporary). But you can attach it back and then detach permanently again.
 
-Also you can not [DROP](../../sql-reference/statements/drop.md#drop-table) the detached table, or [CREATE TABLE](../../sql-reference/statements/create/table.md) with the same name as detached permanently, or replace it with the other table with [RENAME TABLE](../../sql-reference/statements/rename.md) query.
+Also, you can not [DROP](../../sql-reference/statements/drop.md#drop-table) the detached table, or [CREATE TABLE](../../sql-reference/statements/create/table.md) with the same name as detached permanently, or replace it with the other table with [RENAME TABLE](../../sql-reference/statements/rename.md) query.
 
 The `SYNC` modifier executes the action without delay.
 
diff --git a/docs/en/sql-reference/statements/select/distinct.md b/docs/en/sql-reference/statements/select/distinct.md
index 10326b0ef8f..08359b035ae 100644
--- a/docs/en/sql-reference/statements/select/distinct.md
+++ b/docs/en/sql-reference/statements/select/distinct.md
@@ -5,7 +5,7 @@ sidebar_label: DISTINCT
 
 # DISTINCT Clause
 
-If `SELECT DISTINCT` is specified, only unique rows will remain in a query result. Thus only a single row will remain out of all the sets of fully matching rows in the result.
+If `SELECT DISTINCT` is specified, only unique rows will remain in a query result. Thus, only a single row will remain out of all the sets of fully matching rows in the result.
 
 You can specify the list of columns that must have unique values: `SELECT DISTINCT ON (column1, column2,...)`. If the columns are not specified, all of them are taken into consideration.
 
diff --git a/docs/ru/development/architecture.md b/docs/ru/development/architecture.md
index b2e851a78cd..575799cccc4 100644
--- a/docs/ru/development/architecture.md
+++ b/docs/ru/development/architecture.md
@@ -63,7 +63,7 @@ ClickHouse — полноценная столбцовая СУБД. Данны
 
 Для байт-ориентированного ввода-вывода существуют абстрактные классы `ReadBuffer` и `WriteBuffer`. Они используются вместо `iostream`. Не волнуйтесь: каждый зрелый проект C++ использует что-то другое вместо `iostream` по уважительным причинам.
 
-`ReadBuffer` и `WriteBuffer` — это просто непрерывный буфер и курсор, указывающий на позицию в этом буфере. Реализации могут как владеть так и не владеть памятью буфера. Существует виртуальный метод заполнения буфера следующими данными (для `ReadBuffer`) или сброса буфера куда-нибудь (например `WriteBuffer`). Виртуальные методы редко вызываются.
+`ReadBuffer` и `WriteBuffer` — это просто непрерывный буфер и курсор, указывающий на позицию в этом буфере. Реализации могут как владеть, так и не владеть памятью буфера. Существует виртуальный метод заполнения буфера следующими данными (для `ReadBuffer`) или сброса буфера куда-нибудь (например `WriteBuffer`). Виртуальные методы редко вызываются.
 
 Реализации `ReadBuffer`/`WriteBuffer` используются для работы с файлами и файловыми дескрипторами, а также сетевыми сокетами, для реализации сжатия (`CompressedWriteBuffer` инициализируется вместе с другим `WriteBuffer` и осуществляет сжатие данных перед записью в него), и для других целей – названия `ConcatReadBuffer`, `LimitReadBuffer`, и `HashingWriteBuffer` говорят сами за себя.
 
diff --git a/docs/ru/development/developer-instruction.md b/docs/ru/development/developer-instruction.md
index c63622594e4..01ff4dd5f28 100644
--- a/docs/ru/development/developer-instruction.md
+++ b/docs/ru/development/developer-instruction.md
@@ -71,7 +71,7 @@ ClickHouse не работает и не собирается на 32-битны
     Please make sure you have the correct access rights
     and the repository exists.
 
-Как правило это означает, что отсутствуют ssh ключи для соединения с GitHub. Ключи расположены в директории `~/.ssh`. В интерфейсе GitHub, в настройках, необходимо загрузить публичные ключи, чтобы он их понимал.
+Как правило, это означает, что отсутствуют ssh ключи для соединения с GitHub. Ключи расположены в директории `~/.ssh`. В интерфейсе GitHub, в настройках, необходимо загрузить публичные ключи, чтобы он их понимал.
 
 Вы также можете клонировать репозиторий по протоколу https:
 
@@ -199,7 +199,7 @@ sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
 
 В случае успешного запуска, вы увидите прогресс сборки - количество обработанных задач и общее количество задач.
 
-В процессе сборки могут появится сообщения `libprotobuf WARNING` про protobuf файлы в библиотеке libhdfs2. Это не имеет значения.
+В процессе сборки могут появиться сообщения `libprotobuf WARNING` про protobuf файлы в библиотеке libhdfs2. Это не имеет значения.
 
 При успешной сборке, вы получите готовый исполняемый файл `ClickHouse/build/programs/clickhouse`:
 
@@ -207,7 +207,7 @@ sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
 
 ## Запуск собранной версии ClickHouse {#zapusk-sobrannoi-versii-clickhouse}
 
-Для запуска сервера из под текущего пользователя, с выводом логов в терминал и с использованием примеров конфигурационных файлов, расположенных в исходниках, перейдите в директорию `ClickHouse/programs/server/` (эта директория находится не в директории build) и выполните:
+Для запуска сервера из-под текущего пользователя, с выводом логов в терминал и с использованием примеров конфигурационных файлов, расположенных в исходниках, перейдите в директорию `ClickHouse/programs/server/` (эта директория находится не в директории build) и выполните:
 
     ../../build/programs/clickhouse server
 
diff --git a/docs/ru/engines/table-engines/mergetree-family/collapsingmergetree.md b/docs/ru/engines/table-engines/mergetree-family/collapsingmergetree.md
index cfafddf0bc2..4a7d81d38fc 100644
--- a/docs/ru/engines/table-engines/mergetree-family/collapsingmergetree.md
+++ b/docs/ru/engines/table-engines/mergetree-family/collapsingmergetree.md
@@ -37,7 +37,7 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
 
 **Секции запроса**
 
-При создании таблицы с движком `CollapsingMergeTree` используются те же [секции запроса](mergetree.md#table_engine-mergetree-creating-a-table) что и при создании таблицы с движком `MergeTree`.
+При создании таблицы с движком `CollapsingMergeTree` используются те же [секции запроса](mergetree.md#table_engine-mergetree-creating-a-table), что и при создании таблицы с движком `MergeTree`.
 
 <details markdown="1">
 
diff --git a/docs/ru/engines/table-engines/special/buffer.md b/docs/ru/engines/table-engines/special/buffer.md
index 1fd8483e54d..3d2f1ee850d 100644
--- a/docs/ru/engines/table-engines/special/buffer.md
+++ b/docs/ru/engines/table-engines/special/buffer.md
@@ -42,7 +42,7 @@ CREATE TABLE merge.hits_buffer AS merge.hits ENGINE = Buffer(merge, hits, 16, 10
 В качестве имени базы данных и имени таблицы можно указать пустые строки в одинарных кавычках. Это обозначает отсутствие таблицы назначения. В таком случае, при достижении условий на сброс данных, буфер будет просто очищаться. Это может быть полезным, чтобы хранить в оперативке некоторое окно данных.
 
 При чтении из таблицы типа Buffer, будут обработаны данные, как находящиеся в буфере, так и данные из таблицы назначения (если такая есть).
-Но следует иметь ввиду, что таблица Buffer не поддерживает индекс. То есть, данные в буфере будут просканированы полностью, что может быть медленно для буферов большого размера. (Для данных в подчинённой таблице, будет использоваться тот индекс, который она поддерживает.)
+Но следует иметь в виду, что таблица Buffer не поддерживает индекс. То есть, данные в буфере будут просканированы полностью, что может быть медленно для буферов большого размера. (Для данных в подчинённой таблице, будет использоваться тот индекс, который она поддерживает.)
 
 Если множество столбцов таблицы Buffer не совпадает с множеством столбцов подчинённой таблицы, то будут вставлено подмножество столбцов, которое присутствует в обеих таблицах.
 
@@ -66,4 +66,4 @@ CREATE TABLE merge.hits_buffer AS merge.hits ENGINE = Buffer(merge, hits, 16, 10
 
 Таблицы типа Buffer используются в тех случаях, когда от большого количества серверов поступает слишком много INSERT-ов в единицу времени, и нет возможности заранее самостоятельно буферизовать данные перед вставкой, в результате чего, INSERT-ы не успевают выполняться.
 
-Заметим, что даже для таблиц типа Buffer не имеет смысла вставлять данные по одной строке, так как таким образом будет достигнута скорость всего лишь в несколько тысяч строк в секунду, тогда как при вставке более крупными блоками, достижимо более миллиона строк в секунду (смотрите раздел [«Производительность»](../../../introduction/performance.md).
+Заметим, что даже для таблиц типа Buffer не имеет смысла вставлять данные по одной строке, так как таким образом будет достигнута скорость всего лишь в несколько тысяч строк в секунду, тогда как при вставке более крупными блоками, достижимо более миллиона строк в секунду (смотрите раздел [«Производительность»](../../../introduction/performance.md)).
diff --git a/docs/ru/interfaces/cli.md b/docs/ru/interfaces/cli.md
index 8910c258788..4d19cf50ae1 100644
--- a/docs/ru/interfaces/cli.md
+++ b/docs/ru/interfaces/cli.md
@@ -177,11 +177,11 @@ URI позволяет подключаться к нескольким хост
 
 
-Строка подключения должна быть указана в первом аргументе clickhouse-client. Строка подключения может комбинироваться с другими [параметрами командной строки] (#command-line-options) кроме `--host/-h` и `--port`.
+Строка подключения должна быть указана в первом аргументе clickhouse-client. Строка подключения может комбинироваться с другими [параметрами командной строки](#command-line-options) кроме `--host/-h` и `--port`.
 
 Для компонента `query_parameter` разрешены следующие ключи:
 
-- `secure` или сокращенно `s` - без значение. Если параметр указан, то соединение с сервером будет осуществляться по защищенному каналу (TLS). См. `secure` в [command-line-options](#command-line-options).
+- `secure` или сокращенно `s` - без значения. Если параметр указан, то соединение с сервером будет осуществляться по защищенному каналу (TLS). См. `secure` в [command-line-options](#command-line-options).
 
 ### Кодирование URI {#connection_string_uri_percent_encoding}
 
@@ -206,7 +206,7 @@ clickhouse-client clickhouse://john:secret@127.0.0.1:9000
 clickhouse-client clickhouse://[::1]:9000
 ```
 
-Подключиться к localhost через порт 9000  многострочном режиме.
+Подключиться к localhost через порт 9000 в многострочном режиме.
 
 ``` bash
 clickhouse-client clickhouse://localhost:9000 '-m'
diff --git a/docs/ru/operations/clickhouse-keeper.md b/docs/ru/operations/clickhouse-keeper.md
index 3a931529b32..9f1301d817d 100644
--- a/docs/ru/operations/clickhouse-keeper.md
+++ b/docs/ru/operations/clickhouse-keeper.md
@@ -69,7 +69,7 @@ ClickHouse Keeper может использоваться как равноце
 
 
 :::note
-В случае изменения топологии кластера ClickHouse Keeper(например, замены сервера), удостоверьтесь, что вы сохраняеете отношение `server_id` - `hostname`, не переиспользуете существующие `server_id` для для новых серверов и не перемешиваете идентификаторы. Подобные ошибки могут случаться, если вы используете автоматизацию при разворачивании кластера без логики сохранения идентификаторов.
+В случае изменения топологии кластера ClickHouse Keeper(например, замены сервера), удостоверьтесь, что вы сохраняеете отношение `server_id` - `hostname`, не переиспользуете существующие `server_id` для новых серверов и не перемешиваете идентификаторы. Подобные ошибки могут случаться, если вы используете автоматизацию при разворачивании кластера без логики сохранения идентификаторов.
 :::
 
 Примеры конфигурации кворума с тремя узлами можно найти в [интеграционных тестах](https://github.com/ClickHouse/ClickHouse/tree/master/tests/integration) с префиксом `test_keeper_`. Пример конфигурации для сервера №1:
@@ -337,7 +337,7 @@ clickhouse-keeper-converter --zookeeper-logs-dir /var/lib/zookeeper/version-2 --
 
 После того, как выполнили действия выше выполните следующие шаги.
 1. Выберете одну ноду Keeper, которая станет новым лидером. Учтите, что данные с этой ноды будут использованы всем кластером, поэтому рекомендуется выбрать ноду с наиболее актуальным состоянием.
-2. Перед дальнейшими действиям сделайте резервную копию данных из директорий `log_storage_path` и `snapshot_storage_path`.
+2. Перед дальнейшими действиями сделайте резервную копию данных из директорий `log_storage_path` и `snapshot_storage_path`.
 3. Измените настройки на всех нодах кластера, которые вы собираетесь использовать.
 4. Отправьте команду `rcvr` на ноду, которую вы выбрали, или остановите ее и запустите заново с аргументом `--force-recovery`. Это переведет ноду в режим восстановления.
 5. Запускайте остальные ноды кластера по одной и проверяйте, что команда `mntr` возвращает `follower` в выводе состояния `zk_server_state` перед тем, как запустить следующую ноду.
diff --git a/docs/ru/operations/configuration-files.md b/docs/ru/operations/configuration-files.md
index 3b037521692..74f7d217fb7 100644
--- a/docs/ru/operations/configuration-files.md
+++ b/docs/ru/operations/configuration-files.md
@@ -89,7 +89,7 @@ $ cat /etc/clickhouse-server/users.d/alice.xml
 
 Вы можете использовать симметричное шифрование для зашифровки элемента конфигурации, например, поля password. Чтобы это сделать, сначала настройте [кодек шифрования](../sql-reference/statements/create/table.md#encryption-codecs), затем добавьте аттибут`encrypted_by` с именем кодека шифрования как значение к элементу, который надо зашифровать.
 
-В отличии от аттрибутов `from_zk`, `from_env` и `incl` (или элемента `include`), подстановка, т.е. расшифровка зашифрованного значения, не выподняется в файле предобработки. Расшифровка происходит только во время исполнения в серверном процессе.
+В отличие от аттрибутов `from_zk`, `from_env` и `incl` (или элемента `include`), подстановка, т.е. расшифровка зашифрованного значения, не выподняется в файле предобработки. Расшифровка происходит только во время исполнения в серверном процессе.
 
 Пример:
 
@@ -110,7 +110,7 @@ $ cat /etc/clickhouse-server/users.d/alice.xml
 </clickhouse>
 ```
 
-Чтобы получить зашифрованное значение может быть использовано приложение-пример `encrypt_decrypt` .
+Чтобы получить зашифрованное значение, может быть использовано приложение-пример `encrypt_decrypt` .
 
 Пример:
 
diff --git a/docs/ru/operations/utilities/clickhouse-benchmark.md b/docs/ru/operations/utilities/clickhouse-benchmark.md
index 73de78d1c15..eb342bea9a7 100644
--- a/docs/ru/operations/utilities/clickhouse-benchmark.md
+++ b/docs/ru/operations/utilities/clickhouse-benchmark.md
@@ -50,7 +50,7 @@ clickhouse-benchmark [keys] < queries_file;
 -   `-r`, `--randomize` — использовать случайный порядок выполнения запросов при наличии более одного входного запроса.
 -   `-s`, `--secure` — используется `TLS` соединение.
 -   `-t N`, `--timelimit=N` — лимит по времени в секундах. `clickhouse-benchmark` перестает отправлять запросы при достижении лимита по времени. Значение по умолчанию: 0 (лимит отключен).
--   `--confidence=N` — уровень доверия для  T-критерия. Возможные значения: 0 (80%), 1 (90%), 2 (95%), 3 (98%), 4 (99%), 5 (99.5%). Значение по умолчанию: 5. В [режиме сравнения](#clickhouse-benchmark-comparison-mode) `clickhouse-benchmark` проверяет [двухвыборочный  t-критерий Стьюдента для независимых выборок](https://en.wikipedia.org/wiki/Student%27s_t-test#Independent_two-sample_t-test) чтобы определить, различны ли две выборки при выбранном уровне доверия.
+-   `--confidence=N` — уровень доверия для  T-критерия. Возможные значения: 0 (80%), 1 (90%), 2 (95%), 3 (98%), 4 (99%), 5 (99.5%). Значение по умолчанию: 5. В [режиме сравнения](#clickhouse-benchmark-comparison-mode) `clickhouse-benchmark` проверяет [двухвыборочный  t-критерий Стьюдента для независимых выборок](https://en.wikipedia.org/wiki/Student%27s_t-test#Independent_two-sample_t-test), чтобы определить, различны ли две выборки при выбранном уровне доверия.
 -   `--cumulative` — выводить статистику за все время работы, а не за последний временной интервал.
 -   `--database=DATABASE_NAME` — имя базы данных ClickHouse. Значение по умолчанию: `default`.
 -   `--json=FILEPATH` — дополнительный вывод в формате `JSON`. Когда этот ключ указан, `clickhouse-benchmark` выводит отчет в указанный JSON-файл.
diff --git a/docs/ru/sql-reference/data-types/datetime.md b/docs/ru/sql-reference/data-types/datetime.md
index 80d844a1713..57f24786bb7 100644
--- a/docs/ru/sql-reference/data-types/datetime.md
+++ b/docs/ru/sql-reference/data-types/datetime.md
@@ -33,7 +33,7 @@ ClickHouse отображает значения в зависимости от
 
 ## Примеры {#primery}
 
-**1.** Создание таблицы с столбцом типа `DateTime` и вставка данных в неё:
+**1.** Создание таблицы со столбцом типа `DateTime` и вставка данных в неё:
 
 ``` sql
 CREATE TABLE dt
diff --git a/docs/ru/sql-reference/functions/arithmetic-functions.md b/docs/ru/sql-reference/functions/arithmetic-functions.md
index 73bac0595e1..ca7a4566c6c 100644
--- a/docs/ru/sql-reference/functions/arithmetic-functions.md
+++ b/docs/ru/sql-reference/functions/arithmetic-functions.md
@@ -172,7 +172,7 @@ multiplyDecimal(a, b[, result_scale])
 ```
 
 :::note    
-Эта функция работают гораздо медленнее обычной `multiply`.
+Эта функция работает гораздо медленнее обычной `multiply`.
 В случае, если нет необходимости иметь фиксированную точность и/или нужны быстрые вычисления, следует использовать [multiply](#multiply).
 :::
 
diff --git a/docs/ru/sql-reference/functions/array-functions.md b/docs/ru/sql-reference/functions/array-functions.md
index 659e2d3f75e..1f06bdf264a 100644
--- a/docs/ru/sql-reference/functions/array-functions.md
+++ b/docs/ru/sql-reference/functions/array-functions.md
@@ -488,7 +488,7 @@ arrayPushBack(array, single_value)
 **Аргументы**
 
 -   `array` – массив.
--   `single_value` – значение добавляемого элемента. В массив с числам можно добавить только числа, в массив со строками только строки. При добавлении чисел ClickHouse автоматически приводит тип `single_value` к типу данных массива. Подробнее о типах данных в ClickHouse читайте в разделе «[Типы данных](../../sql-reference/functions/array-functions.md#data_types)». Может быть равно `NULL`, в этом случае функция добавит элемент `NULL` в массив, а тип элементов массива преобразует в `Nullable`.
+-   `single_value` – значение добавляемого элемента. В массив с числами можно добавить только числа, в массив со строками только строки. При добавлении чисел ClickHouse автоматически приводит тип `single_value` к типу данных массива. Подробнее о типах данных в ClickHouse читайте в разделе «[Типы данных](../../sql-reference/functions/array-functions.md#data_types)». Может быть равно `NULL`, в этом случае функция добавит элемент `NULL` в массив, а тип элементов массива преобразует в `Nullable`.
 
 **Пример**
 
@@ -513,7 +513,7 @@ arrayPushFront(array, single_value)
 **Аргументы**
 
 -   `array` – массив.
--   `single_value` – значение добавляемого элемента. В массив с числам можно добавить только числа, в массив со строками только строки. При добавлении чисел ClickHouse автоматически приводит тип `single_value` к типу данных массива. Подробнее о типах данных в ClickHouse читайте в разделе «[Типы данных](../../sql-reference/functions/array-functions.md#data_types)». Может быть равно `NULL`, в этом случае функция добавит элемент `NULL` в массив, а тип элементов массива преобразует в `Nullable`.
+-   `single_value` – значение добавляемого элемента. В массив с числами можно добавить только числа, в массив со строками только строки. При добавлении чисел ClickHouse автоматически приводит тип `single_value` к типу данных массива. Подробнее о типах данных в ClickHouse читайте в разделе «[Типы данных](../../sql-reference/functions/array-functions.md#data_types)». Может быть равно `NULL`, в этом случае функция добавит элемент `NULL` в массив, а тип элементов массива преобразует в `Nullable`.
 
 **Пример**
 
diff --git a/docs/ru/sql-reference/statements/select/distinct.md b/docs/ru/sql-reference/statements/select/distinct.md
index 58fe16b16d9..ad310434598 100644
--- a/docs/ru/sql-reference/statements/select/distinct.md
+++ b/docs/ru/sql-reference/statements/select/distinct.md
@@ -92,7 +92,7 @@ ClickHouse поддерживает использование секций `DIS
 
 ## Обработка NULL {#null-processing}
 
-`DISTINCT` работает с [NULL](../../syntax.md#null-literal) как-будто `NULL` — обычное значение и `NULL==NULL`. Другими словами, в результате `DISTINCT`, различные комбинации с `NULL` встретятся только один раз. Это отличается от обработки `NULL` в большинстве других контекстов.
+`DISTINCT` работает с [NULL](../../syntax.md#null-literal) как будто `NULL` — обычное значение и `NULL==NULL`. Другими словами, в результате `DISTINCT`, различные комбинации с `NULL` встретятся только один раз. Это отличается от обработки `NULL` в большинстве других контекстов.
 
 ## Альтернативы {#alternatives}
 
diff --git a/docs/ru/sql-reference/table-functions/cluster.md b/docs/ru/sql-reference/table-functions/cluster.md
index f148a21294a..bb22b38f8f9 100644
--- a/docs/ru/sql-reference/table-functions/cluster.md
+++ b/docs/ru/sql-reference/table-functions/cluster.md
@@ -33,7 +33,7 @@ clusterAllReplicas('cluster_name', db, table[, sharding_key])
 
 **Использование макросов**
 
-`cluster_name` может содержать макрос — подстановку в фигурных скобках. Эта подстановка заменяется на соответствующее значение из секции [macros](../../operations/server-configuration-parameters/settings.md#macros) конфигурационного файла .
+`cluster_name` может содержать макрос — подстановку в фигурных скобках. Эта подстановка заменяется на соответствующее значение из секции [macros](../../operations/server-configuration-parameters/settings.md#macros) конфигурационного файла.
 
 Пример:
 
diff --git a/docs/zh/operations/system-tables/dictionaries.md b/docs/zh/operations/system-tables/dictionaries.md
index 105a591cf69..0cf91e45e86 100644
--- a/docs/zh/operations/system-tables/dictionaries.md
+++ b/docs/zh/operations/system-tables/dictionaries.md
@@ -20,7 +20,7 @@ machine_translated_rev: 5decc73b5dc60054f19087d3690c4eb99446a6c3
     -   `LOADED_AND_RELOADING` — Dictionary is loaded successfully, and is being reloaded right now (frequent reasons: [SYSTEM RELOAD DICTIONARY](../../sql-reference/statements/system.md#query_language-system-reload-dictionary) 查询，超时，字典配置已更改）。
     -   `FAILED_AND_RELOADING` — Could not load the dictionary as a result of an error and is loading now.
 -   `origin` ([字符串](../../sql-reference/data-types/string.md)) — Path to the configuration file that describes the dictionary.
--   `type` ([字符串](../../sql-reference/data-types/string.md)) — Type of a dictionary allocation. [在内存中存储字典](../../sql-reference/dictionaries/external-dictionaries/external-dicts-dict-layout.md).
+-   `type` ([字符串](../../sql-reference/data-types/string.md)) — Type of dictionary allocation. [在内存中存储字典](../../sql-reference/dictionaries/external-dictionaries/external-dicts-dict-layout.md).
 -   `key` — [密钥类型](../../sql-reference/dictionaries/external-dictionaries/external-dicts-dict-structure.md#ext_dict_structure-key):数字键 ([UInt64](../../sql-reference/data-types/int-uint.md#uint-ranges)) or Сomposite key ([字符串](../../sql-reference/data-types/string.md)) — form “(type 1, type 2, …, type n)”.
 -   `attribute.names` ([阵列](../../sql-reference/data-types/array.md)([字符串](../../sql-reference/data-types/string.md))) — Array of [属性名称](../../sql-reference/dictionaries/external-dictionaries/external-dicts-dict-structure.md#ext_dict_structure-attributes) 由字典提供。
 -   `attribute.types` ([阵列](../../sql-reference/data-types/array.md)([字符串](../../sql-reference/data-types/string.md))) — Corresponding array of [属性类型](../../sql-reference/dictionaries/external-dictionaries/external-dicts-dict-structure.md#ext_dict_structure-attributes) 这是由字典提供。

From 58e5d7876b40879dedecc34d0bcef3f435508b1a Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 12 Feb 2024 20:32:23 +0100
Subject: [PATCH 0873/1081] Allow uuid in replica_path if CREATE TABLE
 explicitly has it

Right now the query with {uuid} macro without ON CLUSTER fails:

    CREATE TABLE x UUID 'aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa' (key Int) ENGINE = ReplicatedMergeTree('/tables/{database}/{uuid}', 'r1') ORDER BY tuple();

There is a workaround right now to use ATTACH instead of CREATE, but
ATTACH is not CREATE.

CREATE still useful for proper RESTORE without ON CLUSTER.

So this patch allows this syntax, but only if UUID had been explicitly
passed in the query. This looks safe.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Parsers/ASTCreateQuery.h                  |  1 +
 src/Parsers/ParserCreateQuery.cpp             |  2 ++
 .../MergeTree/registerStorageMergeTree.cpp    |  3 ++-
 .../02990_rmt_replica_path_uuid.reference     |  4 ++++
 .../02990_rmt_replica_path_uuid.sql           | 23 +++++++++++++++++++
 5 files changed, 32 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02990_rmt_replica_path_uuid.reference
 create mode 100644 tests/queries/0_stateless/02990_rmt_replica_path_uuid.sql

diff --git a/src/Parsers/ASTCreateQuery.h b/src/Parsers/ASTCreateQuery.h
index 49a0140625c..b1209e72b61 100644
--- a/src/Parsers/ASTCreateQuery.h
+++ b/src/Parsers/ASTCreateQuery.h
@@ -96,6 +96,7 @@ public:
     bool is_populate{false};
     bool is_create_empty{false};    /// CREATE TABLE ... EMPTY AS SELECT ...
     bool replace_view{false}; /// CREATE OR REPLACE VIEW
+    bool has_uuid{false}; // CREATE TABLE x UUID '...'
 
     ASTColumns * columns_list = nullptr;
 
diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index 1f6f68c9d8e..27c6e6258e3 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -684,6 +684,7 @@ bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
         query->database = table_id->getDatabase();
         query->table = table_id->getTable();
         query->uuid = table_id->uuid;
+        query->has_uuid = table_id->uuid != UUIDHelpers::Nil;
 
         if (query->database)
             query->children.push_back(query->database);
@@ -783,6 +784,7 @@ bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     query->database = table_id->getDatabase();
     query->table = table_id->getTable();
     query->uuid = table_id->uuid;
+    query->has_uuid = table_id->uuid != UUIDHelpers::Nil;
     query->cluster = cluster_str;
 
     if (query->database)
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 8e646e48f16..ca4f19a24e8 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -315,7 +315,8 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         DatabaseCatalog::instance().getDatabase(args.table_id.database_name)->getEngineName() == "Replicated";
 
     /// Allow implicit {uuid} macros only for zookeeper_path in ON CLUSTER queries
-    bool allow_uuid_macro = is_on_cluster || is_replicated_database || args.query.attach;
+    /// and if UUID was explicitly passed in CREATE TABLE (like for ATTACH)
+    bool allow_uuid_macro = is_on_cluster || is_replicated_database || args.query.attach || args.query.has_uuid;
 
     auto expand_macro = [&] (ASTLiteral * ast_zk_path, ASTLiteral * ast_replica_name)
     {
diff --git a/tests/queries/0_stateless/02990_rmt_replica_path_uuid.reference b/tests/queries/0_stateless/02990_rmt_replica_path_uuid.reference
new file mode 100644
index 00000000000..5521c015fcf
--- /dev/null
+++ b/tests/queries/0_stateless/02990_rmt_replica_path_uuid.reference
@@ -0,0 +1,4 @@
+aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa
+/tables/default/aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa/replicas/r1
+aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa
+/tables/default/aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa/replicas/r1
diff --git a/tests/queries/0_stateless/02990_rmt_replica_path_uuid.sql b/tests/queries/0_stateless/02990_rmt_replica_path_uuid.sql
new file mode 100644
index 00000000000..4fcdff2910f
--- /dev/null
+++ b/tests/queries/0_stateless/02990_rmt_replica_path_uuid.sql
@@ -0,0 +1,23 @@
+-- Tags: no-parallel, no-ordinary-database, no-replicated-database
+-- Tag no-parallel: static UUID
+-- Tag no-ordinary-database: requires UUID
+-- Tag no-replicated-database: executes with ON CLUSTER anyway
+
+-- Ignore "ATTACH TABLE query with full table definition is not recommended"
+-- Ignore BAD_ARGUMENTS
+SET send_logs_level='fatal';
+
+DROP TABLE IF EXISTS x;
+
+ATTACH TABLE x UUID 'aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa' (key Int) ENGINE = ReplicatedMergeTree('/tables/{database}/{uuid}', 'r1') ORDER BY tuple();
+SELECT uuid FROM system.tables WHERE database = currentDatabase() and table = 'x';
+SELECT replica_path FROM system.replicas WHERE database = currentDatabase() and table = 'x';
+DROP TABLE x;
+
+-- {uuid} macro forbidden for CREATE TABLE without explicit UUID
+CREATE TABLE x (key Int) ENGINE = ReplicatedMergeTree('/tables/{database}/{uuid}', 'r1') ORDER BY tuple(); -- { serverError BAD_ARGUMENTS }
+
+CREATE TABLE x UUID 'aaaaaaaa-1111-2222-3333-aaaaaaaaaaaa' (key Int) ENGINE = ReplicatedMergeTree('/tables/{database}/{uuid}', 'r1') ORDER BY tuple();
+SELECT uuid FROM system.tables WHERE database = currentDatabase() and table = 'x';
+SELECT replica_path FROM system.replicas WHERE database = currentDatabase() and table = 'x';
+DROP TABLE x;

From 4228eaf44ad6d3bbe22cb8bba280abf50bb44f3c Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 13 Feb 2024 08:31:28 +0100
Subject: [PATCH 0874/1081] Decrease logging level for http retriable errors to
 Warning

Messages like this:

    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:01.596769 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/UserAgent.bin` failed at try 1/10 with bytes read: 311149/378695. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/UserAgent.bin. HTTP status code: 500 Internal Server Error, body: <?xml version="1.0" encoding="UTF-8"?>

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/IO/ReadWriteBufferFromHTTP.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/ReadWriteBufferFromHTTP.cpp b/src/IO/ReadWriteBufferFromHTTP.cpp
index bf5c426f803..a95d42ec7f3 100644
--- a/src/IO/ReadWriteBufferFromHTTP.cpp
+++ b/src/IO/ReadWriteBufferFromHTTP.cpp
@@ -552,7 +552,7 @@ bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::nextImpl()
             if (!can_retry_request)
                 throw;
 
-            LOG_ERROR(
+            LOG_WARNING(
                 log,
                 "HTTP request to `{}` failed at try {}/{} with bytes read: {}/{}. "
                 "Error: {}. (Current backoff wait is {}/{} ms)",

From f62405b234c13a1b0f1c83f6eef2f8025fe1c388 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 13 Feb 2024 08:33:09 +0100
Subject: [PATCH 0875/1081] tests: suppress http retriable errors in
 00157_cache_dictionary

CI reports [1]:

    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:01.596769 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/UserAgent.bin` failed at try 1/10 with bytes read: 311149/378695. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/UserAgent.bin. HTTP status code: 500 Internal Server Error, body: <?xml version="1.0" encoding="UTF-8"?>
    2024-02-12 21:25:24 <Error><Code>InternalError</Code><Message>We encountered an internal error. Please try again.</Message><RequestId>NSG3VKK6GWDFXMFJ</RequestId><HostId>9WhFfHfE6XtL2+InOZMJWv5ZCUY25Z3P+2EjoMx3I7UxACzLzFSHOUTT4v3EJ+ZTSAklw6Ech7E=</HostId></Error>. (Current backoff wait is 100/10000 ms)
    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:02.527290 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/RefererCategories.size0.bin` failed at try 1/10 with bytes read: 1110527/1246029. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/RefererCategories.size0.bin. HTTP status code: 500 Internal Server Error, body: <?xml version="1.0" encoding="UTF-8"?>
    2024-02-12 21:25:24 <Error><Code>InternalError</Code><Message>We encountered an internal error. Please try again.</Message><RequestId>GRRAYKKM9E73JG6A</RequestId><HostId>Ej/aHS4E6GujLjeZugLqgRhpQYLQrZtn4ZwTTz01Z0J3DJmbGQ5Ch6qzXB0NeNLmsSP6BeTy3O8=</HostId></Error>. (Current backoff wait is 100/10000 ms)
    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:04.415182 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/SearchPhrase.bin` failed at try 1/10 with bytes read: 1615554/1843636. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/SearchPhrase.bin. HTTP status code: 500 Internal Server Error, body: <?xml version="1.0" encoding="UTF-8"?>
    2024-02-12 21:25:24 <Error><Code>InternalError</Code><Message>We encountered an internal error. Please try again.</Message><RequestId>WP6PWQCNPK22CH2S</RequestId><HostId>gwYgmcnihSvFDXK3mhDfmXpDIebs39EJGCNcsghxwqqWIkvgsWOu5rSqv837589yB7Mmf+2qTcM=</HostId></Error>. (Current backoff wait is 100/10000 ms)
    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:06.228120 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/HistoryLength.bin` failed at try 1/10 with bytes read: 373045/430913. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/HistoryLength.bin. HTTP status code: 500 Internal Server Error, body: <?xml version="1.0" encoding="UTF-8"?>
    2024-02-12 21:25:24 <Error><Code>InternalError</Code><Message>We encountered an internal error. Please try again.</Message><RequestId>YMA18Y2A0Z9GKD1H</RequestId><HostId>RzI1ju46ixNRgjffHJNW8fndeSAARUKjyYh1T8a73ehCuyWqES/HpsEQNsc728dUL10cI0A6viU=</HostId></Error>. (Current backoff wait is 100/10000 ms)
    2024-02-12 21:25:24 [5c66f008cd40] 2024.02.12 14:25:07.742813 [ 2530 ] {e71fcb6d-356d-4962-95bd-ef8b8c504e11} <Error> ReadWriteBufferFromHTTP: HTTP request to `https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/OpenstatCampaignID.bin` failed at try 1/10 with bytes read: 16494/20267. Error: DB::HTTPException: Received error from remote server /store/78e/78ebf6a1-d987-4579-b3ec-00c1a087b1f3/201403_1_1_2/OpenstatCampaignID.bin. HTTP status code: 500 Internal Server Error, body: <?

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/59895/c7c05c9881362079fa6a02430fc5cd63dfa65bb7/stateful_tests__debug_.html

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/1_stateful/00157_cache_dictionary.sql | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/queries/1_stateful/00157_cache_dictionary.sql b/tests/queries/1_stateful/00157_cache_dictionary.sql
index 3621ff82126..9699843af8f 100644
--- a/tests/queries/1_stateful/00157_cache_dictionary.sql
+++ b/tests/queries/1_stateful/00157_cache_dictionary.sql
@@ -1,5 +1,8 @@
 -- Tags: no-tsan, no-parallel
 
+-- Suppress "ReadWriteBufferFromHTTP: HTTP request to `{}` failed at try 1/10 with bytes read: 311149/378695. Error: DB::HTTPException: Received error from remote server {}. (Current backoff wait is 100/10000 ms)" errors
+SET send_logs_level='error';
+
 DROP TABLE IF EXISTS test.hits_1m;
 
 CREATE TABLE test.hits_1m AS test.hits

From 12599c4b8e53e1f018f833d9a5af67fce3925601 Mon Sep 17 00:00:00 2001
From: xuzifu666 <1206332514@qq.com>
Date: Tue, 13 Feb 2024 17:35:55 +0800
Subject: [PATCH 0876/1081] Commands node args should add rvalue to push_back

---
 programs/keeper-client/Commands.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/keeper-client/Commands.cpp b/programs/keeper-client/Commands.cpp
index d19e2ffe00f..62b082ce15a 100644
--- a/programs/keeper-client/Commands.cpp
+++ b/programs/keeper-client/Commands.cpp
@@ -115,7 +115,7 @@ bool CreateCommand::parse(IParser::Pos & pos, std::shared_ptr<ASTKeeperQuery> &
     else if (ParserKeyword{"PERSISTENT SEQUENTIAL"}.ignore(pos, expected))
         mode = zkutil::CreateMode::PersistentSequential;
 
-    node->args.push_back(mode);
+    node->args.push_back(std::move(mode));
 
     return true;
 }

From 21770b9d1770b31588e3a78facdc3025c6a0e541 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 13 Feb 2024 10:39:45 +0100
Subject: [PATCH 0877/1081] Bump server version

---
 tests/analyzer_integration_broken_tests.txt                  | 1 -
 .../test_distributed_backward_compatability/test.py          | 5 ++---
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index be39e393ce9..0559cfa926c 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,6 +1,5 @@
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
-test_distributed_backward_compatability/test.py::test_distributed_in_tuple
 test_distributed_type_object/test.py::test_distributed_type_object
 test_executable_table_function/test.py::test_executable_function_input_python
 test_mask_sensitive_info/test.py::test_encryption_functions
diff --git a/tests/integration/test_distributed_backward_compatability/test.py b/tests/integration/test_distributed_backward_compatability/test.py
index 319a4c08e60..5b60788a4ef 100644
--- a/tests/integration/test_distributed_backward_compatability/test.py
+++ b/tests/integration/test_distributed_backward_compatability/test.py
@@ -7,11 +7,10 @@ cluster = ClickHouseCluster(__file__)
 node_old = cluster.add_instance(
     "node1",
     main_configs=["configs/remote_servers.xml"],
-    image="yandex/clickhouse-server",
-    tag="20.8.11.17",
+    image="clickhouse/clickhouse-server",
+    tag="23.3",
     stay_alive=True,
     with_installed_binary=True,
-    allow_analyzer=False,
 )
 node_new = cluster.add_instance(
     "node2",

From f3f7f5ca318f3dd082129c2c0b0157a448188d25 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 13 Feb 2024 10:35:00 +0100
Subject: [PATCH 0878/1081] tests: fix 02981_vertical_merges_memory_usage
 flakiness

Note, that I've checked this change by reverting #59340, i.e.

    diff --git a/src/Processors/Transforms/ColumnGathererTransform.h b/src/Processors/Transforms/ColumnGathererTransform.h
    index 4e56cffa46a..dd3c555f361 100644
    --- a/src/Processors/Transforms/ColumnGathererTransform.h
    +++ b/src/Processors/Transforms/ColumnGathererTransform.h
    @@ -195,7 +195,7 @@ void ColumnGathererStream::gather(Column & column_res)
             }

             source.pos += len;
    -    } while (column_res.size() < block_preferred_size_rows && column_res.byteSize() < block_preferred_size_bytes);
    +    } while (true);
     }

     }

And it fails:

    02981_vertical_merges_memory_usage:                                     [ FAIL ] - result differs with reference:
    --- /src/ch/clickhouse/tests/queries/0_stateless/02981_vertical_merges_memory_usage.reference   2024-02-13 10:37:54.771393874 +0100
    +++ /src/ch/clickhouse/tests/queries/0_stateless/02981_vertical_merges_memory_usage.stdout      2024-02-13 10:41:06.781109565 +0100
    @@ -1 +1 @@
    -Vertical       OK
    +Vertical       FAIL: memory usage: 626.59 MiB

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../0_stateless/02981_vertical_merges_memory_usage.sql        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
index 1305f02c044..6ca594ebc7d 100644
--- a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
@@ -13,8 +13,8 @@ SETTINGS
     merge_max_block_size = 8192,
     merge_max_block_size_bytes = '10M';
 
-INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
-INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(30000);
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3000);
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3000);
 
 OPTIMIZE TABLE t_vertical_merge_memory FINAL;
 

From 06f089c480964989bade63183a1800b2e593fa02 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 13 Feb 2024 10:49:04 +0100
Subject: [PATCH 0879/1081] Analyzer: Update broken integration tests list

---
 tests/analyzer_integration_broken_tests.txt | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index be39e393ce9..73e6a83a406 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -7,7 +7,6 @@ test_mask_sensitive_info/test.py::test_encryption_functions
 test_merge_table_over_distributed/test.py::test_global_in
 test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_over_distributed
 test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_task
-test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_select_access_rights/test_main.py::test_alias_columns
 test_settings_profile/test.py::test_show_profiles
@@ -16,5 +15,3 @@ test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functi
 test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
 test_user_defined_object_persistence/test.py::test_persistence
 test_wrong_db_or_table_name/test.py::test_wrong_table_name
-test_zookeeper_config/test.py::test_chroot_with_same_root
-test_zookeeper_config/test.py::test_chroot_with_different_root

From 7c0170523102e0571213e383415d2e6171f5e5d6 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 13 Feb 2024 10:34:27 +0100
Subject: [PATCH 0880/1081] Run ValidationChecker for sanitizers build as well

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Analyzer/QueryTreePassManager.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index 33411488d66..91e48fe4e86 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -61,7 +61,7 @@ namespace ErrorCodes
 namespace
 {
 
-#ifndef NDEBUG
+#if defined(ABORT_ON_LOGICAL_ERROR)
 
 /** This visitor checks if Query Tree structure is valid after each pass
   * in debug build.
@@ -184,7 +184,7 @@ void QueryTreePassManager::run(QueryTreeNodePtr query_tree_node)
     for (size_t i = 0; i < passes_size; ++i)
     {
         passes[i]->run(query_tree_node, current_context);
-#ifndef NDEBUG
+#if defined(ABORT_ON_LOGICAL_ERROR)
         ValidationChecker(passes[i]->getName()).visit(query_tree_node);
 #endif
     }
@@ -209,7 +209,7 @@ void QueryTreePassManager::run(QueryTreeNodePtr query_tree_node, size_t up_to_pa
     for (size_t i = 0; i < up_to_pass_index; ++i)
     {
         passes[i]->run(query_tree_node, current_context);
-#ifndef NDEBUG
+#if defined(ABORT_ON_LOGICAL_ERROR)
         ValidationChecker(passes[i]->getName()).visit(query_tree_node);
 #endif
     }

From 743f2410c1ba45f0fd99dcb22e2b8448ad44a487 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 13 Feb 2024 09:53:32 +0000
Subject: [PATCH 0881/1081] Fix crash in JSONColumnsWithMetadata format over
 http

---
 .../JSONColumnsWithMetadataBlockInputFormat.cpp    |  2 +-
 .../Impl/JSONColumnsWithMetadataBlockInputFormat.h |  2 +-
 ...02982_json_columns_with_metadata_http.reference |  3 +++
 .../02982_json_columns_with_metadata_http.sh       | 14 ++++++++++++++
 4 files changed, 19 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02982_json_columns_with_metadata_http.reference
 create mode 100755 tests/queries/0_stateless/02982_json_columns_with_metadata_http.sh

diff --git a/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.cpp b/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.cpp
index 23c6114fb39..572b3b0703f 100644
--- a/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.cpp
@@ -60,7 +60,7 @@ void registerInputFormatJSONColumnsWithMetadata(FormatFactory & factory)
     factory.registerInputFormat(
         "JSONColumnsWithMetadata",
         [](ReadBuffer & buf,
-           const Block &sample,
+           const Block & sample,
            const RowInputFormatParams &,
            const FormatSettings & settings)
         {
diff --git a/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.h b/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.h
index 9a6ed79c522..265f76a74c1 100644
--- a/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONColumnsWithMetadataBlockInputFormat.h
@@ -15,7 +15,7 @@ public:
     bool checkChunkEnd() override;
 
 private:
-    const Block & header;
+    const Block header;
     const bool validate_types_from_metadata;
 };
 
diff --git a/tests/queries/0_stateless/02982_json_columns_with_metadata_http.reference b/tests/queries/0_stateless/02982_json_columns_with_metadata_http.reference
new file mode 100644
index 00000000000..d03bf4df6cb
--- /dev/null
+++ b/tests/queries/0_stateless/02982_json_columns_with_metadata_http.reference
@@ -0,0 +1,3 @@
+1	4
+2	5
+3	6
diff --git a/tests/queries/0_stateless/02982_json_columns_with_metadata_http.sh b/tests/queries/0_stateless/02982_json_columns_with_metadata_http.sh
new file mode 100755
index 00000000000..41c06ceae61
--- /dev/null
+++ b/tests/queries/0_stateless/02982_json_columns_with_metadata_http.sh
@@ -0,0 +1,14 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -q "drop table if exists test"
+$CLICKHOUSE_CLIENT -q "create table test(x UInt32, y UInt32) engine=Memory"
+
+echo -ne '{"meta":[{"name":"x","type":"UInt32"}, {"name":"y", "type":"UInt32"}],"data":{"x":[1,2,3],"y":[4,5,6]}}\n' | ${CLICKHOUSE_CURL} -sS "{$CLICKHOUSE_URL}&query=INSERT%20INTO%20test%20FORMAT%20JSONColumnsWithMetadata" --data-binary @-
+
+$CLICKHOUSE_CLIENT -q "select * from test"
+$CLICKHOUSE_CLIENT -q "drop table test"
+

From 4b85f6b39afb2576afd4e6b2698a8fc1587d4e25 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Tue, 13 Feb 2024 12:02:46 +0100
Subject: [PATCH 0882/1081] Revert "Less error prone interface of read buffers"
 (#59911)

---
 src/Disks/DiskEncrypted.cpp                   |  4 +-
 src/Disks/DiskEncryptedTransaction.cpp        |  1 +
 src/Disks/IO/ReadBufferFromRemoteFSGather.cpp |  6 +-
 src/Disks/IO/ReadBufferFromRemoteFSGather.h   |  4 +-
 src/Disks/IO/createReadBufferFromFileBase.cpp |  2 +-
 .../ObjectStorages/DiskObjectStorage.cpp      |  2 +-
 src/IO/Archives/LibArchiveReader.cpp          |  7 +--
 src/IO/Archives/ZipArchiveReader.cpp          |  6 --
 src/IO/BoundedReadBuffer.cpp                  |  3 +-
 src/IO/BoundedReadBuffer.h                    | 10 +---
 src/IO/LimitSeekableReadBuffer.h              |  1 +
 src/IO/MMapReadBufferFromFileDescriptor.cpp   |  5 --
 src/IO/MMapReadBufferFromFileDescriptor.h     |  2 -
 src/IO/MMapReadBufferFromFileWithCache.cpp    |  5 --
 src/IO/MMapReadBufferFromFileWithCache.h      |  2 +-
 src/IO/ReadBufferFromEmptyFile.h              |  8 +--
 src/IO/ReadBufferFromEncryptedFile.cpp        | 12 ----
 src/IO/ReadBufferFromEncryptedFile.h          |  4 +-
 src/IO/ReadBufferFromFileBase.h               |  6 --
 src/IO/ReadBufferFromFileDecorator.cpp        | 60 +++++++++++++++++++
 src/IO/ReadBufferFromFileDecorator.h          | 37 ++++++++++++
 src/IO/ReadBufferFromMemory.h                 |  1 +
 src/IO/SeekableReadBuffer.h                   |  6 ++
 src/IO/WithFileSize.cpp                       | 23 ++++++-
 .../HDFS/AsynchronousReadBufferFromHDFS.cpp   |  2 +-
 .../HDFS/AsynchronousReadBufferFromHDFS.h     |  2 +-
 26 files changed, 147 insertions(+), 74 deletions(-)
 create mode 100644 src/IO/ReadBufferFromFileDecorator.cpp
 create mode 100644 src/IO/ReadBufferFromFileDecorator.h

diff --git a/src/Disks/DiskEncrypted.cpp b/src/Disks/DiskEncrypted.cpp
index fe00fdd64d6..68fd9012857 100644
--- a/src/Disks/DiskEncrypted.cpp
+++ b/src/Disks/DiskEncrypted.cpp
@@ -4,9 +4,9 @@
 #include <Disks/DiskFactory.h>
 #include <IO/FileEncryptionCommon.h>
 #include <IO/ReadBufferFromEncryptedFile.h>
+#include <IO/ReadBufferFromFileDecorator.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteBufferFromEncryptedFile.h>
-#include <IO/ReadBufferFromEmptyFile.h>
 #include <boost/algorithm/hex.hpp>
 #include <Common/quoteString.h>
 #include <Common/typeid_cast.h>
@@ -374,7 +374,7 @@ std::unique_ptr<ReadBufferFromFileBase> DiskEncrypted::readFile(
     {
         /// File is empty, that's a normal case, see DiskEncrypted::truncateFile().
         /// There is no header so we just return `ReadBufferFromString("")`.
-        return std::make_unique<ReadBufferFromEmptyFile>(wrapped_path);
+        return std::make_unique<ReadBufferFromFileDecorator>(std::make_unique<ReadBufferFromString>(std::string_view{}), wrapped_path);
     }
     auto encryption_settings = current_settings.get();
     FileEncryption::Header header = readHeader(*buffer);
diff --git a/src/Disks/DiskEncryptedTransaction.cpp b/src/Disks/DiskEncryptedTransaction.cpp
index 3da2e6f925a..daeab7aae6c 100644
--- a/src/Disks/DiskEncryptedTransaction.cpp
+++ b/src/Disks/DiskEncryptedTransaction.cpp
@@ -6,6 +6,7 @@
 #include <Common/Exception.h>
 #include <boost/algorithm/hex.hpp>
 #include <IO/ReadBufferFromEncryptedFile.h>
+#include <IO/ReadBufferFromFileDecorator.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteBufferFromEncryptedFile.h>
 #include <Common/quoteString.h>
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index 923aab5c343..0b3ecca3587 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -1,6 +1,6 @@
 #include "ReadBufferFromRemoteFSGather.h"
 
-#include <IO/ReadBufferFromFileBase.h>
+#include <IO/SeekableReadBuffer.h>
 
 #include <Disks/IO/CachedOnDiskReadBufferFromFile.h>
 #include <Disks/ObjectStorages/Cached/CachedObjectStorage.h>
@@ -62,7 +62,7 @@ ReadBufferFromRemoteFSGather::ReadBufferFromRemoteFSGather(
         current_object = blobs_to_read.front();
 }
 
-std::unique_ptr<ReadBufferFromFileBase> ReadBufferFromRemoteFSGather::createImplementationBuffer(const StoredObject & object)
+SeekableReadBufferPtr ReadBufferFromRemoteFSGather::createImplementationBuffer(const StoredObject & object)
 {
     if (current_buf && !with_cache)
     {
@@ -79,7 +79,7 @@ std::unique_ptr<ReadBufferFromFileBase> ReadBufferFromRemoteFSGather::createImpl
     if (with_cache)
     {
         auto cache_key = settings.remote_fs_cache->createKeyForPath(object_path);
-        return std::make_unique<CachedOnDiskReadBufferFromFile>(
+        return std::make_shared<CachedOnDiskReadBufferFromFile>(
             object_path,
             cache_key,
             settings.remote_fs_cache,
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.h b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
index 93ded9fefb3..f6b7506a54f 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.h
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.h
@@ -53,7 +53,7 @@ public:
     bool isContentCached(size_t offset, size_t size) override;
 
 private:
-    std::unique_ptr<ReadBufferFromFileBase> createImplementationBuffer(const StoredObject & object);
+    SeekableReadBufferPtr createImplementationBuffer(const StoredObject & object);
 
     bool nextImpl() override;
 
@@ -80,7 +80,7 @@ private:
 
     StoredObject current_object;
     size_t current_buf_idx = 0;
-    std::unique_ptr<ReadBufferFromFileBase> current_buf;
+    SeekableReadBufferPtr current_buf;
 
     LoggerPtr log;
 };
diff --git a/src/Disks/IO/createReadBufferFromFileBase.cpp b/src/Disks/IO/createReadBufferFromFileBase.cpp
index d4cb6b83223..a9d451496ff 100644
--- a/src/Disks/IO/createReadBufferFromFileBase.cpp
+++ b/src/Disks/IO/createReadBufferFromFileBase.cpp
@@ -39,7 +39,7 @@ std::unique_ptr<ReadBufferFromFileBase> createReadBufferFromFileBase(
     size_t alignment)
 {
     if (file_size.has_value() && !*file_size)
-        return std::make_unique<ReadBufferFromEmptyFile>(filename);
+        return std::make_unique<ReadBufferFromEmptyFile>();
 
     size_t estimated_size = 0;
     if (read_hint.has_value())
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 9c4132f433f..141aa74e417 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -531,7 +531,7 @@ std::unique_ptr<ReadBufferFromFileBase> DiskObjectStorage::readFile(
     const bool file_can_be_empty = !file_size.has_value() || *file_size == 0;
 
     if (storage_objects.empty() && file_can_be_empty)
-        return std::make_unique<ReadBufferFromEmptyFile>(path);
+        return std::make_unique<ReadBufferFromEmptyFile>();
 
     return object_storage->readObjects(
         storage_objects,
diff --git a/src/IO/Archives/LibArchiveReader.cpp b/src/IO/Archives/LibArchiveReader.cpp
index 763cd3b171b..94e68045575 100644
--- a/src/IO/Archives/LibArchiveReader.cpp
+++ b/src/IO/Archives/LibArchiveReader.cpp
@@ -228,12 +228,7 @@ public:
 
     off_t getPosition() override
     {
-        throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "getPosition is not supported when reading from archive");
-    }
-
-    size_t getFileOffsetOfBufferEnd() const override
-    {
-        throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "getFileOffsetOfBufferEnd is not supported when reading from archive");
+        throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "getPosition not supported when reading from archive");
     }
 
     String getFileName() const override { return handle.getFileName(); }
diff --git a/src/IO/Archives/ZipArchiveReader.cpp b/src/IO/Archives/ZipArchiveReader.cpp
index 636042ec586..8c9c37e4ae0 100644
--- a/src/IO/Archives/ZipArchiveReader.cpp
+++ b/src/IO/Archives/ZipArchiveReader.cpp
@@ -15,7 +15,6 @@ namespace ErrorCodes
     extern const int CANNOT_UNPACK_ARCHIVE;
     extern const int LOGICAL_ERROR;
     extern const int SEEK_POSITION_OUT_OF_BOUND;
-    extern const int UNSUPPORTED_METHOD;
     extern const int CANNOT_SEEK_THROUGH_FILE;
 }
 
@@ -253,11 +252,6 @@ public:
         checkResult(err);
     }
 
-    size_t getFileOffsetOfBufferEnd() const override
-    {
-        throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "getFileOffsetOfBufferEnd is not supported when reading from zip archive");
-    }
-
     off_t seek(off_t off, int whence) override
     {
         off_t current_pos = getPosition();
diff --git a/src/IO/BoundedReadBuffer.cpp b/src/IO/BoundedReadBuffer.cpp
index f3b176a963c..bda79d82ad3 100644
--- a/src/IO/BoundedReadBuffer.cpp
+++ b/src/IO/BoundedReadBuffer.cpp
@@ -4,7 +4,8 @@
 namespace DB
 {
 
-BoundedReadBuffer::BoundedReadBuffer(std::unique_ptr<ReadBufferFromFileBase> impl_) : impl(std::move(impl_))
+BoundedReadBuffer::BoundedReadBuffer(std::unique_ptr<SeekableReadBuffer> impl_)
+    : ReadBufferFromFileDecorator(std::move(impl_))
 {
 }
 
diff --git a/src/IO/BoundedReadBuffer.h b/src/IO/BoundedReadBuffer.h
index 22a6471a9a1..eb65857e83a 100644
--- a/src/IO/BoundedReadBuffer.h
+++ b/src/IO/BoundedReadBuffer.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <IO/ReadBufferFromFileBase.h>
+#include <IO/ReadBufferFromFileDecorator.h>
 
 
 namespace DB
@@ -7,10 +7,10 @@ namespace DB
 
 /// A buffer which allows to make an underlying buffer as right bounded,
 /// e.g. the buffer cannot return data beyond offset specified in `setReadUntilPosition`.
-class BoundedReadBuffer : public ReadBufferFromFileBase
+class BoundedReadBuffer : public ReadBufferFromFileDecorator
 {
 public:
-    explicit BoundedReadBuffer(std::unique_ptr<ReadBufferFromFileBase> impl_);
+    explicit BoundedReadBuffer(std::unique_ptr<SeekableReadBuffer> impl_);
 
     bool supportsRightBoundedReads() const override { return true; }
 
@@ -23,8 +23,6 @@ public:
     off_t seek(off_t off, int whence) override;
 
     size_t getFileOffsetOfBufferEnd() const override { return file_offset_of_buffer_end; }
-    String getFileName() const override { return impl->getFileName(); }
-    size_t getFileSize() override { return impl->getFileSize(); }
 
     /// file_offset_of_buffer_end can differ from impl's file_offset_of_buffer_end
     /// because of resizing of the tail. => Need to also override getPosition() as
@@ -32,8 +30,6 @@ public:
     off_t getPosition() override;
 
 private:
-    std::unique_ptr<ReadBufferFromFileBase> impl;
-
     std::optional<size_t> read_until_position;
     /// atomic because can be used in log or exception messages while being updated.
     std::atomic<size_t> file_offset_of_buffer_end = 0;
diff --git a/src/IO/LimitSeekableReadBuffer.h b/src/IO/LimitSeekableReadBuffer.h
index 5624388dd7e..61b307c522c 100644
--- a/src/IO/LimitSeekableReadBuffer.h
+++ b/src/IO/LimitSeekableReadBuffer.h
@@ -18,6 +18,7 @@ public:
 
     /// Returns adjusted position, i.e. returns `3` if the position in the nested buffer is `start_offset + 3`.
     off_t getPosition() override;
+
     off_t seek(off_t off, int whence) override;
 
 private:
diff --git a/src/IO/MMapReadBufferFromFileDescriptor.cpp b/src/IO/MMapReadBufferFromFileDescriptor.cpp
index 56a094bb1a3..9b1c132cc01 100644
--- a/src/IO/MMapReadBufferFromFileDescriptor.cpp
+++ b/src/IO/MMapReadBufferFromFileDescriptor.cpp
@@ -92,11 +92,6 @@ size_t MMapReadBufferFromFileDescriptor::getFileSize()
     return getSizeFromFileDescriptor(getFD(), getFileName());
 }
 
-size_t MMapReadBufferFromFileDescriptor::getFileOffsetOfBufferEnd() const
-{
-     return mapped.getOffset() + mapped.getLength();
-}
-
 size_t MMapReadBufferFromFileDescriptor::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &)
 {
     if (offset >= mapped.getLength())
diff --git a/src/IO/MMapReadBufferFromFileDescriptor.h b/src/IO/MMapReadBufferFromFileDescriptor.h
index 97d8bbe224d..2a039e04971 100644
--- a/src/IO/MMapReadBufferFromFileDescriptor.h
+++ b/src/IO/MMapReadBufferFromFileDescriptor.h
@@ -36,8 +36,6 @@ public:
 
     std::string getFileName() const override;
 
-    size_t getFileOffsetOfBufferEnd() const override;
-
     int getFD() const;
 
     size_t getFileSize() override;
diff --git a/src/IO/MMapReadBufferFromFileWithCache.cpp b/src/IO/MMapReadBufferFromFileWithCache.cpp
index f3c4d6f4e01..d53f3bc325d 100644
--- a/src/IO/MMapReadBufferFromFileWithCache.cpp
+++ b/src/IO/MMapReadBufferFromFileWithCache.cpp
@@ -76,9 +76,4 @@ off_t MMapReadBufferFromFileWithCache::seek(off_t offset, int whence)
     return new_pos;
 }
 
-size_t MMapReadBufferFromFileWithCache::getFileOffsetOfBufferEnd() const
-{
-    return mapped->getOffset() + mapped->getLength();
-}
-
 }
diff --git a/src/IO/MMapReadBufferFromFileWithCache.h b/src/IO/MMapReadBufferFromFileWithCache.h
index ce5da29831e..cb87b03df8d 100644
--- a/src/IO/MMapReadBufferFromFileWithCache.h
+++ b/src/IO/MMapReadBufferFromFileWithCache.h
@@ -19,7 +19,7 @@ public:
     off_t getPosition() override;
     std::string getFileName() const override;
     off_t seek(off_t offset, int whence) override;
-    size_t getFileOffsetOfBufferEnd() const override;
+
     bool isRegularLocalFile(size_t * /* out_view_offset */) override { return true; }
 
 private:
diff --git a/src/IO/ReadBufferFromEmptyFile.h b/src/IO/ReadBufferFromEmptyFile.h
index e2765765c47..f21f2f507dc 100644
--- a/src/IO/ReadBufferFromEmptyFile.h
+++ b/src/IO/ReadBufferFromEmptyFile.h
@@ -14,18 +14,12 @@ namespace DB
 /// - ThreadPoolReader
 class ReadBufferFromEmptyFile : public ReadBufferFromFileBase
 {
-public:
-    explicit ReadBufferFromEmptyFile(const String & file_name_) : file_name(file_name_) {}
-
 private:
-    String file_name;
-
     bool nextImpl() override { return false; }
-    std::string getFileName() const override { return file_name; }
+    std::string getFileName() const override { return "<empty>"; }
     off_t seek(off_t /*off*/, int /*whence*/) override { return 0; }
     off_t getPosition() override { return 0; }
     size_t getFileSize() override { return 0; }
-    size_t getFileOffsetOfBufferEnd() const override { return 0; }
 };
 
 }
diff --git a/src/IO/ReadBufferFromEncryptedFile.cpp b/src/IO/ReadBufferFromEncryptedFile.cpp
index 6861ae06dd8..f9cf1597153 100644
--- a/src/IO/ReadBufferFromEncryptedFile.cpp
+++ b/src/IO/ReadBufferFromEncryptedFile.cpp
@@ -101,18 +101,6 @@ bool ReadBufferFromEncryptedFile::nextImpl()
     return true;
 }
 
-size_t ReadBufferFromEncryptedFile::getFileSize()
-{
-    size_t size = in->getFileSize();
-    return size > FileEncryption::Header::kSize ? size - FileEncryption::Header::kSize : size;
-}
-
-size_t ReadBufferFromEncryptedFile::getFileOffsetOfBufferEnd() const
-{
-    size_t file_offset = in->getFileOffsetOfBufferEnd();
-    return file_offset > FileEncryption::Header::kSize ? file_offset - FileEncryption::Header::kSize : file_offset;
-}
-
 }
 
 #endif
diff --git a/src/IO/ReadBufferFromEncryptedFile.h b/src/IO/ReadBufferFromEncryptedFile.h
index 2f5093153ea..3626daccb3e 100644
--- a/src/IO/ReadBufferFromEncryptedFile.h
+++ b/src/IO/ReadBufferFromEncryptedFile.h
@@ -27,10 +27,10 @@ public:
     std::string getFileName() const override { return in->getFileName(); }
 
     void setReadUntilPosition(size_t position) override { in->setReadUntilPosition(position + FileEncryption::Header::kSize); }
+
     void setReadUntilEnd() override { in->setReadUntilEnd(); }
 
-    size_t getFileSize() override;
-    size_t getFileOffsetOfBufferEnd() const override;
+    size_t getFileSize() override { return in->getFileSize(); }
 
 private:
     bool nextImpl() override;
diff --git a/src/IO/ReadBufferFromFileBase.h b/src/IO/ReadBufferFromFileBase.h
index b9288ce6636..296edf9c689 100644
--- a/src/IO/ReadBufferFromFileBase.h
+++ b/src/IO/ReadBufferFromFileBase.h
@@ -60,12 +60,6 @@ public:
     /// file offset and what getPosition() returns.
     virtual bool isRegularLocalFile(size_t * /* out_view_offset */ = nullptr) { return false; }
 
-    /// NOTE: This method should be thread-safe against seek(), since it can be
-    /// used in CachedOnDiskReadBufferFromFile from multiple threads (because
-    /// it first releases the buffer, and then do logging, and so other thread
-    /// can already call seek() which will lead to data-race).
-    virtual size_t getFileOffsetOfBufferEnd() const = 0;
-
 protected:
     std::optional<size_t> file_size;
     ProfileCallback profile_callback;
diff --git a/src/IO/ReadBufferFromFileDecorator.cpp b/src/IO/ReadBufferFromFileDecorator.cpp
new file mode 100644
index 00000000000..9ac0fb4e475
--- /dev/null
+++ b/src/IO/ReadBufferFromFileDecorator.cpp
@@ -0,0 +1,60 @@
+#include <IO/ReadBufferFromFileDecorator.h>
+
+
+namespace DB
+{
+
+ReadBufferFromFileDecorator::ReadBufferFromFileDecorator(std::unique_ptr<SeekableReadBuffer> impl_)
+    : ReadBufferFromFileDecorator(std::move(impl_), "")
+{
+}
+
+
+ReadBufferFromFileDecorator::ReadBufferFromFileDecorator(std::unique_ptr<SeekableReadBuffer> impl_, const String & file_name_)
+    : impl(std::move(impl_)), file_name(file_name_)
+{
+    swap(*impl);
+}
+
+
+std::string ReadBufferFromFileDecorator::getFileName() const
+{
+    if (!file_name.empty())
+        return file_name;
+
+    return getFileNameFromReadBuffer(*impl);
+}
+
+
+off_t ReadBufferFromFileDecorator::getPosition()
+{
+    swap(*impl);
+    auto position = impl->getPosition();
+    swap(*impl);
+    return position;
+}
+
+
+off_t ReadBufferFromFileDecorator::seek(off_t off, int whence)
+{
+    swap(*impl);
+    auto result = impl->seek(off, whence);
+    swap(*impl);
+    return result;
+}
+
+
+bool ReadBufferFromFileDecorator::nextImpl()
+{
+    swap(*impl);
+    auto result = impl->next();
+    swap(*impl);
+    return result;
+}
+
+size_t ReadBufferFromFileDecorator::getFileSize()
+{
+    return getFileSizeFromReadBuffer(*impl);
+}
+
+}
diff --git a/src/IO/ReadBufferFromFileDecorator.h b/src/IO/ReadBufferFromFileDecorator.h
new file mode 100644
index 00000000000..6e62c7f741b
--- /dev/null
+++ b/src/IO/ReadBufferFromFileDecorator.h
@@ -0,0 +1,37 @@
+#pragma once
+
+#include <IO/ReadBufferFromFileBase.h>
+
+
+namespace DB
+{
+
+/// Delegates all reads to underlying buffer. Doesn't have own memory.
+class ReadBufferFromFileDecorator : public ReadBufferFromFileBase
+{
+public:
+    explicit ReadBufferFromFileDecorator(std::unique_ptr<SeekableReadBuffer> impl_);
+    ReadBufferFromFileDecorator(std::unique_ptr<SeekableReadBuffer> impl_, const String & file_name_);
+
+    std::string getFileName() const override;
+
+    off_t getPosition() override;
+
+    off_t seek(off_t off, int whence) override;
+
+    bool nextImpl() override;
+
+    bool isWithFileSize() const { return dynamic_cast<const WithFileSize *>(impl.get()) != nullptr; }
+
+    const ReadBuffer & getWrappedReadBuffer() const { return *impl; }
+
+    ReadBuffer & getWrappedReadBuffer() { return *impl; }
+
+    size_t getFileSize() override;
+
+protected:
+    std::unique_ptr<SeekableReadBuffer> impl;
+    String file_name;
+};
+
+}
diff --git a/src/IO/ReadBufferFromMemory.h b/src/IO/ReadBufferFromMemory.h
index 6d3f1a2c6e5..ad96e4bfa28 100644
--- a/src/IO/ReadBufferFromMemory.h
+++ b/src/IO/ReadBufferFromMemory.h
@@ -20,6 +20,7 @@ public:
         : SeekableReadBuffer(const_cast<char *>(str.data()), str.size(), 0) {}
 
     off_t seek(off_t off, int whence) override;
+
     off_t getPosition() override;
 };
 
diff --git a/src/IO/SeekableReadBuffer.h b/src/IO/SeekableReadBuffer.h
index 1fb66a5aa9f..c002d30e633 100644
--- a/src/IO/SeekableReadBuffer.h
+++ b/src/IO/SeekableReadBuffer.h
@@ -44,6 +44,12 @@ public:
 
     virtual String getInfoForLog() { return ""; }
 
+    /// NOTE: This method should be thread-safe against seek(), since it can be
+    /// used in CachedOnDiskReadBufferFromFile from multiple threads (because
+    /// it first releases the buffer, and then do logging, and so other thread
+    /// can already call seek() which will lead to data-race).
+    virtual size_t getFileOffsetOfBufferEnd() const { throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method getFileOffsetOfBufferEnd() not implemented"); }
+
     /// If true, setReadUntilPosition() guarantees that eof will be reported at the given position.
     virtual bool supportsRightBoundedReads() const { return false; }
 
diff --git a/src/IO/WithFileSize.cpp b/src/IO/WithFileSize.cpp
index 435789652dc..3660d962c08 100644
--- a/src/IO/WithFileSize.cpp
+++ b/src/IO/WithFileSize.cpp
@@ -2,6 +2,7 @@
 #include <IO/ReadBufferFromFile.h>
 #include <IO/CompressedReadBufferWrapper.h>
 #include <IO/ParallelReadBuffer.h>
+#include <IO/ReadBufferFromFileDecorator.h>
 #include <IO/PeekableReadBuffer.h>
 
 namespace DB
@@ -16,15 +17,23 @@ template <typename T>
 static size_t getFileSize(T & in)
 {
     if (auto * with_file_size = dynamic_cast<WithFileSize *>(&in))
+    {
         return with_file_size->getFileSize();
+    }
 
     throw Exception(ErrorCodes::UNKNOWN_FILE_SIZE, "Cannot find out file size");
 }
 
 size_t getFileSizeFromReadBuffer(ReadBuffer & in)
 {
-    if (auto * compressed = dynamic_cast<CompressedReadBufferWrapper *>(&in))
+    if (auto * delegate = dynamic_cast<ReadBufferFromFileDecorator *>(&in))
+    {
+        return getFileSize(delegate->getWrappedReadBuffer());
+    }
+    else if (auto * compressed = dynamic_cast<CompressedReadBufferWrapper *>(&in))
+    {
         return getFileSize(compressed->getWrappedReadBuffer());
+    }
 
     return getFileSize(in);
 }
@@ -43,7 +52,11 @@ std::optional<size_t> tryGetFileSizeFromReadBuffer(ReadBuffer & in)
 
 bool isBufferWithFileSize(const ReadBuffer & in)
 {
-    if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
+    if (const auto * delegate = dynamic_cast<const ReadBufferFromFileDecorator *>(&in))
+    {
+        return delegate->isWithFileSize();
+    }
+    else if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
     {
         return isBufferWithFileSize(compressed->getWrappedReadBuffer());
     }
@@ -53,7 +66,11 @@ bool isBufferWithFileSize(const ReadBuffer & in)
 
 size_t getDataOffsetMaybeCompressed(const ReadBuffer & in)
 {
-    if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
+    if (const auto * delegate = dynamic_cast<const ReadBufferFromFileDecorator *>(&in))
+    {
+        return getDataOffsetMaybeCompressed(delegate->getWrappedReadBuffer());
+    }
+    else if (const auto * compressed = dynamic_cast<const CompressedReadBufferWrapper *>(&in))
     {
         return getDataOffsetMaybeCompressed(compressed->getWrappedReadBuffer());
     }
diff --git a/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.cpp b/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.cpp
index 65df2c020ba..6b6151f5474 100644
--- a/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.cpp
+++ b/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.cpp
@@ -37,7 +37,7 @@ namespace ErrorCodes
 
 AsynchronousReadBufferFromHDFS::AsynchronousReadBufferFromHDFS(
     IAsynchronousReader & reader_, const ReadSettings & settings_, std::shared_ptr<ReadBufferFromHDFS> impl_)
-    : ReadBufferFromFileBase(settings_.remote_fs_buffer_size, nullptr, 0)
+    : BufferWithOwnMemory<SeekableReadBuffer>(settings_.remote_fs_buffer_size)
     , reader(reader_)
     , base_priority(settings_.priority)
     , impl(std::move(impl_))
diff --git a/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.h b/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.h
index 1d3e8b8e3e9..10e2749fd4a 100644
--- a/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.h
+++ b/src/Storages/HDFS/AsynchronousReadBufferFromHDFS.h
@@ -21,7 +21,7 @@ namespace DB
 
 class IAsynchronousReader;
 
-class AsynchronousReadBufferFromHDFS : public ReadBufferFromFileBase
+class AsynchronousReadBufferFromHDFS : public BufferWithOwnMemory<SeekableReadBuffer>, public WithFileName, public WithFileSize
 {
 public:
     AsynchronousReadBufferFromHDFS(

From ddf0f228194b50a42908a5730c2cbc2be038d266 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 14:34:16 +0300
Subject: [PATCH 0883/1081] UniqExactSet read crash fix

---
 src/AggregateFunctions/UniqExactSet.h | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/src/AggregateFunctions/UniqExactSet.h b/src/AggregateFunctions/UniqExactSet.h
index e8c0de660ff..2a790690f51 100644
--- a/src/AggregateFunctions/UniqExactSet.h
+++ b/src/AggregateFunctions/UniqExactSet.h
@@ -156,7 +156,6 @@ public:
     void read(ReadBuffer & in)
     {
         size_t new_size = 0;
-        auto * const position = in.position();
         readVarUInt(new_size, in);
         if (new_size > 100'000'000'000)
             throw DB::Exception(
@@ -174,8 +173,14 @@ public:
         }
         else
         {
-            in.position() = position; // Rollback position
-            asSingleLevel().read(in);
+            asSingleLevel().reserve(new_size);
+
+            for (size_t i = 0; i < new_size; ++i)
+            {
+                typename SingleLevelSet::Cell x;
+                x.read(in);
+                asSingleLevel().insert(x.getValue());
+            }
         }
     }
 

From 5daab7a8628182770e02d4f91fa315652e9edbbd Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 11:37:40 +0000
Subject: [PATCH 0884/1081] Fixing test.

---
 .../02731_parallel_replicas_join_subquery.reference            | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
index 48ea1154bc3..028cc744170 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
@@ -58,8 +58,7 @@ U	c	10
 UlI+1		10
 bX?}ix [	Ny]2 G	10
 t<iT	X48q:Z]t0	10
-0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2`
-0	3	SELECT `__table2`.`value1` AS `value1`, `__table2`.`value2` AS `value2`, count() AS `count` FROM `default`.`join_outer_table` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` USING (`key`) GROUP BY `__table1`.`key`, `__table2`.`value1`, `__table2`.`value2`
+0	3	SELECT `__table2`.`value1` AS `value1`, `__table2`.`value2` AS `value2`, count() AS `count` FROM `default`.`join_outer_table` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`key` AS `key`, `__table3`.`value1` AS `value1`, `__table3`.`value2` AS `value2` FROM `default`.`join_inner_table` AS `__table3` PREWHERE (`__table3`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table3`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table3`.`key`, `__table3`.`value1`, `__table3`.`value2`) AS `__table2` USING (`key`) GROUP BY `__table1`.`key`, `__table2`.`value1`, `__table2`.`value2`
 0	3	SELECT `key`, `value1`, `value2` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2`
 0	3	SELECT `value1`, `value2`, count() AS `count` FROM `default`.`join_outer_table` ALL INNER JOIN `_data_` USING (`key`) GROUP BY `key`, `value1`, `value2`
 1	1	-- Parallel full query\nSELECT\n    value1,\n    value2,\n    avg(count) AS avg\nFROM\n    (\n        SELECT\n            key,\n            value1,\n            value2,\n            count() AS count\n        FROM join_outer_table\n        INNER JOIN\n        (\n            SELECT\n                key,\n                value1,\n                value2,\n                toUInt64(min(time)) AS start_ts\n            FROM join_inner_table\n            PREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\n            GROUP BY key, value1, value2\n        ) USING (key)\n        GROUP BY key, value1, value2\n        )\nGROUP BY value1, value2\nORDER BY value1, value2\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=0;

From a4562ea013995326f1953af09fac481a74d642a1 Mon Sep 17 00:00:00 2001
From: Pablo Marcos <pablo.marcos.oltra@gmail.com>
Date: Tue, 13 Feb 2024 12:56:32 +0100
Subject: [PATCH 0885/1081] Fix description for
 allow_prefetched_read_pool_for_local_filesystem

allow_prefetched_read_pool_for_local_filesystem wrongly used the same description as allow_prefetched_read_pool_for_remote_filesystem
---
 src/Core/Settings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 44badfefabb..f85c6e7b618 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -774,7 +774,7 @@ class IColumn;
     M(Bool, load_marks_asynchronously, false, "Load MergeTree marks asynchronously", 0) \
     M(Bool, enable_filesystem_read_prefetches_log, false, "Log to system.filesystem prefetch_log during query. Should be used only for testing or debugging, not recommended to be turned on by default", 0) \
     M(Bool, allow_prefetched_read_pool_for_remote_filesystem, true, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
-    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefetched threadpool if all parts are on remote filesystem", 0) \
+    M(Bool, allow_prefetched_read_pool_for_local_filesystem, false, "Prefer prefetched threadpool if all parts are on local filesystem", 0) \
     \
     M(UInt64, prefetch_buffer_size, DBMS_DEFAULT_BUFFER_SIZE, "The maximum size of the prefetch buffer to read from the filesystem.", 0) \
     M(UInt64, filesystem_prefetch_step_bytes, 0, "Prefetch step in bytes. Zero means `auto` - approximately the best prefetch step will be auto deduced, but might not be 100% the best. The actual value might be different because of setting filesystem_prefetch_min_bytes_for_single_read_task", 0) \

From a359ceecb55dafcff6d6945f27a8f61ba44a3e57 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 7 Feb 2024 20:31:53 +0300
Subject: [PATCH 0886/1081] ASOF JOIN use trySort with RadixSort

---
 src/Common/RadixSort.h       | 67 ++++++++++++++++++++++++++++++++++++
 src/Interpreters/RowRefs.cpp | 56 +++++++++++++++---------------
 tests/performance/asof.xml   | 11 ++++--
 3 files changed, 104 insertions(+), 30 deletions(-)

diff --git a/src/Common/RadixSort.h b/src/Common/RadixSort.h
index 739bec8d9dd..84f88272f19 100644
--- a/src/Common/RadixSort.h
+++ b/src/Common/RadixSort.h
@@ -15,6 +15,7 @@
 
 #include <base/bit_cast.h>
 #include <base/extended_types.h>
+#include <base/sort.h>
 #include <Core/Defines.h>
 
 
@@ -214,6 +215,22 @@ private:
     static KeyBits keyToBits(Key x) { return bit_cast<KeyBits>(x); }
     static Key bitsToKey(KeyBits x) { return bit_cast<Key>(x); }
 
+    struct LessComparator
+    {
+        ALWAYS_INLINE bool operator()(Element & lhs, Element & rhs)
+        {
+            return Traits::less(Traits::extractKey(lhs), Traits::extractKey(rhs));
+        }
+    };
+
+    struct GreaterComparator
+    {
+        ALWAYS_INLINE bool operator()(Element & lhs, Element & rhs)
+        {
+            return !Traits::less(Traits::extractKey(lhs), Traits::extractKey(rhs));
+        }
+    };
+
     static ALWAYS_INLINE KeyBits getPart(size_t N, KeyBits x)
     {
         if (Traits::Transform::transform_is_simple)
@@ -504,6 +521,24 @@ private:
             radixSortMSDInternal<PASS>(arr, size, limit);
     }
 
+    template <bool DIRECT_WRITE_TO_DESTINATION, typename Comparator>
+    static void executeLSDWithPDQSortInternal(Element * arr, size_t size, bool reverse, Comparator comparator, Result * destination)
+    {
+        bool try_sort = ::trySort(arr, arr + size, comparator);
+        if (try_sort)
+        {
+            if constexpr (DIRECT_WRITE_TO_DESTINATION)
+            {
+                for (size_t i = 0; i < size; ++i)
+                    destination[i] = Traits::extractResult(arr[i]);
+            }
+
+            return;
+        }
+
+        radixSortLSDInternal<DIRECT_WRITE_TO_DESTINATION>(arr, size, reverse, destination);
+    }
+
 public:
     /** Least significant digit radix sort (stable).
       * This function will sort inplace (modify 'arr')
@@ -529,6 +564,38 @@ public:
         radixSortLSDInternal<true>(arr, size, reverse, destination);
     }
 
+    /** Tries to fast sort elements for common sorting patterns (unstable).
+      * If fast sort cannot be performed, execute least significant digit radix sort.
+      */
+    static void executeLSDWithPDQSort(Element * arr, size_t size)
+    {
+        return executeLSDWithPDQSort(arr, size, false);
+    }
+
+    static void executeLSDWithPDQSort(Element * arr, size_t size, bool reverse)
+    {
+        return executeLSDWithPDQSort(arr, size, reverse, nullptr);
+    }
+
+    static void executeLSDWithPDQSort(Element * arr, size_t size, bool reverse, Result * destination)
+    {
+        if (reverse)
+        {
+
+            if (destination)
+                return executeLSDWithPDQSortInternal<true>(arr, size, reverse, GreaterComparator(), destination);
+            else
+                return executeLSDWithPDQSortInternal<false>(arr, size, reverse, GreaterComparator(), destination);
+        }
+        else
+        {
+            if (destination)
+                return executeLSDWithPDQSortInternal<true>(arr, size, reverse, LessComparator(), destination);
+            else
+                return executeLSDWithPDQSortInternal<false>(arr, size, reverse, LessComparator(), destination);
+        }
+    }
+
     /* Most significant digit radix sort
      * Is not stable, but allows partial sorting.
      * And it's more cache-friendly and usually faster than LSD variant.
diff --git a/src/Interpreters/RowRefs.cpp b/src/Interpreters/RowRefs.cpp
index 4335cde47f9..e90ae7fd1da 100644
--- a/src/Interpreters/RowRefs.cpp
+++ b/src/Interpreters/RowRefs.cpp
@@ -175,45 +175,45 @@ private:
     // the array becomes immutable
     void sort()
     {
-        if (!sorted.load(std::memory_order_acquire))
+        if (sorted.load(std::memory_order_acquire))
+            return;
+
+        std::lock_guard<std::mutex> l(lock);
+
+        if (sorted.load(std::memory_order_relaxed))
+            return;
+
+        if constexpr (std::is_arithmetic_v<TKey> && !std::is_floating_point_v<TKey>)
         {
-            std::lock_guard<std::mutex> l(lock);
-
-            if (!sorted.load(std::memory_order_relaxed))
+            if (likely(entries.size() > 256))
             {
-                if constexpr (std::is_arithmetic_v<TKey> && !std::is_floating_point_v<TKey>)
+                struct RadixSortTraits : RadixSortNumTraits<TKey>
                 {
-                    if (likely(entries.size() > 256))
-                    {
-                        struct RadixSortTraits : RadixSortNumTraits<TKey>
-                        {
-                            using Element = Entry;
-                            using Result = Element;
+                    using Element = Entry;
+                    using Result = Element;
 
-                            static TKey & extractKey(Element & elem) { return elem.value; }
-                            static Result extractResult(Element & elem) { return elem; }
-                        };
-
-                        if constexpr (is_descending)
-                            RadixSort<RadixSortTraits>::executeLSD(entries.data(), entries.size(), true);
-                        else
-                            RadixSort<RadixSortTraits>::executeLSD(entries.data(), entries.size(), false);
-
-                        sorted.store(true, std::memory_order_release);
-                        return;
-                    }
-                }
+                    static TKey & extractKey(Element & elem) { return elem.value; }
+                    static Result extractResult(Element & elem) { return elem; }
+                };
 
                 if constexpr (is_descending)
-                    ::sort(entries.begin(), entries.end(), GreaterEntryOperator());
+                    RadixSort<RadixSortTraits>::executeLSDWithPDQSort(entries.data(), entries.size(), true /*reverse*/);
                 else
-                    ::sort(entries.begin(), entries.end(), LessEntryOperator());
-
-                sorted.store(true, std::memory_order_release);
+                    RadixSort<RadixSortTraits>::executeLSDWithPDQSort(entries.data(), entries.size(), false /*reverse*/);
             }
         }
+        else
+        {
+            if constexpr (is_descending)
+                ::sort(entries.begin(), entries.end(), GreaterEntryOperator());
+            else
+                ::sort(entries.begin(), entries.end(), LessEntryOperator());
+        }
+
+        sorted.store(true, std::memory_order_release);
     }
 };
+
 }
 
 AsofRowRefs createAsofRowRef(TypeIndex type, ASOFJoinInequality inequality)
diff --git a/tests/performance/asof.xml b/tests/performance/asof.xml
index d00afaa26b5..2299a4d9092 100644
--- a/tests/performance/asof.xml
+++ b/tests/performance/asof.xml
@@ -43,6 +43,13 @@
     </query>
 
     <substitutions>
+        <substitution>
+            <name>num_unique_sessions</name>
+            <values>
+                <value>1000</value>
+                <value>1000000</value>
+            </values>
+        </substitution>
         <substitution>
             <name>num_rows</name>
             <values>
@@ -56,15 +63,15 @@
         FROM
         (
             SELECT
+                (number % {num_unique_sessions}) AS visitor_id,
                 number AS id,
-                number AS visitor_id
             FROM system.numbers
             LIMIT {num_rows}
         ) AS sessions
         ASOF LEFT JOIN
         (
             SELECT
-                number AS visitor_id,
+                (number % {num_unique_sessions}) AS visitor_id,
                 number AS starting_session_id
             FROM system.numbers
             LIMIT {num_rows}

From bfa7938df9b0af787923a1cd050542c62152f100 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 8 Feb 2024 13:29:17 +0300
Subject: [PATCH 0887/1081] Fixed tests

---
 src/Common/RadixSort.h       | 20 ++++++++++----------
 src/Interpreters/RowRefs.cpp | 17 +++++++++--------
 2 files changed, 19 insertions(+), 18 deletions(-)

diff --git a/src/Common/RadixSort.h b/src/Common/RadixSort.h
index 84f88272f19..814101393e8 100644
--- a/src/Common/RadixSort.h
+++ b/src/Common/RadixSort.h
@@ -522,7 +522,7 @@ private:
     }
 
     template <bool DIRECT_WRITE_TO_DESTINATION, typename Comparator>
-    static void executeLSDWithPDQSortInternal(Element * arr, size_t size, bool reverse, Comparator comparator, Result * destination)
+    static void executeLSDWithTrySortInternal(Element * arr, size_t size, bool reverse, Comparator comparator, Result * destination)
     {
         bool try_sort = ::trySort(arr, arr + size, comparator);
         if (try_sort)
@@ -567,32 +567,32 @@ public:
     /** Tries to fast sort elements for common sorting patterns (unstable).
       * If fast sort cannot be performed, execute least significant digit radix sort.
       */
-    static void executeLSDWithPDQSort(Element * arr, size_t size)
+    static void executeLSDWithTrySort(Element * arr, size_t size)
     {
-        return executeLSDWithPDQSort(arr, size, false);
+        return executeLSDWithTrySort(arr, size, false);
     }
 
-    static void executeLSDWithPDQSort(Element * arr, size_t size, bool reverse)
+    static void executeLSDWithTrySort(Element * arr, size_t size, bool reverse)
     {
-        return executeLSDWithPDQSort(arr, size, reverse, nullptr);
+        return executeLSDWithTrySort(arr, size, reverse, nullptr);
     }
 
-    static void executeLSDWithPDQSort(Element * arr, size_t size, bool reverse, Result * destination)
+    static void executeLSDWithTrySort(Element * arr, size_t size, bool reverse, Result * destination)
     {
         if (reverse)
         {
 
             if (destination)
-                return executeLSDWithPDQSortInternal<true>(arr, size, reverse, GreaterComparator(), destination);
+                return executeLSDWithTrySortInternal<true>(arr, size, reverse, GreaterComparator(), destination);
             else
-                return executeLSDWithPDQSortInternal<false>(arr, size, reverse, GreaterComparator(), destination);
+                return executeLSDWithTrySortInternal<false>(arr, size, reverse, GreaterComparator(), destination);
         }
         else
         {
             if (destination)
-                return executeLSDWithPDQSortInternal<true>(arr, size, reverse, LessComparator(), destination);
+                return executeLSDWithTrySortInternal<true>(arr, size, reverse, LessComparator(), destination);
             else
-                return executeLSDWithPDQSortInternal<false>(arr, size, reverse, LessComparator(), destination);
+                return executeLSDWithTrySortInternal<false>(arr, size, reverse, LessComparator(), destination);
         }
     }
 
diff --git a/src/Interpreters/RowRefs.cpp b/src/Interpreters/RowRefs.cpp
index e90ae7fd1da..c93f18707b3 100644
--- a/src/Interpreters/RowRefs.cpp
+++ b/src/Interpreters/RowRefs.cpp
@@ -197,18 +197,19 @@ private:
                 };
 
                 if constexpr (is_descending)
-                    RadixSort<RadixSortTraits>::executeLSDWithPDQSort(entries.data(), entries.size(), true /*reverse*/);
+                    RadixSort<RadixSortTraits>::executeLSDWithTrySort(entries.data(), entries.size(), true /*reverse*/);
                 else
-                    RadixSort<RadixSortTraits>::executeLSDWithPDQSort(entries.data(), entries.size(), false /*reverse*/);
+                    RadixSort<RadixSortTraits>::executeLSDWithTrySort(entries.data(), entries.size(), false /*reverse*/);
+
+                sorted.store(true, std::memory_order_release);
+                return;
             }
         }
+
+        if constexpr (is_descending)
+            ::sort(entries.begin(), entries.end(), GreaterEntryOperator());
         else
-        {
-            if constexpr (is_descending)
-                ::sort(entries.begin(), entries.end(), GreaterEntryOperator());
-            else
-                ::sort(entries.begin(), entries.end(), LessEntryOperator());
-        }
+            ::sort(entries.begin(), entries.end(), LessEntryOperator());
 
         sorted.store(true, std::memory_order_release);
     }

From 2caf3f0fbbcd746c4a1de15767c00af94c90750e Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 8 Feb 2024 20:29:47 +0300
Subject: [PATCH 0888/1081] Fixed tests

---
 tests/performance/asof.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/performance/asof.xml b/tests/performance/asof.xml
index 2299a4d9092..61e61be13bb 100644
--- a/tests/performance/asof.xml
+++ b/tests/performance/asof.xml
@@ -64,7 +64,7 @@
         (
             SELECT
                 (number % {num_unique_sessions}) AS visitor_id,
-                number AS id,
+                number AS id
             FROM system.numbers
             LIMIT {num_rows}
         ) AS sessions

From 45779759232dc065ac5952359e6a04de50782931 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 14:40:04 +0300
Subject: [PATCH 0889/1081] Fixed code review issues

---
 src/Common/RadixSort.h       | 17 ++++++++++++++++-
 src/Interpreters/RowRefs.cpp |  6 +-----
 2 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/src/Common/RadixSort.h b/src/Common/RadixSort.h
index 814101393e8..a30e19d8212 100644
--- a/src/Common/RadixSort.h
+++ b/src/Common/RadixSort.h
@@ -115,6 +115,11 @@ struct RadixSortFloatTraits
     {
         return x < y;
     }
+
+    static bool greater(Key x, Key y)
+    {
+        return x > y;
+    }
 };
 
 
@@ -149,6 +154,11 @@ struct RadixSortUIntTraits
     {
         return x < y;
     }
+
+    static bool greater(Key x, Key y)
+    {
+        return x > y;
+    }
 };
 
 
@@ -183,6 +193,11 @@ struct RadixSortIntTraits
     {
         return x < y;
     }
+
+    static bool greater(Key x, Key y)
+    {
+        return x > y;
+    }
 };
 
 
@@ -227,7 +242,7 @@ private:
     {
         ALWAYS_INLINE bool operator()(Element & lhs, Element & rhs)
         {
-            return !Traits::less(Traits::extractKey(lhs), Traits::extractKey(rhs));
+            return Traits::greater(Traits::extractKey(lhs), Traits::extractKey(rhs));
         }
     };
 
diff --git a/src/Interpreters/RowRefs.cpp b/src/Interpreters/RowRefs.cpp
index c93f18707b3..9785ba46dab 100644
--- a/src/Interpreters/RowRefs.cpp
+++ b/src/Interpreters/RowRefs.cpp
@@ -196,11 +196,7 @@ private:
                     static Result extractResult(Element & elem) { return elem; }
                 };
 
-                if constexpr (is_descending)
-                    RadixSort<RadixSortTraits>::executeLSDWithTrySort(entries.data(), entries.size(), true /*reverse*/);
-                else
-                    RadixSort<RadixSortTraits>::executeLSDWithTrySort(entries.data(), entries.size(), false /*reverse*/);
-
+                RadixSort<RadixSortTraits>::executeLSDWithTrySort(entries.data(), entries.size(), is_descending /*reverse*/);
                 sorted.store(true, std::memory_order_release);
                 return;
             }

From d7056d642d6d4d4e136646b18d6db37437dfd81b Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 13 Feb 2024 13:53:40 +0100
Subject: [PATCH 0890/1081] Addressed review comments

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 56 ++++++++++++-----------
 src/Analyzer/TableFunctionNode.h          | 10 +++-
 src/Storages/StorageView.cpp              |  1 +
 3 files changed, 39 insertions(+), 28 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 02e70e53c5a..3d20242a70a 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6638,13 +6638,16 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     String database_name = scope.context->getCurrentDatabase();
     String table_name;
 
-    if (table_function_node->getOriginalAST() && table_function_node->getOriginalAST()->as<ASTFunction>())
+    auto function_ast = table_function_node->getOriginalAST() ? table_function_node->getOriginalAST()->as<ASTFunction>() : nullptr;
+    auto &table_function_node_typed = table_function_node->as<TableFunctionNode &>();
+
+    if (function_ast)
     {
-        table_name = table_function_node->getOriginalAST()->as<ASTFunction>()->name;
-        if (table_function_node->getOriginalAST()->as<ASTFunction>()->is_compound_name)
+        table_name = function_ast->name;
+        if (function_ast->is_compound_name)
         {
             std::vector<std::string> parts;
-            splitInto<'.'>(parts, table_function_node->getOriginalAST()->as<ASTFunction>()->name);
+            splitInto<'.'>(parts, function_ast->name);
 
             if (parts.size() == 2)
             {
@@ -6652,35 +6655,34 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
                 table_name = parts[1];
             }
         }
-    }
 
-    auto & table_function_node_typed = table_function_node->as<TableFunctionNode &>();
-
-    StoragePtr table = table_name.empty() ? nullptr : DatabaseCatalog::instance().tryGetTable({database_name, table_name}, scope.context->getQueryContext());
-    if (table)
-    {
-        if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())
+        StoragePtr table = table_name.empty() ? nullptr : DatabaseCatalog::instance().tryGetTable(
+                {database_name, table_name}, scope.context->getQueryContext());
+        if (table)
         {
-            auto query = table->getInMemoryMetadataPtr()->getSelectQuery().inner_query->clone();
-            NameToNameMap parameterized_view_values = analyzeFunctionParamValues(table_function_node->getOriginalAST());
-            StorageView::replaceQueryParametersIfParametrizedView(query, parameterized_view_values);
+            if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())
+            {
+                auto query = table->getInMemoryMetadataPtr()->getSelectQuery().inner_query->clone();
+                NameToNameMap parameterized_view_values = analyzeFunctionParamValues(
+                        table_function_node->getOriginalAST());
+                StorageView::replaceQueryParametersIfParametrizedView(query, parameterized_view_values);
 
-            ASTCreateQuery create;
-            create.select = query->as<ASTSelectWithUnionQuery>();
-            auto sample_block = InterpreterSelectWithUnionQuery::getSampleBlock(query, scope.context);
-            auto res = std::make_shared<StorageView>(StorageID(database_name, table_name),
-                                                     create,
-                                                     ColumnsDescription(sample_block.getNamesAndTypesList()),
-                    /* comment */ "",
-                    /* is_parameterized_view */ true);
-            res->startup();
-            table_function_node->getOriginalAST()->as<ASTFunction>()->prefer_subquery_to_function_formatting = true;
-            table_function_node_typed.resolve(std::move(res), scope.context);
-            return;
+                ASTCreateQuery create;
+                create.select = query->as<ASTSelectWithUnionQuery>();
+                auto sample_block = InterpreterSelectWithUnionQuery::getSampleBlock(query, scope.context);
+                auto res = std::make_shared<StorageView>(StorageID(database_name, table_name),
+                                                         create,
+                                                         ColumnsDescription(sample_block.getNamesAndTypesList()),
+                        /* comment */ "",
+                        /* is_parameterized_view */ true);
+                res->startup();
+                function_ast->prefer_subquery_to_function_formatting = true;
+                table_function_node_typed.resolve(std::move(res), scope.context);
+                return;
+            }
         }
     }
 
-
     if (!nested_table_function)
         expressions_visitor.visit(table_function_node_typed.getArgumentsNode());
 
diff --git a/src/Analyzer/TableFunctionNode.h b/src/Analyzer/TableFunctionNode.h
index ed1a26c4dd4..cb65511bfce 100644
--- a/src/Analyzer/TableFunctionNode.h
+++ b/src/Analyzer/TableFunctionNode.h
@@ -5,6 +5,7 @@
 #include <Storages/IStorage_fwd.h>
 #include <Storages/TableLockHolder.h>
 #include <Storages/StorageSnapshot.h>
+#include <Storages/StorageView.h>
 
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/StorageID.h>
@@ -73,7 +74,14 @@ public:
     /// Returns true, if table function is resolved, false otherwise
     bool isResolved() const
     {
-        return storage != nullptr && table_function != nullptr;
+        /// For parameterized view, we only have storage
+        if (storage)
+            if (storage->as<StorageView>() && storage->as<StorageView>()->isParameterizedView())
+                return true;
+            else
+                return table_function != nullptr;
+        else
+            return false;
     }
 
     /// Get table function, returns nullptr if table function node is not resolved
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 6b80e2450c4..588e5303117 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -114,6 +114,7 @@ StorageView::StorageView(
     StorageInMemoryMetadata storage_metadata;
     if (!is_parameterized_view_)
     {
+        /// If CREATE query is to create parameterized view, then we dont want to set columns
         if (!query.isParameterizedView())
             storage_metadata.setColumns(columns_);
     }

From 8f71d7817c60bec0a050437aa28cd4e28298daea Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 13 Feb 2024 14:57:45 +0100
Subject: [PATCH 0891/1081] Fix clang build

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 3d20242a70a..ed67250312a 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6638,7 +6638,7 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     String database_name = scope.context->getCurrentDatabase();
     String table_name;
 
-    auto function_ast = table_function_node->getOriginalAST() ? table_function_node->getOriginalAST()->as<ASTFunction>() : nullptr;
+    auto * function_ast = table_function_node->getOriginalAST() ? table_function_node->getOriginalAST()->as<ASTFunction>() : nullptr;
     auto &table_function_node_typed = table_function_node->as<TableFunctionNode &>();
 
     if (function_ast)

From 4dc6ed3a39fcc67f0615978d8c567fa8a9c26b0c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 17:53:35 +0300
Subject: [PATCH 0892/1081] Register StorageMergeTree exception message fix

---
 src/Storages/MergeTree/registerStorageMergeTree.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 8e646e48f16..dd212190664 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -194,7 +194,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
     auto add_optional_param = [&](const char * desc)
     {
         ++max_num_params;
-        needed_params += needed_params.empty() ? "\n" : ",\n[";
+        needed_params += needed_params.empty() ? "\n[" : ",\n[";
         needed_params += desc;
         needed_params += "]";
     };

From 037bc043e6cbb6b56d66c8bb94db2335cfdc0cd8 Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Tue, 13 Feb 2024 16:01:17 +0100
Subject: [PATCH 0893/1081] Removed lambdas

---
 src/Storages/MergeTree/MergeTask.cpp |  6 ++---
 src/Storages/MergeTree/MergeTask.h   | 38 ++++++++++++++--------------
 2 files changed, 22 insertions(+), 22 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 9cbcdbaaaaa..e6ae63da7e3 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -436,7 +436,7 @@ MergeTask::StageRuntimeContextPtr MergeTask::VerticalMergeStage::getContextForNe
 bool MergeTask::ExecuteAndFinalizeHorizontalPart::execute()
 {
     assert(subtasks_iterator != subtasks.end());
-    if ((*subtasks_iterator)())
+    if ((this->**subtasks_iterator)())
         return true;
 
     /// Move to the next subtask in an array of subtasks
@@ -827,7 +827,7 @@ bool MergeTask::MergeProjectionsStage::finalizeProjectionsAndWholeMerge() const
 bool MergeTask::VerticalMergeStage::execute()
 {
     assert(subtasks_iterator != subtasks.end());
-    if ((*subtasks_iterator)())
+    if ((this->**subtasks_iterator)())
         return true;
 
     /// Move to the next subtask in an array of subtasks
@@ -838,7 +838,7 @@ bool MergeTask::VerticalMergeStage::execute()
 bool MergeTask::MergeProjectionsStage::execute()
 {
     assert(subtasks_iterator != subtasks.end());
-    if ((*subtasks_iterator)())
+    if ((this->**subtasks_iterator)())
         return true;
 
     /// Move to the next subtask in an array of subtasks
diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index 6f5336baaad..ad5fe3eb8ce 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -246,15 +246,15 @@ private:
         bool prepare();
         bool executeImpl();
 
-        using ExecuteAndFinalizeHorizontalPartSubtasks = std::array<std::function<bool()>, 2>;
+        using ExecuteAndFinalizeHorizontalPartSubtasks = std::array<bool(ExecuteAndFinalizeHorizontalPart::*)(), 2>;
 
-        ExecuteAndFinalizeHorizontalPartSubtasks subtasks
+        const ExecuteAndFinalizeHorizontalPartSubtasks subtasks
         {
-            [this] () { return prepare(); },
-            [this] () { return executeImpl(); }
+            &ExecuteAndFinalizeHorizontalPart::prepare,
+            &ExecuteAndFinalizeHorizontalPart::executeImpl
         };
 
-        ExecuteAndFinalizeHorizontalPartSubtasks::iterator subtasks_iterator = subtasks.begin();
+        ExecuteAndFinalizeHorizontalPartSubtasks::const_iterator subtasks_iterator = subtasks.begin();
 
 
         MergeAlgorithm chooseMergeAlgorithm() const;
@@ -323,16 +323,16 @@ private:
         bool executeVerticalMergeForAllColumns() const;
         bool finalizeVerticalMergeForAllColumns() const;
 
-        using VerticalMergeStageSubtasks = std::array<std::function<bool()>, 3>;
+        using VerticalMergeStageSubtasks = std::array<bool(VerticalMergeStage::*)()const, 3>;
 
-        VerticalMergeStageSubtasks subtasks
+        const VerticalMergeStageSubtasks subtasks
         {
-            [this] () { return prepareVerticalMergeForAllColumns(); },
-            [this] () { return executeVerticalMergeForAllColumns(); },
-            [this] () { return finalizeVerticalMergeForAllColumns(); }
+            &VerticalMergeStage::prepareVerticalMergeForAllColumns,
+            &VerticalMergeStage::executeVerticalMergeForAllColumns,
+            &VerticalMergeStage::finalizeVerticalMergeForAllColumns
         };
 
-        VerticalMergeStageSubtasks::iterator subtasks_iterator = subtasks.begin();
+        VerticalMergeStageSubtasks::const_iterator subtasks_iterator = subtasks.begin();
 
         void prepareVerticalMergeForOneColumn() const;
         bool executeVerticalMergeForOneColumn() const;
@@ -373,16 +373,16 @@ private:
         bool executeProjections() const;
         bool finalizeProjectionsAndWholeMerge() const;
 
-        using MergeProjectionsStageSubtasks = std::array<std::function<bool()>, 3>;
+        using MergeProjectionsStageSubtasks = std::array<bool(MergeProjectionsStage::*)()const, 3>;
 
-        MergeProjectionsStageSubtasks subtasks
+        const MergeProjectionsStageSubtasks subtasks
         {
-            [this] () { return mergeMinMaxIndexAndPrepareProjections(); },
-            [this] () { return executeProjections(); },
-            [this] () { return finalizeProjectionsAndWholeMerge(); }
+            &MergeProjectionsStage::mergeMinMaxIndexAndPrepareProjections,
+            &MergeProjectionsStage::executeProjections,
+            &MergeProjectionsStage::finalizeProjectionsAndWholeMerge
         };
 
-        MergeProjectionsStageSubtasks::iterator subtasks_iterator = subtasks.begin();
+        MergeProjectionsStageSubtasks::const_iterator subtasks_iterator = subtasks.begin();
 
         MergeProjectionsRuntimeContextPtr ctx;
         GlobalRuntimeContextPtr global_ctx;
@@ -392,14 +392,14 @@ private:
 
     using Stages = std::array<StagePtr, 3>;
 
-    Stages stages
+    const Stages stages
     {
         std::make_shared<ExecuteAndFinalizeHorizontalPart>(),
         std::make_shared<VerticalMergeStage>(),
         std::make_shared<MergeProjectionsStage>()
     };
 
-    Stages::iterator stages_iterator = stages.begin();
+    Stages::const_iterator stages_iterator = stages.begin();
 
     /// Check for persisting block number column
     static bool supportsBlockNumberColumn(GlobalRuntimeContextPtr global_ctx)

From 0d151e3f0d325b4396e47e7cf06e353f7d31f01c Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 13 Feb 2024 16:01:50 +0100
Subject: [PATCH 0894/1081] Send only specific events/metrics for Keeper
 prometheus

---
 programs/keeper/Keeper.cpp              |  38 ++-
 src/Common/CurrentMetrics.cpp           |   2 +
 src/Common/ProfileEvents.cpp            |   2 +
 src/Coordination/KeeperConstants.cpp    | 376 ++++++++++++++++++++++++
 src/Server/HTTPHandlerFactory.cpp       |   9 +-
 src/Server/HTTPHandlerFactory.h         |   7 +-
 src/Server/PrometheusMetricsWriter.cpp  | 145 +++++----
 src/Server/PrometheusMetricsWriter.h    |  22 +-
 src/Server/PrometheusRequestHandler.cpp |  12 +-
 src/Server/PrometheusRequestHandler.h   |   6 +-
 10 files changed, 532 insertions(+), 87 deletions(-)
 create mode 100644 src/Coordination/KeeperConstants.cpp

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index c751702dc6f..5cc73437dba 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -31,9 +31,10 @@
 #include <Coordination/KeeperAsynchronousMetrics.h>
 
 #include <Server/HTTP/HTTPServer.h>
-#include <Server/TCPServer.h>
 #include <Server/HTTPHandlerFactory.h>
 #include <Server/KeeperReadinessHandler.h>
+#include <Server/PrometheusMetricsWriter.h>
+#include <Server/TCPServer.h>
 
 #include "Core/Defines.h"
 #include "config.h"
@@ -482,19 +483,28 @@ try
 
         /// Prometheus (if defined and not setup yet with http_port)
         port_name = "prometheus.port";
-        createServer(listen_host, port_name, listen_try, [&, my_http_context = std::move(http_context)](UInt16 port) mutable
-        {
-            Poco::Net::ServerSocket socket;
-            auto address = socketBindListen(socket, listen_host, port);
-            socket.setReceiveTimeout(my_http_context->getReceiveTimeout());
-            socket.setSendTimeout(my_http_context->getSendTimeout());
-            servers->emplace_back(
-                listen_host,
-                port_name,
-                "Prometheus: http://" + address.toString(),
-                std::make_unique<HTTPServer>(
-                    std::move(my_http_context), createPrometheusMainHandlerFactory(*this, config_getter(), async_metrics, "PrometheusHandler-factory"), server_pool, socket, http_params));
-        });
+        createServer(
+            listen_host,
+            port_name,
+            listen_try,
+            [&, my_http_context = std::move(http_context)](UInt16 port) mutable
+            {
+                Poco::Net::ServerSocket socket;
+                auto address = socketBindListen(socket, listen_host, port);
+                socket.setReceiveTimeout(my_http_context->getReceiveTimeout());
+                socket.setSendTimeout(my_http_context->getSendTimeout());
+                auto metrics_writer = std::make_shared<KeeperPrometheusMetricsWriter>(config, "prometheus", async_metrics);
+                servers->emplace_back(
+                    listen_host,
+                    port_name,
+                    "Prometheus: http://" + address.toString(),
+                    std::make_unique<HTTPServer>(
+                        std::move(my_http_context),
+                        createPrometheusMainHandlerFactory(*this, config_getter(), metrics_writer, "PrometheusHandler-factory"),
+                        server_pool,
+                        socket,
+                        http_params));
+            });
 
         /// HTTP control endpoints
         port_name = "keeper_server.http_control.port";
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index f56149ed464..c6fbafa8dc3 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -2,6 +2,8 @@
 
 
 /// Available metrics. Add something here as you wish.
+/// If the metric is generic (i.e. not server specific)
+/// it should be also added to src/Coordination/KeeperConstant.cpp
 #define APPLY_FOR_BUILTIN_METRICS(M) \
     M(Query, "Number of executing queries") \
     M(Merge, "Number of executing background merges") \
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 2476a69a513..7843a76620a 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -4,6 +4,8 @@
 
 
 /// Available events. Add something here as you wish.
+/// If the event is generic (i.e. not server specific)
+/// it should be also added to src/Coordination/KeeperConstant.cpp
 #define APPLY_FOR_BUILTIN_EVENTS(M) \
     M(Query, "Number of queries to be interpreted and potentially executed. Does not include queries that failed to parse or were rejected due to AST size limits, quota limits or limits on the number of simultaneously running queries. May include internal queries initiated by ClickHouse itself. Does not count subqueries.") \
     M(SelectQuery, "Same as Query, but only for SELECT queries.") \
diff --git a/src/Coordination/KeeperConstants.cpp b/src/Coordination/KeeperConstants.cpp
new file mode 100644
index 00000000000..2aa84b691c4
--- /dev/null
+++ b/src/Coordination/KeeperConstants.cpp
@@ -0,0 +1,376 @@
+#include <Common/ProfileEvents.h>
+#include <Common/CurrentMetrics.h>
+
+/// Events which are useful for Keeper.
+/// New events should be added manually.
+#define APPLY_FOR_KEEPER_PROFILE_EVENTS(M) \
+    M(FileOpen) \
+    M(Seek) \
+    M(ReadBufferFromFileDescriptorRead) \
+    M(ReadBufferFromFileDescriptorReadFailed) \
+    M(ReadBufferFromFileDescriptorReadBytes) \
+    M(WriteBufferFromFileDescriptorWrite) \
+    M(WriteBufferFromFileDescriptorWriteFailed) \
+    M(WriteBufferFromFileDescriptorWriteBytes) \
+    M(FileSync) \
+    M(DirectorySync) \
+    M(FileSyncElapsedMicroseconds) \
+    M(DirectorySyncElapsedMicroseconds) \
+    M(ReadCompressedBytes) \
+    M(CompressedReadBufferBlocks) \
+    M(CompressedReadBufferBytes) \
+    M(AIOWrite) \
+    M(AIOWriteBytes) \
+    M(AIORead) \
+    M(AIOReadBytes) \
+    M(IOBufferAllocs) \
+    M(IOBufferAllocBytes) \
+    M(ArenaAllocChunks) \
+    M(ArenaAllocBytes) \
+    M(CreatedReadBufferOrdinary) \
+    M(CreatedReadBufferDirectIO) \
+    M(CreatedReadBufferDirectIOFailed) \
+    M(CreatedReadBufferMMap) \
+    M(CreatedReadBufferMMapFailed) \
+    M(DiskReadElapsedMicroseconds) \
+    M(DiskWriteElapsedMicroseconds) \
+    M(NetworkReceiveElapsedMicroseconds) \
+    M(NetworkSendElapsedMicroseconds) \
+    M(NetworkReceiveBytes) \
+    M(NetworkSendBytes) \
+\
+    M(DiskS3GetRequestThrottlerCount) \
+    M(DiskS3GetRequestThrottlerSleepMicroseconds) \
+    M(DiskS3PutRequestThrottlerCount) \
+    M(DiskS3PutRequestThrottlerSleepMicroseconds) \
+    M(S3GetRequestThrottlerCount) \
+    M(S3GetRequestThrottlerSleepMicroseconds) \
+    M(S3PutRequestThrottlerCount) \
+    M(S3PutRequestThrottlerSleepMicroseconds) \
+    M(RemoteReadThrottlerBytes) \
+    M(RemoteReadThrottlerSleepMicroseconds) \
+    M(RemoteWriteThrottlerBytes) \
+    M(RemoteWriteThrottlerSleepMicroseconds) \
+    M(LocalReadThrottlerBytes) \
+    M(LocalReadThrottlerSleepMicroseconds) \
+    M(LocalWriteThrottlerBytes) \
+    M(LocalWriteThrottlerSleepMicroseconds) \
+    M(ThrottlerSleepMicroseconds) \
+\
+    M(SlowRead) \
+    M(ReadBackoff) \
+\
+    M(ContextLock) \
+    M(ContextLockWaitMicroseconds) \
+\
+    M(RWLockAcquiredReadLocks) \
+    M(RWLockAcquiredWriteLocks) \
+    M(RWLockReadersWaitMilliseconds) \
+    M(RWLockWritersWaitMilliseconds) \
+    M(DNSError) \
+    M(RealTimeMicroseconds) \
+    M(UserTimeMicroseconds) \
+    M(SystemTimeMicroseconds) \
+    M(MemoryOvercommitWaitTimeMicroseconds) \
+    M(MemoryAllocatorPurge) \
+    M(MemoryAllocatorPurgeTimeMicroseconds) \
+    M(SoftPageFaults) \
+    M(HardPageFaults) \
+\
+    M(OSIOWaitMicroseconds) \
+    M(OSCPUWaitMicroseconds) \
+    M(OSCPUVirtualTimeMicroseconds) \
+    M(OSReadBytes) \
+    M(OSWriteBytes) \
+    M(OSReadChars) \
+    M(OSWriteChars) \
+\
+    M(PerfCpuCycles) \
+    M(PerfInstructions) \
+    M(PerfCacheReferences) \
+    M(PerfCacheMisses) \
+    M(PerfBranchInstructions) \
+    M(PerfBranchMisses) \
+    M(PerfBusCycles) \
+    M(PerfStalledCyclesFrontend) \
+    M(PerfStalledCyclesBackend) \
+    M(PerfRefCpuCycles) \
+\
+    M(PerfCpuClock) \
+    M(PerfTaskClock) \
+    M(PerfContextSwitches) \
+    M(PerfCpuMigrations) \
+    M(PerfAlignmentFaults) \
+    M(PerfEmulationFaults) \
+    M(PerfMinEnabledTime) \
+    M(PerfMinEnabledRunningTime) \
+    M(PerfDataTLBReferences) \
+    M(PerfDataTLBMisses) \
+    M(PerfInstructionTLBReferences) \
+    M(PerfInstructionTLBMisses) \
+    M(PerfLocalMemoryReferences) \
+    M(PerfLocalMemoryMisses) \
+\
+    M(CreatedHTTPConnections) \
+    M(CannotWriteToWriteBufferDiscard) \
+\
+    M(S3ReadMicroseconds) \
+    M(S3ReadRequestsCount) \
+    M(S3ReadRequestsErrors) \
+    M(S3ReadRequestsThrottling) \
+    M(S3ReadRequestsRedirects) \
+\
+    M(S3WriteMicroseconds) \
+    M(S3WriteRequestsCount) \
+    M(S3WriteRequestsErrors) \
+    M(S3WriteRequestsThrottling) \
+    M(S3WriteRequestsRedirects) \
+\
+    M(DiskS3ReadMicroseconds) \
+    M(DiskS3ReadRequestsCount) \
+    M(DiskS3ReadRequestsErrors) \
+    M(DiskS3ReadRequestsThrottling) \
+    M(DiskS3ReadRequestsRedirects) \
+\
+    M(DiskS3WriteMicroseconds) \
+    M(DiskS3WriteRequestsCount) \
+    M(DiskS3WriteRequestsErrors) \
+    M(DiskS3WriteRequestsThrottling) \
+    M(DiskS3WriteRequestsRedirects) \
+\
+    M(S3DeleteObjects) \
+    M(S3CopyObject) \
+    M(S3ListObjects) \
+    M(S3HeadObject) \
+    M(S3GetObjectAttributes) \
+    M(S3CreateMultipartUpload) \
+    M(S3UploadPartCopy) \
+    M(S3UploadPart) \
+    M(S3AbortMultipartUpload) \
+    M(S3CompleteMultipartUpload) \
+    M(S3PutObject) \
+    M(S3GetObject) \
+\
+    M(AzureUploadPart) \
+    M(DiskAzureUploadPart) \
+    M(AzureCopyObject) \
+    M(DiskAzureCopyObject) \
+    M(AzureDeleteObjects) \
+    M(AzureListObjects) \
+\
+    M(DiskS3DeleteObjects) \
+    M(DiskS3CopyObject) \
+    M(DiskS3ListObjects) \
+    M(DiskS3HeadObject) \
+    M(DiskS3GetObjectAttributes) \
+    M(DiskS3CreateMultipartUpload) \
+    M(DiskS3UploadPartCopy) \
+    M(DiskS3UploadPart) \
+    M(DiskS3AbortMultipartUpload) \
+    M(DiskS3CompleteMultipartUpload) \
+    M(DiskS3PutObject) \
+    M(DiskS3GetObject) \
+\
+    M(S3Clients) \
+    M(TinyS3Clients) \
+\
+    M(ReadBufferFromS3Microseconds) \
+    M(ReadBufferFromS3InitMicroseconds) \
+    M(ReadBufferFromS3Bytes) \
+    M(ReadBufferFromS3RequestsErrors) \
+    M(ReadBufferFromS3ResetSessions) \
+    M(ReadBufferFromS3PreservedSessions) \
+\
+    M(ReadWriteBufferFromHTTPPreservedSessions) \
+\
+    M(WriteBufferFromS3Microseconds) \
+    M(WriteBufferFromS3Bytes) \
+    M(WriteBufferFromS3RequestsErrors) \
+    M(WriteBufferFromS3WaitInflightLimitMicroseconds) \
+    M(RemoteFSSeeks) \
+    M(RemoteFSPrefetches) \
+    M(RemoteFSCancelledPrefetches) \
+    M(RemoteFSUnusedPrefetches) \
+    M(RemoteFSPrefetchedReads) \
+    M(RemoteFSPrefetchedBytes) \
+    M(RemoteFSUnprefetchedReads) \
+    M(RemoteFSUnprefetchedBytes) \
+    M(RemoteFSLazySeeks) \
+    M(RemoteFSSeeksWithReset) \
+    M(RemoteFSBuffers) \
+\
+    M(ThreadpoolReaderTaskMicroseconds) \
+    M(ThreadpoolReaderPrepareMicroseconds) \
+    M(ThreadpoolReaderReadBytes) \
+    M(ThreadpoolReaderSubmit) \
+    M(ThreadpoolReaderSubmitReadSynchronously) \
+    M(ThreadpoolReaderSubmitReadSynchronouslyBytes) \
+    M(ThreadpoolReaderSubmitReadSynchronouslyMicroseconds) \
+    M(ThreadpoolReaderSubmitLookupInCacheMicroseconds) \
+    M(AsynchronousReaderIgnoredBytes) \
+\
+    M(FileSegmentWaitReadBufferMicroseconds) \
+    M(FileSegmentReadMicroseconds) \
+    M(FileSegmentCacheWriteMicroseconds) \
+    M(FileSegmentPredownloadMicroseconds) \
+    M(FileSegmentUsedBytes) \
+\
+    M(ReadBufferSeekCancelConnection) \
+\
+    M(SleepFunctionCalls) \
+    M(SleepFunctionMicroseconds) \
+    M(SleepFunctionElapsedMicroseconds) \
+\
+    M(ThreadPoolReaderPageCacheHit) \
+    M(ThreadPoolReaderPageCacheHitBytes) \
+    M(ThreadPoolReaderPageCacheHitElapsedMicroseconds) \
+    M(ThreadPoolReaderPageCacheMiss) \
+    M(ThreadPoolReaderPageCacheMissBytes) \
+    M(ThreadPoolReaderPageCacheMissElapsedMicroseconds) \
+\
+    M(AsynchronousReadWaitMicroseconds) \
+    M(SynchronousReadWaitMicroseconds) \
+    M(AsynchronousRemoteReadWaitMicroseconds) \
+    M(SynchronousRemoteReadWaitMicroseconds) \
+\
+    M(ExternalDataSourceLocalCacheReadBytes) \
+\
+    M(MainConfigLoads) \
+\
+    M(KeeperPacketsSent) \
+    M(KeeperPacketsReceived) \
+    M(KeeperRequestTotal) \
+    M(KeeperLatency) \
+    M(KeeperCommits) \
+    M(KeeperCommitsFailed) \
+    M(KeeperSnapshotCreations) \
+    M(KeeperSnapshotCreationsFailed) \
+    M(KeeperSnapshotApplys) \
+    M(KeeperSnapshotApplysFailed) \
+    M(KeeperReadSnapshot) \
+    M(KeeperSaveSnapshot) \
+    M(KeeperCreateRequest) \
+    M(KeeperRemoveRequest) \
+    M(KeeperSetRequest) \
+    M(KeeperReconfigRequest) \
+    M(KeeperCheckRequest) \
+    M(KeeperMultiRequest) \
+    M(KeeperMultiReadRequest) \
+    M(KeeperGetRequest) \
+    M(KeeperListRequest) \
+    M(KeeperExistsRequest) \
+\
+    M(IOUringSQEsSubmitted) \
+    M(IOUringSQEsResubmits) \
+    M(IOUringCQEsCompleted) \
+    M(IOUringCQEsFailed) \
+\
+    M(LogTest) \
+    M(LogTrace) \
+    M(LogDebug) \
+    M(LogInfo) \
+    M(LogWarning) \
+    M(LogError) \
+    M(LogFatal) \
+\
+    M(InterfaceHTTPSendBytes) \
+    M(InterfaceHTTPReceiveBytes) \
+    M(InterfaceNativeSendBytes) \
+    M(InterfaceNativeReceiveBytes) \
+    M(InterfacePrometheusSendBytes) \
+    M(InterfacePrometheusReceiveBytes) \
+    M(InterfaceInterserverSendBytes) \
+    M(InterfaceInterserverReceiveBytes) \
+    M(InterfaceMySQLSendBytes) \
+    M(InterfaceMySQLReceiveBytes) \
+    M(InterfacePostgreSQLSendBytes) \
+    M(InterfacePostgreSQLReceiveBytes)
+
+namespace ProfileEvents
+{
+#define M(NAME) extern const Event NAME;
+    APPLY_FOR_KEEPER_PROFILE_EVENTS(M)
+#undef M
+
+#define M(NAME) NAME,
+extern const std::vector<Event> keeper_profile_events
+{
+    APPLY_FOR_KEEPER_PROFILE_EVENTS(M)
+};
+#undef M
+}
+
+/// Metrics which are useful for Keeper.
+/// New metrics should be added manually.
+#define APPLY_FOR_KEEPER_METRICS(M) \
+    M(BackgroundCommonPoolTask) \
+    M(BackgroundCommonPoolSize) \
+    M(TCPConnection) \
+    M(HTTPConnection) \
+    M(OpenFileForRead) \
+    M(OpenFileForWrite) \
+    M(Read) \
+    M(RemoteRead) \
+    M(Write) \
+    M(NetworkReceive) \
+    M(NetworkSend) \
+    M(MemoryTracking) \
+    M(ContextLockWait) \
+    M(Revision) \
+    M(VersionInteger) \
+    M(RWLockWaitingReaders) \
+    M(RWLockWaitingWriters) \
+    M(RWLockActiveReaders) \
+    M(RWLockActiveWriters) \
+    M(GlobalThread) \
+    M(GlobalThreadActive) \
+    M(GlobalThreadScheduled) \
+    M(LocalThread) \
+    M(LocalThreadActive) \
+    M(LocalThreadScheduled) \
+    M(IOPrefetchThreads) \
+    M(IOPrefetchThreadsActive) \
+    M(IOPrefetchThreadsScheduled) \
+    M(IOWriterThreads) \
+    M(IOWriterThreadsActive) \
+    M(IOWriterThreadsScheduled) \
+    M(IOThreads) \
+    M(IOThreadsActive) \
+    M(IOThreadsScheduled) \
+    M(ThreadPoolRemoteFSReaderThreads) \
+    M(ThreadPoolRemoteFSReaderThreadsActive) \
+    M(ThreadPoolRemoteFSReaderThreadsScheduled) \
+    M(ThreadPoolFSReaderThreads) \
+    M(ThreadPoolFSReaderThreadsActive) \
+    M(ThreadPoolFSReaderThreadsScheduled) \
+    M(DiskObjectStorageAsyncThreads) \
+    M(DiskObjectStorageAsyncThreadsActive) \
+    M(ObjectStorageS3Threads) \
+    M(ObjectStorageS3ThreadsActive) \
+    M(ObjectStorageS3ThreadsScheduled) \
+    M(ObjectStorageAzureThreads) \
+    M(ObjectStorageAzureThreadsActive) \
+    M(ObjectStorageAzureThreadsScheduled) \
+    M(MMappedFiles) \
+    M(MMappedFileBytes) \
+    M(AsynchronousReadWait) \
+    M(S3Requests) \
+    M(KeeperAliveConnections) \
+    M(KeeperOutstandingRequets) \
+    M(ThreadsInOvercommitTracker) \
+    M(IOUringPendingEvents) \
+    M(IOUringInFlightEvents) \
+
+namespace CurrentMetrics
+{
+#define M(NAME) extern const Metric NAME;
+    APPLY_FOR_KEEPER_METRICS(M)
+#undef M
+
+#define M(NAME) NAME,
+extern const std::vector<Metric> keeper_metrics
+{
+    APPLY_FOR_KEEPER_METRICS(M)
+};
+#undef M
+}
diff --git a/src/Server/HTTPHandlerFactory.cpp b/src/Server/HTTPHandlerFactory.cpp
index 66b55f68217..06ca1182be5 100644
--- a/src/Server/HTTPHandlerFactory.cpp
+++ b/src/Server/HTTPHandlerFactory.cpp
@@ -1,3 +1,4 @@
+#include <memory>
 #include <Server/HTTPHandlerFactory.h>
 
 #include <Server/HTTP/HTTPRequestHandler.h>
@@ -7,6 +8,7 @@
 #include <Poco/Util/AbstractConfiguration.h>
 
 #include "HTTPHandler.h"
+#include "Server/PrometheusMetricsWriter.h"
 #include "StaticRequestHandler.h"
 #include "ReplicasStatusHandler.h"
 #include "InterserverIOHTTPHandler.h"
@@ -113,7 +115,10 @@ HTTPRequestHandlerFactoryPtr createHandlerFactory(IServer & server, const Poco::
     else if (name == "InterserverIOHTTPHandler-factory" || name == "InterserverIOHTTPSHandler-factory")
         return createInterserverHTTPHandlerFactory(server, name);
     else if (name == "PrometheusHandler-factory")
-        return createPrometheusMainHandlerFactory(server, config, async_metrics, name);
+    {
+        auto metrics_writer = std::make_shared<PrometheusMetricsWriter>(config, "prometheus", async_metrics);
+        return createPrometheusMainHandlerFactory(server, config, metrics_writer, name);
+    }
 
     throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: Unknown HTTP handler factory name.");
 }
@@ -208,7 +213,7 @@ void addDefaultHandlersFactory(
     /// Otherwise it will be created separately, see createHandlerFactory(...).
     if (config.has("prometheus") && config.getInt("prometheus.port", 0) == 0)
     {
-        PrometheusMetricsWriter writer(config, "prometheus", async_metrics);
+        auto writer = std::make_shared<PrometheusMetricsWriter>(config, "prometheus", async_metrics);
         auto creator = [&server, writer] () -> std::unique_ptr<PrometheusRequestHandler>
         {
             return std::make_unique<PrometheusRequestHandler>(server, writer);
diff --git a/src/Server/HTTPHandlerFactory.h b/src/Server/HTTPHandlerFactory.h
index 94b02e52277..427d495f659 100644
--- a/src/Server/HTTPHandlerFactory.h
+++ b/src/Server/HTTPHandlerFactory.h
@@ -6,6 +6,7 @@
 #include <Server/HTTPHandlerRequestFilter.h>
 #include <Server/HTTPRequestHandlerFactoryMain.h>
 #include <Common/StringUtils/StringUtils.h>
+#include <Server/PrometheusMetricsWriter.h>
 
 #include <Poco/Util/AbstractConfiguration.h>
 
@@ -130,10 +131,10 @@ createPrometheusHandlerFactory(IServer & server,
     AsynchronousMetrics & async_metrics,
     const std::string & config_prefix);
 
-HTTPRequestHandlerFactoryPtr
-createPrometheusMainHandlerFactory(IServer & server,
+HTTPRequestHandlerFactoryPtr createPrometheusMainHandlerFactory(
+    IServer & server,
     const Poco::Util::AbstractConfiguration & config,
-    AsynchronousMetrics & async_metrics,
+    PrometheusMetricsWriterPtr metrics_writer,
     const std::string & name);
 
 /// @param server - used in handlers to check IServer::isCancelled()
diff --git a/src/Server/PrometheusMetricsWriter.cpp b/src/Server/PrometheusMetricsWriter.cpp
index 3d09c2165e5..70a2fa0a41b 100644
--- a/src/Server/PrometheusMetricsWriter.cpp
+++ b/src/Server/PrometheusMetricsWriter.cpp
@@ -38,6 +38,79 @@ void convertHelpToSingleLine(std::string & help)
     std::replace(help.begin(), help.end(), '\n', ' ');
 }
 
+constexpr auto profile_events_prefix = "ClickHouseProfileEvents_";
+constexpr auto current_metrics_prefix = "ClickHouseMetrics_";
+constexpr auto asynchronous_metrics_prefix = "ClickHouseAsyncMetrics_";
+constexpr auto error_metrics_prefix = "ClickHouseErrorMetric_";
+
+void writeEvent(DB::WriteBuffer & wb, ProfileEvents::Event event)
+{
+    const auto counter = ProfileEvents::global_counters[event].load(std::memory_order_relaxed);
+
+    std::string metric_name{ProfileEvents::getName(static_cast<ProfileEvents::Event>(event))};
+    std::string metric_doc{ProfileEvents::getDocumentation(static_cast<ProfileEvents::Event>(event))};
+
+    convertHelpToSingleLine(metric_doc);
+
+    if (!replaceInvalidChars(metric_name))
+        return;
+
+    std::string key{profile_events_prefix + metric_name};
+
+    writeOutLine(wb, "# HELP", key, metric_doc);
+    writeOutLine(wb, "# TYPE", key, "counter");
+    writeOutLine(wb, key, counter);
+}
+
+void writeMetric(DB::WriteBuffer & wb, size_t metric)
+{
+    const auto value = CurrentMetrics::values[metric].load(std::memory_order_relaxed);
+
+    std::string metric_name{CurrentMetrics::getName(static_cast<CurrentMetrics::Metric>(metric))};
+    std::string metric_doc{CurrentMetrics::getDocumentation(static_cast<CurrentMetrics::Metric>(metric))};
+
+    convertHelpToSingleLine(metric_doc);
+
+    if (!replaceInvalidChars(metric_name))
+        return;
+
+    std::string key{current_metrics_prefix + metric_name};
+
+    writeOutLine(wb, "# HELP", key, metric_doc);
+    writeOutLine(wb, "# TYPE", key, "gauge");
+    writeOutLine(wb, key, value);
+}
+
+void writeAsyncMetrics(DB::WriteBuffer & wb, const DB::AsynchronousMetricValues & values)
+{
+    for (const auto & name_value : values)
+    {
+        std::string key{asynchronous_metrics_prefix + name_value.first};
+
+        if (!replaceInvalidChars(key))
+            continue;
+
+        auto value = name_value.second;
+
+        std::string metric_doc{value.documentation};
+        convertHelpToSingleLine(metric_doc);
+
+        writeOutLine(wb, "# HELP", key, metric_doc);
+        writeOutLine(wb, "# TYPE", key, "gauge");
+        writeOutLine(wb, key, value.value);
+    }
+}
+
+}
+
+namespace ProfileEvents
+{
+    extern const std::vector<Event> keeper_profile_events;
+}
+
+namespace CurrentMetrics
+{
+    extern const std::vector<Metric> keeper_metrics;
 }
 
 
@@ -60,65 +133,17 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
     if (send_events)
     {
         for (ProfileEvents::Event i = ProfileEvents::Event(0), end = ProfileEvents::end(); i < end; ++i)
-        {
-            const auto counter = ProfileEvents::global_counters[i].load(std::memory_order_relaxed);
-
-            std::string metric_name{ProfileEvents::getName(static_cast<ProfileEvents::Event>(i))};
-            std::string metric_doc{ProfileEvents::getDocumentation(static_cast<ProfileEvents::Event>(i))};
-
-            convertHelpToSingleLine(metric_doc);
-
-            if (!replaceInvalidChars(metric_name))
-                continue;
-            std::string key{profile_events_prefix + metric_name};
-
-            writeOutLine(wb, "# HELP", key, metric_doc);
-            writeOutLine(wb, "# TYPE", key, "counter");
-            writeOutLine(wb, key, counter);
-        }
+            writeEvent(wb, i);
     }
 
     if (send_metrics)
     {
         for (size_t i = 0, end = CurrentMetrics::end(); i < end; ++i)
-        {
-            const auto value = CurrentMetrics::values[i].load(std::memory_order_relaxed);
-
-            std::string metric_name{CurrentMetrics::getName(static_cast<CurrentMetrics::Metric>(i))};
-            std::string metric_doc{CurrentMetrics::getDocumentation(static_cast<CurrentMetrics::Metric>(i))};
-
-            convertHelpToSingleLine(metric_doc);
-
-            if (!replaceInvalidChars(metric_name))
-                continue;
-            std::string key{current_metrics_prefix + metric_name};
-
-            writeOutLine(wb, "# HELP", key, metric_doc);
-            writeOutLine(wb, "# TYPE", key, "gauge");
-            writeOutLine(wb, key, value);
-        }
+            writeMetric(wb, i);
     }
 
     if (send_asynchronous_metrics)
-    {
-        auto async_metrics_values = async_metrics.getValues();
-        for (const auto & name_value : async_metrics_values)
-        {
-            std::string key{asynchronous_metrics_prefix + name_value.first};
-
-            if (!replaceInvalidChars(key))
-                continue;
-
-            auto value = name_value.second;
-
-            std::string metric_doc{value.documentation};
-            convertHelpToSingleLine(metric_doc);
-
-            writeOutLine(wb, "# HELP", key, metric_doc);
-            writeOutLine(wb, "# TYPE", key, "gauge");
-            writeOutLine(wb, key, value.value);
-        }
-    }
+        writeAsyncMetrics(wb, async_metrics.getValues());
 
     if (send_errors)
     {
@@ -152,4 +177,22 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
 
 }
 
+void KeeperPrometheusMetricsWriter::write(WriteBuffer & wb) const
+{
+    if (send_events)
+    {
+        for (auto event : ProfileEvents::keeper_profile_events)
+            writeEvent(wb, event);
+    }
+
+    if (send_metrics)
+    {
+        for (auto metric : CurrentMetrics::keeper_metrics)
+            writeMetric(wb, metric);
+    }
+
+    if (send_asynchronous_metrics)
+        writeAsyncMetrics(wb, async_metrics.getValues());
+}
+
 }
diff --git a/src/Server/PrometheusMetricsWriter.h b/src/Server/PrometheusMetricsWriter.h
index b909a0ddcf6..933ad909ee0 100644
--- a/src/Server/PrometheusMetricsWriter.h
+++ b/src/Server/PrometheusMetricsWriter.h
@@ -3,6 +3,7 @@
 #include <string>
 
 #include <Common/AsynchronousMetrics.h>
+#include <Common/ProfileEvents.h>
 #include <IO/WriteBuffer.h>
 
 #include <Poco/Util/AbstractConfiguration.h>
@@ -19,20 +20,25 @@ public:
         const Poco::Util::AbstractConfiguration & config, const std::string & config_name,
         const AsynchronousMetrics & async_metrics_);
 
-    void write(WriteBuffer & wb) const;
+    virtual void write(WriteBuffer & wb) const;
 
-private:
+    virtual ~PrometheusMetricsWriter() = default;
+
+protected:
     const AsynchronousMetrics & async_metrics;
-
     const bool send_events;
     const bool send_metrics;
     const bool send_asynchronous_metrics;
     const bool send_errors;
-
-    static inline constexpr auto profile_events_prefix = "ClickHouseProfileEvents_";
-    static inline constexpr auto current_metrics_prefix = "ClickHouseMetrics_";
-    static inline constexpr auto asynchronous_metrics_prefix = "ClickHouseAsyncMetrics_";
-    static inline constexpr auto error_metrics_prefix = "ClickHouseErrorMetric_";
 };
 
+class KeeperPrometheusMetricsWriter : public PrometheusMetricsWriter
+{
+    using PrometheusMetricsWriter::PrometheusMetricsWriter;
+
+    void write(WriteBuffer & wb) const override;
+};
+
+using PrometheusMetricsWriterPtr = std::shared_ptr<PrometheusMetricsWriter>;
+
 }
diff --git a/src/Server/PrometheusRequestHandler.cpp b/src/Server/PrometheusRequestHandler.cpp
index 8690ec9121e..dff960f7031 100644
--- a/src/Server/PrometheusRequestHandler.cpp
+++ b/src/Server/PrometheusRequestHandler.cpp
@@ -7,6 +7,7 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/Exception.h>
 #include <Common/ProfileEvents.h>
+#include "Server/PrometheusMetricsWriter.h"
 
 #include <Poco/Util/LayeredConfiguration.h>
 
@@ -34,7 +35,7 @@ void PrometheusRequestHandler::handleRequest(HTTPServerRequest & request, HTTPSe
         WriteBufferFromHTTPServerResponse wb(response, request.getMethod() == Poco::Net::HTTPRequest::HTTP_HEAD, keep_alive_timeout, write_event);
         try
         {
-            metrics_writer.write(wb);
+            metrics_writer->write(wb);
             wb.finalize();
         }
         catch (...)
@@ -54,7 +55,7 @@ HTTPRequestHandlerFactoryPtr createPrometheusHandlerFactory(
     AsynchronousMetrics & async_metrics,
     const std::string & config_prefix)
 {
-    PrometheusMetricsWriter writer(config, config_prefix + ".handler", async_metrics);
+    auto writer = std::make_shared<PrometheusMetricsWriter>(config, config_prefix + ".handler", async_metrics);
     auto creator = [&server, writer]() -> std::unique_ptr<PrometheusRequestHandler>
     {
         return std::make_unique<PrometheusRequestHandler>(server, writer);
@@ -66,13 +67,12 @@ HTTPRequestHandlerFactoryPtr createPrometheusHandlerFactory(
 }
 
 HTTPRequestHandlerFactoryPtr createPrometheusMainHandlerFactory(
-    IServer & server, const Poco::Util::AbstractConfiguration & config, AsynchronousMetrics & async_metrics, const std::string & name)
+    IServer & server, const Poco::Util::AbstractConfiguration & config, PrometheusMetricsWriterPtr metrics_writer, const std::string & name)
 {
     auto factory = std::make_shared<HTTPRequestHandlerFactoryMain>(name);
-    PrometheusMetricsWriter writer(config, "prometheus", async_metrics);
-    auto creator = [&server, writer]() -> std::unique_ptr<PrometheusRequestHandler>
+    auto creator = [&server, metrics_writer]
     {
-        return std::make_unique<PrometheusRequestHandler>(server, writer);
+        return std::make_unique<PrometheusRequestHandler>(server, metrics_writer);
     };
 
     auto handler = std::make_shared<HandlingRuleHTTPHandlerFactory<PrometheusRequestHandler>>(std::move(creator));
diff --git a/src/Server/PrometheusRequestHandler.h b/src/Server/PrometheusRequestHandler.h
index 9ec54cc2e4e..d120752c8c5 100644
--- a/src/Server/PrometheusRequestHandler.h
+++ b/src/Server/PrometheusRequestHandler.h
@@ -13,12 +13,12 @@ class PrometheusRequestHandler : public HTTPRequestHandler
 {
 private:
     IServer & server;
-    const PrometheusMetricsWriter & metrics_writer;
+    PrometheusMetricsWriterPtr metrics_writer;
 
 public:
-    PrometheusRequestHandler(IServer & server_, const PrometheusMetricsWriter & metrics_writer_)
+    PrometheusRequestHandler(IServer & server_, PrometheusMetricsWriterPtr metrics_writer_)
         : server(server_)
-        , metrics_writer(metrics_writer_)
+        , metrics_writer(std::move(metrics_writer_))
     {
     }
 

From 2389cd5e61af2f978e974175f6db4656fbd6fab1 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 13 Feb 2024 16:27:29 +0100
Subject: [PATCH 0895/1081] Fix style

---
 utils/check-style/check-style | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index daee2e7fb00..baaa3583195 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -76,6 +76,7 @@ EXTERN_TYPES_EXCLUDES=(
     ProfileEvents::getProfileEvents
     ProfileEvents::ThreadIdToCountersSnapshot
     ProfileEvents::LOCAL_NAME
+    ProfileEvents::keeper_profile_events
     ProfileEvents::CountersIncrement
 
     CurrentMetrics::add
@@ -87,6 +88,7 @@ EXTERN_TYPES_EXCLUDES=(
     CurrentMetrics::Metric
     CurrentMetrics::values
     CurrentMetrics::Value
+    CurrentMetrics::keeper_metrics
 
     ErrorCodes::ErrorCode
     ErrorCodes::getName
@@ -106,7 +108,7 @@ for extern_type in ${!EXTERN_TYPES[@]}; do
     find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' | {
         # NOTE: the check is pretty dumb and distinguish only by the type_of_extern,
         # and this matches with zkutil::CreateMode
-        grep -v 'src/Common/ZooKeeper/Types.h'
+        grep -v -e 'src/Common/ZooKeeper/Types.h' -e 'src/Coordination/KeeperConstants.cpp'
     } | {
         grep -vP $EXCLUDE_DIRS | xargs grep -l -P "extern const $type_of_extern $allowed_chars"
     } | while read file; do

From 45d359cb9359671af477859f171e6f953d4826e1 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Tue, 13 Feb 2024 16:33:54 +0100
Subject: [PATCH 0896/1081] Use version with execution names

---
 .../integration/test_distributed_backward_compatability/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_distributed_backward_compatability/test.py b/tests/integration/test_distributed_backward_compatability/test.py
index 5b60788a4ef..79b937558cd 100644
--- a/tests/integration/test_distributed_backward_compatability/test.py
+++ b/tests/integration/test_distributed_backward_compatability/test.py
@@ -8,7 +8,7 @@ node_old = cluster.add_instance(
     "node1",
     main_configs=["configs/remote_servers.xml"],
     image="clickhouse/clickhouse-server",
-    tag="23.3",
+    tag="23.12",
     stay_alive=True,
     with_installed_binary=True,
 )

From 253abd16436875faa3d0bbf939ae0e01d847ad3b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 16:50:18 +0000
Subject: [PATCH 0897/1081] Refactor Squashing for inserts.

---
 src/Interpreters/InterpreterInsertQuery.cpp   | 70 ++++++++-------
 src/Interpreters/InterpreterInsertQuery.h     |  5 +-
 .../Transforms/CountingTransform.cpp          |  4 +-
 src/Processors/Transforms/CountingTransform.h | 86 ++++++++++++++++---
 .../Transforms/buildPushingToViewsChain.cpp   | 18 ++++
 src/QueryPipeline/QueryPipeline.cpp           |  7 +-
 6 files changed, 139 insertions(+), 51 deletions(-)

diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 734306cf58d..8e735fbdb54 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -274,7 +274,7 @@ Chain InterpreterInsertQuery::buildChain(
     auto sample = getSampleBlock(columns, table, metadata_snapshot);
 
     Chain sink = buildSink(table, metadata_snapshot, thread_status_holder, running_group, elapsed_counter_ms);
-    Chain chain = buildPreSinkChain(sink.getInputHeader(), table, metadata_snapshot, sample, thread_status_holder);
+    Chain chain = buildPreSinkChain(sink.getInputHeader(), table, metadata_snapshot, sample);
 
     chain.appendChain(std::move(sink));
     return chain;
@@ -317,25 +317,31 @@ Chain InterpreterInsertQuery::buildSink(
     return out;
 }
 
+bool InterpreterInsertQuery::shouldAddSquashingFroStorage(const StoragePtr & table) const
+{
+    auto context_ptr = getContext();
+    const Settings & settings = context_ptr->getSettingsRef();
+    const ASTInsertQuery * query = nullptr;
+    if (query_ptr)
+        query = query_ptr->as<ASTInsertQuery>();
+
+    /// Do not squash blocks if it is a sync INSERT into Distributed, since it lead to double bufferization on client and server side.
+    /// Client-side bufferization might cause excessive timeouts (especially in case of big blocks).
+    return !(settings.distributed_foreground_insert && table->isRemote()) && !async_insert && !no_squash && !(query && query->watch);
+}
+
 Chain InterpreterInsertQuery::buildPreSinkChain(
     const Block & subsequent_header,
     const StoragePtr & table,
     const StorageMetadataPtr & metadata_snapshot,
-    const Block & query_sample_block,
-    ThreadStatusesHolderPtr thread_status_holder)
+    const Block & query_sample_block)
 {
-    ThreadStatus * thread_status = current_thread;
-
-    if (!thread_status_holder)
-        thread_status = nullptr;
-
     auto context_ptr = getContext();
 
     const ASTInsertQuery * query = nullptr;
     if (query_ptr)
         query = query_ptr->as<ASTInsertQuery>();
 
-    const Settings & settings = context_ptr->getSettingsRef();
     bool null_as_default = query && query->select && context_ptr->getSettingsRef().insert_null_as_default;
 
     /// We create a pipeline of several streams, into which we will write data.
@@ -366,26 +372,6 @@ Chain InterpreterInsertQuery::buildPreSinkChain(
     /// because some clients break insertion protocol (columns != header)
     out.addSource(std::make_shared<ConvertingTransform>(query_sample_block, adding_missing_defaults_actions));
 
-    /// It's important to squash blocks as early as possible (before other transforms),
-    ///  because other transforms may work inefficient if block size is small.
-
-    /// Do not squash blocks if it is a sync INSERT into Distributed, since it lead to double bufferization on client and server side.
-    /// Client-side bufferization might cause excessive timeouts (especially in case of big blocks).
-    if (!(settings.distributed_foreground_insert && table->isRemote()) && !async_insert && !no_squash && !(query && query->watch))
-    {
-        bool table_prefers_large_blocks = table->prefersLargeBlocks();
-
-        out.addSource(std::make_shared<SquashingChunksTransform>(
-            input_header(),
-            table_prefers_large_blocks ? settings.min_insert_block_size_rows : settings.max_block_size,
-            table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL));
-    }
-
-    auto counting = std::make_shared<CountingTransform>(input_header(), thread_status, getContext()->getQuota());
-    counting->setProcessListElement(context_ptr->getProcessListElement());
-    counting->setProgressCallback(context_ptr->getProgressCallback());
-    out.addSource(std::move(counting));
-
     return out;
 }
 
@@ -558,8 +544,7 @@ BlockIO InterpreterInsertQuery::execute()
         }
         for (size_t i = 0; i < pre_streams_size; ++i)
         {
-            auto out = buildPreSinkChain(sink_chains[0].getInputHeader(), table, metadata_snapshot,
-                query_sample_block, /* thread_status_holder= */ nullptr);
+            auto out = buildPreSinkChain(sink_chains[0].getInputHeader(), table, metadata_snapshot, query_sample_block);
             presink_chains.emplace_back(std::move(out));
         }
     }
@@ -592,6 +577,29 @@ BlockIO InterpreterInsertQuery::execute()
             return std::make_shared<MaterializingTransform>(in_header);
         });
 
+        pipeline.addSimpleTransform([&](const Block & in_header) -> ProcessorPtr
+        {
+            auto context_ptr = getContext();
+            auto counting = std::make_shared<SimpleCountingTransform>(in_header, context_ptr->getQuota());
+            counting->setProcessListElement(context_ptr->getProcessListElement());
+            counting->setProgressCallback(context_ptr->getProgressCallback());
+
+            return counting;
+        });
+
+        if (shouldAddSquashingFroStorage(table))
+        {
+            bool table_prefers_large_blocks = table->prefersLargeBlocks();
+
+            pipeline.addSimpleTransform([&](const Block & in_header) -> ProcessorPtr
+            {
+                return std::make_shared<SimpleSquashingChunksTransform>(
+                    in_header,
+                    table_prefers_large_blocks ? settings.min_insert_block_size_rows : settings.max_block_size,
+                    table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL);
+            });
+        }
+
         size_t num_select_threads = pipeline.getNumThreads();
 
         for (auto & chain : presink_chains)
diff --git a/src/Interpreters/InterpreterInsertQuery.h b/src/Interpreters/InterpreterInsertQuery.h
index 845cb6b730b..74baf4bc4f6 100644
--- a/src/Interpreters/InterpreterInsertQuery.h
+++ b/src/Interpreters/InterpreterInsertQuery.h
@@ -59,6 +59,8 @@ public:
 
     void addBuffer(std::unique_ptr<ReadBuffer> buffer) { owned_buffers.push_back(std::move(buffer)); }
 
+    bool shouldAddSquashingFroStorage(const StoragePtr & table) const;
+
 private:
     Block getSampleBlock(const Names & names, const StoragePtr & table, const StorageMetadataPtr & metadata_snapshot) const;
 
@@ -81,8 +83,7 @@ private:
         const Block & subsequent_header,
         const StoragePtr & table,
         const StorageMetadataPtr & metadata_snapshot,
-        const Block & query_sample_block,
-        ThreadStatusesHolderPtr thread_status_holder);
+        const Block & query_sample_block);
 };
 
 
diff --git a/src/Processors/Transforms/CountingTransform.cpp b/src/Processors/Transforms/CountingTransform.cpp
index 3dfb9fe178f..7143ae2b8fc 100644
--- a/src/Processors/Transforms/CountingTransform.cpp
+++ b/src/Processors/Transforms/CountingTransform.cpp
@@ -15,7 +15,7 @@ namespace ProfileEvents
 namespace DB
 {
 
-void CountingTransform::onConsume(Chunk chunk)
+void CountingBase::count(const Chunk & chunk)
 {
     if (quota)
         quota->used(QuotaType::WRITTEN_BYTES, chunk.bytes());
@@ -40,8 +40,6 @@ void CountingTransform::onConsume(Chunk chunk)
 
     if (progress_callback)
         progress_callback(local_progress);
-
-    cur_chunk = std::move(chunk);
 }
 
 }
diff --git a/src/Processors/Transforms/CountingTransform.h b/src/Processors/Transforms/CountingTransform.h
index 05d8e2aeac8..2f067f7ac6b 100644
--- a/src/Processors/Transforms/CountingTransform.h
+++ b/src/Processors/Transforms/CountingTransform.h
@@ -2,6 +2,7 @@
 
 #include <IO/Progress.h>
 #include <Processors/Transforms/ExceptionKeepingTransform.h>
+#include <Processors/ISimpleTransform.h>
 #include <Access/EnabledQuota.h>
 
 
@@ -13,17 +14,13 @@ using QueryStatusPtr = std::shared_ptr<QueryStatus>;
 class ThreadStatus;
 
 /// Proxy class which counts number of written block, rows, bytes
-class CountingTransform final : public ExceptionKeepingTransform
+class CountingBase
 {
 public:
-    explicit CountingTransform(
-        const Block & header,
+    explicit CountingBase(
         ThreadStatus * thread_status_ = nullptr,
         std::shared_ptr<const EnabledQuota> quota_ = nullptr)
-        : ExceptionKeepingTransform(header, header)
-        , thread_status(thread_status_), quota(std::move(quota_)) {}
-
-    String getName() const override { return "CountingTransform"; }
+        : thread_status(thread_status_), quota(std::move(quota_)) {}
 
     void setProgressCallback(const ProgressCallback & callback)
     {
@@ -40,13 +37,7 @@ public:
         return progress;
     }
 
-    void onConsume(Chunk chunk) override;
-    GenerateResult onGenerate() override
-    {
-        GenerateResult res;
-        res.chunk = std::move(cur_chunk);
-        return res;
-    }
+    void count(const Chunk & chunk);
 
 protected:
     Progress progress;
@@ -56,7 +47,74 @@ protected:
 
     /// Quota is used to limit amount of written bytes.
     std::shared_ptr<const EnabledQuota> quota;
+};
+
+class CountingTransform2 final : public ExceptionKeepingTransform
+{
+public:
+    explicit CountingTransform2(
+        const Block & header,
+        ThreadStatus * thread_status_ = nullptr,
+        std::shared_ptr<const EnabledQuota> quota_ = nullptr)
+        : ExceptionKeepingTransform(header, header), counting(thread_status_, std::move(quota_)) {}
+
+    String getName() const override { return "CountingTransform"; }
+    void onConsume(Chunk chunk) override
+    {
+        counting.count(chunk);
+        cur_chunk = std::move(chunk);
+    }
+
+    GenerateResult onGenerate() override
+    {
+        GenerateResult res;
+        res.chunk = std::move(cur_chunk);
+        return res;
+    }
+
+    void setProgressCallback(const ProgressCallback & callback)
+    {
+        counting.setProgressCallback(callback);
+    }
+
+    void setProcessListElement(QueryStatusPtr elem)
+    {
+        counting.setProcessListElement(std::move(elem));
+    }
+
+protected:
+    CountingBase counting;
     Chunk cur_chunk;
 };
 
+class SimpleCountingTransform final : public ISimpleTransform
+{
+public:
+    explicit SimpleCountingTransform(
+        const Block & header,
+        std::shared_ptr<const EnabledQuota> quota_ = nullptr)
+        : ISimpleTransform(header, header, false)
+        , counting(nullptr, std::move(quota_))
+    {}
+
+    String getName() const override { return "SimpleCountingTransform"; }
+    void transform(Chunk & chunk) override
+    {
+        counting.count(chunk);
+    }
+
+    void setProgressCallback(const ProgressCallback & callback)
+    {
+        counting.setProgressCallback(callback);
+    }
+
+    void setProcessListElement(QueryStatusPtr elem)
+    {
+        counting.setProcessListElement(std::move(elem));
+    }
+
+protected:
+    CountingBase counting;
+};
+
 }
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 40f4166283b..a3c3eb4037b 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -5,6 +5,7 @@
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Parsers/ASTInsertQuery.h>
+#include <Processors/Transforms/CountingTransform.h>
 #include <Processors/Transforms/SquashingChunksTransform.h>
 #include <Processors/Transforms/ExpressionTransform.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
@@ -412,6 +413,23 @@ Chain buildPushingToViewsChain(
 
             InterpreterInsertQuery interpreter(nullptr, view_insert_context, false, false, false);
             out = interpreter.buildChain(inner_table, inner_metadata_snapshot, insert_columns, thread_status_holder, view_counter_ms);
+
+            if (interpreter.shouldAddSquashingFroStorage(inner_table))
+            {
+                bool table_prefers_large_blocks = inner_table->prefersLargeBlocks();
+                const auto & settings = view_insert_context->getSettingsRef();
+
+                out.addSource(std::make_shared<SquashingChunksTransform>(
+                    out.getInputHeader(),
+                    table_prefers_large_blocks ? settings.min_insert_block_size_rows : settings.max_block_size,
+                    table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL));
+            }
+
+            auto counting = std::make_shared<CountingTransform2>(out.getInputHeader(), thread_status, view_insert_context->getQuota());
+            counting->setProcessListElement(view_insert_context->getProcessListElement());
+            counting->setProgressCallback(view_insert_context->getProgressCallback());
+            out.addSource(std::move(counting));
+
             out.addStorageHolder(view);
             out.addStorageHolder(inner_table);
         }
diff --git a/src/QueryPipeline/QueryPipeline.cpp b/src/QueryPipeline/QueryPipeline.cpp
index 935c006c217..54b2d1df493 100644
--- a/src/QueryPipeline/QueryPipeline.cpp
+++ b/src/QueryPipeline/QueryPipeline.cpp
@@ -549,7 +549,12 @@ void QueryPipeline::setProcessListElement(QueryStatusPtr elem)
 
     if (pushing())
     {
-        if (auto * counting = dynamic_cast<CountingTransform *>(&input->getProcessor()))
+        if (auto * counting = dynamic_cast<CountingTransform2 *>(&input->getProcessor()))
+        {
+            counting->setProcessListElement(elem);
+        }
+
+        if (auto * counting = dynamic_cast<SimpleCountingTransform *>(&input->getProcessor()))
         {
             counting->setProcessListElement(elem);
         }

From 431aee4de3cce16411682425cd6eda4e645be04e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 12 Feb 2024 16:52:54 +0000
Subject: [PATCH 0898/1081] Rename back.

---
 src/Processors/Transforms/CountingTransform.h          | 4 ++--
 src/Processors/Transforms/buildPushingToViewsChain.cpp | 2 +-
 src/QueryPipeline/QueryPipeline.cpp                    | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Processors/Transforms/CountingTransform.h b/src/Processors/Transforms/CountingTransform.h
index 2f067f7ac6b..7fd9bd12d4b 100644
--- a/src/Processors/Transforms/CountingTransform.h
+++ b/src/Processors/Transforms/CountingTransform.h
@@ -49,10 +49,10 @@ protected:
     std::shared_ptr<const EnabledQuota> quota;
 };
 
-class CountingTransform2 final : public ExceptionKeepingTransform
+class CountingTransform final : public ExceptionKeepingTransform
 {
 public:
-    explicit CountingTransform2(
+    explicit CountingTransform(
         const Block & header,
         ThreadStatus * thread_status_ = nullptr,
         std::shared_ptr<const EnabledQuota> quota_ = nullptr)
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index a3c3eb4037b..702d60e375b 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -425,7 +425,7 @@ Chain buildPushingToViewsChain(
                     table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL));
             }
 
-            auto counting = std::make_shared<CountingTransform2>(out.getInputHeader(), thread_status, view_insert_context->getQuota());
+            auto counting = std::make_shared<CountingTransform>(out.getInputHeader(), thread_status, view_insert_context->getQuota());
             counting->setProcessListElement(view_insert_context->getProcessListElement());
             counting->setProgressCallback(view_insert_context->getProgressCallback());
             out.addSource(std::move(counting));
diff --git a/src/QueryPipeline/QueryPipeline.cpp b/src/QueryPipeline/QueryPipeline.cpp
index 54b2d1df493..569d4655460 100644
--- a/src/QueryPipeline/QueryPipeline.cpp
+++ b/src/QueryPipeline/QueryPipeline.cpp
@@ -549,7 +549,7 @@ void QueryPipeline::setProcessListElement(QueryStatusPtr elem)
 
     if (pushing())
     {
-        if (auto * counting = dynamic_cast<CountingTransform2 *>(&input->getProcessor()))
+        if (auto * counting = dynamic_cast<CountingTransform *>(&input->getProcessor()))
         {
             counting->setProcessListElement(elem);
         }

From 134837d6fbc4face69bf3b73eff629e4c4d695cd Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 13:54:23 +0000
Subject: [PATCH 0899/1081] Fixing tests.

---
 src/Interpreters/InterpreterInsertQuery.cpp | 23 ++++++++++++++++++++-
 1 file changed, 22 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 8e735fbdb54..beb9f4d1857 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -642,7 +642,28 @@ BlockIO InterpreterInsertQuery::execute()
     }
     else
     {
-        presink_chains.at(0).appendChain(std::move(sink_chains.at(0)));
+        auto & chain = presink_chains.at(0);
+        chain.appendChain(std::move(sink_chains.at(0)));
+
+        auto context_ptr = getContext();
+        auto counting = std::make_shared<SimpleCountingTransform>(chain.getInputHeader(), context_ptr->getQuota());
+        counting->setProcessListElement(context_ptr->getProcessListElement());
+        counting->setProgressCallback(context_ptr->getProgressCallback());
+
+        chain.addSource(std::move(counting));
+
+        if (shouldAddSquashingFroStorage(table))
+        {
+            bool table_prefers_large_blocks = table->prefersLargeBlocks();
+
+            auto squashing = std::make_shared<SimpleSquashingChunksTransform>(
+                chain.getInputHeader(),
+                table_prefers_large_blocks ? settings.min_insert_block_size_rows : settings.max_block_size,
+                table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL);
+
+            chain.addSource(std::move(squashing));
+        }
+
         res.pipeline = QueryPipeline(std::move(presink_chains[0]));
         res.pipeline.setNumThreads(std::min<size_t>(res.pipeline.getNumThreads(), settings.max_threads));
         res.pipeline.setConcurrencyControl(settings.use_concurrency_control);

From 476bec4baf27c5a42ea2638c1705ea529a0f99a2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 14:59:26 +0000
Subject: [PATCH 0900/1081] Fixing tests.

---
 src/Processors/Transforms/buildPushingToViewsChain.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index 702d60e375b..91bbf04f327 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -425,7 +425,7 @@ Chain buildPushingToViewsChain(
                     table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0ULL));
             }
 
-            auto counting = std::make_shared<CountingTransform>(out.getInputHeader(), thread_status, view_insert_context->getQuota());
+            auto counting = std::make_shared<CountingTransform>(out.getInputHeader(), current_thread, view_insert_context->getQuota());
             counting->setProcessListElement(view_insert_context->getProcessListElement());
             counting->setProgressCallback(view_insert_context->getProgressCallback());
             out.addSource(std::move(counting));

From 262e8af90912e9d23e7df5a9330958824659b75f Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 13 Feb 2024 17:37:20 +0100
Subject: [PATCH 0901/1081] Analyzer: Fix test_user_defined_object_persistence

---
 tests/analyzer_integration_broken_tests.txt       |  1 -
 .../test_user_defined_object_persistence/test.py  | 15 +++++++++++----
 2 files changed, 11 insertions(+), 5 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c04ed440c18..30cc5a0c917 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -16,7 +16,6 @@ test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
 test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
-test_user_defined_object_persistence/test.py::test_persistence
 test_wrong_db_or_table_name/test.py::test_wrong_table_name
 test_zookeeper_config/test.py::test_chroot_with_same_root
 test_zookeeper_config/test.py::test_chroot_with_different_root
diff --git a/tests/integration/test_user_defined_object_persistence/test.py b/tests/integration/test_user_defined_object_persistence/test.py
index 8d775411b61..1919da0726e 100644
--- a/tests/integration/test_user_defined_object_persistence/test.py
+++ b/tests/integration/test_user_defined_object_persistence/test.py
@@ -35,9 +35,16 @@ def test_persistence():
 
     instance.restart_clickhouse()
 
-    assert "Unknown function MySum1" in instance.query_and_get_error(
-        "SELECT MySum1(1, 2)"
+    error_message = instance.query_and_get_error("SELECT MySum1(1, 2)")
+    assert (
+        "Unknown function MySum1" in error_message
+        or "Function with name 'MySum1' does not exists. In scope SELECT MySum1(1, 2)"
+        in error_message
     )
-    assert "Unknown function MySum2" in instance.query_and_get_error(
-        "SELECT MySum2(1, 2)"
+
+    error_message = instance.query_and_get_error("SELECT MySum2(1, 2)")
+    assert (
+        "Unknown function MySum2" in error_message
+        or "Function with name 'MySum2' does not exists. In scope SELECT MySum2(1, 2)"
+        in error_message
     )

From c2ad7693dbc263fd9d618f4428de94482f6326d2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 17:32:24 +0000
Subject: [PATCH 0902/1081] Review fixes.

---
 src/Planner/Planner.cpp                   |  4 +--
 src/Planner/findParallelReplicasQuery.cpp | 37 +++++++++++++---------
 src/Planner/findParallelReplicasQuery.h   | 38 -----------------------
 3 files changed, 24 insertions(+), 55 deletions(-)
 delete mode 100644 src/Planner/findParallelReplicasQuery.h

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index 2e763a41f1a..ace6d500482 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -64,7 +64,7 @@
 #include <Analyzer/AggregationUtils.h>
 #include <Analyzer/WindowFunctionsUtils.h>
 
-#include <Planner/findParallelReplicasQuery.h>
+#include <Planner/findQueryForParallelReplicas.h>
 #include <Planner/Utils.h>
 #include <Planner/PlannerContext.h>
 #include <Planner/PlannerActionsVisitor.h>
@@ -1163,7 +1163,7 @@ Planner::Planner(const QueryTreeNodePtr & query_tree_,
     , select_query_options(select_query_options_)
     , planner_context(buildPlannerContext(query_tree, select_query_options,
         std::make_shared<GlobalPlannerContext>(
-            findParallelReplicasQuery(query_tree, select_query_options),
+            findQueryForParallelReplicas(query_tree, select_query_options),
             findTableForParallelReplicas(query_tree, select_query_options))))
 {
 }
diff --git a/src/Planner/findParallelReplicasQuery.cpp b/src/Planner/findParallelReplicasQuery.cpp
index 8b03fc97bec..362f7109f47 100644
--- a/src/Planner/findParallelReplicasQuery.cpp
+++ b/src/Planner/findParallelReplicasQuery.cpp
@@ -1,4 +1,4 @@
-#include <Planner/findParallelReplicasQuery.h>
+#include <Planner/findQueryForParallelReplicas.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Processors/QueryPlan/JoinStep.h>
@@ -152,7 +152,7 @@ QueryTreeNodePtr replaceTablesWithDummyTables(const QueryTreeNodePtr & query, co
 /// Find the best candidate for parallel replicas execution by verifying query plan.
 /// If query plan has only Expression, Filter of Join steps, we can execute it fully remotely and check the next query.
 /// Otherwise we can execute current query up to WithMergableStage only.
-const QueryNode * findParallelReplicasQuery(
+const QueryNode * findQueryForParallelReplicas(
     std::stack<const QueryNode *> stack,
     const std::unordered_map<const QueryNode *, const QueryPlan::Node *> & mapping)
 {
@@ -227,7 +227,7 @@ const QueryNode * findParallelReplicasQuery(
     return res;
 }
 
-const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options)
+const QueryNode * findQueryForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options)
 {
     if (select_query_options.only_analyze)
         return nullptr;
@@ -269,10 +269,10 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
     /// This part is a bit clumsy.
     /// We updated a query_tree with dummy storages, and mapping is using updated_query_tree now.
     /// But QueryNode result should be taken from initial query tree.
-    /// So that we build a list of candidates again, and call findParallelReplicasQuery for it.
+    /// So that we build a list of candidates again, and call findQueryForParallelReplicas for it.
     auto new_stack = getSupportingParallelReplicasQuery(updated_query_tree.get());
     const auto & mapping = planner.getQueryNodeToPlanStepMapping();
-    const auto * res = findParallelReplicasQuery(new_stack, mapping);
+    const auto * res = findQueryForParallelReplicas(new_stack, mapping);
 
     /// Now, return a query from initial stack.
     if (res)
@@ -292,8 +292,15 @@ const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_
 
 static const TableNode * findTableForParallelReplicas(const IQueryTreeNode * query_tree_node)
 {
-    while (query_tree_node)
+    std::stack<const IQueryTreeNode *> right_join_nodes;
+    while (query_tree_node || !right_join_nodes.empty())
     {
+        if (!query_tree_node)
+        {
+            query_tree_node = right_join_nodes.top();
+            right_join_nodes.pop();
+        }
+
         auto join_tree_node_type = query_tree_node->getNodeType();
 
         switch (join_tree_node_type)
@@ -305,11 +312,13 @@ static const TableNode * findTableForParallelReplicas(const IQueryTreeNode * que
                 if (std::dynamic_pointer_cast<MergeTreeData>(storage) || typeid_cast<const StorageDummy *>(storage.get()))
                     return &table_node;
 
-                return {};
+                query_tree_node = nullptr;
+                break;
             }
             case QueryTreeNodeType::TABLE_FUNCTION:
             {
-                return {};
+                query_tree_node = nullptr;
+                break;
             }
             case QueryTreeNodeType::QUERY:
             {
@@ -322,10 +331,10 @@ static const TableNode * findTableForParallelReplicas(const IQueryTreeNode * que
                 const auto & union_node = query_tree_node->as<UnionNode &>();
                 const auto & union_queries = union_node.getQueries().getNodes();
 
-                if (union_queries.empty())
-                    return {};
+                query_tree_node = nullptr;
+                if (!union_queries.empty())
+                    query_tree_node = union_queries.front().get();
 
-                query_tree_node = union_queries.front().get();
                 break;
             }
             case QueryTreeNodeType::ARRAY_JOIN:
@@ -337,10 +346,8 @@ static const TableNode * findTableForParallelReplicas(const IQueryTreeNode * que
             case QueryTreeNodeType::JOIN:
             {
                 const auto & join_node = query_tree_node->as<JoinNode &>();
-                if (const auto * res = findTableForParallelReplicas(join_node.getLeftTableExpression().get()))
-                    return res;
-
-                query_tree_node = join_node.getRightTableExpression().get();
+                query_tree_node = join_node.getLeftTableExpression().get();
+                right_join_nodes.push(join_node.getRightTableExpression().get());
                 break;
             }
             default:
diff --git a/src/Planner/findParallelReplicasQuery.h b/src/Planner/findParallelReplicasQuery.h
deleted file mode 100644
index ee910cbdaaa..00000000000
--- a/src/Planner/findParallelReplicasQuery.h
+++ /dev/null
@@ -1,38 +0,0 @@
-#pragma once
-#include <list>
-#include <memory>
-
-namespace DB
-{
-
-class QueryNode;
-class TableNode;
-
-class IQueryTreeNode;
-using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
-
-struct SelectQueryOptions;
-
-/// Find a qury which can be executed with parallel replicas up to WithMergableStage.
-/// Returned query will always contain some (>1) subqueries, possibly with joins.
-const QueryNode * findParallelReplicasQuery(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
-
-/// Find a table from which we should read on follower replica. It's the left-most table within all JOINs and UNIONs.
-const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
-
-struct JoinTreeQueryPlan;
-
-class PlannerContext;
-using PlannerContextPtr = std::shared_ptr<PlannerContext>;
-
-struct StorageLimits;
-using StorageLimitsList = std::list<StorageLimits>;
-
-/// Execute QueryNode with parallel replicas up to WithMergableStage and return a plan.
-/// This method does not check that QueryNode is valid. Ideally it should be a result of findParallelReplicasQuery.
-JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
-    const QueryNode & query_node,
-    const PlannerContextPtr & planner_context,
-    std::shared_ptr<const StorageLimitsList> storage_limits);
-
-}

From 72bcadb7d518fa6d0c3f002be9927057076460b3 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 17:37:25 +0000
Subject: [PATCH 0903/1081] Trying to fix settings change

---
 src/Core/SettingsChangesHistory.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 71d9b5d4e55..5089d2d6e4f 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,7 +93,10 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
               {"split_parts_ranges_into_intersecting_and_non_intersecting_final", true, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
               {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"},
-              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."}}},
+              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."},
+              {"min_external_table_block_size_rows", DEFAULT_INSERT_BLOCK_SIZE, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough"},
+              {"min_external_table_block_size_bytes", DEFAULT_INSERT_BLOCK_SIZE * 256, DEFAULT_INSERT_BLOCK_SIZE * 256, "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough."},
+              {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
@@ -112,9 +115,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"min_external_table_block_size_rows", DEFAULT_INSERT_BLOCK_SIZE, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough"},
-              {"min_external_table_block_size_bytes", DEFAULT_INSERT_BLOCK_SIZE * 256, DEFAULT_INSERT_BLOCK_SIZE * 256, "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough."},
-              {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},

From d697c12a4417c8d6aec28fef1d659d5cf8630ea1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 13 Feb 2024 17:57:35 +0000
Subject: [PATCH 0904/1081] Fixing build.

---
 src/Planner/findQueryForParallelReplicas.h | 38 ++++++++++++++++++++++
 1 file changed, 38 insertions(+)
 create mode 100644 src/Planner/findQueryForParallelReplicas.h

diff --git a/src/Planner/findQueryForParallelReplicas.h b/src/Planner/findQueryForParallelReplicas.h
new file mode 100644
index 00000000000..f5dc69dfa0e
--- /dev/null
+++ b/src/Planner/findQueryForParallelReplicas.h
@@ -0,0 +1,38 @@
+#pragma once
+#include <list>
+#include <memory>
+
+namespace DB
+{
+
+class QueryNode;
+class TableNode;
+
+class IQueryTreeNode;
+using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
+
+struct SelectQueryOptions;
+
+/// Find a qury which can be executed with parallel replicas up to WithMergableStage.
+/// Returned query will always contain some (>1) subqueries, possibly with joins.
+const QueryNode * findQueryForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
+
+/// Find a table from which we should read on follower replica. It's the left-most table within all JOINs and UNIONs.
+const TableNode * findTableForParallelReplicas(const QueryTreeNodePtr & query_tree_node, SelectQueryOptions & select_query_options);
+
+struct JoinTreeQueryPlan;
+
+class PlannerContext;
+using PlannerContextPtr = std::shared_ptr<PlannerContext>;
+
+struct StorageLimits;
+using StorageLimitsList = std::list<StorageLimits>;
+
+/// Execute QueryNode with parallel replicas up to WithMergableStage and return a plan.
+/// This method does not check that QueryNode is valid. Ideally it should be a result of findParallelReplicasQuery.
+JoinTreeQueryPlan buildQueryPlanForParallelReplicas(
+    const QueryNode & query_node,
+    const PlannerContextPtr & planner_context,
+    std::shared_ptr<const StorageLimitsList> storage_limits);
+
+}

From 30ef68d78fa3b2f29ffa0ac7daa06f402f63e51b Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 13 Feb 2024 18:59:23 +0100
Subject: [PATCH 0905/1081] Analyzer: Fix test_mutations_with_merge_tree

---
 tests/analyzer_integration_broken_tests.txt                     | 1 -
 .../test_mutations_with_merge_tree/configs/users.xml            | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index c04ed440c18..c48bb5a17b7 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -7,7 +7,6 @@ test_executable_table_function/test.py::test_executable_function_input_python
 test_mask_sensitive_info/test.py::test_encryption_functions
 test_merge_table_over_distributed/test.py::test_global_in
 test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_over_distributed
-test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_task
 test_mysql_database_engine/test.py::test_mysql_ddl_for_mysql_database
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_replicating_constants/test.py::test_different_versions
diff --git a/tests/integration/test_mutations_with_merge_tree/configs/users.xml b/tests/integration/test_mutations_with_merge_tree/configs/users.xml
index d1a3ae1e859..c767d6361fd 100644
--- a/tests/integration/test_mutations_with_merge_tree/configs/users.xml
+++ b/tests/integration/test_mutations_with_merge_tree/configs/users.xml
@@ -1,7 +1,7 @@
 <clickhouse>
     <profiles>
         <default>
-            <max_expanded_ast_elements>500</max_expanded_ast_elements>
+            <max_expanded_ast_elements>1800</max_expanded_ast_elements>
             <force_index_by_date>1</force_index_by_date>
             <force_primary_key>1</force_primary_key>
         </default>

From 73cf923033fb4feec9653fd6d2bd7111c652baeb Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 13 Feb 2024 18:03:00 +0000
Subject: [PATCH 0906/1081] Update test

---
 .../0_stateless/02500_numbers_inference.sh       | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/02500_numbers_inference.sh b/tests/queries/0_stateless/02500_numbers_inference.sh
index ce9cd5bdc9f..5d863bd616f 100755
--- a/tests/queries/0_stateless/02500_numbers_inference.sh
+++ b/tests/queries/0_stateless/02500_numbers_inference.sh
@@ -8,10 +8,10 @@ $CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : 1.2}')";
 echo '{"x" : 1.2}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test";
 $CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : 1}')";
 echo '{"x" : 1}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test";
-$CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : 1e10}')";
-echo '{"x" : 1e10}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test";
-$CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : [1, 42.42, 1, 1e10]}')";
-echo '{"x" : [1, 42.42, 1, 1e10]}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test";
+$CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : 1e10}')" --input_format_try_infer_exponent_floats=1;
+echo '{"x" : 1e10}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test" --input_format_try_infer_exponent_floats=1;
+$CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : [1, 42.42, 1, 1e10]}')" --input_format_try_infer_exponent_floats=1;
+echo '{"x" : [1, 42.42, 1, 1e10]}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test" --input_format_try_infer_exponent_floats=1;
 $CLICKHOUSE_LOCAL -q "desc format(JSONEachRow, '{\"x\" : [1, 42.42, false]}')";
 echo '{"x" : [1, 42.42, false]}' | $CLICKHOUSE_LOCAL --input-format='JSONEachRow' --table='test' -q "desc test";
 
@@ -19,10 +19,10 @@ $CLICKHOUSE_LOCAL -q "desc format(TSV, '1.2')";
 echo '1.2' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test";
 $CLICKHOUSE_LOCAL -q "desc format(TSV, '1')";
 echo '1' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test";
-$CLICKHOUSE_LOCAL -q "desc format(TSV, '1e10')";
-echo '1e10' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test";
-$CLICKHOUSE_LOCAL -q "desc format(TSV, '[1, 42.42, 1, 1e10]')";
-echo '[1, 42.42, 1, 1e10]' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test";
+$CLICKHOUSE_LOCAL -q "desc format(TSV, '1e10')" --input_format_try_infer_exponent_floats=1;
+echo '1e10' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test" --input_format_try_infer_exponent_floats=1;
+$CLICKHOUSE_LOCAL -q "desc format(TSV, '[1, 42.42, 1, 1e10]')" --input_format_try_infer_exponent_floats=1;
+echo '[1, 42.42, 1, 1e10]' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test" --input_format_try_infer_exponent_floats=1;
 $CLICKHOUSE_LOCAL -q "desc format(TSV, '[1, 42.42, false]')";
 echo '[1, 42.42, false]' | $CLICKHOUSE_LOCAL --input-format='TSV' --table='test' -q "desc test";
 

From ed5591e68cce58624bab515286a128352213377e Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 13 Feb 2024 18:20:57 +0000
Subject: [PATCH 0907/1081] changes due to review

---
 src/Functions/FunctionBinaryArithmetic.h | 78 ++++++++++--------------
 1 file changed, 31 insertions(+), 47 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 9b0afee5053..d2e74b0cb71 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -148,14 +148,7 @@ public:
     static constexpr bool allow_decimal = IsOperation<Operation>::allow_decimal;
     static constexpr bool only_integer = IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero;
 
-    /// Appropriate result type for binary operator on numeric types. "Date" can also mean
-    /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
-    using ResultDataType = Switch<
-        /// Result must be Integer
-        Case<IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero, DataTypeFromFieldType<typename Op::ResultType>>,
-
-        /// Decimal cases
-        Case<!allow_decimal && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>), InvalidType>,
+    using DecimalResultType = Switch<
         Case<
             IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>,
             LeftDataType>,
@@ -163,6 +156,18 @@ public:
         Case<IsDataTypeDecimal<LeftDataType> && IsIntegralOrExtended<RightDataType>, LeftDataType>,
         Case<IsDataTypeDecimal<RightDataType> && IsIntegralOrExtended<LeftDataType>, RightDataType>,
 
+        /// Decimal <op> Real is not supported (traditional DBs convert Decimal <op> Real to Real)
+        Case<IsDataTypeDecimal<LeftDataType> && !IsIntegralOrExtendedOrDecimal<RightDataType>, InvalidType>,
+        Case<IsDataTypeDecimal<RightDataType> && !IsIntegralOrExtendedOrDecimal<LeftDataType>, InvalidType>>; /// Determine result decimal type as it would be with usual division (as we determine BinaryOperationTraits::ResultType)
+
+    /// Appropriate result type for binary operator on numeric types. "Date" can also mean
+    /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
+    using ResultDataType = Switch<
+        /// Result must be Integer
+        Case<IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero, DataTypeFromFieldType<typename Op::ResultType>>,
+        /// Decimal cases
+        Case<IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>, DecimalResultType>,
+
         /// e.g Decimal +-*/ Float, least(Decimal, Float), greatest(Decimal, Float) = Float64
         Case<IsOperation<Operation>::allow_decimal && IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>, DataTypeFloat64>,
         Case<IsOperation<Operation>::allow_decimal && IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>, DataTypeFloat64>,
@@ -1669,26 +1674,23 @@ public:
 
                 if constexpr (!std::is_same_v<ResultDataType, InvalidType>)
                 {
+                    if constexpr (is_div_int || is_div_int_or_zero)
+                        type_res = std::make_shared<ResultDataType>();
                     if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr (is_div_int || is_div_int_or_zero)
-                            type_res = std::make_shared<ResultDataType>();
-                        else
+                        if constexpr (is_division)
                         {
-                            if constexpr (is_division)
+                            if (context->getSettingsRef().decimal_check_overflow)
                             {
-                                if (context->getSettingsRef().decimal_check_overflow)
-                                {
-                                    /// Check overflow by using operands scale (based on big decimal division implementation details):
-                                    /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
-                                    /// i.e. int_operand = decimal_operand*10^scale
-                                    /// For division, left operand will be scaled by right operand scale also to do big integer division,
-                                    /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
-                                    /// So, we can check upfront possible overflow just by checking max scale used for left operand
-                                    /// Note: it doesn't detect all possible overflow during big decimal division
-                                    if (left.getScale() + right.getScale() > ResultDataType::maxPrecision())
-                                        throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
-                                }
+                                /// Check overflow by using operands scale (based on big decimal division implementation details):
+                                /// big decimal arithmetic is based on big integers, decimal operands are converted to big integers
+                                /// i.e. int_operand = decimal_operand*10^scale
+                                /// For division, left operand will be scaled by right operand scale also to do big integer division,
+                                /// BigInt result = left*10^(left_scale + right_scale) / right * 10^right_scale
+                                /// So, we can check upfront possible overflow just by checking max scale used for left operand
+                                /// Note: it doesn't detect all possible overflow during big decimal division
+                                if (left.getScale() + right.getScale() > ResultDataType::maxPrecision())
+                                    throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
                             }
                             ResultDataType result_type = decimalResultType<is_multiply, is_division>(left, right);
                             type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
@@ -1697,24 +1699,15 @@ public:
                     else if constexpr (((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
                         (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)))
                     {
-                        if constexpr (is_div_int || is_div_int_or_zero)
-                            type_res = std::make_shared<ResultDataType>();
-                        else
-                            type_res = std::make_shared<DataTypeFloat64>();
+                        type_res = std::make_shared<DataTypeFloat64>();
                     }
                     else if constexpr (IsDataTypeDecimal<LeftDataType>)
                     {
-                        if constexpr (is_div_int || is_div_int_or_zero)
-                            type_res = std::make_shared<ResultDataType>();
-                        else
-                            type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
+                        type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
                     }
                     else if constexpr (IsDataTypeDecimal<RightDataType>)
                     {
-                        if constexpr (is_div_int || is_div_int_or_zero)
-                            type_res = std::make_shared<ResultDataType>();
-                        else
-                            type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
+                        type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
                     }
                     else if constexpr (std::is_same_v<ResultDataType, DataTypeDateTime>)
                     {
@@ -2024,6 +2017,7 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
         using LeftDataType = std::decay_t<decltype(left)>;
         using RightDataType = std::decay_t<decltype(right)>;
         using ResultDataType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::ResultDataType;
+        using DecimalResultType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::DecimalResultType;
 
         if constexpr (std::is_same_v<ResultDataType, InvalidType>)
             return nullptr;
@@ -2075,19 +2069,9 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                     col_left_size,
                     right_nullmap);
             }
+            /// Here we check if we have `intDiv` or `intDivOrZero` and at least one of the arguments is decimal, because in this case originally we had result as decimal, so we need to convert result into integer after calculations
             else if constexpr (!decimal_with_float && (is_div_int || is_div_int_or_zero) && (IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>))
             {
-                using DecimalResultType = Switch<
-                    Case<
-                        IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>,
-                        LeftDataType>,
-                    Case<IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>, RightDataType>,
-                    Case<IsDataTypeDecimal<LeftDataType> && IsIntegralOrExtended<RightDataType>, LeftDataType>,
-                    Case<IsDataTypeDecimal<RightDataType> && IsIntegralOrExtended<LeftDataType>, RightDataType>,
-
-                    /// Decimal <op> Real is not supported (traditional DBs convert Decimal <op> Real to Real)
-                    Case<IsDataTypeDecimal<LeftDataType> && !IsIntegralOrExtendedOrDecimal<RightDataType>, InvalidType>,
-                    Case<IsDataTypeDecimal<RightDataType> && !IsIntegralOrExtendedOrDecimal<LeftDataType>, InvalidType>>; /// Determine result decimal type as it would be with usual division (as we determine BinaryOperationTraits::ResultType)
 
                 if constexpr (!std::is_same_v<DecimalResultType, InvalidType>)
                 {

From 84e8755aae2d111a121bbee592a067d848fb3dcc Mon Sep 17 00:00:00 2001
From: jsc0218 <jsc0218@gmail.com>
Date: Tue, 13 Feb 2024 19:27:29 +0000
Subject: [PATCH 0908/1081] rename a setting

---
 src/Core/Settings.h                                         | 2 +-
 src/Core/SettingsChangesHistory.h                           | 3 ++-
 src/Functions/keyvaluepair/extractKeyValuePairs.cpp         | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.reference  | 4 ++--
 .../02499_extract_key_value_pairs_multiple_input.sql        | 6 +++---
 5 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 44badfefabb..c3a2f98bffe 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -858,7 +858,7 @@ class IColumn;
     M(UInt64, grace_hash_join_max_buckets, 1024, "Limit on the number of grace hash join buckets", 0) \
     M(Bool, optimize_distinct_in_order, true, "Enable DISTINCT optimization if some columns in DISTINCT form a prefix of sorting. For example, prefix of sorting key in merge tree or ORDER BY statement", 0) \
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
-    M(UInt64, extract_kvp_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
+    M(UInt64, extract_key_value_pairs_max_pairs_per_row, 1000, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory.", 0) ALIAS(extract_kvp_max_pairs_per_row) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
     M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c453dd837eb..5b21347e80b 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,7 +93,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
               {"split_parts_ranges_into_intersecting_and_non_intersecting_final", true, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
               {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"},
-              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."}}},
+              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."},
+              {"extract_key_value_pairs_max_pairs_per_row", 0, 0, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory."}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
diff --git a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
index 34081cddb92..94f02861af0 100644
--- a/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
+++ b/src/Functions/keyvaluepair/extractKeyValuePairs.cpp
@@ -43,11 +43,11 @@ class ExtractKeyValuePairs : public IFunction
             builder.withQuotingCharacter(parsed_arguments.quoting_character.value());
         }
 
-        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_kvp_max_pairs_per_row == 0;
+        bool is_number_of_pairs_unlimited = context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row == 0;
 
         if (!is_number_of_pairs_unlimited)
         {
-            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_kvp_max_pairs_per_row);
+            builder.withMaxNumberOfPairs(context->getSettingsRef().extract_key_value_pairs_max_pairs_per_row);
         }
 
         return builder.build();
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
index f646583bbd3..9a0cfdffcb5 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.reference
@@ -293,7 +293,7 @@ SELECT
 {'age':'31','last_key':'last_value','name':'neymar','nationality':'brazil','team':'psg'}
 -- { echoOn }
 
-SET extract_kvp_max_pairs_per_row = 2;
+SET extract_key_value_pairs_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -307,7 +307,7 @@ WITH
 SELECT
     x;
 {'key1':'value1','key2':'value2'}
-SET extract_kvp_max_pairs_per_row = 0;
+SET extract_key_value_pairs_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
diff --git a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
index 9277ba6d7ec..4f3db3f166b 100644
--- a/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
+++ b/tests/queries/0_stateless/02499_extract_key_value_pairs_multiple_input.sql
@@ -415,7 +415,7 @@ SELECT
     x; -- {serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
 
 -- Should fail allowed because it exceeds the max number of pairs
-SET extract_kvp_max_pairs_per_row = 1;
+SET extract_key_value_pairs_max_pairs_per_row = 1;
 WITH
     extractKeyValuePairs('key1:value1,key2:value2') AS s_map,
     CAST(
@@ -429,7 +429,7 @@ SELECT
 
 -- { echoOn }
 
-SET extract_kvp_max_pairs_per_row = 2;
+SET extract_key_value_pairs_max_pairs_per_row = 2;
 -- Should be allowed because it no longer exceeds the max number of pairs
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH
@@ -443,7 +443,7 @@ WITH
 SELECT
     x;
 
-SET extract_kvp_max_pairs_per_row = 0;
+SET extract_key_value_pairs_max_pairs_per_row = 0;
 -- Should be allowed because max pairs per row is set to 0 (unlimited)
 -- expected output: {'key1':'value1','key2':'value2'}
 WITH

From a27639a7f90c0575618ee4433c6545aa554c7750 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 13 Feb 2024 22:06:00 +0000
Subject: [PATCH 0909/1081] Fix: call first exception callback on exception

it'll update query_log
---
 src/Interpreters/executeQuery.cpp                    |  6 +++++-
 .../test_insert_exception_over_http/test.py          | 12 ++++++++----
 2 files changed, 13 insertions(+), 5 deletions(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 345472fe4d0..6dd6d8eb6a0 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1511,13 +1511,17 @@ void executeQuery(
     }
     catch (...)
     {
+        /// first execute on exception callback, it includes updating query_log
+        /// otherwise closing record ('ExceptionWhileProcessing') can be not appended in query_log
+        /// due to possible exceptions in functions called bellow (passed as parameter here)
+        streams.onException();
+
         if (handle_exception_in_output_format)
         {
             update_format_on_exception_if_needed();
             if (output_format)
                 handle_exception_in_output_format(*output_format);
         }
-        streams.onException();
         throw;
     }
 
diff --git a/tests/integration/test_insert_exception_over_http/test.py b/tests/integration/test_insert_exception_over_http/test.py
index 962c20d6bff..826e0d01a81 100644
--- a/tests/integration/test_insert_exception_over_http/test.py
+++ b/tests/integration/test_insert_exception_over_http/test.py
@@ -25,13 +25,17 @@ def test_insert_exception_over_http(start_cluster):
     )
 
     assert True == instance.http_query_and_get_error(
-        "insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)"
+        "insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)", method='POST'
     ).startswith("500 Internal Server Error")
 
     assert "0\n" == instance.query("select count() from tt")
+
     instance.query("SYSTEM FLUSH LOGS")
-    assert "2\n" == instance.query(
-        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday()"
-    )
+
+    assert "1\n" == instance.query(
+        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'QueryStart'")
+
+    assert "1\n" == instance.query(
+        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'ExceptionWhileProcessing'")
 
     instance.query("DROP TABLE tt SYNC")

From bc456820a0286d290f606ea5413e444614b9ddf7 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 13 Feb 2024 22:19:27 +0000
Subject: [PATCH 0910/1081] Automatic style fix

---
 .../integration/test_insert_exception_over_http/test.py  | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/tests/integration/test_insert_exception_over_http/test.py b/tests/integration/test_insert_exception_over_http/test.py
index 826e0d01a81..a03d68e0b03 100644
--- a/tests/integration/test_insert_exception_over_http/test.py
+++ b/tests/integration/test_insert_exception_over_http/test.py
@@ -25,7 +25,8 @@ def test_insert_exception_over_http(start_cluster):
     )
 
     assert True == instance.http_query_and_get_error(
-        "insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)", method='POST'
+        "insert into tt settings insert_keeper_max_retries=0, insert_keeper_fault_injection_probability=1.0, log_comment='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' values (1), (2), (3), (4), (5)",
+        method="POST",
     ).startswith("500 Internal Server Error")
 
     assert "0\n" == instance.query("select count() from tt")
@@ -33,9 +34,11 @@ def test_insert_exception_over_http(start_cluster):
     instance.query("SYSTEM FLUSH LOGS")
 
     assert "1\n" == instance.query(
-        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'QueryStart'")
+        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'QueryStart'"
+    )
 
     assert "1\n" == instance.query(
-        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'ExceptionWhileProcessing'")
+        "select count() from system.query_log where log_comment ='02988_66a57d6f-d1cc-4693-8bf4-206848edab87' and current_database = currentDatabase() and event_date >= yesterday() and type = 'ExceptionWhileProcessing'"
+    )
 
     instance.query("DROP TABLE tt SYNC")

From 3d91b12a2fc29d44f2631a811e960ddc5936c922 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Tue, 13 Feb 2024 22:34:10 +0000
Subject: [PATCH 0911/1081] Fix typo

---
 src/Interpreters/executeQuery.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 6dd6d8eb6a0..e8a032974c6 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1513,7 +1513,7 @@ void executeQuery(
     {
         /// first execute on exception callback, it includes updating query_log
         /// otherwise closing record ('ExceptionWhileProcessing') can be not appended in query_log
-        /// due to possible exceptions in functions called bellow (passed as parameter here)
+        /// due to possible exceptions in functions called below (passed as parameter here)
         streams.onException();
 
         if (handle_exception_in_output_format)

From ac601a0cb9a8a81e0b690df317b9c7a98f17e1ad Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 13 Feb 2024 23:12:21 +0000
Subject: [PATCH 0912/1081] fix build

---
 src/Functions/FunctionBinaryArithmetic.h | 31 +++++++++++++++++-------
 1 file changed, 22 insertions(+), 9 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 667854a622b..fa2ff8fc275 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -147,17 +147,24 @@ private: /// it's not correct for Decimal
 public:
     static constexpr bool allow_decimal = IsOperation<Operation>::allow_decimal;
 
-    using DecimalResultType = Switch<
-        Case<
-            IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>,
-            LeftDataType>,
+    using DecimalResultDataType = Switch<
+        Case<!allow_decimal, InvalidType>,
+        Case<IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>, LeftDataType>,
         Case<IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>, RightDataType>,
         Case<IsDataTypeDecimal<LeftDataType> && IsIntegralOrExtended<RightDataType>, LeftDataType>,
         Case<IsDataTypeDecimal<RightDataType> && IsIntegralOrExtended<LeftDataType>, RightDataType>,
 
-        /// Decimal <op> Real is not supported (traditional DBs convert Decimal <op> Real to Real)
+        /// e.g Decimal +-*/ Float, least(Decimal, Float), greatest(Decimal, Float) = Float64
+        Case<IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>, DataTypeFloat64>,
+        Case<IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>, DataTypeFloat64>,
+
+        Case<IsOperation<Operation>::bit_hamming_distance && IsIntegral<LeftDataType> && IsIntegral<RightDataType>, DataTypeUInt8>,
+        Case<IsOperation<Operation>::bit_hamming_distance && IsFixedString<LeftDataType> && IsFixedString<RightDataType>, DataTypeUInt16>,
+        Case<IsOperation<Operation>::bit_hamming_distance && IsString<LeftDataType> && IsString<RightDataType>, DataTypeUInt64>,
+
+          /// Decimal <op> Real is not supported (traditional DBs convert Decimal <op> Real to Real)
         Case<IsDataTypeDecimal<LeftDataType> && !IsIntegralOrExtendedOrDecimal<RightDataType>, InvalidType>,
-        Case<IsDataTypeDecimal<RightDataType> && !IsIntegralOrExtendedOrDecimal<LeftDataType>, InvalidType>>; /// Determine result decimal type as it would be with usual division (as we determine BinaryOperationTraits::ResultType)
+        Case<IsDataTypeDecimal<RightDataType> && !IsIntegralOrExtendedOrDecimal<LeftDataType>, InvalidType>>;
 
     /// Appropriate result type for binary operator on numeric types. "Date" can also mean
     /// DateTime, but if both operands are Dates, their type must be the same (e.g. Date - DateTime is invalid).
@@ -165,7 +172,13 @@ public:
         /// Result must be Integer
         Case<IsOperation<Operation>::div_int || IsOperation<Operation>::div_int_or_zero, DataTypeFromFieldType<typename Op::ResultType>>,
         /// Decimal cases
-        Case<IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>, DecimalResultType>,
+        Case<IsDataTypeDecimal<LeftDataType> || IsDataTypeDecimal<RightDataType>, DecimalResultDataType>,
+        Case<
+            IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType> && UseLeftDecimal<LeftDataType, RightDataType>,
+            LeftDataType>,
+        Case<IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>, RightDataType>,
+        Case<IsDataTypeDecimal<LeftDataType> && IsIntegralOrExtended<RightDataType>, LeftDataType>,
+        Case<IsDataTypeDecimal<RightDataType> && IsIntegralOrExtended<LeftDataType>, RightDataType>,
 
         /// e.g Decimal +-*/ Float, least(Decimal, Float), greatest(Decimal, Float) = Float64
         Case<IsOperation<Operation>::allow_decimal && IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>, DataTypeFloat64>,
@@ -1678,7 +1691,7 @@ public:
                 {
                     if constexpr (is_div_int || is_div_int_or_zero)
                         type_res = std::make_shared<ResultDataType>();
-                    if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
+                    else if constexpr (IsDataTypeDecimal<LeftDataType> && IsDataTypeDecimal<RightDataType>)
                     {
                         if constexpr (is_division)
                         {
@@ -2019,7 +2032,7 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
         using LeftDataType = std::decay_t<decltype(left)>;
         using RightDataType = std::decay_t<decltype(right)>;
         using ResultDataType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::ResultDataType;
-        using DecimalResultType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::DecimalResultType;
+        using DecimalResultType = typename BinaryOperationTraits<Op, LeftDataType, RightDataType>::DecimalResultDataType;
 
         if constexpr (std::is_same_v<ResultDataType, InvalidType>)
             return nullptr;

From 2b4949bd18f3969226bf35e04950d6463f97607e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 00:21:13 +0100
Subject: [PATCH 0913/1081] Cleanups

---
 programs/local/LocalServer.cpp              | 2 +-
 src/Core/Settings.h                         | 2 +-
 src/Databases/IDatabase.h                   | 2 +-
 src/Functions/widthBucket.cpp               | 4 ++--
 src/Interpreters/ClusterDiscovery.cpp       | 2 +-
 src/Interpreters/InterpreterSystemQuery.cpp | 2 +-
 src/TableFunctions/ITableFunctionFileLike.h | 1 -
 src/TableFunctions/TableFunctionFile.h      | 1 +
 utils/check-style/check-style               | 5 +++++
 9 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index d7acf4112a5..5b455a59a07 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -249,7 +249,7 @@ void LocalServer::tryInitPath()
         default_path = parent_folder / fmt::format("clickhouse-local-{}-{}-{}", getpid(), time(nullptr), randomSeed());
 
         if (exists(default_path))
-            throw Exception(ErrorCodes::FILE_ALREADY_EXISTS, "Unsuccessful attempt to create working directory: {} exist!", default_path.string());
+            throw Exception(ErrorCodes::FILE_ALREADY_EXISTS, "Unsuccessful attempt to create working directory: {} already exists.", default_path.string());
 
         create_directory(default_path);
         temporary_directory_to_delete = default_path;
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 44badfefabb..abf0230c68d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -831,7 +831,7 @@ class IColumn;
     M(UInt64, insert_keeper_retry_max_backoff_ms, 10000, "Max backoff timeout for keeper operations during insert", 0) \
     M(Float, insert_keeper_fault_injection_probability, 0.0f, "Approximate probability of failure for a keeper request during insert. Valid value is in interval [0.0f, 1.0f]", 0) \
     M(UInt64, insert_keeper_fault_injection_seed, 0, "0 - random seed, otherwise the setting value", 0) \
-    M(Bool, force_aggregation_in_order, false, "Force use of aggregation in order on remote nodes during distributed aggregation. PLEASE, NEVER CHANGE THIS SETTING VALUE MANUALLY!", IMPORTANT) \
+    M(Bool, force_aggregation_in_order, false, "The setting is used by the server itself to support distributed queries. Do not change it manually, because it will break normal operations. (Forces use of aggregation in order on remote nodes during distributed aggregation).", IMPORTANT) \
     M(UInt64, http_max_request_param_data_size, 10_MiB, "Limit on size of request data used as a query parameter in predefined HTTP requests.", 0) \
     M(Bool, function_json_value_return_type_allow_nullable, false, "Allow function JSON_VALUE to return nullable type.", 0) \
     M(Bool, function_json_value_return_type_allow_complex, false, "Allow function JSON_VALUE to return complex type, such as: struct, array, map.", 0) \
diff --git a/src/Databases/IDatabase.h b/src/Databases/IDatabase.h
index 2f448cd7036..ec380fa759d 100644
--- a/src/Databases/IDatabase.h
+++ b/src/Databases/IDatabase.h
@@ -407,7 +407,7 @@ public:
 
     virtual void stopReplication()
     {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Database engine {} does not run a replication thread!", getEngineName());
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Database engine {} does not run a replication thread", getEngineName());
     }
 
     virtual bool shouldReplicateQuery(const ContextPtr & /*query_context*/, const ASTPtr & /*query_ptr*/) const { return false; }
diff --git a/src/Functions/widthBucket.cpp b/src/Functions/widthBucket.cpp
index e95f7c05756..62ed460ca9d 100644
--- a/src/Functions/widthBucket.cpp
+++ b/src/Functions/widthBucket.cpp
@@ -44,7 +44,7 @@ class FunctionWidthBucket : public IFunction
         {
             throw Exception(
                 ErrorCodes::LOGICAL_ERROR,
-                "Logical error in function {}: argument {} has unexpected type or size!",
+                "Logical error in function {}: argument {} has unexpected type or size.",
                 getName(),
                 argument_index);
         }
@@ -157,7 +157,7 @@ class FunctionWidthBucket : public IFunction
         if (are_all_const_cols)
         {
             throw Exception(
-                ErrorCodes::LOGICAL_ERROR, "Logical error in function {}: unexpected combination of argument types!", getName());
+                ErrorCodes::LOGICAL_ERROR, "Logical error in function {}: unexpected combination of argument types.", getName());
         }
 
         auto result_column = ColumnVector<ResultType>::create();
diff --git a/src/Interpreters/ClusterDiscovery.cpp b/src/Interpreters/ClusterDiscovery.cpp
index 52b74597c4b..d432488964d 100644
--- a/src/Interpreters/ClusterDiscovery.cpp
+++ b/src/Interpreters/ClusterDiscovery.cpp
@@ -319,7 +319,7 @@ bool ClusterDiscovery::updateCluster(ClusterInfo & cluster_info)
 
     if (cluster_info.current_cluster_is_invisible)
     {
-        LOG_DEBUG(log, "cluster '{}' is invisible!", cluster_info.name);
+        LOG_DEBUG(log, "Cluster '{}' is invisible.", cluster_info.name);
         return true;
     }
 
diff --git a/src/Interpreters/InterpreterSystemQuery.cpp b/src/Interpreters/InterpreterSystemQuery.cpp
index 9a80553f149..19449cd9e28 100644
--- a/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/src/Interpreters/InterpreterSystemQuery.cpp
@@ -1083,7 +1083,7 @@ void InterpreterSystemQuery::syncReplica(ASTSystemQuery & query)
         auto sync_timeout = getContext()->getSettingsRef().receive_timeout.totalMilliseconds();
         if (!storage_replicated->waitForProcessingQueue(sync_timeout, query.sync_replica_mode, query.src_replicas))
         {
-            LOG_ERROR(log, "SYNC REPLICA {}: Timed out!", table_id.getNameForLogs());
+            LOG_ERROR(log, "SYNC REPLICA {}: Timed out.", table_id.getNameForLogs());
             throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "SYNC REPLICA {}: command timed out. " \
                     "See the 'receive_timeout' setting", table_id.getNameForLogs());
         }
diff --git a/src/TableFunctions/ITableFunctionFileLike.h b/src/TableFunctions/ITableFunctionFileLike.h
index 5fe86587797..4a316cedb9b 100644
--- a/src/TableFunctions/ITableFunctionFileLike.h
+++ b/src/TableFunctions/ITableFunctionFileLike.h
@@ -42,7 +42,6 @@ protected:
     virtual String getFormatFromFirstArgument();
 
     String filename;
-    String path_to_archive;
     String format = "auto";
     String structure = "auto";
     String compression_method = "auto";
diff --git a/src/TableFunctions/TableFunctionFile.h b/src/TableFunctions/TableFunctionFile.h
index 6eaab29db8a..fd4fedc21a9 100644
--- a/src/TableFunctions/TableFunctionFile.h
+++ b/src/TableFunctions/TableFunctionFile.h
@@ -26,6 +26,7 @@ public:
 
 protected:
     int fd = -1;
+    String path_to_archive;
     void parseFirstArguments(const ASTPtr & arg, const ContextPtr & context) override;
     String getFormatFromFirstArgument() override;
 
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index daee2e7fb00..badfd173172 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -274,6 +274,11 @@ find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
     grep -vP $EXCLUDE_DIRS |
     xargs grep -F '!!!' | grep -P '.' && echo "Too many exclamation marks (looks dirty, unconfident)."
 
+# Exclamation mark in a message
+find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
+    grep -vP $EXCLUDE_DIRS |
+    xargs grep -F '!",' | grep -P '.' && echo "No need for an exclamation mark (looks dirty, unconfident)."
+
 # Trailing whitespaces
 find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
     grep -vP $EXCLUDE_DIRS |

From 3c0abe08cb00245cde18e6e57018c87566d228bb Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 14 Feb 2024 00:29:24 +0000
Subject: [PATCH 0914/1081] Update version_date.tsv and changelogs after
 v24.1.4.19-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.4.19-stable.md | 28 ++++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  1 +
 5 files changed, 32 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.4.19-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index e8293869a56..618b3a1faa7 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.19"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 3cf89f1b841..26c401a89fe 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.19"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index d477d8aaca1..3a9cbd674a8 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.19"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.4.19-stable.md b/docs/changelogs/v24.1.4.19-stable.md
new file mode 100644
index 00000000000..5083c94f490
--- /dev/null
+++ b/docs/changelogs/v24.1.4.19-stable.md
@@ -0,0 +1,28 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.4.19-stable (334aecf7e4b) FIXME as compared to v24.1.3.31-stable (135b08cbd28)
+
+#### Improvement
+* Backported in [#59826](https://github.com/ClickHouse/ClickHouse/issues/59826): In case when `merge_max_block_size_bytes` is small enough and tables contain wide rows (strings or tuples) background merges may stuck in an endless loop. This behaviour is fixed. Follow-up for https://github.com/ClickHouse/ClickHouse/pull/59340. [#59812](https://github.com/ClickHouse/ClickHouse/pull/59812) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#59885](https://github.com/ClickHouse/ClickHouse/issues/59885): If you want to run initdb scripts every time when ClickHouse container is starting you shoud initialize environment varible CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS. [#59808](https://github.com/ClickHouse/ClickHouse/pull/59808) ([Alexander Nikolaev](https://github.com/AlexNik)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix digest calculation in Keeper [#59439](https://github.com/ClickHouse/ClickHouse/pull/59439) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix distributed table with a constant sharding key [#59606](https://github.com/ClickHouse/ClickHouse/pull/59606) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix query start time on non initial queries [#59662](https://github.com/ClickHouse/ClickHouse/pull/59662) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix parsing of partition expressions surrounded by parens [#59901](https://github.com/ClickHouse/ClickHouse/pull/59901) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Temporarily remove a feature that doesn't work [#59688](https://github.com/ClickHouse/ClickHouse/pull/59688) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Make ZooKeeper actually sequentialy consistent [#59735](https://github.com/ClickHouse/ClickHouse/pull/59735) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix special build reports in release branches [#59797](https://github.com/ClickHouse/ClickHouse/pull/59797) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 1e931b95b41..56fe1adafe8 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.4.19-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30

From 27f115f581021e6b3367a6328abb65d8c22ee21b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 02:17:23 +0100
Subject: [PATCH 0915/1081] Use merge table in the dashboard

---
 programs/server/dashboard.html                |   2 +-
 .../System/StorageSystemDashboards.cpp        | 206 +++++++++++++++---
 2 files changed, 173 insertions(+), 35 deletions(-)

diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index 3c2916b6a16..5d51b8056e7 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -521,7 +521,7 @@ const errorMessages = [
 
 
 /// Query to fill `queries` list for the dashboard
-let search_query = `SELECT title, query FROM system.dashboards WHERE dashboard = 'overview'`;
+let search_query = `SELECT title, query FROM system.dashboards WHERE dashboard = 'Overview'`;
 let customized = false;
 let queries = [];
 
diff --git a/src/Storages/System/StorageSystemDashboards.cpp b/src/Storages/System/StorageSystemDashboards.cpp
index 7e545757129..60175b6fa2c 100644
--- a/src/Storages/System/StorageSystemDashboards.cpp
+++ b/src/Storages/System/StorageSystemDashboards.cpp
@@ -26,192 +26,330 @@ void StorageSystemDashboards::fillData(MutableColumns & res_columns, ContextPtr,
 {
     static const std::vector<std::map<String, String>> dashboards
     {
+        /// Default dashboard for self-managed ClickHouse
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Queries/second" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_Query)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "CPU Usage (cores)" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_OSCPUVirtualTimeMicroseconds) / 1000000
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Queries Running" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(CurrentMetric_Query)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Merges Running" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(CurrentMetric_Merge)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Selected Bytes/second" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_SelectedBytes)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "IO Wait" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_OSIOWaitMicroseconds) / 1000000
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "CPU Wait" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_OSCPUWaitMicroseconds) / 1000000
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "OS CPU Usage (Userspace)" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)
-FROM system.asynchronous_metric_log
+FROM merge('system', '^asynchronous_metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32} AND metric = 'OSUserTimeNormalized'
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "OS CPU Usage (Kernel)" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)
-FROM system.asynchronous_metric_log
+FROM merge('system', '^asynchronous_metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32} AND metric = 'OSSystemTimeNormalized'
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Read From Disk" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_OSReadBytes)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Read From Filesystem" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_OSReadChars)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Memory (tracked)" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(CurrentMetric_MemoryTracking)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Load Average (15 minutes)" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)
-FROM system.asynchronous_metric_log
+FROM merge('system', '^asynchronous_metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32} AND metric = 'LoadAverage15'
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Selected Rows/second" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_SelectedRows)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Inserted Rows/second" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(ProfileEvent_InsertedRows)
-FROM system.metric_log
+FROM merge('system', '^metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Total MergeTree Parts" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)
-FROM system.asynchronous_metric_log
+FROM merge('system', '^asynchronous_metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32} AND metric = 'TotalPartsOfMergeTreeTables'
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
         {
-            { "dashboard", "overview" },
+            { "dashboard", "Overview" },
             { "title", "Max Parts For Partition" },
             { "query", trim(R"EOQ(
 SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, max(value)
-FROM system.asynchronous_metric_log
+FROM merge('system', '^asynchronous_metric_log')
 WHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32} AND metric = 'MaxPartCountForPartition'
 GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
+        },
+        
+        /// Default dashboard for ClickHouse Cloud
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Queries/second" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_Query) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "CPU Usage (cores)" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(metric) / 1000000\nFROM (\n  SELECT event_time, sum(ProfileEvent_OSCPUVirtualTimeMicroseconds) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32} GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Queries Running" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(CurrentMetric_Query) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Merges Running" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(CurrentMetric_Merge) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Selected Bytes/second" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_SelectedBytes) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "IO Wait (local fs)" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_OSIOWaitMicroseconds) / 1000000 AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "S3 read wait" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_ReadBufferFromS3Microseconds) / 1000000 AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "S3 read errors/sec" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_ReadBufferFromS3RequestsErrors) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "CPU Wait" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_OSCPUWaitMicroseconds) / 1000000 AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "OS CPU Usage (Userspace, normalized)" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)\nFROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\nWHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}\nAND metric = 'OSUserTimeNormalized'\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "OS CPU Usage (Kernel, normalized)" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)\nFROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\nWHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}\nAND metric = 'OSSystemTimeNormalized'\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Read From Disk (bytes/sec)" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_OSReadBytes) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Read From Filesystem (bytes/sec)" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_OSReadChars) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Memory (tracked, bytes)" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(CurrentMetric_MemoryTracking) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Load Average (15 minutes)" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)\nFROM (\n  SELECT event_time, sum(value) AS value\n  FROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n    AND metric = 'LoadAverage15'\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Selected Rows/sec" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_SelectedRows) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Inserted Rows/sec" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_InsertedRows) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Total MergeTree Parts" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, max(value)\nFROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\nWHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}\nAND metric = 'TotalPartsOfMergeTreeTables'\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Max Parts For Partition" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, max(value)\nFROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\nWHERE event_date >= toDate(now() - {seconds:UInt32}) AND event_time >= now() - {seconds:UInt32}\nAND metric = 'MaxPartCountForPartition'\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Read From S3 (bytes/sec)" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_ReadBufferFromS3Bytes) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Filesystem Cache Size" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(CurrentMetric_FilesystemCacheSize) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Disk S3 write req/sec" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_DiskS3PutObject + ProfileEvent_DiskS3UploadPart + ProfileEvent_DiskS3CreateMultipartUpload + ProfileEvent_DiskS3CompleteMultipartUpload) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Disk S3 read req/sec" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_DiskS3GetObject + ProfileEvent_DiskS3HeadObject + ProfileEvent_DiskS3ListObjects) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "FS cache hit rate" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, sum(ProfileEvent_CachedReadBufferReadFromCacheBytes) / (sum(ProfileEvent_CachedReadBufferReadFromCacheBytes) + sum(ProfileEvent_CachedReadBufferReadFromSourceBytes)) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Page cache hit rate" },
+            { "query", "SELECT \n  toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t,\n  avg(metric)\nFROM (\n  SELECT event_time, greatest(0, (sum(ProfileEvent_OSReadChars) - sum(ProfileEvent_OSReadBytes)) / (sum(ProfileEvent_OSReadChars) + sum(ProfileEvent_ReadBufferFromS3Bytes))) AS metric \n  FROM clusterAllReplicas(default, merge('system', '^metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Network receive bytes/sec" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)\nFROM (\n  SELECT event_time, sum(value) AS value\n  FROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n    AND metric LIKE 'NetworkReceiveBytes%'\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
+        },
+        {
+            { "dashboard", "Cloud overview" },
+            { "title", "Network send bytes/sec" },
+            { "query", "SELECT toStartOfInterval(event_time, INTERVAL {rounding:UInt32} SECOND)::INT AS t, avg(value)\nFROM (\n  SELECT event_time, sum(value) AS value\n  FROM clusterAllReplicas(default, merge('system', '^asynchronous_metric_log'))\n  WHERE event_date >= toDate(now() - {seconds:UInt32})\n    AND event_time >= now() - {seconds:UInt32}\n    AND metric LIKE 'NetworkSendBytes%'\n  GROUP BY event_time)\nGROUP BY t\nORDER BY t WITH FILL STEP {rounding:UInt32} SETTINGS skip_unavailable_shards = 1" }
         }
     };
 

From 7b3e57e2d255670c5785ff4f68958e456f921916 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 02:37:42 +0100
Subject: [PATCH 0916/1081] Use merge table in the dashboard

---
 src/Storages/System/StorageSystemDashboards.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/System/StorageSystemDashboards.cpp b/src/Storages/System/StorageSystemDashboards.cpp
index 60175b6fa2c..7c9e8b73519 100644
--- a/src/Storages/System/StorageSystemDashboards.cpp
+++ b/src/Storages/System/StorageSystemDashboards.cpp
@@ -214,7 +214,6 @@ GROUP BY t
 ORDER BY t WITH FILL STEP {rounding:UInt32}
 )EOQ") }
         },
-        
         /// Default dashboard for ClickHouse Cloud
         {
             { "dashboard", "Cloud overview" },

From 98f7602ea14dca341720792a2245e771f3f2cade Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 03:01:03 +0100
Subject: [PATCH 0917/1081] Less conflicts

---
 programs/disks/DisksApp.cpp                    | 5 +++++
 programs/disks/DisksApp.h                      | 1 +
 src/Disks/ObjectStorages/DiskObjectStorage.cpp | 1 +
 src/Disks/ObjectStorages/IMetadataStorage.h    | 5 +++++
 4 files changed, 12 insertions(+)

diff --git a/programs/disks/DisksApp.cpp b/programs/disks/DisksApp.cpp
index 4b3b83238a0..11273a9f907 100644
--- a/programs/disks/DisksApp.cpp
+++ b/programs/disks/DisksApp.cpp
@@ -89,6 +89,11 @@ void DisksApp::processOptions()
         config().setString("log-level", options["log-level"].as<String>());
 }
 
+DisksApp::~DisksApp()
+{
+    global_context->shutdown();
+}
+
 void DisksApp::init(std::vector<String> & common_arguments)
 {
     stopOptionsProcessing();
diff --git a/programs/disks/DisksApp.h b/programs/disks/DisksApp.h
index 0b596921707..81e05d1d3cb 100644
--- a/programs/disks/DisksApp.h
+++ b/programs/disks/DisksApp.h
@@ -21,6 +21,7 @@ class DisksApp : public Poco::Util::Application, public Loggers
 {
 public:
     DisksApp() = default;
+    ~DisksApp() override;
 
     void init(std::vector<String> & common_arguments);
 
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 141aa74e417..2a648f28f14 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -389,6 +389,7 @@ void DiskObjectStorage::shutdown()
 {
     LOG_INFO(log, "Shutting down disk {}", name);
     object_storage->shutdown();
+    metadata_storage->shutdown();
     LOG_INFO(log, "Disk {} shut down", name);
 }
 
diff --git a/src/Disks/ObjectStorages/IMetadataStorage.h b/src/Disks/ObjectStorages/IMetadataStorage.h
index f08b0d594bd..f95db2e1eee 100644
--- a/src/Disks/ObjectStorages/IMetadataStorage.h
+++ b/src/Disks/ObjectStorages/IMetadataStorage.h
@@ -210,6 +210,11 @@ public:
         throwNotImplemented();
     }
 
+    virtual void shutdown()
+    {
+        /// This method is overridden for specific metadata implementations in ClickHouse Cloud.
+    }
+
     virtual ~IMetadataStorage() = default;
 
     /// ==== More specific methods. Previous were almost general purpose. ====

From 39378deac1b64b41896a007a2f0d22a5f8816af4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 03:09:40 +0100
Subject: [PATCH 0918/1081] Less conflicts

---
 programs/disks/DisksApp.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/programs/disks/DisksApp.cpp b/programs/disks/DisksApp.cpp
index 11273a9f907..44d46e7d24a 100644
--- a/programs/disks/DisksApp.cpp
+++ b/programs/disks/DisksApp.cpp
@@ -139,6 +139,7 @@ void DisksApp::parseAndCheckOptions(
         .options(options_description_)
         .positional(positional_options_description)
         .allow_unregistered();
+
     po::parsed_options parsed = parser.run();
     po::store(parsed, options);
 
@@ -204,8 +205,8 @@ int DisksApp::main(const std::vector<String> & /*args*/)
         po::parsed_options parsed = parser.run();
         po::store(parsed, options);
         po::notify(options);
-        args = po::collect_unrecognized(parsed.options, po::collect_unrecognized_mode::include_positional);
 
+        args = po::collect_unrecognized(parsed.options, po::collect_unrecognized_mode::include_positional);
         command->processOptions(config(), options);
     }
     else

From c49651ef8906c96a68e81d02e664770a26d6e291 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 03:31:31 +0100
Subject: [PATCH 0919/1081] Even less conflicts

---
 programs/disks/CMakeLists.txt  | 4 ++++
 programs/disks/CommandRead.cpp | 1 -
 programs/disks/DisksApp.cpp    | 6 ++++++
 programs/disks/DisksApp.h      | 2 +-
 programs/disks/ICommand.h      | 1 +
 5 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/programs/disks/CMakeLists.txt b/programs/disks/CMakeLists.txt
index 9477854a58b..f0949fcfceb 100644
--- a/programs/disks/CMakeLists.txt
+++ b/programs/disks/CMakeLists.txt
@@ -11,6 +11,10 @@ set (CLICKHOUSE_DISKS_SOURCES
     CommandRemove.cpp
     CommandWrite.cpp)
 
+if (CLICKHOUSE_CLOUD)
+    set (CLICKHOUSE_DISKS_SOURCES ${CLICKHOUSE_DISKS_SOURCES} CommandPackedIO.cpp)
+endif ()
+
 set (CLICKHOUSE_DISKS_LINK
     PRIVATE
         boost::program_options
diff --git a/programs/disks/CommandRead.cpp b/programs/disks/CommandRead.cpp
index 85041faf22c..0f3ac7ab98c 100644
--- a/programs/disks/CommandRead.cpp
+++ b/programs/disks/CommandRead.cpp
@@ -61,7 +61,6 @@ public:
             auto out = disk->writeFile(relative_path_output);
             copyData(*in, *out);
             out->finalize();
-            return;
         }
         else
         {
diff --git a/programs/disks/DisksApp.cpp b/programs/disks/DisksApp.cpp
index 44d46e7d24a..b7c3c7f5c97 100644
--- a/programs/disks/DisksApp.cpp
+++ b/programs/disks/DisksApp.cpp
@@ -65,6 +65,9 @@ void DisksApp::addOptions(
     positional_options_description.add("command_name", 1);
 
     supported_commands = {"list-disks", "list", "move", "remove", "link", "copy", "write", "read", "mkdir"};
+#ifdef CLICKHOUSE_CLOUD
+    supported_commands.insert("packed-io");
+#endif
 
     command_descriptions.emplace("list-disks", makeCommandListDisks());
     command_descriptions.emplace("list", makeCommandList());
@@ -75,6 +78,9 @@ void DisksApp::addOptions(
     command_descriptions.emplace("write", makeCommandWrite());
     command_descriptions.emplace("read", makeCommandRead());
     command_descriptions.emplace("mkdir", makeCommandMkDir());
+#ifdef CLICKHOUSE_CLOUD
+    command_descriptions.emplace("packed-io", makeCommandPackedIO());
+#endif
 }
 
 void DisksApp::processOptions()
diff --git a/programs/disks/DisksApp.h b/programs/disks/DisksApp.h
index 81e05d1d3cb..51bc3f58dc4 100644
--- a/programs/disks/DisksApp.h
+++ b/programs/disks/DisksApp.h
@@ -53,9 +53,9 @@ protected:
     std::vector<String> command_arguments;
 
     std::unordered_set<String> supported_commands;
-
     std::unordered_map<String, CommandPtr> command_descriptions;
 
     po::variables_map options;
 };
+
 }
diff --git a/programs/disks/ICommand.h b/programs/disks/ICommand.h
index da106e1084e..efe350fe87b 100644
--- a/programs/disks/ICommand.h
+++ b/programs/disks/ICommand.h
@@ -63,3 +63,4 @@ DB::CommandPtr makeCommandRead();
 DB::CommandPtr makeCommandRemove();
 DB::CommandPtr makeCommandWrite();
 DB::CommandPtr makeCommandMkDir();
+DB::CommandPtr makeCommandPackedIO();

From 0ccad7481020ce7919669ede385781e95028d8f3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 03:44:52 +0100
Subject: [PATCH 0920/1081] Even less conflicts

---
 src/Core/ServerUUID.cpp | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/src/Core/ServerUUID.cpp b/src/Core/ServerUUID.cpp
index bcc1fecb529..c2de6be7794 100644
--- a/src/Core/ServerUUID.cpp
+++ b/src/Core/ServerUUID.cpp
@@ -14,6 +14,11 @@ namespace ErrorCodes
 }
 
 void ServerUUID::load(const fs::path & server_uuid_file, Poco::Logger * log)
+{
+    server_uuid = loadServerUUID(server_uuid_file, log);
+}
+
+UUID loadServerUUID(const fs::path & server_uuid_file, Poco::Logger * log)
 {
     /// Write a uuid file containing a unique uuid if the file doesn't already exist during server start.
 
@@ -25,8 +30,7 @@ void ServerUUID::load(const fs::path & server_uuid_file, Poco::Logger * log)
             ReadBufferFromFile in(server_uuid_file);
             readUUIDText(uuid, in);
             assertEOF(in);
-            server_uuid = uuid;
-            return;
+            return uuid;
         }
         catch (...)
         {
@@ -44,7 +48,7 @@ void ServerUUID::load(const fs::path & server_uuid_file, Poco::Logger * log)
         out.write(uuid_str.data(), uuid_str.size());
         out.sync();
         out.finalize();
-        server_uuid = new_uuid;
+        return new_uuid;
     }
     catch (...)
     {

From 40ac23e958330e32fd0437fb42f0ce7cbc7fe84c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 04:12:50 +0100
Subject: [PATCH 0921/1081] Even less conflicts

---
 src/Core/ServerUUID.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Core/ServerUUID.h b/src/Core/ServerUUID.h
index b5ea17426cb..71ae9edc00e 100644
--- a/src/Core/ServerUUID.h
+++ b/src/Core/ServerUUID.h
@@ -21,4 +21,6 @@ public:
     static void load(const fs::path & server_uuid_file, Poco::Logger * log);
 };
 
+UUID loadServerUUID(const fs::path & server_uuid_file, Poco::Logger * log);
+
 }

From 1fbc52fa40fc7967609ed9da54d2bf0128fc4ee3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 14 Feb 2024 05:52:39 +0100
Subject: [PATCH 0922/1081] Remove Aerospike

---
 docker/test/integration/runner/Dockerfile     |  1 -
 tests/integration/README.md                   |  1 -
 tests/integration/helpers/external_sources.py | 89 -------------------
 3 files changed, 91 deletions(-)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index 473278104b2..b876f7b9635 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -62,7 +62,6 @@ RUN curl -fsSL https://download.docker.com/linux/ubuntu/gpg | apt-key add - \
 # kazoo 2.10.0 is broken
 # https://s3.amazonaws.com/clickhouse-test-reports/59337/524625a1d2f4cc608a3f1059e3df2c30f353a649/integration_tests__asan__analyzer__[5_6].html
 RUN python3 -m pip install --no-cache-dir \
-    aerospike==11.1.0 \
     PyMySQL==1.1.0 \
     asyncio==3.4.3 \
     avro==1.10.2 \
diff --git a/tests/integration/README.md b/tests/integration/README.md
index e7ba37bfb56..1b5a0ee8994 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -19,7 +19,6 @@ Don't use Docker from your system repository.
 ```
 sudo -H pip install \
     PyMySQL \
-    aerospike \
     avro \
     cassandra-driver \
     confluent-kafka \
diff --git a/tests/integration/helpers/external_sources.py b/tests/integration/helpers/external_sources.py
index afb91083d57..cccf151e73e 100644
--- a/tests/integration/helpers/external_sources.py
+++ b/tests/integration/helpers/external_sources.py
@@ -4,7 +4,6 @@ import os
 import uuid
 import warnings
 
-import aerospike
 import cassandra.cluster
 import pymongo
 import pymysql.cursors
@@ -696,91 +695,3 @@ class SourceRedis(ExternalSource):
             or layout.is_complex
             and self.storage_type == "hash_map"
         )
-
-
-class SourceAerospike(ExternalSource):
-    def __init__(
-        self,
-        name,
-        internal_hostname,
-        internal_port,
-        docker_hostname,
-        docker_port,
-        user,
-        password,
-    ):
-        ExternalSource.__init__(
-            self,
-            name,
-            internal_hostname,
-            internal_port,
-            docker_hostname,
-            docker_port,
-            user,
-            password,
-        )
-        self.namespace = "test"
-        self.set = "test_set"
-
-    def get_source_str(self, table_name):
-        print("AEROSPIKE get source str")
-        return """
-            <aerospike>
-                <host>{host}</host>
-                <port>{port}</port>
-            </aerospike>
-        """.format(
-            host=self.docker_hostname,
-            port=self.docker_port,
-        )
-
-    def prepare(self, structure, table_name, cluster):
-        config = {"hosts": [(self.internal_hostname, self.internal_port)]}
-        self.client = aerospike.client(config).connect()
-        self.prepared = True
-        print("PREPARED AEROSPIKE")
-        print(config)
-
-    def compatible_with_layout(self, layout):
-        print("compatible AEROSPIKE")
-        return layout.is_simple
-
-    def _flush_aerospike_db(self):
-        keys = []
-
-        def handle_record(xxx_todo_changeme):
-            (key, metadata, record) = xxx_todo_changeme
-            print(("Handle record {} {}".format(key, record)))
-            keys.append(key)
-
-        def print_record(xxx_todo_changeme1):
-            (key, metadata, record) = xxx_todo_changeme1
-            print(("Print record {} {}".format(key, record)))
-
-        scan = self.client.scan(self.namespace, self.set)
-        scan.foreach(handle_record)
-
-        [self.client.remove(key) for key in keys]
-
-    def load_kv_data(self, values):
-        self._flush_aerospike_db()
-
-        print("Load KV Data Aerospike")
-        if len(values[0]) == 2:
-            for value in values:
-                key = (self.namespace, self.set, value[0])
-                print(key)
-                self.client.put(
-                    key,
-                    {"bin_value": value[1]},
-                    policy={"key": aerospike.POLICY_KEY_SEND},
-                )
-                assert self.client.exists(key)
-        else:
-            assert "VALUES SIZE != 2"
-
-        # print(values)
-
-    def load_data(self, data, table_name):
-        print("Load Data Aerospike")
-        # print(data)

From 25667d9c9a4b354bbd2dbda16e7e19acd1ea43b2 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 14 Feb 2024 08:49:14 +0000
Subject: [PATCH 0923/1081] Attempt II at fixing the Fuzzer issue

---
 src/Functions/countMatches.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Functions/countMatches.h b/src/Functions/countMatches.h
index 4664ad18cb3..e9880e6e93f 100644
--- a/src/Functions/countMatches.h
+++ b/src/Functions/countMatches.h
@@ -16,7 +16,7 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
+    extern const int ILLEGAL_COLUMN;
 }
 
 using Pos = const char *;
@@ -48,7 +48,7 @@ public:
         const IColumn * col_pattern = arguments[1].column.get();
         const ColumnConst * col_pattern_const = checkAndGetColumnConst<ColumnString>(col_pattern);
         if (col_pattern_const == nullptr)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Pattern argument is not const");
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Pattern argument is not const");
 
         const OptimizedRegularExpression re = Regexps::createRegexp</*is_like*/ false, /*no_capture*/ true, CountMatchesBase::case_insensitive>(col_pattern_const->getValue<String>());
 
@@ -101,7 +101,7 @@ public:
             return col_res;
         }
         else
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Could not cast haystack argument to String or FixedString");
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Could not cast haystack argument to String or FixedString");
     }
 
     static uint64_t countMatches(std::string_view src, const OptimizedRegularExpression & re, OptimizedRegularExpression::MatchVec & matches)

From 9e7ac6d0eecd0a618f26da92aca4d4372acd379c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Wed, 14 Feb 2024 10:07:09 +0100
Subject: [PATCH 0924/1081] Revert "Update version_date.tsv and changelogs
 after v24.1.4.19-stable"

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.4.19-stable.md | 28 ----------------------------
 utils/list-versions/version_date.tsv |  1 -
 5 files changed, 3 insertions(+), 32 deletions(-)
 delete mode 100644 docs/changelogs/v24.1.4.19-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 618b3a1faa7..e8293869a56 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.4.19"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 26c401a89fe..3cf89f1b841 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.4.19"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 3a9cbd674a8..d477d8aaca1 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.4.19"
+ARG VERSION="24.1.3.31"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.4.19-stable.md b/docs/changelogs/v24.1.4.19-stable.md
deleted file mode 100644
index 5083c94f490..00000000000
--- a/docs/changelogs/v24.1.4.19-stable.md
+++ /dev/null
@@ -1,28 +0,0 @@
----
-sidebar_position: 1
-sidebar_label: 2024
----
-
-# 2024 Changelog
-
-### ClickHouse release v24.1.4.19-stable (334aecf7e4b) FIXME as compared to v24.1.3.31-stable (135b08cbd28)
-
-#### Improvement
-* Backported in [#59826](https://github.com/ClickHouse/ClickHouse/issues/59826): In case when `merge_max_block_size_bytes` is small enough and tables contain wide rows (strings or tuples) background merges may stuck in an endless loop. This behaviour is fixed. Follow-up for https://github.com/ClickHouse/ClickHouse/pull/59340. [#59812](https://github.com/ClickHouse/ClickHouse/pull/59812) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
-
-#### Build/Testing/Packaging Improvement
-* Backported in [#59885](https://github.com/ClickHouse/ClickHouse/issues/59885): If you want to run initdb scripts every time when ClickHouse container is starting you shoud initialize environment varible CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS. [#59808](https://github.com/ClickHouse/ClickHouse/pull/59808) ([Alexander Nikolaev](https://github.com/AlexNik)).
-
-#### Bug Fix (user-visible misbehavior in an official stable release)
-
-* Fix digest calculation in Keeper [#59439](https://github.com/ClickHouse/ClickHouse/pull/59439) ([Antonio Andelic](https://github.com/antonio2368)).
-* Fix distributed table with a constant sharding key [#59606](https://github.com/ClickHouse/ClickHouse/pull/59606) ([Vitaly Baranov](https://github.com/vitlibar)).
-* Fix query start time on non initial queries [#59662](https://github.com/ClickHouse/ClickHouse/pull/59662) ([Raúl Marín](https://github.com/Algunenano)).
-* Fix parsing of partition expressions surrounded by parens [#59901](https://github.com/ClickHouse/ClickHouse/pull/59901) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
-
-#### NOT FOR CHANGELOG / INSIGNIFICANT
-
-* Temporarily remove a feature that doesn't work [#59688](https://github.com/ClickHouse/ClickHouse/pull/59688) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Make ZooKeeper actually sequentialy consistent [#59735](https://github.com/ClickHouse/ClickHouse/pull/59735) ([Alexander Tokmakov](https://github.com/tavplubix)).
-* Fix special build reports in release branches [#59797](https://github.com/ClickHouse/ClickHouse/pull/59797) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
-
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 56fe1adafe8..1e931b95b41 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,4 +1,3 @@
-v24.1.4.19-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30

From 83a184d9281bcd7eda2ed0e9daa508715e9d7a8a Mon Sep 17 00:00:00 2001
From: Jordi Villar <jrdi.villar@gmail.com>
Date: Wed, 14 Feb 2024 10:11:21 +0100
Subject: [PATCH 0925/1081] Fix max num to warn message

---
 src/Interpreters/Context.cpp                              | 2 +-
 tests/config/config.d/max_num_to_warn.xml                 | 4 ++--
 tests/queries/0_stateless/02931_max_num_to_warn.reference | 4 ++--
 tests/queries/0_stateless/02931_max_num_to_warn.sql       | 2 +-
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 0e5897e7306..4f6d2c48b5b 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -907,7 +907,7 @@ Strings Context::getWarnings() const
         if (CurrentMetrics::get(CurrentMetrics::AttachedTable) > static_cast<Int64>(shared->max_table_num_to_warn))
             common_warnings.emplace_back(fmt::format("The number of attached tables is more than {}", shared->max_table_num_to_warn));
         if (CurrentMetrics::get(CurrentMetrics::AttachedDatabase) > static_cast<Int64>(shared->max_database_num_to_warn))
-            common_warnings.emplace_back(fmt::format("The number of attached databases is more than {}", shared->max_table_num_to_warn));
+            common_warnings.emplace_back(fmt::format("The number of attached databases is more than {}", shared->max_database_num_to_warn));
         if (CurrentMetrics::get(CurrentMetrics::PartsActive) > static_cast<Int64>(shared->max_part_num_to_warn))
             common_warnings.emplace_back(fmt::format("The number of active parts is more than {}", shared->max_part_num_to_warn));
     }
diff --git a/tests/config/config.d/max_num_to_warn.xml b/tests/config/config.d/max_num_to_warn.xml
index 77d68998f8e..776c270823d 100644
--- a/tests/config/config.d/max_num_to_warn.xml
+++ b/tests/config/config.d/max_num_to_warn.xml
@@ -1,5 +1,5 @@
 <clickhouse>
-    <max_table_num_to_warn>10</max_table_num_to_warn>
-    <max_database_num_to_warn>10</max_database_num_to_warn>
+    <max_table_num_to_warn>5</max_table_num_to_warn>
+    <max_database_num_to_warn>2</max_database_num_to_warn>
     <max_part_num_to_warn>10</max_part_num_to_warn>
 </clickhouse>
diff --git a/tests/queries/0_stateless/02931_max_num_to_warn.reference b/tests/queries/0_stateless/02931_max_num_to_warn.reference
index c0ad7354039..7de998eebfa 100644
--- a/tests/queries/0_stateless/02931_max_num_to_warn.reference
+++ b/tests/queries/0_stateless/02931_max_num_to_warn.reference
@@ -1,3 +1,3 @@
-The number of attached tables is more than 10
-The number of attached databases is more than 10
+The number of attached tables is more than 5
+The number of attached databases is more than 2
 The number of active parts is more than 10
diff --git a/tests/queries/0_stateless/02931_max_num_to_warn.sql b/tests/queries/0_stateless/02931_max_num_to_warn.sql
index 49b981fc355..23f04816d5a 100644
--- a/tests/queries/0_stateless/02931_max_num_to_warn.sql
+++ b/tests/queries/0_stateless/02931_max_num_to_warn.sql
@@ -37,7 +37,7 @@ INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_9 VALUES (1, 'Hello'
 INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_10 VALUES (1, 'Hello');
 INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_11 VALUES (1, 'Hello');
 
-SELECT * FROM system.warnings where message in ('The number of attached tables is more than 10', 'The number of attached databases is more than 10', 'The number of active parts is more than 10');
+SELECT * FROM system.warnings where message in ('The number of attached tables is more than 5', 'The number of attached databases is more than 2', 'The number of active parts is more than 10');
 
 DROP DATABASE IF EXISTS test_max_num_to_warn_02931;
 DROP DATABASE IF EXISTS test_max_num_to_warn_1;

From b3e5d34204815f684aede15bd9fca3a6056717d6 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Wed, 14 Feb 2024 10:16:13 +0100
Subject: [PATCH 0926/1081] Change used version

---
 .../integration/test_distributed_backward_compatability/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_distributed_backward_compatability/test.py b/tests/integration/test_distributed_backward_compatability/test.py
index 79b937558cd..21ae5f2dc59 100644
--- a/tests/integration/test_distributed_backward_compatability/test.py
+++ b/tests/integration/test_distributed_backward_compatability/test.py
@@ -8,7 +8,7 @@ node_old = cluster.add_instance(
     "node1",
     main_configs=["configs/remote_servers.xml"],
     image="clickhouse/clickhouse-server",
-    tag="23.12",
+    tag="24.1",
     stay_alive=True,
     with_installed_binary=True,
 )

From 914fd27d5b11559b0eb19e119f68acfa93c45678 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 13 Feb 2024 10:40:20 +0100
Subject: [PATCH 0927/1081] Add PlacementInfo

---
 programs/server/Server.cpp        |  6 +++
 src/Server/CloudPlacementInfo.cpp | 75 +++++++++++++++++++++++++++++++
 src/Server/CloudPlacementInfo.h   | 43 ++++++++++++++++++
 3 files changed, 124 insertions(+)
 create mode 100644 src/Server/CloudPlacementInfo.cpp
 create mode 100644 src/Server/CloudPlacementInfo.h

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index f00da445c16..53fc32663e7 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -97,6 +97,7 @@
 #include <Server/ProtocolServerAdapter.h>
 #include <Server/KeeperReadinessHandler.h>
 #include <Server/HTTP/HTTPServer.h>
+#include <Server/CloudPlacementInfo.h>
 #include <Interpreters/AsynchronousInsertQueue.h>
 #include <Core/ServerSettings.h>
 #include <filesystem>
@@ -1960,6 +1961,11 @@ try
                                          load_metadata_tasks);
         }
 
+        if (config().has(DB::PlacementInfo::PLACEMENT_CONFIG_PREFIX))
+        {
+            PlacementInfo::PlacementInfo::instance().initialize(config());
+        }
+
         /// Do not keep tasks in server, they should be kept inside databases. Used here to make dependent tasks only.
         load_metadata_tasks.clear();
         load_metadata_tasks.shrink_to_fit();
diff --git a/src/Server/CloudPlacementInfo.cpp b/src/Server/CloudPlacementInfo.cpp
new file mode 100644
index 00000000000..0b45a58d05a
--- /dev/null
+++ b/src/Server/CloudPlacementInfo.cpp
@@ -0,0 +1,75 @@
+#include <Server/CloudPlacementInfo.h>
+#include <Common/logger_useful.h>
+#include <IO/ReadBufferFromFile.h>
+#include <IO/S3/Credentials.h>
+#include <fmt/core.h>
+#include <filesystem>
+
+
+namespace DB
+{
+
+namespace PlacementInfo
+{
+
+namespace
+{
+    std::string getConfigPath(std::string_view path)
+    {
+        return fmt::format("{}.{}", PLACEMENT_CONFIG_PREFIX, path);
+    }
+
+    String loadAvailabilityZoneFromFile(const Poco::Util::AbstractConfiguration & config)
+    {
+        auto az_file = config.getString(getConfigPath("availability_zone_from_file"), DEFAULT_AZ_FILE_PATH);
+
+        if (!std::filesystem::exists(az_file))
+            return "";
+
+        String availability_zone_from_file;
+
+        ReadBufferFromFile in(az_file);
+        readStringUntilEOF(availability_zone_from_file, in);
+        Poco::trimInPlace(availability_zone_from_file);
+
+        return availability_zone_from_file;
+    }
+}
+
+
+void PlacementInfo::initialize(const Poco::Util::AbstractConfiguration & config)
+{
+    use_imds = config.getBool(getConfigPath("use_imds"), false);
+
+    if (use_imds)
+    {
+        availability_zone = S3::getRunningAvailabilityZone();
+    }
+    else
+    {
+        availability_zone = config.getString(getConfigPath("availability_zone"), "");
+
+        if (availability_zone.empty())
+            availability_zone = loadAvailabilityZoneFromFile(config);
+
+        if (availability_zone.empty())
+            LOG_WARNING(log, "Availability zone info not found");
+    }
+
+    LOG_DEBUG(log, "Loaded info: availability_zone: {}", availability_zone);
+    initialized = true;
+}
+
+std::string PlacementInfo::getAvailabilityZone() const
+{
+    if (!initialized)
+    {
+        LOG_WARNING(log, "Placement info has not been loaded");
+        return "";
+    }
+
+    return availability_zone;
+}
+
+}
+}
diff --git a/src/Server/CloudPlacementInfo.h b/src/Server/CloudPlacementInfo.h
new file mode 100644
index 00000000000..b26f4b10e88
--- /dev/null
+++ b/src/Server/CloudPlacementInfo.h
@@ -0,0 +1,43 @@
+#pragma once
+
+#include <string>
+#include <boost/core/noncopyable.hpp>
+#include <Poco/Util/AbstractConfiguration.h>
+#include <Common/Logger.h>
+
+namespace DB
+{
+
+namespace PlacementInfo
+{
+
+static constexpr auto PLACEMENT_CONFIG_PREFIX = "placement";
+static constexpr auto DEFAULT_AZ_FILE_PATH = "/run/instance-metadata/node-zone";
+
+/// A singleton providing information on where in cloud server is running.
+class PlacementInfo : private boost::noncopyable
+{
+public:
+    static PlacementInfo & instance()
+    {
+        static PlacementInfo instance;
+        return instance;
+    }
+
+    void initialize(const Poco::Util::AbstractConfiguration & config);
+
+    std::string getAvailabilityZone() const;
+
+private:
+    PlacementInfo() = default;
+
+    LoggerPtr log = getLogger("CloudPlacementInfo");
+
+    bool initialized;
+
+    bool use_imds;
+    std::string availability_zone;
+};
+
+}
+}

From c71835ebecacb662d7995bee2bc1233ca2704a03 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 13 Feb 2024 10:40:49 +0100
Subject: [PATCH 0928/1081] Add an integration test

---
 .../test_placement_info/__init__.py           |  0
 .../configs/config_value.xml                  |  6 ++
 .../configs/file_value.xml                    |  6 ++
 .../test_placement_info/configs/imds.xml      |  8 ++
 .../configs/missing_value.xml                 |  5 ++
 .../metadata_servers/simple_server.py         | 30 +++++++
 tests/integration/test_placement_info/test.py | 82 +++++++++++++++++++
 7 files changed, 137 insertions(+)
 create mode 100644 tests/integration/test_placement_info/__init__.py
 create mode 100644 tests/integration/test_placement_info/configs/config_value.xml
 create mode 100644 tests/integration/test_placement_info/configs/file_value.xml
 create mode 100644 tests/integration/test_placement_info/configs/imds.xml
 create mode 100644 tests/integration/test_placement_info/configs/missing_value.xml
 create mode 100644 tests/integration/test_placement_info/metadata_servers/simple_server.py
 create mode 100644 tests/integration/test_placement_info/test.py

diff --git a/tests/integration/test_placement_info/__init__.py b/tests/integration/test_placement_info/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_placement_info/configs/config_value.xml b/tests/integration/test_placement_info/configs/config_value.xml
new file mode 100644
index 00000000000..d3f1a241962
--- /dev/null
+++ b/tests/integration/test_placement_info/configs/config_value.xml
@@ -0,0 +1,6 @@
+<clickhouse>
+    <placement>
+        <use_imds>0</use_imds>
+        <availability_zone>ci-test-1b</availability_zone>
+    </placement>
+</clickhouse>
diff --git a/tests/integration/test_placement_info/configs/file_value.xml b/tests/integration/test_placement_info/configs/file_value.xml
new file mode 100644
index 00000000000..636ccacb467
--- /dev/null
+++ b/tests/integration/test_placement_info/configs/file_value.xml
@@ -0,0 +1,6 @@
+<clickhouse>
+    <placement>
+        <use_imds>0</use_imds>
+        <availability_zone_from_file>/tmp/node-zone</availability_zone_from_file>
+    </placement>
+</clickhouse>
diff --git a/tests/integration/test_placement_info/configs/imds.xml b/tests/integration/test_placement_info/configs/imds.xml
new file mode 100644
index 00000000000..5fc8c1ab3dc
--- /dev/null
+++ b/tests/integration/test_placement_info/configs/imds.xml
@@ -0,0 +1,8 @@
+<clickhouse>
+    <s3>
+        <use_environment_credentials>1</use_environment_credentials>
+    </s3>
+    <placement>
+        <use_imds>1</use_imds>
+    </placement>
+</clickhouse>
diff --git a/tests/integration/test_placement_info/configs/missing_value.xml b/tests/integration/test_placement_info/configs/missing_value.xml
new file mode 100644
index 00000000000..d37218428b3
--- /dev/null
+++ b/tests/integration/test_placement_info/configs/missing_value.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <placement>
+        <use_imds>0</use_imds>
+    </placement>
+</clickhouse>
diff --git a/tests/integration/test_placement_info/metadata_servers/simple_server.py b/tests/integration/test_placement_info/metadata_servers/simple_server.py
new file mode 100644
index 00000000000..73140a7d776
--- /dev/null
+++ b/tests/integration/test_placement_info/metadata_servers/simple_server.py
@@ -0,0 +1,30 @@
+import http.server
+import sys
+
+
+class RequestHandler(http.server.BaseHTTPRequestHandler):
+    def get_response(self):
+        if self.path == "/":
+            return "OK", 200
+
+        if self.path == "/latest/meta-data/placement/availability-zone":
+            return "ci-test-1a", 200
+
+        # Resource not found.
+        return 404
+
+    def do_HEAD(self):
+        response, code = self.get_response()
+        self.send_response(code)
+        self.send_header("Content-Type", "text/plain")
+        self.send_header("Content-Length", len(response.encode()))
+        self.end_headers()
+        return response, code
+
+    def do_GET(self):
+        response, _ = self.do_HEAD()
+        self.wfile.write(response.encode())
+
+
+httpd = http.server.HTTPServer(("0.0.0.0", int(sys.argv[1])), RequestHandler)
+httpd.serve_forever()
diff --git a/tests/integration/test_placement_info/test.py b/tests/integration/test_placement_info/test.py
new file mode 100644
index 00000000000..f08bdf1ddce
--- /dev/null
+++ b/tests/integration/test_placement_info/test.py
@@ -0,0 +1,82 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.mock_servers import start_mock_servers
+import os
+import time
+
+METADATA_SERVER_HOSTNAME = "resolver"
+METADATA_SERVER_PORT = 8080
+
+cluster = ClickHouseCluster(__file__)
+node_imds = cluster.add_instance(
+    "node_imds",
+    with_minio=True,
+    main_configs=["configs/imds.xml"],
+    env_variables={
+        "AWS_EC2_METADATA_SERVICE_ENDPOINT": f"http://{METADATA_SERVER_HOSTNAME}:{METADATA_SERVER_PORT}",
+    },
+    stay_alive=True,
+)
+node_config_value = cluster.add_instance(
+    "node_config_value",
+    main_configs=["configs/config_value.xml"],
+)
+node_file_value = cluster.add_instance(
+    "node_file_value",
+    main_configs=["configs/file_value.xml"],
+    stay_alive=True,
+)
+node_missing_value = cluster.add_instance(
+    "node_missing_value",
+    main_configs=["configs/missing_value.xml"],
+)
+
+def start_metadata_server():
+    script_dir = os.path.join(os.path.dirname(__file__), "metadata_servers")
+    start_mock_servers(
+        cluster,
+        script_dir,
+        [
+            (
+                "simple_server.py",
+                METADATA_SERVER_HOSTNAME,
+                METADATA_SERVER_PORT,
+            )
+        ],
+    )
+
+
+@pytest.fixture(scope="module", autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        start_metadata_server()
+        yield
+    finally:
+        cluster.shutdown()
+
+
+def test_placement_info_from_imds():
+    node_imds.stop_clickhouse(kill=True)
+    node_imds.start_clickhouse()
+
+    node_imds.query("SYSTEM FLUSH LOGS")
+    assert node_imds.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1a")
+
+
+def test_placement_info_from_config():
+    node_config_value.query("SYSTEM FLUSH LOGS")
+    assert node_config_value.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1b")
+
+def test_placement_info_from_file():
+    node_file_value.exec_in_container(["bash", "-c", "echo ci-test-1c > /tmp/node-zone"])
+
+    node_file_value.stop_clickhouse(kill=True)
+    node_file_value.start_clickhouse()
+
+    node_file_value.query("SYSTEM FLUSH LOGS")
+    assert node_file_value.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1c")
+
+def test_placement_info_missing_data():
+    node_missing_value.query("SYSTEM FLUSH LOGS")
+    assert node_missing_value.contains_in_log("CloudPlacementInfo: Availability zone info not found")

From 3769846d4a1c9c9f93e8be09c43ed5ff5fa25497 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 13 Feb 2024 11:01:31 +0100
Subject: [PATCH 0929/1081] Lint

---
 tests/integration/test_placement_info/test.py | 23 +++++++++++++++----
 1 file changed, 18 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_placement_info/test.py b/tests/integration/test_placement_info/test.py
index f08bdf1ddce..1b93a3eae0b 100644
--- a/tests/integration/test_placement_info/test.py
+++ b/tests/integration/test_placement_info/test.py
@@ -31,6 +31,7 @@ node_missing_value = cluster.add_instance(
     main_configs=["configs/missing_value.xml"],
 )
 
+
 def start_metadata_server():
     script_dir = os.path.join(os.path.dirname(__file__), "metadata_servers")
     start_mock_servers(
@@ -61,22 +62,34 @@ def test_placement_info_from_imds():
     node_imds.start_clickhouse()
 
     node_imds.query("SYSTEM FLUSH LOGS")
-    assert node_imds.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1a")
+    assert node_imds.contains_in_log(
+        "CloudPlacementInfo: Loaded info: availability_zone: ci-test-1a"
+    )
 
 
 def test_placement_info_from_config():
     node_config_value.query("SYSTEM FLUSH LOGS")
-    assert node_config_value.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1b")
+    assert node_config_value.contains_in_log(
+        "CloudPlacementInfo: Loaded info: availability_zone: ci-test-1b"
+    )
+
 
 def test_placement_info_from_file():
-    node_file_value.exec_in_container(["bash", "-c", "echo ci-test-1c > /tmp/node-zone"])
+    node_file_value.exec_in_container(
+        ["bash", "-c", "echo ci-test-1c > /tmp/node-zone"]
+    )
 
     node_file_value.stop_clickhouse(kill=True)
     node_file_value.start_clickhouse()
 
     node_file_value.query("SYSTEM FLUSH LOGS")
-    assert node_file_value.contains_in_log("CloudPlacementInfo: Loaded info: availability_zone: ci-test-1c")
+    assert node_file_value.contains_in_log(
+        "CloudPlacementInfo: Loaded info: availability_zone: ci-test-1c"
+    )
+
 
 def test_placement_info_missing_data():
     node_missing_value.query("SYSTEM FLUSH LOGS")
-    assert node_missing_value.contains_in_log("CloudPlacementInfo: Availability zone info not found")
+    assert node_missing_value.contains_in_log(
+        "CloudPlacementInfo: Availability zone info not found"
+    )

From a7c7a5a671076dfd9be8fb3787a88ef55a392142 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 14 Feb 2024 09:50:55 +0000
Subject: [PATCH 0930/1081] Analyzer: Fix test_settings_profile

---
 tests/analyzer_integration_broken_tests.txt   |  1 -
 .../integration/test_settings_profile/test.py | 31 +++++++++++++++----
 2 files changed, 25 insertions(+), 7 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index b2576bfdb2e..bf78cbd64d8 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -9,7 +9,6 @@ test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_ove
 test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_task
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_select_access_rights/test_main.py::test_alias_columns
-test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
 test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 5e40b534cee..70740104d63 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -454,22 +454,41 @@ def test_show_profiles():
     assert instance.query("SHOW PROFILES") == "default\nreadonly\nxyz\n"
 
     assert instance.query("SHOW CREATE PROFILE xyz") == "CREATE SETTINGS PROFILE xyz\n"
+
+    query_possible_response = [
+        "CREATE SETTINGS PROFILE default\n",
+        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n",
+    ]
     assert (
         instance.query("SHOW CREATE SETTINGS PROFILE default")
-        == "CREATE SETTINGS PROFILE default\n"
+        in query_possible_response
     )
-    assert (
-        instance.query("SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default\n"
+
+    query_possible_response = [
+        "CREATE SETTINGS PROFILE default\n"
         "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
-        "CREATE SETTINGS PROFILE xyz\n"
-    )
+        "CREATE SETTINGS PROFILE xyz\n",
+        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n"
+        "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
+        "CREATE SETTINGS PROFILE xyz\n",
+    ]
+    assert instance.query("SHOW CREATE PROFILES") in query_possible_response
 
     expected_access = (
         "CREATE SETTINGS PROFILE default\n"
         "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
         "CREATE SETTINGS PROFILE xyz\n"
     )
-    assert expected_access in instance.query("SHOW ACCESS")
+    expected_access_analyzer = (
+        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n"
+        "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
+        "CREATE SETTINGS PROFILE xyz\n"
+    )
+
+    query_response = instance.query("SHOW ACCESS")
+    assert (
+        expected_access in query_response or expected_access_analyzer in query_response
+    )
 
 
 def test_set_profile():

From f678bdc546c400e32fb603c2e6e53e75ec2fa370 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 14 Feb 2024 10:51:42 +0100
Subject: [PATCH 0931/1081] Update tests

---
 programs/keeper/Keeper.cpp                   |  6 +++++
 src/Coordination/KeeperContext.cpp           | 24 ++++----------------
 tests/integration/helpers/keeper_config1.xml |  8 ++++---
 tests/integration/helpers/keeper_config2.xml |  9 ++++----
 4 files changed, 21 insertions(+), 26 deletions(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index c751702dc6f..b0c207347a3 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -14,6 +14,7 @@
 #include <Common/assertProcessUserMatchesDataOwner.h>
 #include <Common/makeSocketAddress.h>
 #include <Server/waitServersToFinish.h>
+#include <Server/CloudPlacementInfo.h>
 #include <base/getMemoryAmount.h>
 #include <base/scope_guard.h>
 #include <base/safeExit.h>
@@ -352,6 +353,11 @@ try
 
     std::string include_from_path = config().getString("include_from", "/etc/metrika.xml");
 
+    if (config().has(DB::PlacementInfo::PLACEMENT_CONFIG_PREFIX))
+    {
+        PlacementInfo::PlacementInfo::instance().initialize(config());
+    }
+
     GlobalThreadPool::initialize(
         config().getUInt("max_thread_pool_size", 100),
         config().getUInt("max_thread_pool_free_size", 1000),
diff --git a/src/Coordination/KeeperContext.cpp b/src/Coordination/KeeperContext.cpp
index baad8d98e6a..374571bae7e 100644
--- a/src/Coordination/KeeperContext.cpp
+++ b/src/Coordination/KeeperContext.cpp
@@ -7,6 +7,7 @@
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Coordination/KeeperConstants.h>
 #include <Common/logger_useful.h>
+#include <Server/CloudPlacementInfo.h>
 #include <Coordination/KeeperFeatureFlags.h>
 #include <boost/algorithm/string.hpp>
 
@@ -37,26 +38,11 @@ void KeeperContext::initialize(const Poco::Util::AbstractConfiguration & config,
 {
     dispatcher = dispatcher_;
 
-    if (config.hasProperty("keeper_server.availability_zone"))
+    const auto keeper_az = PlacementInfo::PlacementInfo::instance().getAvailabilityZone();
+    if (!keeper_az.empty())
     {
-        auto keeper_az = config.getString("keeper_server.availability_zone.value", "");
-        const auto auto_detect_for_cloud = config.getBool("keeper_server.availability_zone.enable_auto_detection_on_cloud", false);
-        if (keeper_az.empty() && auto_detect_for_cloud)
-        {
-            try
-            {
-                keeper_az = DB::S3::getRunningAvailabilityZone();
-            }
-            catch (...)
-            {
-                tryLogCurrentException(__PRETTY_FUNCTION__);
-            }
-        }
-        if (!keeper_az.empty())
-        {
-            system_nodes_with_data[keeper_availability_zone_path] = keeper_az;
-            LOG_INFO(getLogger("KeeperContext"), "Initialize the KeeperContext with availability zone: '{}'", keeper_az);
-        }
+        system_nodes_with_data[keeper_availability_zone_path] = keeper_az;
+        LOG_INFO(getLogger("KeeperContext"), "Initialize the KeeperContext with availability zone: '{}'", keeper_az);
     }
 
     updateKeeperMemorySoftLimit(config);
diff --git a/tests/integration/helpers/keeper_config1.xml b/tests/integration/helpers/keeper_config1.xml
index 12c6c0b78b6..a4a1059ffe9 100644
--- a/tests/integration/helpers/keeper_config1.xml
+++ b/tests/integration/helpers/keeper_config1.xml
@@ -9,11 +9,13 @@
         <errorlog>/var/log/clickhouse-keeper/clickhouse-keeper.err.log</errorlog>
     </logger>
 
+    <placement>
+        <use_imds>0</use_imds>
+        <availability_zone>az-zoo1</availability_zone>
+    </placement>
+
     <keeper_server>
         <tcp_port>2181</tcp_port>
-        <availability_zone>
-            <value>az-zoo1</value>
-        </availability_zone>
         <server_id>1</server_id>
 
         <coordination_settings>
diff --git a/tests/integration/helpers/keeper_config2.xml b/tests/integration/helpers/keeper_config2.xml
index 2afff2f5e59..88a0d1f0b4b 100644
--- a/tests/integration/helpers/keeper_config2.xml
+++ b/tests/integration/helpers/keeper_config2.xml
@@ -9,13 +9,14 @@
         <errorlog>/var/log/clickhouse-keeper/clickhouse-keeper.err.log</errorlog>
     </logger>
 
+    <placement>
+        <use_imds>0</use_imds>
+        <availability_zone>az-zoo2</availability_zone>
+    </placement>
+
     <keeper_server>
         <tcp_port>2181</tcp_port>
         <server_id>2</server_id>
-        <availability_zone>
-            <value>az-zoo2</value>
-            <enable_auto_detection_on_cloud>1</enable_auto_detection_on_cloud>
-        </availability_zone>
 
         <coordination_settings>
             <operation_timeout_ms>10000</operation_timeout_ms>

From 5f2358b014f887f2365f05e2102b917b15b591e8 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 14 Feb 2024 11:22:29 +0100
Subject: [PATCH 0932/1081] Add missing header

---
 src/Server/CloudPlacementInfo.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Server/CloudPlacementInfo.cpp b/src/Server/CloudPlacementInfo.cpp
index 0b45a58d05a..0eb57254125 100644
--- a/src/Server/CloudPlacementInfo.cpp
+++ b/src/Server/CloudPlacementInfo.cpp
@@ -1,6 +1,7 @@
 #include <Server/CloudPlacementInfo.h>
 #include <Common/logger_useful.h>
 #include <IO/ReadBufferFromFile.h>
+#include <IO/ReadHelpers.h>
 #include <IO/S3/Credentials.h>
 #include <fmt/core.h>
 #include <filesystem>

From 90d07ba82ce785f254513686fdd6409a9a249ea2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E6=9D=8E=E6=89=AC?= <654010905@qq.com>
Date: Wed, 14 Feb 2024 18:29:45 +0800
Subject: [PATCH 0933/1081] Trivial optimize of function coalesce.  (#59627)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* reuse result of functionfactory::get

* add perf test

* Update src/Functions/coalesce.cpp

Co-authored-by: János Benjamin Antal <antaljanosbenjamin@users.noreply.github.com>

* change as requested

---------

Co-authored-by: János Benjamin Antal <antaljanosbenjamin@users.noreply.github.com>
---
 src/Functions/coalesce.cpp     | 24 ++++++++++++++----------
 tests/performance/coalesce.xml |  3 +++
 2 files changed, 17 insertions(+), 10 deletions(-)
 create mode 100644 tests/performance/coalesce.xml

diff --git a/src/Functions/coalesce.cpp b/src/Functions/coalesce.cpp
index befebd1ff52..4ae90a9db13 100644
--- a/src/Functions/coalesce.cpp
+++ b/src/Functions/coalesce.cpp
@@ -29,7 +29,14 @@ public:
         return std::make_shared<FunctionCoalesce>(context);
     }
 
-    explicit FunctionCoalesce(ContextPtr context_) : context(context_) {}
+    explicit FunctionCoalesce(ContextPtr context_)
+        : context(context_)
+        , is_not_null(FunctionFactory::instance().get("isNotNull", context))
+        , assume_not_null(FunctionFactory::instance().get("assumeNotNull", context))
+        , if_function(FunctionFactory::instance().get("if", context))
+        , multi_if_function(FunctionFactory::instance().get("multiIf", context))
+    {
+    }
 
     std::string getName() const override
     {
@@ -110,8 +117,6 @@ public:
                 break;
         }
 
-        auto is_not_null = FunctionFactory::instance().get("isNotNull", context);
-        auto assume_not_null = FunctionFactory::instance().get("assumeNotNull", context);
 
         ColumnsWithTypeAndName multi_if_args;
         ColumnsWithTypeAndName tmp_args(1);
@@ -146,13 +151,8 @@ public:
         /// If there was only two arguments (3 arguments passed to multiIf)
         /// use function "if" instead, because it's implemented more efficient.
         /// TODO: make "multiIf" the same efficient.
-        FunctionOverloadResolverPtr if_function;
-        if (multi_if_args.size() == 3)
-            if_function = FunctionFactory::instance().get("if", context);
-        else
-            if_function = FunctionFactory::instance().get("multiIf", context);
-
-        ColumnPtr res = if_function->build(multi_if_args)->execute(multi_if_args, result_type, input_rows_count);
+        FunctionOverloadResolverPtr if_or_multi_if = multi_if_args.size() == 3 ? if_function : multi_if_function;
+        ColumnPtr res = if_or_multi_if->build(multi_if_args)->execute(multi_if_args, result_type, input_rows_count);
 
         /// if last argument is not nullable, result should be also not nullable
         if (!multi_if_args.back().column->isNullable() && res->isNullable())
@@ -170,6 +170,10 @@ public:
 
 private:
     ContextPtr context;
+    FunctionOverloadResolverPtr is_not_null;
+    FunctionOverloadResolverPtr assume_not_null;
+    FunctionOverloadResolverPtr if_function;
+    FunctionOverloadResolverPtr multi_if_function;
 };
 
 }
diff --git a/tests/performance/coalesce.xml b/tests/performance/coalesce.xml
new file mode 100644
index 00000000000..08b9a6aab1e
--- /dev/null
+++ b/tests/performance/coalesce.xml
@@ -0,0 +1,3 @@
+<test>
+    <query>select coalesce(materialize(null), -1) from numbers(1000000000) format Null settings max_block_size = 8192</query>
+</test>

From 75141583535fb06e1a53252582223711f8d1e1df Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 14 Feb 2024 10:30:32 +0000
Subject: [PATCH 0934/1081] Update version_date.tsv and changelogs after
 v24.1.4.20-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.4.20-stable.md | 28 ++++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  1 +
 5 files changed, 32 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.4.20-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index e8293869a56..ab1bc58da1b 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.20"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 3cf89f1b841..39187781a86 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.20"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index d477d8aaca1..67ea2656310 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.3.31"
+ARG VERSION="24.1.4.20"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.4.20-stable.md b/docs/changelogs/v24.1.4.20-stable.md
new file mode 100644
index 00000000000..8612a485f12
--- /dev/null
+++ b/docs/changelogs/v24.1.4.20-stable.md
@@ -0,0 +1,28 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.4.20-stable (f59d842b3fa) FIXME as compared to v24.1.3.31-stable (135b08cbd28)
+
+#### Improvement
+* Backported in [#59826](https://github.com/ClickHouse/ClickHouse/issues/59826): In case when `merge_max_block_size_bytes` is small enough and tables contain wide rows (strings or tuples) background merges may stuck in an endless loop. This behaviour is fixed. Follow-up for https://github.com/ClickHouse/ClickHouse/pull/59340. [#59812](https://github.com/ClickHouse/ClickHouse/pull/59812) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#59885](https://github.com/ClickHouse/ClickHouse/issues/59885): If you want to run initdb scripts every time when ClickHouse container is starting you shoud initialize environment varible CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS. [#59808](https://github.com/ClickHouse/ClickHouse/pull/59808) ([Alexander Nikolaev](https://github.com/AlexNik)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix digest calculation in Keeper [#59439](https://github.com/ClickHouse/ClickHouse/pull/59439) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix distributed table with a constant sharding key [#59606](https://github.com/ClickHouse/ClickHouse/pull/59606) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix query start time on non initial queries [#59662](https://github.com/ClickHouse/ClickHouse/pull/59662) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix parsing of partition expressions surrounded by parens [#59901](https://github.com/ClickHouse/ClickHouse/pull/59901) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Temporarily remove a feature that doesn't work [#59688](https://github.com/ClickHouse/ClickHouse/pull/59688) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Make ZooKeeper actually sequentialy consistent [#59735](https://github.com/ClickHouse/ClickHouse/pull/59735) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix special build reports in release branches [#59797](https://github.com/ClickHouse/ClickHouse/pull/59797) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 1e931b95b41..312a33ac2d6 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30

From dda7c5d2b768a248064fd363c17a746a7f0b881f Mon Sep 17 00:00:00 2001
From: Alexander Gololobov <davenger@clickhouse.com>
Date: Wed, 14 Feb 2024 11:41:07 +0100
Subject: [PATCH 0935/1081] Add comment with motivation

---
 src/Storages/MergeTree/MergeTask.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index ad5fe3eb8ce..7fb4797e482 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -246,6 +246,7 @@ private:
         bool prepare();
         bool executeImpl();
 
+        /// NOTE: Using pointer-to-member instead of std::function and lambda makes stacktraces much more concise and readable
         using ExecuteAndFinalizeHorizontalPartSubtasks = std::array<bool(ExecuteAndFinalizeHorizontalPart::*)(), 2>;
 
         const ExecuteAndFinalizeHorizontalPartSubtasks subtasks
@@ -323,6 +324,7 @@ private:
         bool executeVerticalMergeForAllColumns() const;
         bool finalizeVerticalMergeForAllColumns() const;
 
+        /// NOTE: Using pointer-to-member instead of std::function and lambda makes stacktraces much more concise and readable
         using VerticalMergeStageSubtasks = std::array<bool(VerticalMergeStage::*)()const, 3>;
 
         const VerticalMergeStageSubtasks subtasks
@@ -373,6 +375,7 @@ private:
         bool executeProjections() const;
         bool finalizeProjectionsAndWholeMerge() const;
 
+        /// NOTE: Using pointer-to-member instead of std::function and lambda makes stacktraces much more concise and readable
         using MergeProjectionsStageSubtasks = std::array<bool(MergeProjectionsStage::*)()const, 3>;
 
         const MergeProjectionsStageSubtasks subtasks

From e6450f8af2c284b55b0220c8677c5964cd8d6acf Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 14 Feb 2024 11:48:03 +0100
Subject: [PATCH 0936/1081] More missing headers

---
 src/Server/CloudPlacementInfo.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Server/CloudPlacementInfo.cpp b/src/Server/CloudPlacementInfo.cpp
index 0eb57254125..5a884dc08d2 100644
--- a/src/Server/CloudPlacementInfo.cpp
+++ b/src/Server/CloudPlacementInfo.cpp
@@ -3,6 +3,7 @@
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <IO/S3/Credentials.h>
+#include <Poco/String.h>
 #include <fmt/core.h>
 #include <filesystem>
 

From 59d8912f6361abc0df81e385cb1bf0f4e7cf42d1 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 14 Feb 2024 12:20:11 +0100
Subject: [PATCH 0937/1081] Update 02327_try_infer_integers_schema_inference
 test

---
 .../0_stateless/02327_try_infer_integers_schema_inference.sql    | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/02327_try_infer_integers_schema_inference.sql b/tests/queries/0_stateless/02327_try_infer_integers_schema_inference.sql
index 0ceed178865..a4a69f4fa40 100644
--- a/tests/queries/0_stateless/02327_try_infer_integers_schema_inference.sql
+++ b/tests/queries/0_stateless/02327_try_infer_integers_schema_inference.sql
@@ -1,6 +1,7 @@
 -- Tags: no-fasttest
 
 set input_format_try_infer_integers=1;
+set input_format_try_infer_exponent_floats=1;
 
 select 'JSONEachRow';
 desc format(JSONEachRow, '{"x" : 123}');

From 4f8ee992b649f9091d7ed7bad53e1e65ec81480e Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 14 Feb 2024 12:22:21 +0100
Subject: [PATCH 0938/1081] Apply suggestions from code review

Co-authored-by: Sergei Trifonov <svtrifonov@gmail.com>
---
 docs/en/interfaces/schema-inference.md | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index 6a7b744dd43..39ae69eaef4 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -1994,8 +1994,7 @@ If data format is not specified and cannot be determined by the file extension,
 
 **Examples:**
 
-Let's say we have `data` with the next content:
-`data1`:
+Let's say we have `data` with the following content:
 ```
 "a","b"
 1,"Data1"
@@ -2027,4 +2026,6 @@ We can inspect and query this file without specifying format or structure:
 └───┴───────┘
 ```
 
-**Note:** ClickHouse can detect only some subset of formats and this detection takes some time, it's always better to specify the format explicitly.
\ No newline at end of file
+:::note
+ClickHouse can detect only some subset of formats and this detection takes some time, it's always better to specify the format explicitly.
+:::
\ No newline at end of file

From db2c15c0a6824b9fc7aa4a8216db44d7bcacf5bf Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 14 Feb 2024 12:24:10 +0100
Subject: [PATCH 0939/1081] Apply suggestions from code review

Co-authored-by: Sergei Trifonov <svtrifonov@gmail.com>
---
 src/Formats/ReadSchemaUtils.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index f97df25aba7..5badf4301bf 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -192,13 +192,13 @@ try
                 if (format_name)
                     throw Exception(
                         ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
-                        "The table structure cannot be extracted from a {} format file:\n{}\n.You can specify the structure manually",
+                        "The table structure cannot be extracted from a {} format file:\n{}.\nYou can specify the structure manually",
                         *format_name,
                         exception_message);
 
                 throw Exception(
                     ErrorCodes::CANNOT_DETECT_FORMAT,
-                    "The data format cannot be detected by the contents of the files:\n{}\n.You can specify the format manually",
+                    "The data format cannot be detected by the contents of the files:\n{}.\nYou can specify the format manually",
                     exception_message);
             }
 

From 48fcc3eeab4254d6d3dca6e3eec5c14aa68dec49 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 14 Feb 2024 12:41:41 +0100
Subject: [PATCH 0940/1081] Fix standalone build

---
 programs/keeper/CMakeLists.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index 143ded0ee85..0c3d76e614f 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -69,6 +69,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/ServerType.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTPRequestHandlerFactoryMain.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/KeeperReadinessHandler.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/CloudPlacementInfo.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/HTTPServer.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/ReadHeaders.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/HTTPServerConnection.cpp

From 83f28b8537155439b77c4c141dcc718623dd3e24 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Wed, 14 Feb 2024 12:51:14 +0100
Subject: [PATCH 0941/1081] Move definition to cpp

---
 src/Server/CloudPlacementInfo.cpp | 6 ++++++
 src/Server/CloudPlacementInfo.h   | 6 +-----
 2 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/src/Server/CloudPlacementInfo.cpp b/src/Server/CloudPlacementInfo.cpp
index 5a884dc08d2..0790f825a45 100644
--- a/src/Server/CloudPlacementInfo.cpp
+++ b/src/Server/CloudPlacementInfo.cpp
@@ -39,6 +39,12 @@ namespace
 }
 
 
+PlacementInfo & PlacementInfo::instance()
+{
+    static PlacementInfo instance;
+    return instance;
+}
+
 void PlacementInfo::initialize(const Poco::Util::AbstractConfiguration & config)
 {
     use_imds = config.getBool(getConfigPath("use_imds"), false);
diff --git a/src/Server/CloudPlacementInfo.h b/src/Server/CloudPlacementInfo.h
index b26f4b10e88..407f668142f 100644
--- a/src/Server/CloudPlacementInfo.h
+++ b/src/Server/CloudPlacementInfo.h
@@ -18,11 +18,7 @@ static constexpr auto DEFAULT_AZ_FILE_PATH = "/run/instance-metadata/node-zone";
 class PlacementInfo : private boost::noncopyable
 {
 public:
-    static PlacementInfo & instance()
-    {
-        static PlacementInfo instance;
-        return instance;
-    }
+    static PlacementInfo & instance();
 
     void initialize(const Poco::Util::AbstractConfiguration & config);
 

From 2c34a98426b270c6f233a9833aa7ceab6ea326cf Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 14 Feb 2024 12:20:09 +0000
Subject: [PATCH 0942/1081] Apply suggestions from the review

---
 src/Backups/.BackupCoordinationLocal.cpp.pHKoqj | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 src/Backups/.BackupCoordinationLocal.cpp.pHKoqj

diff --git a/src/Backups/.BackupCoordinationLocal.cpp.pHKoqj b/src/Backups/.BackupCoordinationLocal.cpp.pHKoqj
new file mode 100644
index 00000000000..e69de29bb2d

From 12963ce53e289d33fa3fe366378e123fd7e5b5f5 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 14 Feb 2024 12:20:37 +0000
Subject: [PATCH 0943/1081] Analyzer: Fix test_storage_rabbitmq

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 108 ++++++++++++------
 tests/analyzer_integration_broken_tests.txt   |   1 -
 .../02989_group_by_tuple.reference            |   3 +
 .../0_stateless/02989_group_by_tuple.sql      |   1 +
 4 files changed, 78 insertions(+), 35 deletions(-)
 create mode 100644 tests/queries/0_stateless/02989_group_by_tuple.reference
 create mode 100644 tests/queries/0_stateless/02989_group_by_tuple.sql

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 2510d35f720..a8054a2de34 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1380,6 +1380,8 @@ private:
 
     ProjectionNames resolveSortNodeList(QueryTreeNodePtr & sort_node_list, IdentifierResolveScope & scope);
 
+    void resolveGroupByNode(QueryNode & query_node_typed, IdentifierResolveScope & scope);
+
     void resolveInterpolateColumnsNodeList(QueryTreeNodePtr & interpolate_node_list, IdentifierResolveScope & scope);
 
     void resolveWindowNodeList(QueryTreeNodePtr & window_node_list, IdentifierResolveScope & scope);
@@ -6263,6 +6265,77 @@ ProjectionNames QueryAnalyzer::resolveSortNodeList(QueryTreeNodePtr & sort_node_
     return result_projection_names;
 }
 
+namespace
+{
+
+void expandTuplesInList(QueryTreeNodes & key_list)
+{
+    QueryTreeNodes expanded_keys;
+    expanded_keys.reserve(key_list.size());
+    for (auto const & key : key_list)
+    {
+        if (auto * function = key->as<FunctionNode>(); function != nullptr && function->getFunctionName() == "tuple")
+        {
+            std::copy(function->getArguments().begin(), function->getArguments().end(), std::back_inserter(expanded_keys));
+        }
+        else
+            expanded_keys.push_back(key);
+    }
+    key_list = std::move(expanded_keys);
+}
+
+}
+
+/** Resolve GROUP BY clause.
+  */
+void QueryAnalyzer::resolveGroupByNode(QueryNode & query_node_typed, IdentifierResolveScope & scope)
+{
+    const auto & settings = scope.context->getSettingsRef();
+
+    if (query_node_typed.isGroupByWithGroupingSets())
+    {
+        for (auto & grouping_sets_keys_list_node : query_node_typed.getGroupBy().getNodes())
+        {
+            if (settings.enable_positional_arguments)
+                replaceNodesWithPositionalArguments(grouping_sets_keys_list_node, query_node_typed.getProjection().getNodes(), scope);
+
+            resolveExpressionNodeList(grouping_sets_keys_list_node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
+
+            // Remove redundant calls to `tuple` function. It simplifies checking if expression is an aggregation key.
+            // It's required to support queries like: SELECT number FROM numbers(3) GROUP BY (number, number % 2)
+            auto & group_by_list = grouping_sets_keys_list_node->as<ListNode &>().getNodes();
+            expandTuplesInList(group_by_list);
+        }
+
+        if (scope.group_by_use_nulls)
+        {
+            for (const auto & grouping_set : query_node_typed.getGroupBy().getNodes())
+            {
+                for (const auto & group_by_elem : grouping_set->as<ListNode>()->getNodes())
+                    scope.nullable_group_by_keys.insert(group_by_elem);
+            }
+        }
+    }
+    else
+    {
+        if (settings.enable_positional_arguments)
+            replaceNodesWithPositionalArguments(query_node_typed.getGroupByNode(), query_node_typed.getProjection().getNodes(), scope);
+
+        resolveExpressionNodeList(query_node_typed.getGroupByNode(), scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
+
+        // Remove redundant calls to `tuple` function. It simplifies checking if expression is an aggregation key.
+        // It's required to support queries like: SELECT number FROM numbers(3) GROUP BY (number, number % 2)
+        auto & group_by_list = query_node_typed.getGroupBy().getNodes();
+        expandTuplesInList(group_by_list);
+
+        if (scope.group_by_use_nulls)
+        {
+            for (const auto & group_by_elem : query_node_typed.getGroupBy().getNodes())
+                scope.nullable_group_by_keys.insert(group_by_elem);
+        }
+    }
+}
+
 /** Resolve interpolate columns nodes list.
   */
 void QueryAnalyzer::resolveInterpolateColumnsNodeList(QueryTreeNodePtr & interpolate_node_list, IdentifierResolveScope & scope)
@@ -7453,40 +7526,7 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
         resolveExpressionNode(query_node_typed.getWhere(), scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
 
     if (query_node_typed.hasGroupBy())
-    {
-        if (query_node_typed.isGroupByWithGroupingSets())
-        {
-            for (auto & grouping_sets_keys_list_node : query_node_typed.getGroupBy().getNodes())
-            {
-                if (settings.enable_positional_arguments)
-                    replaceNodesWithPositionalArguments(grouping_sets_keys_list_node, query_node_typed.getProjection().getNodes(), scope);
-
-                resolveExpressionNodeList(grouping_sets_keys_list_node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
-            }
-
-            if (scope.group_by_use_nulls)
-            {
-                for (const auto & grouping_set : query_node_typed.getGroupBy().getNodes())
-                {
-                    for (const auto & group_by_elem : grouping_set->as<ListNode>()->getNodes())
-                        scope.nullable_group_by_keys.insert(group_by_elem);
-                }
-            }
-        }
-        else
-        {
-            if (settings.enable_positional_arguments)
-                replaceNodesWithPositionalArguments(query_node_typed.getGroupByNode(), query_node_typed.getProjection().getNodes(), scope);
-
-            resolveExpressionNodeList(query_node_typed.getGroupByNode(), scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
-
-            if (scope.group_by_use_nulls)
-            {
-                for (const auto & group_by_elem : query_node_typed.getGroupBy().getNodes())
-                    scope.nullable_group_by_keys.insert(group_by_elem);
-            }
-        }
-    }
+        resolveGroupByNode(query_node_typed, scope);
 
     if (query_node_typed.hasHaving())
         resolveExpressionNode(query_node_typed.getHaving(), scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index b2576bfdb2e..16c1a6802ea 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -12,5 +12,4 @@ test_select_access_rights/test_main.py::test_alias_columns
 test_settings_profile/test.py::test_show_profiles
 test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
-test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
 test_wrong_db_or_table_name/test.py::test_wrong_table_name
diff --git a/tests/queries/0_stateless/02989_group_by_tuple.reference b/tests/queries/0_stateless/02989_group_by_tuple.reference
new file mode 100644
index 00000000000..4539bbf2d22
--- /dev/null
+++ b/tests/queries/0_stateless/02989_group_by_tuple.reference
@@ -0,0 +1,3 @@
+0
+1
+2
diff --git a/tests/queries/0_stateless/02989_group_by_tuple.sql b/tests/queries/0_stateless/02989_group_by_tuple.sql
new file mode 100644
index 00000000000..d0a205f5edc
--- /dev/null
+++ b/tests/queries/0_stateless/02989_group_by_tuple.sql
@@ -0,0 +1 @@
+SELECT number FROM numbers(3) GROUP BY (number, number % 2) ORDER BY number;

From 3d86e87f7f85b89cf7db1d119585c3c139f80eff Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 14 Feb 2024 12:28:54 +0000
Subject: [PATCH 0944/1081] Fixing tests.

---
 src/Interpreters/InterpreterInsertQuery.cpp   | 15 ++--
 .../Transforms/CountingTransform.cpp          |  4 +-
 src/Processors/Transforms/CountingTransform.h | 86 +++----------------
 src/QueryPipeline/QueryPipeline.cpp           |  5 --
 4 files changed, 24 insertions(+), 86 deletions(-)

diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index beb9f4d1857..724cfca6a80 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -580,7 +580,7 @@ BlockIO InterpreterInsertQuery::execute()
         pipeline.addSimpleTransform([&](const Block & in_header) -> ProcessorPtr
         {
             auto context_ptr = getContext();
-            auto counting = std::make_shared<SimpleCountingTransform>(in_header, context_ptr->getQuota());
+            auto counting = std::make_shared<CountingTransform>(in_header, nullptr, context_ptr->getQuota());
             counting->setProcessListElement(context_ptr->getProcessListElement());
             counting->setProgressCallback(context_ptr->getProgressCallback());
 
@@ -645,13 +645,6 @@ BlockIO InterpreterInsertQuery::execute()
         auto & chain = presink_chains.at(0);
         chain.appendChain(std::move(sink_chains.at(0)));
 
-        auto context_ptr = getContext();
-        auto counting = std::make_shared<SimpleCountingTransform>(chain.getInputHeader(), context_ptr->getQuota());
-        counting->setProcessListElement(context_ptr->getProcessListElement());
-        counting->setProgressCallback(context_ptr->getProgressCallback());
-
-        chain.addSource(std::move(counting));
-
         if (shouldAddSquashingFroStorage(table))
         {
             bool table_prefers_large_blocks = table->prefersLargeBlocks();
@@ -664,6 +657,12 @@ BlockIO InterpreterInsertQuery::execute()
             chain.addSource(std::move(squashing));
         }
 
+        auto context_ptr = getContext();
+        auto counting = std::make_shared<CountingTransform>(chain.getInputHeader(), nullptr, context_ptr->getQuota());
+        counting->setProcessListElement(context_ptr->getProcessListElement());
+        counting->setProgressCallback(context_ptr->getProgressCallback());
+        chain.addSource(std::move(counting));
+
         res.pipeline = QueryPipeline(std::move(presink_chains[0]));
         res.pipeline.setNumThreads(std::min<size_t>(res.pipeline.getNumThreads(), settings.max_threads));
         res.pipeline.setConcurrencyControl(settings.use_concurrency_control);
diff --git a/src/Processors/Transforms/CountingTransform.cpp b/src/Processors/Transforms/CountingTransform.cpp
index 7143ae2b8fc..3dfb9fe178f 100644
--- a/src/Processors/Transforms/CountingTransform.cpp
+++ b/src/Processors/Transforms/CountingTransform.cpp
@@ -15,7 +15,7 @@ namespace ProfileEvents
 namespace DB
 {
 
-void CountingBase::count(const Chunk & chunk)
+void CountingTransform::onConsume(Chunk chunk)
 {
     if (quota)
         quota->used(QuotaType::WRITTEN_BYTES, chunk.bytes());
@@ -40,6 +40,8 @@ void CountingBase::count(const Chunk & chunk)
 
     if (progress_callback)
         progress_callback(local_progress);
+
+    cur_chunk = std::move(chunk);
 }
 
 }
diff --git a/src/Processors/Transforms/CountingTransform.h b/src/Processors/Transforms/CountingTransform.h
index 7fd9bd12d4b..05d8e2aeac8 100644
--- a/src/Processors/Transforms/CountingTransform.h
+++ b/src/Processors/Transforms/CountingTransform.h
@@ -2,7 +2,6 @@
 
 #include <IO/Progress.h>
 #include <Processors/Transforms/ExceptionKeepingTransform.h>
-#include <Processors/ISimpleTransform.h>
 #include <Access/EnabledQuota.h>
 
 
@@ -14,13 +13,17 @@ using QueryStatusPtr = std::shared_ptr<QueryStatus>;
 class ThreadStatus;
 
 /// Proxy class which counts number of written block, rows, bytes
-class CountingBase
+class CountingTransform final : public ExceptionKeepingTransform
 {
 public:
-    explicit CountingBase(
+    explicit CountingTransform(
+        const Block & header,
         ThreadStatus * thread_status_ = nullptr,
         std::shared_ptr<const EnabledQuota> quota_ = nullptr)
-        : thread_status(thread_status_), quota(std::move(quota_)) {}
+        : ExceptionKeepingTransform(header, header)
+        , thread_status(thread_status_), quota(std::move(quota_)) {}
+
+    String getName() const override { return "CountingTransform"; }
 
     void setProgressCallback(const ProgressCallback & callback)
     {
@@ -37,7 +40,13 @@ public:
         return progress;
     }
 
-    void count(const Chunk & chunk);
+    void onConsume(Chunk chunk) override;
+    GenerateResult onGenerate() override
+    {
+        GenerateResult res;
+        res.chunk = std::move(cur_chunk);
+        return res;
+    }
 
 protected:
     Progress progress;
@@ -47,74 +56,7 @@ protected:
 
     /// Quota is used to limit amount of written bytes.
     std::shared_ptr<const EnabledQuota> quota;
-};
-
-class CountingTransform final : public ExceptionKeepingTransform
-{
-public:
-    explicit CountingTransform(
-        const Block & header,
-        ThreadStatus * thread_status_ = nullptr,
-        std::shared_ptr<const EnabledQuota> quota_ = nullptr)
-        : ExceptionKeepingTransform(header, header), counting(thread_status_, std::move(quota_)) {}
-
-    String getName() const override { return "CountingTransform"; }
-    void onConsume(Chunk chunk) override
-    {
-        counting.count(chunk);
-        cur_chunk = std::move(chunk);
-    }
-
-    GenerateResult onGenerate() override
-    {
-        GenerateResult res;
-        res.chunk = std::move(cur_chunk);
-        return res;
-    }
-
-    void setProgressCallback(const ProgressCallback & callback)
-    {
-        counting.setProgressCallback(callback);
-    }
-
-    void setProcessListElement(QueryStatusPtr elem)
-    {
-        counting.setProcessListElement(std::move(elem));
-    }
-
-protected:
-    CountingBase counting;
     Chunk cur_chunk;
 };
 
-class SimpleCountingTransform final : public ISimpleTransform
-{
-public:
-    explicit SimpleCountingTransform(
-        const Block & header,
-        std::shared_ptr<const EnabledQuota> quota_ = nullptr)
-        : ISimpleTransform(header, header, false)
-        , counting(nullptr, std::move(quota_))
-    {}
-
-    String getName() const override { return "SimpleCountingTransform"; }
-    void transform(Chunk & chunk) override
-    {
-        counting.count(chunk);
-    }
-
-    void setProgressCallback(const ProgressCallback & callback)
-    {
-        counting.setProgressCallback(callback);
-    }
-
-    void setProcessListElement(QueryStatusPtr elem)
-    {
-        counting.setProcessListElement(std::move(elem));
-    }
-
-protected:
-    CountingBase counting;
-};
-
 }
diff --git a/src/QueryPipeline/QueryPipeline.cpp b/src/QueryPipeline/QueryPipeline.cpp
index 569d4655460..935c006c217 100644
--- a/src/QueryPipeline/QueryPipeline.cpp
+++ b/src/QueryPipeline/QueryPipeline.cpp
@@ -553,11 +553,6 @@ void QueryPipeline::setProcessListElement(QueryStatusPtr elem)
         {
             counting->setProcessListElement(elem);
         }
-
-        if (auto * counting = dynamic_cast<SimpleCountingTransform *>(&input->getProcessor()))
-        {
-            counting->setProcessListElement(elem);
-        }
     }
 }
 

From 32a23244c9ca491200f35ee7a6e523f9f7f96620 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 30 Aug 2023 19:53:32 +0000
Subject: [PATCH 0945/1081] Remove context from comparison functions.

(cherry picked from commit 57608cc6f90ae7c29d7fc82ed228c1eaf6e25c73)
---
 src/Functions/FunctionsComparison.h |  9 ++++-----
 src/Functions/equals.cpp            | 12 ++++++++++--
 src/Functions/greater.cpp           | 21 +++++++++++++++++----
 src/Functions/greaterOrEquals.cpp   | 29 ++++++++++++++++++++++++-----
 src/Functions/less.cpp              | 20 ++++++++++++++++----
 src/Functions/lessOrEquals.cpp      | 28 +++++++++++++++++++++++-----
 src/Functions/notEquals.cpp         | 12 ++++++++++--
 7 files changed, 104 insertions(+), 27 deletions(-)

diff --git a/src/Functions/FunctionsComparison.h b/src/Functions/FunctionsComparison.h
index 446d6c008f0..d04f76d051a 100644
--- a/src/Functions/FunctionsComparison.h
+++ b/src/Functions/FunctionsComparison.h
@@ -643,13 +643,12 @@ class FunctionComparison : public IFunction
 {
 public:
     static constexpr auto name = Name::name;
-    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionComparison>(context); }
+    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionComparison>(decimalCheckComparisonOverflow(context)); }
 
-    explicit FunctionComparison(ContextPtr context_)
-        : context(context_), check_decimal_overflow(decimalCheckComparisonOverflow(context)) {}
+    explicit FunctionComparison(bool check_decimal_overflow_)
+        : check_decimal_overflow(check_decimal_overflow_) {}
 
 private:
-    ContextPtr context;
     bool check_decimal_overflow = true;
 
     template <typename T0, typename T1>
@@ -1190,7 +1189,7 @@ public:
 
         if (left_tuple && right_tuple)
         {
-            auto func = FunctionToOverloadResolverAdaptor(FunctionComparison<Op, Name>::create(context));
+            auto func = FunctionToOverloadResolverAdaptor(std::make_shared<FunctionComparison<Op, Name>>(check_decimal_overflow));
 
             bool has_nullable = false;
             bool has_null = false;
diff --git a/src/Functions/equals.cpp b/src/Functions/equals.cpp
index de1cf623ea6..5c59daf0537 100644
--- a/src/Functions/equals.cpp
+++ b/src/Functions/equals.cpp
@@ -1,5 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
 
 
 namespace DB
@@ -16,9 +17,16 @@ template <>
 ColumnPtr FunctionComparison<EqualsOp, NameEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
+    FunctionOverloadResolverPtr func_builder_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(check_decimal_overflow));
+
+
+    FunctionOverloadResolverPtr func_builder_and
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+
     return executeTupleEqualityImpl(
-        FunctionFactory::instance().get("equals", context),
-        FunctionFactory::instance().get("and", context),
+        func_builder_equals,
+        func_builder_and,
         x, y, tuple_size, input_rows_count);
 }
 
diff --git a/src/Functions/greater.cpp b/src/Functions/greater.cpp
index c36f8d7acca..60fbd18a4e7 100644
--- a/src/Functions/greater.cpp
+++ b/src/Functions/greater.cpp
@@ -1,11 +1,14 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
+
 
 
 namespace DB
 {
 
 using FunctionGreater = FunctionComparison<GreaterOp, NameGreater>;
+using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
 
 REGISTER_FUNCTION(Greater)
 {
@@ -16,14 +19,24 @@ template <>
 ColumnPtr FunctionComparison<GreaterOp, NameGreater>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
-    auto greater = FunctionFactory::instance().get("greater", context);
+    FunctionOverloadResolverPtr greater
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionGreater>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr func_builder_or
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionOr>());
+
+    FunctionOverloadResolverPtr func_builder_and
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+
+    FunctionOverloadResolverPtr func_builder_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(check_decimal_overflow));
 
     return executeTupleLessGreaterImpl(
         greater,
         greater,
-        FunctionFactory::instance().get("and", context),
-        FunctionFactory::instance().get("or", context),
-        FunctionFactory::instance().get("equals", context),
+        func_builder_and,
+        func_builder_or,
+        func_builder_equals,
         x, y, tuple_size, input_rows_count);
 }
 
diff --git a/src/Functions/greaterOrEquals.cpp b/src/Functions/greaterOrEquals.cpp
index 089ac4d5466..c77ca585c76 100644
--- a/src/Functions/greaterOrEquals.cpp
+++ b/src/Functions/greaterOrEquals.cpp
@@ -1,11 +1,14 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
 
 
 namespace DB
 {
 
 using FunctionGreaterOrEquals = FunctionComparison<GreaterOrEqualsOp, NameGreaterOrEquals>;
+using FunctionGreater = FunctionComparison<GreaterOp, NameGreater>;
+using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
 
 REGISTER_FUNCTION(GreaterOrEquals)
 {
@@ -16,12 +19,28 @@ template <>
 ColumnPtr FunctionComparison<GreaterOrEqualsOp, NameGreaterOrEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
+
+    FunctionOverloadResolverPtr greater
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionGreater>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr greater_or_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionGreaterOrEquals>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr func_builder_or
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionOr>());
+
+    FunctionOverloadResolverPtr func_builder_and
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+
+    FunctionOverloadResolverPtr func_builder_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(check_decimal_overflow));
+
     return executeTupleLessGreaterImpl(
-        FunctionFactory::instance().get("greater", context),
-        FunctionFactory::instance().get("greaterOrEquals", context),
-        FunctionFactory::instance().get("and", context),
-        FunctionFactory::instance().get("or", context),
-        FunctionFactory::instance().get("equals", context),
+        greater,
+        greater_or_equals,
+        func_builder_and,
+        func_builder_or,
+        func_builder_equals,
         x, y, tuple_size, input_rows_count);
 }
 
diff --git a/src/Functions/less.cpp b/src/Functions/less.cpp
index 63bfcfc9f40..0998dc60292 100644
--- a/src/Functions/less.cpp
+++ b/src/Functions/less.cpp
@@ -1,11 +1,13 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
 
 
 namespace DB
 {
 
 using FunctionLess = FunctionComparison<LessOp, NameLess>;
+using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
 
 REGISTER_FUNCTION(Less)
 {
@@ -16,14 +18,24 @@ template <>
 ColumnPtr FunctionComparison<LessOp, NameLess>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
-    auto less = FunctionFactory::instance().get("less", context);
+    FunctionOverloadResolverPtr less
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionLess>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr func_builder_or
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionOr>());
+
+    FunctionOverloadResolverPtr func_builder_and
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+
+    FunctionOverloadResolverPtr func_builder_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(check_decimal_overflow));
 
     return executeTupleLessGreaterImpl(
         less,
         less,
-        FunctionFactory::instance().get("and", context),
-        FunctionFactory::instance().get("or", context),
-        FunctionFactory::instance().get("equals", context),
+        func_builder_and,
+        func_builder_or,
+        func_builder_equals,
         x, y, tuple_size, input_rows_count);
 }
 
diff --git a/src/Functions/lessOrEquals.cpp b/src/Functions/lessOrEquals.cpp
index a91afabe226..e88ae34da75 100644
--- a/src/Functions/lessOrEquals.cpp
+++ b/src/Functions/lessOrEquals.cpp
@@ -1,11 +1,14 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
 
 
 namespace DB
 {
 
 using FunctionLessOrEquals = FunctionComparison<LessOrEqualsOp, NameLessOrEquals>;
+using FunctionLess = FunctionComparison<LessOp, NameLess>;
+using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
 
 REGISTER_FUNCTION(LessOrEquals)
 {
@@ -16,12 +19,27 @@ template <>
 ColumnPtr FunctionComparison<LessOrEqualsOp, NameLessOrEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
+    FunctionOverloadResolverPtr less_or_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionLessOrEquals>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr less
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionLess>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr func_builder_or
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionOr>());
+
+    FunctionOverloadResolverPtr func_builder_and
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionAnd>());
+
+    FunctionOverloadResolverPtr func_builder_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(check_decimal_overflow));
+
     return executeTupleLessGreaterImpl(
-        FunctionFactory::instance().get("less", context),
-        FunctionFactory::instance().get("lessOrEquals", context),
-        FunctionFactory::instance().get("and", context),
-        FunctionFactory::instance().get("or", context),
-        FunctionFactory::instance().get("equals", context),
+        less,
+        less_or_equals,
+        func_builder_and,
+        func_builder_or,
+        func_builder_equals,
         x, y, tuple_size, input_rows_count);
 }
 
diff --git a/src/Functions/notEquals.cpp b/src/Functions/notEquals.cpp
index 08bedff399e..38d0735898c 100644
--- a/src/Functions/notEquals.cpp
+++ b/src/Functions/notEquals.cpp
@@ -1,5 +1,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsComparison.h>
+#include <Functions/FunctionsLogical.h>
+
 
 
 namespace DB
@@ -16,9 +18,15 @@ template <>
 ColumnPtr FunctionComparison<NotEqualsOp, NameNotEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
 {
+    FunctionOverloadResolverPtr func_builder_not_equals
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionNotEquals>(check_decimal_overflow));
+
+    FunctionOverloadResolverPtr func_builder_or
+        = std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionOr>());
+
     return executeTupleEqualityImpl(
-        FunctionFactory::instance().get("notEquals", context),
-        FunctionFactory::instance().get("or", context),
+        func_builder_not_equals,
+        func_builder_or,
         x, y, tuple_size, input_rows_count);
 }
 

From eb3836ac5a8c38f5d68c59c692177a49abb17a2a Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Tue, 6 Feb 2024 11:16:08 +0100
Subject: [PATCH 0946/1081] Fix error "Read beyond last offset" for
 AsynchronousBoundedReadBuffer.

---
 .../IO/AsynchronousBoundedReadBuffer.cpp      | 43 ++++++++++++++-----
 src/Disks/IO/AsynchronousBoundedReadBuffer.h  |  3 ++
 2 files changed, 35 insertions(+), 11 deletions(-)

diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
index bd19540bf44..236ea486d36 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
@@ -69,12 +69,7 @@ bool AsynchronousBoundedReadBuffer::hasPendingDataToRead()
             return false;
 
         if (file_offset_of_buffer_end > *read_until_position)
-        {
-            throw Exception(
-                ErrorCodes::LOGICAL_ERROR,
-                "Read beyond last offset ({} > {}, info: {})",
-                file_offset_of_buffer_end, *read_until_position, impl->getInfoForLog());
-        }
+            throwReadBeyondLastOffset();
     }
 
     return true;
@@ -103,6 +98,18 @@ IAsynchronousReader::Result AsynchronousBoundedReadBuffer::readSync(char * data,
     return reader.execute(request);
 }
 
+size_t AsynchronousBoundedReadBuffer::getBufferSizeForReading() const
+{
+    size_t buffer_size = chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize());
+    if (read_until_position)
+    {
+        if (file_offset_of_buffer_end > *read_until_position)
+            throwReadBeyondLastOffset();
+        buffer_size = std::min(buffer_size, *read_until_position - file_offset_of_buffer_end);
+    }
+    return buffer_size;
+}
+
 void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
 {
     if (prefetch_future.valid())
@@ -114,7 +121,7 @@ void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
     last_prefetch_info.submit_time = std::chrono::system_clock::now();
     last_prefetch_info.priority = priority;
 
-    prefetch_buffer.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+    prefetch_buffer.resize(getBufferSizeForReading());
     prefetch_future = readAsync(prefetch_buffer.data(), prefetch_buffer.size(), priority);
     ProfileEvents::increment(ProfileEvents::RemoteFSPrefetches);
 }
@@ -126,14 +133,15 @@ void AsynchronousBoundedReadBuffer::setReadUntilPosition(size_t position)
         if (position < file_offset_of_buffer_end)
         {
             /// file has been read beyond new read until position already
-            if (working_buffer.size() >= file_offset_of_buffer_end - position)
+            if (available() >= file_offset_of_buffer_end - position)
             {
-                /// new read until position is inside working buffer
+                /// new read until position is after the current position in the working buffer
                 file_offset_of_buffer_end = position;
+                working_buffer.resize(working_buffer.size() - (file_offset_of_buffer_end - position));
             }
             else
             {
-                /// new read until position is before working buffer begin
+                /// new read until position is before the current position in the working buffer
                 throw Exception(
                     ErrorCodes::LOGICAL_ERROR,
                     "Attempt to set read until position before already read data ({} > {}, info: {})",
@@ -155,6 +163,16 @@ void AsynchronousBoundedReadBuffer::setReadUntilPosition(size_t position)
     }
 }
 
+void AsynchronousBoundedReadBuffer::throwReadBeyondLastOffset() const
+{
+    size_t file_size = impl->getFileSize();
+    size_t read_end_position = read_until_position ? *read_until_position : file_size;
+    throw Exception(
+        ErrorCodes::LOGICAL_ERROR,
+        "Read beyond last offset ({} > {}): file size = {}, info: {}",
+        file_offset_of_buffer_end, read_end_position, file_size, impl->getInfoForLog());
+}
+
 void AsynchronousBoundedReadBuffer::appendToPrefetchLog(
     FilesystemPrefetchState state,
     int64_t size,
@@ -210,7 +228,7 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     }
     else
     {
-        memory.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
+        memory.resize(getBufferSizeForReading());
 
         {
             ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::SynchronousRemoteReadWaitMicroseconds);
@@ -238,6 +256,9 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     /// so we use [impl->getImplementationBufferOffset(), impl->getFileSize()]
     chassert(file_offset_of_buffer_end <= impl->getFileSize());
 
+    if (read_until_position && (file_offset_of_buffer_end > *read_until_position))
+        throwReadBeyondLastOffset();
+
     return bytes_read;
 }
 
diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.h b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
index e5030f37b1d..b945aed28f0 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.h
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
@@ -94,8 +94,11 @@ private:
 
     IAsynchronousReader::Result readSync(char * data, size_t size);
 
+    size_t getBufferSizeForReading() const;
+
     void resetPrefetch(FilesystemPrefetchState state);
 
+    [[noreturn]] void throwReadBeyondLastOffset() const;
 };
 
 }

From 8919e3b011796d837064a30400775497b5c6aeac Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Tue, 6 Feb 2024 18:28:26 +0100
Subject: [PATCH 0947/1081] Add test.

---
 ...gtest_asynchronous_bounded_read_buffer.cpp | 82 +++++++++++++++++++
 1 file changed, 82 insertions(+)
 create mode 100644 src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp

diff --git a/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp b/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp
new file mode 100644
index 00000000000..5fee295f53a
--- /dev/null
+++ b/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp
@@ -0,0 +1,82 @@
+#include <gtest/gtest.h>
+
+#include <Disks/IO/AsynchronousBoundedReadBuffer.h>
+#include <Disks/IO/ThreadPoolRemoteFSReader.h>
+#include <Disks/IO/createReadBufferFromFileBase.h>
+#include <IO/WriteBufferFromFile.h>
+#include <Poco/TemporaryFile.h>
+#include <filesystem>
+
+
+using namespace DB;
+namespace fs = std::filesystem;
+
+class AsynchronousBoundedReadBufferTest : public ::testing::TestWithParam<const char *>
+{
+public:
+    AsynchronousBoundedReadBufferTest() { fs::create_directories(temp_folder.path()); }
+
+    String makeTempFile(const String & contents)
+    {
+        String path = fmt::format("{}/{}", temp_folder.path(), counter);
+        ++counter;
+
+        WriteBufferFromFile out{path};
+        out.write(contents.data(), contents.size());
+        out.finalize();
+
+        return path;
+    }
+
+private:
+    Poco::TemporaryFile temp_folder;
+    size_t counter = 0;
+};
+
+String getAlphabetWithDigits()
+{
+    String contents = "";
+    for (char c = 'a'; c <= 'z'; ++c)
+        contents += c;
+    for (char c = '0'; c <= '9'; ++c)
+        contents += c;
+    return contents;
+}
+
+
+TEST_F(AsynchronousBoundedReadBufferTest, setReadUntilPosition)
+{
+    String file_path = makeTempFile(getAlphabetWithDigits());
+    ThreadPoolRemoteFSReader remote_fs_reader(4, 0);
+
+    for (bool with_prefetch : {false, true})
+    {
+        AsynchronousBoundedReadBuffer read_buffer(createReadBufferFromFileBase(file_path, {}), remote_fs_reader, {});
+        read_buffer.setReadUntilPosition(20);
+
+        auto try_read = [&](size_t count)
+        {
+            if (with_prefetch)
+                read_buffer.prefetch(Priority{0});
+
+            String str;
+            str.resize(count);
+            str.resize(read_buffer.read(str.data(), str.size()));
+            return str;
+        };
+
+        EXPECT_EQ(try_read(15), "abcdefghijklmno");
+        EXPECT_EQ(try_read(15), "pqrst");
+        EXPECT_EQ(try_read(15), "");
+
+        read_buffer.setReadUntilPosition(25);
+
+        EXPECT_EQ(try_read(15), "uvwxy");
+        EXPECT_EQ(try_read(15), "");
+
+        read_buffer.setReadUntilEnd();
+
+        EXPECT_EQ(try_read(15), "z0123456789");
+        EXPECT_EQ(try_read(15), "");
+    }
+}

From fd5b5722259344c60ff6ec77ae0a58a0949d66a9 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 14 Feb 2024 13:00:22 +0000
Subject: [PATCH 0948/1081] Fix

---
 src/Common/FailPoint.h            | 1 +
 src/Interpreters/executeQuery.cpp | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Common/FailPoint.h b/src/Common/FailPoint.h
index a0081d67081..6aafbc0053a 100644
--- a/src/Common/FailPoint.h
+++ b/src/Common/FailPoint.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include "config.h"
 #include <Common/Exception.h>
 #include <Core/Types.h>
 #include <Poco/Util/AbstractConfiguration.h>
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index e8a032974c6..11eaffb99ff 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1380,7 +1380,7 @@ void executeQuery(
                     result_details.content_type = output_format->getContentType();
                     result_details.format = format_name;
 
-                    fiu_do_on(FailPoint::execute_query_calling_empty_set_result_func_on_exception, {
+                    fiu_do_on(FailPoints::execute_query_calling_empty_set_result_func_on_exception, {
                         set_result_details = nullptr;
                         set_result_details(result_details);
                     });

From 41304c3e11934e105dbb82dd805bc4414ab952ac Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Wed, 14 Feb 2024 14:08:20 +0100
Subject: [PATCH 0949/1081] Update src/Functions/FunctionBinaryArithmetic.h

Co-authored-by: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
---
 src/Functions/FunctionBinaryArithmetic.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index fa2ff8fc275..967c2b73881 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -644,7 +644,8 @@ private:
             {
                 if ((*right_nullmap)[0])
                 {
-                    c[0] = ResultType();
+                    for (size_t i = 0; i < size; ++i)
+                        c[i] = ResultType();
                     return;
                 }
 

From 0bee591a0cf94160dff9846a16e47eec0e1d4182 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 14 Feb 2024 09:26:28 +0100
Subject: [PATCH 0950/1081] Fix build

---
 programs/keeper/CMakeLists.txt         | 1 +
 src/Server/PrometheusMetricsWriter.cpp | 8 +++++++-
 2 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index 143ded0ee85..1688ec6a93a 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -39,6 +39,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperContext.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperStateManager.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperStorage.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperConstants.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/KeeperAsynchronousMetrics.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/pathUtils.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Coordination/SessionExpiryQueue.cpp
diff --git a/src/Server/PrometheusMetricsWriter.cpp b/src/Server/PrometheusMetricsWriter.cpp
index 70a2fa0a41b..d0fdcd61493 100644
--- a/src/Server/PrometheusMetricsWriter.cpp
+++ b/src/Server/PrometheusMetricsWriter.cpp
@@ -4,6 +4,8 @@
 #include <Common/re2.h>
 #include <algorithm>
 
+#include "config.h"
+
 namespace
 {
 
@@ -103,6 +105,7 @@ void writeAsyncMetrics(DB::WriteBuffer & wb, const DB::AsynchronousMetricValues
 
 }
 
+#if USE_NURAFT
 namespace ProfileEvents
 {
     extern const std::vector<Event> keeper_profile_events;
@@ -112,6 +115,7 @@ namespace CurrentMetrics
 {
     extern const std::vector<Metric> keeper_metrics;
 }
+#endif
 
 
 namespace DB
@@ -177,8 +181,9 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
 
 }
 
-void KeeperPrometheusMetricsWriter::write(WriteBuffer & wb) const
+void KeeperPrometheusMetricsWriter::write([[maybe_unused]] WriteBuffer & wb) const
 {
+#if USE_NURAFT
     if (send_events)
     {
         for (auto event : ProfileEvents::keeper_profile_events)
@@ -193,6 +198,7 @@ void KeeperPrometheusMetricsWriter::write(WriteBuffer & wb) const
 
     if (send_asynchronous_metrics)
         writeAsyncMetrics(wb, async_metrics.getValues());
+#endif
 }
 
 }

From eafa4219d9aeadd732c67372eef7aaf428afdc06 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 14 Feb 2024 13:17:55 +0000
Subject: [PATCH 0951/1081] Remove unnecessary include

---
 src/Common/FailPoint.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Common/FailPoint.cpp b/src/Common/FailPoint.cpp
index e0639df29b4..a23133b7522 100644
--- a/src/Common/FailPoint.cpp
+++ b/src/Common/FailPoint.cpp
@@ -1,4 +1,3 @@
-#include "config.h"
 #include <Common/Exception.h>
 #include <Common/FailPoint.h>
 #include <Common/Config/ConfigHelper.h>

From d5ab7d8df08fecb0235416e7c5b15630cae4201b Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Wed, 14 Feb 2024 13:19:34 +0000
Subject: [PATCH 0952/1081] Keep header the same as before

---
 src/Common/FailPoint.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/FailPoint.h b/src/Common/FailPoint.h
index 6aafbc0053a..613cfb15322 100644
--- a/src/Common/FailPoint.h
+++ b/src/Common/FailPoint.h
@@ -1,6 +1,6 @@
 #pragma once
-
 #include "config.h"
+
 #include <Common/Exception.h>
 #include <Core/Types.h>
 #include <Poco/Util/AbstractConfiguration.h>

From e95726f57c3e9ff2d3a6cd466c5820323d33963e Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 14 Feb 2024 13:21:23 +0000
Subject: [PATCH 0953/1081] Analyzer: Fix test_shard_level_const_function

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp   | 2 +-
 tests/analyzer_integration_broken_tests.txt | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 2510d35f720..5a13103d6ef 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -5667,7 +5667,7 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
 
         /// Do not constant fold get scalar functions
         bool disable_constant_folding = function_name == "__getScalar" || function_name == "shardNum" ||
-            function_name == "shardCount" || function_name == "hostName";
+            function_name == "shardCount" || function_name == "hostName" || function_name == "tcpPort";
 
         /** If function is suitable for constant folding try to convert it to constant.
           * Example: SELECT plus(1, 1);
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index b2576bfdb2e..52799085622 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -10,7 +10,6 @@ test_mutations_with_merge_tree/test.py::test_mutations_with_merge_background_tas
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_select_access_rights/test_main.py::test_alias_columns
 test_settings_profile/test.py::test_show_profiles
-test_shard_level_const_function/test.py::test_remote
 test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
 test_storage_rabbitmq/test.py::test_rabbitmq_materialized_view
 test_wrong_db_or_table_name/test.py::test_wrong_table_name

From c54a1d1d9777208e2c66d303cdf74b11dc0e7c02 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 14 Feb 2024 13:54:26 +0000
Subject: [PATCH 0954/1081] Add newlines to SettingsChangesHistory to maybe
 have less conflicts

---
 src/Core/SettingsChangesHistory.h | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index f22bb39e774..64650bf0ef5 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -84,7 +84,8 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
-    {"24.2", {{"async_insert_max_data_size", 1000000, 10485760, "The previous value appeared to be too small."},
+    {"24.2", {
+              {"async_insert_max_data_size", 1000000, 10485760, "The previous value appeared to be too small."},
               {"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
               {"async_insert_use_adaptive_busy_timeout", true, true, "Use adaptive asynchronous insert timeout"},
               {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
@@ -99,7 +100,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"min_external_table_block_size_rows", DEFAULT_INSERT_BLOCK_SIZE, DEFAULT_INSERT_BLOCK_SIZE, "Squash blocks passed to external table to specified size in rows, if blocks are not big enough"},
               {"min_external_table_block_size_bytes", DEFAULT_INSERT_BLOCK_SIZE * 256, DEFAULT_INSERT_BLOCK_SIZE * 256, "Squash blocks passed to external table to specified size in bytes, if blocks are not big enough."},
               {"parallel_replicas_prefer_local_join", true, true, "If true, and JOIN can be executed with parallel replicas algorithm, and all storages of right JOIN part are *MergeTree, local JOIN will be used instead of GLOBAL JOIN."},
-              {"extract_key_value_pairs_max_pairs_per_row", 0, 0, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory."}}},
+              {"extract_key_value_pairs_max_pairs_per_row", 0, 0, "Max number of pairs that can be produced by the `extractKeyValuePairs` function. Used as a safeguard against consuming too much memory."},
+              }},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},

From c1897e74a83101130ffa369dd6c58993c17f5e6f Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Wed, 14 Feb 2024 14:04:25 +0000
Subject: [PATCH 0955/1081] fix

---
 src/Functions/FunctionBinaryArithmetic.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 967c2b73881..9b4249b0aef 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -1708,9 +1708,9 @@ public:
                                 if (left.getScale() + right.getScale() > ResultDataType::maxPrecision())
                                     throw Exception(ErrorCodes::DECIMAL_OVERFLOW, "Overflow during decimal division");
                             }
-                            ResultDataType result_type = decimalResultType<is_multiply, is_division>(left, right);
-                            type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
                         }
+                        ResultDataType result_type = decimalResultType<is_multiply, is_division>(left, right);
+                        type_res = std::make_shared<ResultDataType>(result_type.getPrecision(), result_type.getScale());
                     }
                     else if constexpr (((IsDataTypeDecimal<LeftDataType> && IsFloatingPoint<RightDataType>) ||
                         (IsDataTypeDecimal<RightDataType> && IsFloatingPoint<LeftDataType>)))

From dca627026c7a67df3e89bd5cdcce80a4edbba151 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 19:51:14 +0300
Subject: [PATCH 0956/1081] ReplicatedMergeTree ALTER update metadata_version
 in single transaction

---
 src/Storages/StorageReplicatedMergeTree.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6119541ff52..f2fbb47957e 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -5817,6 +5817,7 @@ bool StorageReplicatedMergeTree::executeMetadataAlter(const StorageReplicatedMer
     Coordination::Requests requests;
     requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "columns", entry.columns_str, -1));
     requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "metadata", entry.metadata_str, -1));
+    requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "metadata_version", std::to_string(entry.alter_version), -1));
 
     auto table_id = getStorageID();
     auto alter_context = getContext();
@@ -5863,10 +5864,6 @@ bool StorageReplicatedMergeTree::executeMetadataAlter(const StorageReplicatedMer
         resetObjectColumnsFromActiveParts(parts_lock);
     }
 
-    /// This transaction may not happen, but it's OK, because on the next retry we will eventually create/update this node
-    /// TODO Maybe do in in one transaction for Replicated database?
-    zookeeper->createOrUpdate(fs::path(replica_path) / "metadata_version", std::to_string(current_metadata->getMetadataVersion()), zkutil::CreateMode::Persistent);
-
     return true;
 }
 

From be490291afde34d16bb7f6699bb4ad67e6eaeb12 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 14 Feb 2024 15:05:47 +0300
Subject: [PATCH 0957/1081] Updated implementation

---
 src/Storages/StorageReplicatedMergeTree.cpp   |  9 ++++-
 ...ge_tree_invalid_metadata_version.reference |  9 +++++
 ...ed_merge_tree_invalid_metadata_version.sql | 33 +++++++++++++++++++
 3 files changed, 50 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
 create mode 100644 tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index f2fbb47957e..8e1598a1eef 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -513,8 +513,15 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
             if (same_structure)
             {
                 Coordination::Stat metadata_stat;
-                current_zookeeper->get(zookeeper_path + "/metadata", &metadata_stat);
+                current_zookeeper->get(fs::path(zookeeper_path) / "metadata", &metadata_stat);
+
+                /** We change metadata_snapshot so that `createReplica` method will create `metadata_version` node in ZooKeeper
+                  * with version of table '/metadata' node in Zookeeper.
+                  *
+                  * Otherwise `metadata_version` for not first replica will be initialized with 0 by default.
+                  */
                 setInMemoryMetadata(metadata_snapshot->withMetadataVersion(metadata_stat.version));
+                metadata_snapshot = getInMemoryMetadataPtr();
             }
         }
         catch (Coordination::Exception & e)
diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
new file mode 100644
index 00000000000..15b2568912c
--- /dev/null
+++ b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
@@ -0,0 +1,9 @@
+Row 1:
+──────
+name:  metadata_version
+value: 1
+--
+id	UInt64					
+value	String					
+insert_time	DateTime					
+insert_time_updated	DateTime					
diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
new file mode 100644
index 00000000000..93ebe65bcde
--- /dev/null
+++ b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
@@ -0,0 +1,33 @@
+-- Tags: zookeeper
+
+DROP TABLE IF EXISTS test_table_replicated;
+CREATE TABLE test_table_replicated
+(
+    id UInt64,
+    value String
+) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '1_replica') ORDER BY id;
+
+ALTER TABLE test_table_replicated ADD COLUMN insert_time DateTime;
+
+DROP TABLE test_table_replicated;
+
+CREATE TABLE test_table_replicated
+(
+    id UInt64,
+    value String,
+    insert_time DateTime
+) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '2_replica') ORDER BY id;
+
+SELECT name, value FROM system.zookeeper
+WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/replicas/2_replica'
+AND name = 'metadata_version' FORMAT Vertical;
+
+SYSTEM RESTART REPLICA test_table_replicated;
+
+ALTER TABLE test_table_replicated ADD COLUMN insert_time_updated DateTime;
+
+SELECT '--';
+
+DESCRIBE test_table_replicated;
+
+DROP TABLE test_table_replicated;

From c11aa589554bc3e16c89b9e58f374bf31d521d1f Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 14 Feb 2024 18:03:01 +0300
Subject: [PATCH 0958/1081] Fixed tests

---
 ...replicated_merge_tree_invalid_metadata_version.reference | 5 +++++
 ...02989_replicated_merge_tree_invalid_metadata_version.sql | 6 ++++++
 2 files changed, 11 insertions(+)

diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
index 15b2568912c..128e3adcc0a 100644
--- a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
+++ b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
@@ -1,5 +1,10 @@
 Row 1:
 ──────
+name:    metadata
+version: 1
+--
+Row 1:
+──────
 name:  metadata_version
 value: 1
 --
diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
index 93ebe65bcde..f63971f456c 100644
--- a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
+++ b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
@@ -9,6 +9,10 @@ CREATE TABLE test_table_replicated
 
 ALTER TABLE test_table_replicated ADD COLUMN insert_time DateTime;
 
+SELECT name, version FROM system.zookeeper
+WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/'
+AND name = 'metadata' FORMAT Vertical;
+
 DROP TABLE test_table_replicated;
 
 CREATE TABLE test_table_replicated
@@ -18,6 +22,8 @@ CREATE TABLE test_table_replicated
     insert_time DateTime
 ) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '2_replica') ORDER BY id;
 
+SELECT '--';
+
 SELECT name, value FROM system.zookeeper
 WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/replicas/2_replica'
 AND name = 'metadata_version' FORMAT Vertical;

From f6d211b44da03ce02cc2b6aa55a5a84f899e7613 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 17:56:37 +0300
Subject: [PATCH 0959/1081] StorageSystemTables add metadata_version

---
 src/Storages/System/StorageSystemTables.cpp | 22 +++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index e0d2dd03e78..bed7cc1a4db 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -43,6 +43,7 @@ StorageSystemTables::StorageSystemTables(const StorageID & table_id_)
         {"data_paths", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Paths to the table data in the file systems."},
         {"metadata_path", std::make_shared<DataTypeString>(), "Path to the table metadata in the file system."},
         {"metadata_modification_time", std::make_shared<DataTypeDateTime>(), "Time of latest modification of the table metadata."},
+        {"metadata_version", std::make_shared<DataTypeInt32>(), "Metadata version for ReplicatedMergeTree."},
         {"dependencies_database", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Database dependencies."},
         {"dependencies_table", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Table dependencies (materialized views the current table)."},
         {"create_table_query", std::make_shared<DataTypeString>(), "The query that was used to create the table."},
@@ -287,6 +288,11 @@ protected:
                         if (columns_mask[src_index++])
                             res_columns[res_index++]->insertDefault();
 
+                        // metadata_version
+                        // Temporary tables does not support replication
+                        if (columns_mask[src_index++])
+                            res_columns[res_index++]->insert(-1);
+
                         // dependencies_database
                         if (columns_mask[src_index++])
                             res_columns[res_index++]->insertDefault();
@@ -418,6 +424,18 @@ protected:
                 if (columns_mask[src_index++])
                     res_columns[res_index++]->insert(static_cast<UInt64>(database->getObjectMetadataModificationTime(table_name)));
 
+                StorageMetadataPtr metadata_snapshot;
+                if (table)
+                    metadata_snapshot = table->getInMemoryMetadataPtr();
+
+                if (columns_mask[src_index++])
+                {
+                    if (metadata_snapshot && table->supportsReplication())
+                        res_columns[res_index++]->insert(metadata_snapshot->metadata_version);
+                    else
+                        res_columns[res_index++]->insert(-1);
+                }
+
                 {
                     Array views_table_name_array;
                     Array views_database_name_array;
@@ -482,10 +500,6 @@ protected:
                 else
                     src_index += 3;
 
-                StorageMetadataPtr metadata_snapshot;
-                if (table)
-                    metadata_snapshot = table->getInMemoryMetadataPtr();
-
                 ASTPtr expression_ptr;
                 if (columns_mask[src_index++])
                 {

From 0cce3862070ecdc9c20adc3bdf9c15fb8c2c00c9 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 13 Feb 2024 18:01:24 +0300
Subject: [PATCH 0960/1081] Added documentation

---
 docs/en/operations/system-tables/tables.md  | 2 ++
 src/Storages/System/StorageSystemTables.cpp | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/docs/en/operations/system-tables/tables.md b/docs/en/operations/system-tables/tables.md
index 8049ab091c0..fbfefe7c7da 100644
--- a/docs/en/operations/system-tables/tables.md
+++ b/docs/en/operations/system-tables/tables.md
@@ -27,6 +27,8 @@ Columns:
 
 - `metadata_modification_time` ([DateTime](../../sql-reference/data-types/datetime.md)) - Time of latest modification of the table metadata.
 
+- `metadata_version` ([Int32](../../sql-reference/data-types/int-uint.md)) - Metadata version for ReplicatedMergeTree table, -1 for non replicated table.
+
 - `dependencies_database` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Database dependencies.
 
 - `dependencies_table` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Table dependencies ([materialized views](../../sql-reference/statements/create/view.md#materialized-view) the current table).
diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index bed7cc1a4db..ac81ef5d174 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -43,7 +43,7 @@ StorageSystemTables::StorageSystemTables(const StorageID & table_id_)
         {"data_paths", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Paths to the table data in the file systems."},
         {"metadata_path", std::make_shared<DataTypeString>(), "Path to the table metadata in the file system."},
         {"metadata_modification_time", std::make_shared<DataTypeDateTime>(), "Time of latest modification of the table metadata."},
-        {"metadata_version", std::make_shared<DataTypeInt32>(), "Metadata version for ReplicatedMergeTree."},
+        {"metadata_version", std::make_shared<DataTypeInt32>(), "Metadata version for ReplicatedMergeTree table."},
         {"dependencies_database", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Database dependencies."},
         {"dependencies_table", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Table dependencies (materialized views the current table)."},
         {"create_table_query", std::make_shared<DataTypeString>(), "The query that was used to create the table."},

From d4778d858d319615d1f6105c0df23fba960ed382 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 14 Feb 2024 17:47:51 +0300
Subject: [PATCH 0961/1081] Fixed tests

---
 docs/en/operations/system-tables/tables.md    |  2 +-
 src/Storages/System/StorageSystemTables.cpp   | 10 ++--
 .../System/getQueriedColumnsMaskAndHeader.cpp |  5 +-
 .../02117_show_create_table_system.reference  |  1 +
 .../02117_show_create_table_system.sql        |  2 +-
 ...9_system_tables_metadata_version.reference |  9 ++++
 .../02989_system_tables_metadata_version.sql  | 50 +++++++++++++++++++
 7 files changed, 70 insertions(+), 9 deletions(-)
 create mode 100644 tests/queries/0_stateless/02989_system_tables_metadata_version.reference
 create mode 100644 tests/queries/0_stateless/02989_system_tables_metadata_version.sql

diff --git a/docs/en/operations/system-tables/tables.md b/docs/en/operations/system-tables/tables.md
index fbfefe7c7da..2132f69319e 100644
--- a/docs/en/operations/system-tables/tables.md
+++ b/docs/en/operations/system-tables/tables.md
@@ -27,7 +27,7 @@ Columns:
 
 - `metadata_modification_time` ([DateTime](../../sql-reference/data-types/datetime.md)) - Time of latest modification of the table metadata.
 
-- `metadata_version` ([Int32](../../sql-reference/data-types/int-uint.md)) - Metadata version for ReplicatedMergeTree table, -1 for non replicated table.
+- `metadata_version` ([Int32](../../sql-reference/data-types/int-uint.md)) - Metadata version for ReplicatedMergeTree table, 0 for non ReplicatedMergeTree table.
 
 - `dependencies_database` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Database dependencies.
 
diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index ac81ef5d174..47c4a03a595 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -43,7 +43,7 @@ StorageSystemTables::StorageSystemTables(const StorageID & table_id_)
         {"data_paths", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Paths to the table data in the file systems."},
         {"metadata_path", std::make_shared<DataTypeString>(), "Path to the table metadata in the file system."},
         {"metadata_modification_time", std::make_shared<DataTypeDateTime>(), "Time of latest modification of the table metadata."},
-        {"metadata_version", std::make_shared<DataTypeInt32>(), "Metadata version for ReplicatedMergeTree table."},
+        {"metadata_version", std::make_shared<DataTypeInt32>(), "Metadata version for ReplicatedMergeTree table, 0 for non ReplicatedMergeTree table."},
         {"dependencies_database", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Database dependencies."},
         {"dependencies_table", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()), "Table dependencies (materialized views the current table)."},
         {"create_table_query", std::make_shared<DataTypeString>(), "The query that was used to create the table."},
@@ -291,7 +291,7 @@ protected:
                         // metadata_version
                         // Temporary tables does not support replication
                         if (columns_mask[src_index++])
-                            res_columns[res_index++]->insert(-1);
+                            res_columns[res_index++]->insertDefault();
 
                         // dependencies_database
                         if (columns_mask[src_index++])
@@ -317,7 +317,7 @@ protected:
                         while (src_index < columns_mask.size())
                         {
                             // total_rows
-                            if (src_index == 18 && columns_mask[src_index])
+                            if (src_index == 19 && columns_mask[src_index])
                             {
                                 if (auto total_rows = table.second->totalRows(settings))
                                     res_columns[res_index++]->insert(*total_rows);
@@ -325,7 +325,7 @@ protected:
                                     res_columns[res_index++]->insertDefault();
                             }
                             // total_bytes
-                            else if (src_index == 19 && columns_mask[src_index])
+                            else if (src_index == 20 && columns_mask[src_index])
                             {
                                 if (auto total_bytes = table.second->totalBytes(settings))
                                     res_columns[res_index++]->insert(*total_bytes);
@@ -433,7 +433,7 @@ protected:
                     if (metadata_snapshot && table->supportsReplication())
                         res_columns[res_index++]->insert(metadata_snapshot->metadata_version);
                     else
-                        res_columns[res_index++]->insert(-1);
+                        res_columns[res_index++]->insertDefault();
                 }
 
                 {
diff --git a/src/Storages/System/getQueriedColumnsMaskAndHeader.cpp b/src/Storages/System/getQueriedColumnsMaskAndHeader.cpp
index c29ccb590ed..b93fe7b8034 100644
--- a/src/Storages/System/getQueriedColumnsMaskAndHeader.cpp
+++ b/src/Storages/System/getQueriedColumnsMaskAndHeader.cpp
@@ -11,10 +11,11 @@ std::pair<std::vector<UInt8>, Block> getQueriedColumnsMaskAndHeader(const Block
     NameSet names_set(column_names.begin(), column_names.end());
     for (size_t i = 0; i < columns_mask.size(); ++i)
     {
-        if (names_set.contains(sample_block.getByPosition(i).name))
+        const auto & column_with_type_and_name = sample_block.getByPosition(i);
+        if (names_set.contains(column_with_type_and_name.name))
         {
             columns_mask[i] = 1;
-            header.insert(sample_block.getByPosition(i));
+            header.insert(column_with_type_and_name);
         }
     }
 
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 1b758f4132b..e60fb844de8 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -1083,6 +1083,7 @@ CREATE TABLE system.tables
     `data_paths` Array(String),
     `metadata_path` String,
     `metadata_modification_time` DateTime,
+    `metadata_version` Int32,
     `dependencies_database` Array(String),
     `dependencies_table` Array(String),
     `create_table_query` String,
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.sql b/tests/queries/0_stateless/02117_show_create_table_system.sql
index 32465abbed7..438f26dcca7 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.sql
+++ b/tests/queries/0_stateless/02117_show_create_table_system.sql
@@ -1,6 +1,6 @@
 /* we will `use system` to bypass style check,
 because `show create table` statement
-cannot fit the requirement in check-sytle, which is as
+cannot fit the requirement in check-style, which is as
 
 "# Queries to:
 tables_with_database_column=(
diff --git a/tests/queries/0_stateless/02989_system_tables_metadata_version.reference b/tests/queries/0_stateless/02989_system_tables_metadata_version.reference
new file mode 100644
index 00000000000..73f6a1ad346
--- /dev/null
+++ b/tests/queries/0_stateless/02989_system_tables_metadata_version.reference
@@ -0,0 +1,9 @@
+test_temporary_table_02989	0
+--
+test_table	0
+--
+test_table_replicated	0
+--
+test_table_replicated	1
+--
+test_table_replicated	2
diff --git a/tests/queries/0_stateless/02989_system_tables_metadata_version.sql b/tests/queries/0_stateless/02989_system_tables_metadata_version.sql
new file mode 100644
index 00000000000..9534b1f2e82
--- /dev/null
+++ b/tests/queries/0_stateless/02989_system_tables_metadata_version.sql
@@ -0,0 +1,50 @@
+-- Tags: zookeeper, no-parallel
+
+DROP TABLE IF EXISTS test_temporary_table_02989;
+CREATE TEMPORARY TABLE test_temporary_table_02989
+(
+    id UInt64,
+    value String
+) ENGINE=MergeTree ORDER BY id;
+
+SELECT name, metadata_version FROM system.tables WHERE name = 'test_temporary_table_02989' AND is_temporary;
+
+DROP TABLE test_temporary_table_02989;
+
+DROP TABLE IF EXISTS test_table;
+CREATE TABLE test_table
+(
+    id UInt64,
+    value String
+) ENGINE=MergeTree ORDER BY id;
+
+SELECT '--';
+
+SELECT name, metadata_version FROM system.tables WHERE database = currentDatabase() AND name = 'test_table';
+
+DROP TABLE test_table;
+
+DROP TABLE IF EXISTS test_table_replicated;
+CREATE TABLE test_table_replicated
+(
+    id UInt64,
+    value String
+) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '1_replica') ORDER BY id;
+
+SELECT '--';
+
+SELECT name, metadata_version FROM system.tables WHERE database = currentDatabase() AND name = 'test_table_replicated';
+
+ALTER TABLE test_table_replicated ADD COLUMN insert_time DateTime;
+
+SELECT '--';
+
+SELECT name, metadata_version FROM system.tables WHERE database = currentDatabase() AND name = 'test_table_replicated';
+
+ALTER TABLE test_table_replicated ADD COLUMN insert_time_updated DateTime;
+
+SELECT '--';
+
+SELECT name, metadata_version FROM system.tables WHERE database = currentDatabase() AND name = 'test_table_replicated';
+
+DROP TABLE test_table_replicated;

From 5f87956fc8004bb077bc8161892120b6bca5bac3 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Wed, 14 Feb 2024 16:18:10 +0100
Subject: [PATCH 0962/1081] impl

---
 src/Storages/StorageDistributed.cpp | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 5fb404da1cf..6cd9ce1aa8f 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -976,8 +976,10 @@ std::optional<QueryPipeline> StorageDistributed::distributedWriteBetweenDistribu
         new_query->select = select_with_union_query;
     }
 
-    const Cluster::AddressesWithFailover & src_addresses = src_distributed.getCluster()->getShardsAddresses();
-    const Cluster::AddressesWithFailover & dst_addresses = getCluster()->getShardsAddresses();
+    const auto src_cluster = src_distributed.getCluster();
+    const auto dst_cluster = getCluster();
+    const Cluster::AddressesWithFailover & src_addresses = src_cluster->getShardsAddresses();
+    const Cluster::AddressesWithFailover & dst_addresses = dst_cluster->getShardsAddresses();
     /// Compare addresses instead of cluster name, to handle remote()/cluster().
     /// (since for remote()/cluster() the getClusterName() is empty string)
     if (src_addresses != dst_addresses)
@@ -1006,8 +1008,7 @@ std::optional<QueryPipeline> StorageDistributed::distributedWriteBetweenDistribu
         new_query->table_function.reset();
     }
 
-    const auto & cluster = getCluster();
-    const auto & shards_info = cluster->getShardsInfo();
+    const auto & shards_info = dst_cluster->getShardsInfo();
 
     String new_query_str;
     {
@@ -1138,7 +1139,8 @@ std::optional<QueryPipeline> StorageDistributed::distributedWriteFromClusterStor
     auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(current_settings);
 
     /// Here we take addresses from destination cluster and assume source table exists on these nodes
-    for (const auto & replicas : getCluster()->getShardsInfo())
+    const auto cluster = getCluster();
+    for (const auto & replicas : cluster->getShardsInfo())
     {
         /// Skip unavailable hosts if necessary
         auto try_results = replicas.pool->getMany(timeouts, current_settings, PoolMode::GET_MANY, /*async_callback*/ {}, /*skip_unavailable_endpoints*/ true);

From 17c9e2df6b4254c3810e1e5aacdee116374f7ab4 Mon Sep 17 00:00:00 2001
From: jktng <149093363+jktng@users.noreply.github.com>
Date: Wed, 14 Feb 2024 11:39:22 -0500
Subject: [PATCH 0963/1081] Update entrypoint.sh

---
 docker/server/entrypoint.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/server/entrypoint.sh b/docker/server/entrypoint.sh
index 69c0fdda351..79e809ea7f1 100755
--- a/docker/server/entrypoint.sh
+++ b/docker/server/entrypoint.sh
@@ -130,7 +130,7 @@ if [[ -n "${CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS}" || -z "${DATABASE_ALREADY_EXI
   RUN_INITDB_SCRIPTS='true'
 fi
 
-if [ -z "${RUN_INITDB_SCRIPTS}" ]; then
+if [ -n "${RUN_INITDB_SCRIPTS}" ]; then
     if [ -n "$(ls /docker-entrypoint-initdb.d/)" ] || [ -n "$CLICKHOUSE_DB" ]; then
         # port is needed to check if clickhouse-server is ready for connections
         HTTP_PORT="$(clickhouse extract-from-config --config-file "$CLICKHOUSE_CONFIG" --key=http_port --try)"

From 078ec9a97fd4f1a9651d45194f3e96c4fa6694a8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 14 Feb 2024 17:43:49 +0100
Subject: [PATCH 0964/1081] Update notEquals.cpp

---
 src/Functions/notEquals.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Functions/notEquals.cpp b/src/Functions/notEquals.cpp
index 38d0735898c..3a63db46711 100644
--- a/src/Functions/notEquals.cpp
+++ b/src/Functions/notEquals.cpp
@@ -2,8 +2,6 @@
 #include <Functions/FunctionsComparison.h>
 #include <Functions/FunctionsLogical.h>
 
-
-
 namespace DB
 {
 

From 70d456dc2837a0f1665031ee986d098630e9c8b9 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 14 Feb 2024 17:44:06 +0100
Subject: [PATCH 0965/1081] Update greater.cpp

---
 src/Functions/greater.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Functions/greater.cpp b/src/Functions/greater.cpp
index 60fbd18a4e7..2b87b376ce0 100644
--- a/src/Functions/greater.cpp
+++ b/src/Functions/greater.cpp
@@ -2,8 +2,6 @@
 #include <Functions/FunctionsComparison.h>
 #include <Functions/FunctionsLogical.h>
 
-
-
 namespace DB
 {
 

From 08df19157bb16c6c7fcab7dfed6e842022d0313c Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 14 Feb 2024 17:22:21 +0000
Subject: [PATCH 0966/1081] Update version_date.tsv and changelogs after
 v24.1.5.6-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.5.6-stable.md  | 17 +++++++++++++++++
 utils/list-versions/version_date.tsv |  1 +
 5 files changed, 21 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.5.6-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index ab1bc58da1b..d39ca312454 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.4.20"
+ARG VERSION="24.1.5.6"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 39187781a86..2d07937ad79 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.1.4.20"
+ARG VERSION="24.1.5.6"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 67ea2656310..d4775b17319 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.1.4.20"
+ARG VERSION="24.1.5.6"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.5.6-stable.md b/docs/changelogs/v24.1.5.6-stable.md
new file mode 100644
index 00000000000..ce46c51e2f4
--- /dev/null
+++ b/docs/changelogs/v24.1.5.6-stable.md
@@ -0,0 +1,17 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.5.6-stable (7f67181ff31) FIXME as compared to v24.1.4.20-stable (f59d842b3fa)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* UniqExactSet read crash fix [#59928](https://github.com/ClickHouse/ClickHouse/pull/59928) ([Maksim Kita](https://github.com/kitaisreal)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* CI: do not reuse builds on release branches [#59798](https://github.com/ClickHouse/ClickHouse/pull/59798) ([Max K.](https://github.com/maxknv)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index 312a33ac2d6..23fc0032056 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,4 @@
+v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02

From 54b43ee3a22ccfed8b8e8cc650efad7098b7d876 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 14 Feb 2024 18:33:55 +0100
Subject: [PATCH 0967/1081] Do not dump to the file, there are no pr_info
 locally

---
 tests/ci/mark_release_ready.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/ci/mark_release_ready.py b/tests/ci/mark_release_ready.py
index 011b3f28843..31415fef9c0 100755
--- a/tests/ci/mark_release_ready.py
+++ b/tests/ci/mark_release_ready.py
@@ -56,7 +56,6 @@ def main():
         description,
         RELEASE_READY_STATUS,
         pr_info,
-        dump_to_file=True,
     )
 
 
From a5e3b7982ac310591c815b37541926ce26bdb133 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 14 Feb 2024 18:38:00 +0100
Subject: [PATCH 0968/1081] Use the least awful and ugly way to check if all
 needs succeeded

---
 .github/workflows/master.yml           | 1 +
 .github/workflows/release_branches.yml | 1 +
 2 files changed, 2 insertions(+)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 209995bfbdd..0e83a777641 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -327,6 +327,7 @@ jobs:
       run_command: |
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
+    if: ${{ ! (contains(needs.*.result, 'skipped') || contains(needs.*.result, 'failure')) }}
     needs:
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index 6eb787e6453..c076c2209ec 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -228,6 +228,7 @@ jobs:
       run_command: |
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
+    if: ${{ ! (contains(needs.*.result, 'skipped') || contains(needs.*.result, 'failure')) }}
     needs:
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64

From 9a62d7e5bb2eaf6fe899cb8a1d9a004921cdecd2 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 14 Feb 2024 20:39:25 +0300
Subject: [PATCH 0969/1081] Fixed tests

---
 ...icated_merge_tree_invalid_metadata_version.sql | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
index f63971f456c..3e37f368fd8 100644
--- a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
+++ b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
@@ -13,27 +13,28 @@ SELECT name, version FROM system.zookeeper
 WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/'
 AND name = 'metadata' FORMAT Vertical;
 
-DROP TABLE test_table_replicated;
-
-CREATE TABLE test_table_replicated
+DROP TABLE IF EXISTS test_table_replicated_second;
+CREATE TABLE test_table_replicated_second
 (
     id UInt64,
     value String,
     insert_time DateTime
 ) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '2_replica') ORDER BY id;
 
+DROP TABLE test_table_replicated;
+
 SELECT '--';
 
 SELECT name, value FROM system.zookeeper
 WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/replicas/2_replica'
 AND name = 'metadata_version' FORMAT Vertical;
 
-SYSTEM RESTART REPLICA test_table_replicated;
+SYSTEM RESTART REPLICA test_table_replicated_second;
 
-ALTER TABLE test_table_replicated ADD COLUMN insert_time_updated DateTime;
+ALTER TABLE test_table_replicated_second ADD COLUMN insert_time_updated DateTime;
 
 SELECT '--';
 
-DESCRIBE test_table_replicated;
+DESCRIBE test_table_replicated_second;
 
-DROP TABLE test_table_replicated;
+DROP TABLE test_table_replicated_second;

From d842c497e6f0de7bf5544367faae9f38d260b647 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Wed, 14 Feb 2024 18:41:25 +0100
Subject: [PATCH 0970/1081] Change code to pass test
 02963_remote_read_small_buffer_size_bug.

---
 .../IO/AsynchronousBoundedReadBuffer.cpp      | 50 ++++++++-----------
 src/Disks/IO/AsynchronousBoundedReadBuffer.h  |  4 --
 ...gtest_asynchronous_bounded_read_buffer.cpp |  2 +-
 3 files changed, 23 insertions(+), 33 deletions(-)

diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
index 236ea486d36..2373640704b 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
@@ -69,7 +69,10 @@ bool AsynchronousBoundedReadBuffer::hasPendingDataToRead()
             return false;
 
         if (file_offset_of_buffer_end > *read_until_position)
-            throwReadBeyondLastOffset();
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Read beyond last offset ({} > {}): file size = {}, info: {}",
+                file_offset_of_buffer_end, *read_until_position, impl->getFileSize(), impl->getInfoForLog());
     }
 
     return true;
@@ -98,18 +101,6 @@ IAsynchronousReader::Result AsynchronousBoundedReadBuffer::readSync(char * data,
     return reader.execute(request);
 }
 
-size_t AsynchronousBoundedReadBuffer::getBufferSizeForReading() const
-{
-    size_t buffer_size = chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize());
-    if (read_until_position)
-    {
-        if (file_offset_of_buffer_end > *read_until_position)
-            throwReadBeyondLastOffset();
-        buffer_size = std::min(buffer_size, *read_until_position - file_offset_of_buffer_end);
-    }
-    return buffer_size;
-}
-
 void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
 {
     if (prefetch_future.valid())
@@ -121,7 +112,7 @@ void AsynchronousBoundedReadBuffer::prefetch(Priority priority)
     last_prefetch_info.submit_time = std::chrono::system_clock::now();
     last_prefetch_info.priority = priority;
 
-    prefetch_buffer.resize(getBufferSizeForReading());
+    prefetch_buffer.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
     prefetch_future = readAsync(prefetch_buffer.data(), prefetch_buffer.size(), priority);
     ProfileEvents::increment(ProfileEvents::RemoteFSPrefetches);
 }
@@ -163,16 +154,6 @@ void AsynchronousBoundedReadBuffer::setReadUntilPosition(size_t position)
     }
 }
 
-void AsynchronousBoundedReadBuffer::throwReadBeyondLastOffset() const
-{
-    size_t file_size = impl->getFileSize();
-    size_t read_end_position = read_until_position ? *read_until_position : file_size;
-    throw Exception(
-        ErrorCodes::LOGICAL_ERROR,
-        "Read beyond last offset ({} > {}): file size = {}, info: {}",
-        file_offset_of_buffer_end, read_end_position, file_size, impl->getInfoForLog());
-}
-
 void AsynchronousBoundedReadBuffer::appendToPrefetchLog(
     FilesystemPrefetchState state,
     int64_t size,
@@ -204,6 +185,7 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
         return false;
 
     chassert(file_offset_of_buffer_end <= impl->getFileSize());
+    size_t old_file_offset_of_buffer_end = file_offset_of_buffer_end;
 
     IAsynchronousReader::Result result;
     if (prefetch_future.valid())
@@ -228,7 +210,7 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     }
     else
     {
-        memory.resize(getBufferSizeForReading());
+        memory.resize(chooseBufferSizeForRemoteReading(read_settings, impl->getFileSize()));
 
         {
             ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::SynchronousRemoteReadWaitMicroseconds);
@@ -239,6 +221,9 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
         ProfileEvents::increment(ProfileEvents::RemoteFSUnprefetchedBytes, result.size);
     }
 
+    bytes_to_ignore = 0;
+    resetWorkingBuffer();
+
     size_t bytes_read = result.size - result.offset;
     if (bytes_read)
     {
@@ -249,7 +234,6 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     }
 
     file_offset_of_buffer_end = impl->getFileOffsetOfBufferEnd();
-    bytes_to_ignore = 0;
 
     /// In case of multiple files for the same file in clickhouse (i.e. log family)
     /// file_offset_of_buffer_end will not match getImplementationBufferOffset()
@@ -257,9 +241,19 @@ bool AsynchronousBoundedReadBuffer::nextImpl()
     chassert(file_offset_of_buffer_end <= impl->getFileSize());
 
     if (read_until_position && (file_offset_of_buffer_end > *read_until_position))
-        throwReadBeyondLastOffset();
+    {
+        size_t excessive_bytes_read = file_offset_of_buffer_end - *read_until_position;
 
-    return bytes_read;
+        if (excessive_bytes_read > working_buffer.size())
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "File offset moved too far: old_file_offset = {}, new_file_offset = {}, read_until_position = {}, bytes_read = {}",
+                            old_file_offset_of_buffer_end, file_offset_of_buffer_end, *read_until_position, bytes_read);
+
+        working_buffer.resize(working_buffer.size() - excessive_bytes_read);
+        file_offset_of_buffer_end = *read_until_position;
+    }
+
+    return !working_buffer.empty();
 }
 
 
diff --git a/src/Disks/IO/AsynchronousBoundedReadBuffer.h b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
index b945aed28f0..6dc76352aca 100644
--- a/src/Disks/IO/AsynchronousBoundedReadBuffer.h
+++ b/src/Disks/IO/AsynchronousBoundedReadBuffer.h
@@ -94,11 +94,7 @@ private:
 
     IAsynchronousReader::Result readSync(char * data, size_t size);
 
-    size_t getBufferSizeForReading() const;
-
     void resetPrefetch(FilesystemPrefetchState state);
-
-    [[noreturn]] void throwReadBeyondLastOffset() const;
 };
 
 }
diff --git a/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp b/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp
index 5fee295f53a..63a39fe39c7 100644
--- a/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp
+++ b/src/Disks/tests/gtest_asynchronous_bounded_read_buffer.cpp
@@ -35,7 +35,7 @@ private:
 
 String getAlphabetWithDigits()
 {
-    String contents = "";
+    String contents;
     for (char c = 'a'; c <= 'z'; ++c)
         contents += c;
     for (char c = '0'; c <= '9'; ++c)

From b1b58ef9a334ec27107a6919f08c4f109ccbdf8f Mon Sep 17 00:00:00 2001
From: Julia Kartseva <yulia.kartseva@gmail.com>
Date: Wed, 14 Feb 2024 12:54:42 -0800
Subject: [PATCH 0971/1081] Revert "Insert synchronously if dependent MV
 deduplication is enabled"

---
 src/Interpreters/executeQuery.cpp             |  2 -
 src/Server/TCPHandler.cpp                     |  2 +-
 ...c_inserts_for_dependent_mv_dedup.reference |  1 -
 ...e_async_inserts_for_dependent_mv_dedup.sql | 46 -------------------
 4 files changed, 1 insertion(+), 50 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
 delete mode 100644 tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 8b36790a269..dfa9cc056ee 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -927,8 +927,6 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
                 reason = "asynchronous insert queue is not configured";
             else if (insert_query->select)
                 reason = "insert query has select";
-            else if (settings.deduplicate_blocks_in_dependent_materialized_views)
-                reason = "dependent materialized views block deduplication is enabled";
             else if (insert_query->hasInlinedData())
                 async_insert = true;
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index e1086ac5833..2c4e9c1e3b2 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -933,7 +933,7 @@ void TCPHandler::processInsertQuery()
         if (auto table = DatabaseCatalog::instance().tryGetTable(insert_query.table_id, query_context))
             async_insert_enabled |= table->areAsynchronousInsertsEnabled();
 
-    if (insert_queue && async_insert_enabled && !insert_query.select && !settings.deduplicate_blocks_in_dependent_materialized_views)
+    if (insert_queue && async_insert_enabled && !insert_query.select)
     {
         auto result = processAsyncInsertQuery(*insert_queue);
         if (result.status == AsynchronousInsertQueue::PushResult::OK)
diff --git a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
deleted file mode 100644
index 4ff73b99975..00000000000
--- a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.reference
+++ /dev/null
@@ -1 +0,0 @@
-Values	Ok	4	Parsed
diff --git a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql b/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql
deleted file mode 100644
index 41b23374bfc..00000000000
--- a/tests/queries/0_stateless/02985_disable_async_inserts_for_dependent_mv_dedup.sql
+++ /dev/null
@@ -1,46 +0,0 @@
--- Tags: no-parallel
-
-SET async_insert = 1;
-SET insert_deduplicate = 1;
-SET deduplicate_blocks_in_dependent_materialized_views = 1;
-
-DROP TABLE IF EXISTS 02985_test;
-CREATE TABLE 02985_test
-(
-    d Date,
-    value UInt64
-) ENGINE = MergeTree ORDER BY tuple() SETTINGS non_replicated_deduplication_window = 1000;
-
-DROP VIEW IF EXISTS 02985_mv;
-CREATE MATERIALIZED VIEW 02985_mv
-ENGINE = SummingMergeTree ORDER BY d AS
-SELECT
-    d, sum(value) s
-FROM 02985_test GROUP BY d;
-
--- Inserts are synchronous.
-INSERT INTO 02985_test (*)
-VALUES ('2024-01-01', 1), ('2024-01-01', 2), ('2024-01-02', 1);
-
-SYSTEM FLUSH LOGS;
-
-SELECT format, status, rows, data_kind  FROM system.asynchronous_insert_log
-WHERE database = currentDatabase() AND table = '02985_test';
-
-SET deduplicate_blocks_in_dependent_materialized_views = 0;
-
--- Set a large value for async_insert_busy_timeout_max_ms to avoid flushing the entry synchronously.
-INSERT INTO 02985_test (*)
-SETTINGS
-    async_insert_busy_timeout_min_ms=200,
-    async_insert_busy_timeout_max_ms=100000
-VALUES ('2024-01-01', 1), ('2024-01-01', 2), ('2024-01-02', 1), ('2024-01-02', 4);
-
-SYSTEM FLUSH LOGS;
-
-SELECT format, status, rows, data_kind
-FROM system.asynchronous_insert_log
-WHERE database = currentDatabase() AND table = '02985_test';
-
-DROP VIEW IF EXISTS 02985_mv;
-DROP TABLE IF EXISTS 02985_test;

From 4f305cca41295032308c861e6ff934a2cebd7960 Mon Sep 17 00:00:00 2001
From: Jake Bamrah <login@bamrah.sh>
Date: Wed, 14 Feb 2024 22:55:54 +0000
Subject: [PATCH 0972/1081] Update min. clang version in Getting Started docs

---
 docs/en/development/developer-instruction.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/development/developer-instruction.md b/docs/en/development/developer-instruction.md
index 31346c77949..303e0e315d5 100644
--- a/docs/en/development/developer-instruction.md
+++ b/docs/en/development/developer-instruction.md
@@ -91,7 +91,7 @@ If you use Arch or Gentoo, you probably know it yourself how to install CMake.
 
 ## C++ Compiler {#c-compiler}
 
-Compilers Clang starting from version 15 is supported for building ClickHouse.
+Compilers Clang starting from version 16 is supported for building ClickHouse.
 
 Clang should be used instead of gcc. Though, our continuous integration (CI) platform runs checks for about a dozen of build combinations.
 

From 2688a6268caef7b7430a6a7ffc6aa057c1b4360a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 01:42:14 +0100
Subject: [PATCH 0973/1081] Fix obviously wrong (but non significant) error in
 dictionaries

---
 src/Dictionaries/CacheDictionary.h                            | 2 +-
 src/Dictionaries/DirectDictionary.h                           | 2 +-
 src/Dictionaries/FlatDictionary.h                             | 2 +-
 src/Dictionaries/HashedArrayDictionary.h                      | 2 +-
 src/Dictionaries/HashedDictionary.h                           | 2 +-
 src/Dictionaries/IDictionary.h                                | 3 +++
 src/Dictionaries/IPAddressDictionary.h                        | 2 +-
 src/Dictionaries/PolygonDictionary.h                          | 2 +-
 src/Dictionaries/RangeHashedDictionary.h                      | 2 +-
 src/Dictionaries/RegExpTreeDictionary.h                       | 2 +-
 .../queries/0_stateless/01852_dictionary_found_rate_long.sql  | 3 +++
 .../queries/0_stateless/02832_alter_max_sessions_for_user.sh  | 4 ++--
 12 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/src/Dictionaries/CacheDictionary.h b/src/Dictionaries/CacheDictionary.h
index aae86a83f12..041d763dc83 100644
--- a/src/Dictionaries/CacheDictionary.h
+++ b/src/Dictionaries/CacheDictionary.h
@@ -85,7 +85,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override
diff --git a/src/Dictionaries/DirectDictionary.h b/src/Dictionaries/DirectDictionary.h
index 214c8ef8a13..ea0baf929f1 100644
--- a/src/Dictionaries/DirectDictionary.h
+++ b/src/Dictionaries/DirectDictionary.h
@@ -41,7 +41,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/FlatDictionary.h b/src/Dictionaries/FlatDictionary.h
index a54916c5cd1..df48e4f48b0 100644
--- a/src/Dictionaries/FlatDictionary.h
+++ b/src/Dictionaries/FlatDictionary.h
@@ -48,7 +48,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/HashedArrayDictionary.h b/src/Dictionaries/HashedArrayDictionary.h
index 86b21443e18..de17c98e7ac 100644
--- a/src/Dictionaries/HashedArrayDictionary.h
+++ b/src/Dictionaries/HashedArrayDictionary.h
@@ -64,7 +64,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/HashedDictionary.h b/src/Dictionaries/HashedDictionary.h
index 0b8419dd242..17d3ef51cad 100644
--- a/src/Dictionaries/HashedDictionary.h
+++ b/src/Dictionaries/HashedDictionary.h
@@ -106,7 +106,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/IDictionary.h b/src/Dictionaries/IDictionary.h
index f1834b4b129..d3e28682f35 100644
--- a/src/Dictionaries/IDictionary.h
+++ b/src/Dictionaries/IDictionary.h
@@ -109,6 +109,9 @@ public:
 
     virtual size_t getQueryCount() const = 0;
 
+    /// The percentage of time a lookup successfully found an entry.
+    /// When there were no lookups, it returns zero (instead of NaN).
+    /// The value is calculated non atomically and can be slightly off in the presence of concurrent lookups.
     virtual double getFoundRate() const = 0;
 
     virtual double getHitRate() const = 0;
diff --git a/src/Dictionaries/IPAddressDictionary.h b/src/Dictionaries/IPAddressDictionary.h
index d758e23043d..0fb60844867 100644
--- a/src/Dictionaries/IPAddressDictionary.h
+++ b/src/Dictionaries/IPAddressDictionary.h
@@ -48,7 +48,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/PolygonDictionary.h b/src/Dictionaries/PolygonDictionary.h
index a856d12b66c..4afe8664102 100644
--- a/src/Dictionaries/PolygonDictionary.h
+++ b/src/Dictionaries/PolygonDictionary.h
@@ -78,7 +78,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index c44bffe42e1..0b484032577 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -92,7 +92,7 @@ public:
         size_t queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/RegExpTreeDictionary.h b/src/Dictionaries/RegExpTreeDictionary.h
index 78b7f441d34..bf76820ba1e 100644
--- a/src/Dictionaries/RegExpTreeDictionary.h
+++ b/src/Dictionaries/RegExpTreeDictionary.h
@@ -65,7 +65,7 @@ public:
         const auto queries = query_count.load(std::memory_order_relaxed);
         if (!queries)
             return 0;
-        return static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries;
+        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql b/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
index 09ca0e2063d..c9ce28e2e99 100644
--- a/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
+++ b/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
@@ -263,9 +263,12 @@ SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'ip_trie_source_table_01
 LAYOUT(IP_TRIE())
 LIFETIME(MIN 0 MAX 1000);
 
+-- found_rate = 0, because we didn't make any searches.
 SELECT name, found_rate FROM system.dictionaries WHERE database = currentDatabase() AND name = 'ip_trie_dictionary_01862';
+-- found_rate = 1, because the dictionary covers the 127.0.0.1 address.
 SELECT dictGet('ip_trie_dictionary_01862', 'value', tuple(toIPv4('127.0.0.1'))) FORMAT Null;
 SELECT name, found_rate FROM system.dictionaries WHERE database = currentDatabase() AND name = 'ip_trie_dictionary_01862';
+-- found_rate = 0.5, because the dictionary does not cover 1.1.1.1 and we have two lookups in total as of now.
 SELECT dictGet('ip_trie_dictionary_01862', 'value', tuple(toIPv4('1.1.1.1'))) FORMAT Null;
 SELECT name, found_rate FROM system.dictionaries WHERE database = currentDatabase() AND name = 'ip_trie_dictionary_01862';
 
diff --git a/tests/queries/0_stateless/02832_alter_max_sessions_for_user.sh b/tests/queries/0_stateless/02832_alter_max_sessions_for_user.sh
index 546c54a4de9..a3b0d17f1be 100755
--- a/tests/queries/0_stateless/02832_alter_max_sessions_for_user.sh
+++ b/tests/queries/0_stateless/02832_alter_max_sessions_for_user.sh
@@ -23,14 +23,14 @@ function test_alter_profile()
 
     ${CLICKHOUSE_CLIENT} -q $"ALTER SETTINGS PROFILE ${PROFILE} SETTINGS max_sessions_for_user = ${max_session_count}"
 
-    # Create sesssions with $max_session_count resriction
+    # Create sessions with $max_session_count restriction
     for ((i = 1 ; i <= ${max_session_count} ; i++)); do
         local session_id="${SESSION_ID_PREFIX}_${i}"
          # Skip output from this query 
          ${CLICKHOUSE_CURL} -sS -X POST "${CLICKHOUSE_URL}&user=${USER}&session_id=${session_id}&session_check=0" --data-binary "SELECT 1" > /dev/null
     done
 
-    # Update resriction to $alter_sessions_count
+    # Update restriction to $alter_sessions_count
     ${CLICKHOUSE_CLIENT} -q $"ALTER SETTINGS PROFILE ${PROFILE} SETTINGS max_sessions_for_user = ${alter_sessions_count}"
 
     # Simultaneous sessions should use max settings from profile ($alter_sessions_count)

From 8e0504038d90e6c6594b745022bf8bf43ac836f8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 02:05:44 +0100
Subject: [PATCH 0974/1081] Maybe better

---
 .../01852_dictionary_found_rate_long.sql      | 22 +++++++++----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql b/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
index c9ce28e2e99..d5108e98510 100644
--- a/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
+++ b/tests/queries/0_stateless/01852_dictionary_found_rate_long.sql
@@ -22,7 +22,7 @@ CREATE DICTIONARY simple_key_flat_dictionary_01862
     value String
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'simple_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'simple_key_source_table_01862'))
 LAYOUT(FLAT())
 LIFETIME(MIN 0 MAX 1000);
 
@@ -43,7 +43,7 @@ CREATE DICTIONARY simple_key_direct_dictionary_01862
     value String
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'simple_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'simple_key_source_table_01862'))
 LAYOUT(DIRECT());
 
 -- check that found_rate is 0, not nan
@@ -65,7 +65,7 @@ CREATE DICTIONARY simple_key_hashed_dictionary_01862
     value String
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'simple_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'simple_key_source_table_01862'))
 LAYOUT(HASHED())
 LIFETIME(MIN 0 MAX 1000);
 
@@ -85,7 +85,7 @@ CREATE DICTIONARY simple_key_sparse_hashed_dictionary_01862
     value String
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'simple_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'simple_key_source_table_01862'))
 LAYOUT(SPARSE_HASHED())
 LIFETIME(MIN 0 MAX 1000);
 
@@ -105,7 +105,7 @@ CREATE DICTIONARY simple_key_cache_dictionary_01862
     value String
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'simple_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'simple_key_source_table_01862'))
 LAYOUT(CACHE(SIZE_IN_CELLS 100000))
 LIFETIME(MIN 0 MAX 1000);
 
@@ -143,7 +143,7 @@ CREATE DICTIONARY complex_key_hashed_dictionary_01862
     value String
 )
 PRIMARY KEY id, id_key
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'complex_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'complex_key_source_table_01862'))
 LAYOUT(COMPLEX_KEY_HASHED())
 LIFETIME(MIN 0 MAX 1000);
 
@@ -164,7 +164,7 @@ CREATE DICTIONARY complex_key_direct_dictionary_01862
     value String
 )
 PRIMARY KEY id, id_key
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'complex_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'complex_key_source_table_01862'))
 LAYOUT(COMPLEX_KEY_DIRECT());
 
 SELECT name, found_rate FROM system.dictionaries WHERE database = currentDatabase() AND name = 'complex_key_direct_dictionary_01862';
@@ -184,7 +184,7 @@ CREATE DICTIONARY complex_key_cache_dictionary_01862
     value String
 )
 PRIMARY KEY id, id_key
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'complex_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'complex_key_source_table_01862'))
 LAYOUT(COMPLEX_KEY_CACHE(SIZE_IN_CELLS 100000))
 LIFETIME(MIN 0 MAX 1000);
 
@@ -223,7 +223,7 @@ CREATE DICTIONARY simple_key_range_hashed_dictionary_01862
     last Date
 )
 PRIMARY KEY id
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'range_key_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'range_key_source_table_01862'))
 LAYOUT(RANGE_HASHED())
 RANGE(MIN first MAX last)
 LIFETIME(MIN 0 MAX 1000);
@@ -259,7 +259,7 @@ CREATE DICTIONARY ip_trie_dictionary_01862
     value String
 )
 PRIMARY KEY prefix
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'ip_trie_source_table_01862'))
+SOURCE(CLICKHOUSE(TABLE 'ip_trie_source_table_01862'))
 LAYOUT(IP_TRIE())
 LIFETIME(MIN 0 MAX 1000);
 
@@ -302,7 +302,7 @@ CREATE DICTIONARY polygon_dictionary_01862
     name String
 )
 PRIMARY KEY key
-SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() USER 'default' TABLE 'polygons_01862'))
+SOURCE(CLICKHOUSE(USER 'default' TABLE 'polygons_01862'))
 LIFETIME(0)
 LAYOUT(POLYGON());
 

From 46fb01c4f69668d0a48bfa0d7b19a8b3abdd4230 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 02:31:46 +0100
Subject: [PATCH 0975/1081] Fix trash

---
 src/Dictionaries/CacheDictionary.h       | 10 +++++-----
 src/Dictionaries/DirectDictionary.h      |  6 +++---
 src/Dictionaries/FlatDictionary.h        |  6 +++---
 src/Dictionaries/HashedArrayDictionary.h |  6 +++---
 src/Dictionaries/HashedDictionary.h      |  6 +++---
 src/Dictionaries/IPAddressDictionary.h   |  6 +++---
 src/Dictionaries/PolygonDictionary.h     |  6 +++---
 src/Dictionaries/RangeHashedDictionary.h |  6 +++---
 src/Dictionaries/RegExpTreeDictionary.h  |  6 +++---
 src/Disks/VolumeJBOD.cpp                 |  2 +-
 src/Interpreters/Context.cpp             |  8 ++++----
 11 files changed, 34 insertions(+), 34 deletions(-)

diff --git a/src/Dictionaries/CacheDictionary.h b/src/Dictionaries/CacheDictionary.h
index 041d763dc83..a52bcbc4ae4 100644
--- a/src/Dictionaries/CacheDictionary.h
+++ b/src/Dictionaries/CacheDictionary.h
@@ -78,22 +78,22 @@ public:
 
     double getLoadFactor() const override;
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return static_cast<double>(hit_count.load(std::memory_order_acquire)) / queries;
+        return static_cast<double>(hit_count.load()) / queries;
     }
 
     bool supportUpdates() const override { return false; }
diff --git a/src/Dictionaries/DirectDictionary.h b/src/Dictionaries/DirectDictionary.h
index ea0baf929f1..73340904684 100644
--- a/src/Dictionaries/DirectDictionary.h
+++ b/src/Dictionaries/DirectDictionary.h
@@ -34,14 +34,14 @@ public:
 
     size_t getBytesAllocated() const override { return 0; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/FlatDictionary.h b/src/Dictionaries/FlatDictionary.h
index df48e4f48b0..aac55610351 100644
--- a/src/Dictionaries/FlatDictionary.h
+++ b/src/Dictionaries/FlatDictionary.h
@@ -41,14 +41,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/HashedArrayDictionary.h b/src/Dictionaries/HashedArrayDictionary.h
index de17c98e7ac..f18a8f4a474 100644
--- a/src/Dictionaries/HashedArrayDictionary.h
+++ b/src/Dictionaries/HashedArrayDictionary.h
@@ -57,14 +57,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/HashedDictionary.h b/src/Dictionaries/HashedDictionary.h
index 17d3ef51cad..ed80973fcf3 100644
--- a/src/Dictionaries/HashedDictionary.h
+++ b/src/Dictionaries/HashedDictionary.h
@@ -99,14 +99,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/IPAddressDictionary.h b/src/Dictionaries/IPAddressDictionary.h
index 0fb60844867..105bf7e340a 100644
--- a/src/Dictionaries/IPAddressDictionary.h
+++ b/src/Dictionaries/IPAddressDictionary.h
@@ -41,14 +41,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/PolygonDictionary.h b/src/Dictionaries/PolygonDictionary.h
index 4afe8664102..48a1f0e56da 100644
--- a/src/Dictionaries/PolygonDictionary.h
+++ b/src/Dictionaries/PolygonDictionary.h
@@ -71,14 +71,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 0b484032577..28db67038ca 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -85,14 +85,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        size_t queries = query_count.load(std::memory_order_relaxed);
+        size_t queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Dictionaries/RegExpTreeDictionary.h b/src/Dictionaries/RegExpTreeDictionary.h
index bf76820ba1e..68b6b603692 100644
--- a/src/Dictionaries/RegExpTreeDictionary.h
+++ b/src/Dictionaries/RegExpTreeDictionary.h
@@ -58,14 +58,14 @@ public:
 
     size_t getBytesAllocated() const override { return bytes_allocated; }
 
-    size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); }
+    size_t getQueryCount() const override { return query_count.load(); }
 
     double getFoundRate() const override
     {
-        const auto queries = query_count.load(std::memory_order_relaxed);
+        const auto queries = query_count.load();
         if (!queries)
             return 0;
-        return std::min(1.0, static_cast<double>(found_count.load(std::memory_order_relaxed)) / queries);
+        return std::min(1.0, static_cast<double>(found_count.load()) / queries);
     }
 
     double getHitRate() const override { return 1.0; }
diff --git a/src/Disks/VolumeJBOD.cpp b/src/Disks/VolumeJBOD.cpp
index e437684b802..ec9e5ea0d39 100644
--- a/src/Disks/VolumeJBOD.cpp
+++ b/src/Disks/VolumeJBOD.cpp
@@ -85,7 +85,7 @@ VolumeJBOD::VolumeJBOD(const VolumeJBOD & volume_jbod,
         DiskSelectorPtr disk_selector)
     : VolumeJBOD(volume_jbod.name, config, config_prefix, disk_selector)
 {
-    are_merges_avoided_user_override = volume_jbod.are_merges_avoided_user_override.load(std::memory_order_relaxed);
+    are_merges_avoided_user_override = volume_jbod.are_merges_avoided_user_override.load();
     last_used = volume_jbod.last_used.load(std::memory_order_relaxed);
 }
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 0e5897e7306..697c488e265 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -4154,12 +4154,12 @@ void Context::setMaxTableSizeToDrop(size_t max_size)
 
 size_t Context::getMaxTableSizeToDrop() const
 {
-    return shared->max_table_size_to_drop.load(std::memory_order_relaxed);
+    return shared->max_table_size_to_drop.load();
 }
 
 void Context::checkTableCanBeDropped(const String & database, const String & table, const size_t & table_size) const
 {
-    size_t max_table_size_to_drop = shared->max_table_size_to_drop.load(std::memory_order_relaxed);
+    size_t max_table_size_to_drop = shared->max_table_size_to_drop.load();
 
     checkCanBeDropped(database, table, table_size, max_table_size_to_drop);
 }
@@ -4177,12 +4177,12 @@ void Context::setMaxPartitionSizeToDrop(size_t max_size)
 
 size_t Context::getMaxPartitionSizeToDrop() const
 {
-    return shared->max_partition_size_to_drop.load(std::memory_order_relaxed);
+    return shared->max_partition_size_to_drop.load();
 }
 
 void Context::checkPartitionCanBeDropped(const String & database, const String & table, const size_t & partition_size) const
 {
-    size_t max_partition_size_to_drop = shared->max_partition_size_to_drop.load(std::memory_order_relaxed);
+    size_t max_partition_size_to_drop = shared->max_partition_size_to_drop.load();
 
     checkCanBeDropped(database, table, partition_size, max_partition_size_to_drop);
 }

From 9219617959745f0572846a473cdbfe83adad55e6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 03:01:34 +0100
Subject: [PATCH 0976/1081] Apply review comments

---
 tests/integration/test_settings_profile/test.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 70740104d63..6d7aa3d051f 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -469,8 +469,6 @@ def test_show_profiles():
         "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
         "CREATE SETTINGS PROFILE xyz\n",
         "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n"
-        "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
-        "CREATE SETTINGS PROFILE xyz\n",
     ]
     assert instance.query("SHOW CREATE PROFILES") in query_possible_response
 

From acba747275062fe8dc7e8d680d7b144a8df3a7cd Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 15 Feb 2024 02:12:44 +0000
Subject: [PATCH 0977/1081] Automatic style fix

---
 tests/integration/test_settings_profile/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 6d7aa3d051f..4c9fc31f76d 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -468,7 +468,7 @@ def test_show_profiles():
         "CREATE SETTINGS PROFILE default\n"
         "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
         "CREATE SETTINGS PROFILE xyz\n",
-        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n"
+        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n",
     ]
     assert instance.query("SHOW CREATE PROFILES") in query_possible_response
 

From 1bc3dc632c7ba4bc2ff6a3b23339392530dbfa8e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 04:56:14 +0100
Subject: [PATCH 0978/1081] Inhibit randomization in some tests

---
 tests/queries/1_stateful/00037_uniq_state_merge1.sql | 1 +
 tests/queries/1_stateful/00038_uniq_state_merge2.sql | 1 +
 2 files changed, 2 insertions(+)

diff --git a/tests/queries/1_stateful/00037_uniq_state_merge1.sql b/tests/queries/1_stateful/00037_uniq_state_merge1.sql
index c941a14b571..6abaad7297f 100644
--- a/tests/queries/1_stateful/00037_uniq_state_merge1.sql
+++ b/tests/queries/1_stateful/00037_uniq_state_merge1.sql
@@ -1 +1,2 @@
+SET max_bytes_before_external_group_by = '1G';
 SELECT k, any(u) AS u, uniqMerge(us) AS us FROM (SELECT domain(URL) AS k, uniq(UserID) AS u, uniqState(UserID) AS us FROM test.hits GROUP BY k) GROUP BY k ORDER BY u DESC, k ASC LIMIT 100
diff --git a/tests/queries/1_stateful/00038_uniq_state_merge2.sql b/tests/queries/1_stateful/00038_uniq_state_merge2.sql
index 677458daeda..f97395943a1 100644
--- a/tests/queries/1_stateful/00038_uniq_state_merge2.sql
+++ b/tests/queries/1_stateful/00038_uniq_state_merge2.sql
@@ -1 +1,2 @@
+SET max_bytes_before_external_group_by = '1G';
 SELECT topLevelDomain(concat('http://', k)) AS tld, sum(u) AS u, uniqMerge(us) AS us FROM (SELECT domain(URL) AS k, uniq(UserID) AS u, uniqState(UserID) AS us FROM test.hits GROUP BY k) GROUP BY tld ORDER BY u DESC, tld ASC LIMIT 100

From d60ab4146dd167d3e177778e62e3a1cbbca1a78c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 05:02:10 +0100
Subject: [PATCH 0979/1081] Inhibit randomization in some tests

---
 ...43_variant_type_with_different_local_and_global_order.sh | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index d089ed3cb2f..e4c1206263f 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long
+# Tags: long, no-debug
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # reset --log_comment
@@ -74,11 +74,11 @@ run 0
 $CH_CLIENT -q "drop table test;"
 
 echo "MergeTree compact"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000;"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=100000000, min_bytes_for_wide_part=1000000000, index_granularity = 8192, index_granularity_bytes = '10Mi';"
 run 1
 $CH_CLIENT -q "drop table test;"
 
 echo "MergeTree wide"
-$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1;"
+$CH_CLIENT -q "create table test (id UInt64, v Variant(UInt64, String, Array(UInt64))) engine=MergeTree order by id settings min_rows_for_wide_part=1, min_bytes_for_wide_part=1, index_granularity = 8192, index_granularity_bytes = '10Mi';"
 run 1
 $CH_CLIENT -q "drop table test;"

From 2660e69abb102b45e6d321cdd294ddd228beb39f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 05:12:59 +0100
Subject: [PATCH 0980/1081] Inhibit randomization in some tests

---
 .../0_stateless/02450_kill_distributed_query_deadlock.sh        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02450_kill_distributed_query_deadlock.sh b/tests/queries/0_stateless/02450_kill_distributed_query_deadlock.sh
index 03c43843d3a..0cd520d8d5d 100755
--- a/tests/queries/0_stateless/02450_kill_distributed_query_deadlock.sh
+++ b/tests/queries/0_stateless/02450_kill_distributed_query_deadlock.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long
+# Tags: long, no-random-settings, no-debug
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From d3fdd97891eea2877e881a5bb4160c274c97179b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 06:04:45 +0100
Subject: [PATCH 0981/1081] The code should not be complex

---
 .../Serializations/SerializationTuple.cpp     | 53 +++++++++----------
 1 file changed, 26 insertions(+), 27 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationTuple.cpp b/src/DataTypes/Serializations/SerializationTuple.cpp
index 5d8c84b70bf..399ad870d60 100644
--- a/src/DataTypes/Serializations/SerializationTuple.cpp
+++ b/src/DataTypes/Serializations/SerializationTuple.cpp
@@ -62,7 +62,7 @@ void SerializationTuple::serializeBinary(const IColumn & column, size_t row_num,
 }
 
 
-template <typename ReturnType = void, typename F>
+template <typename ReturnType, typename F>
 static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
 {
     static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
@@ -85,11 +85,7 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
 
     try
     {
-        if constexpr (throw_exception)
-        {
-            impl();
-        }
-        else if (!impl())
+        if (!impl())
         {
             restore_elements();
             return ReturnType(false);
@@ -125,10 +121,11 @@ static ReturnType addElementSafe(size_t num_elems, IColumn & column, F && impl)
 
 void SerializationTuple::deserializeBinary(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    addElementSafe(elems.size(), column, [&]
+    addElementSafe<void>(elems.size(), column, [&]
     {
         for (size_t i = 0; i < elems.size(); ++i)
             elems[i]->deserializeBinary(extractElementColumn(column, i), istr, settings);
+        return true;
     });
 }
 
@@ -165,7 +162,7 @@ ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer
                 if constexpr (throw_exception)
                     assertChar(',', istr);
                 else if (!checkChar(',', istr))
-                    return ReturnType(false);
+                    return false;
 
                 skipWhitespaceIfAny(istr);
             }
@@ -203,16 +200,16 @@ ReturnType SerializationTuple::deserializeTextImpl(IColumn & column, ReadBuffer
         if constexpr (throw_exception)
             assertChar(')', istr);
         else if (!checkChar(')', istr))
-            return ReturnType(false);
+            return false;
 
         if (whole && !istr.eof())
         {
             if constexpr (throw_exception)
                 throwUnexpectedDataAfterParsedValue(column, istr, settings, "Tuple");
-            return ReturnType(false);
+            return false;
         }
 
-        return ReturnType(true);
+        return true;
     };
 
     return addElementSafe<ReturnType>(elems.size(), column, impl);
@@ -323,6 +320,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 SerializationNullable::deserializeNullAsDefaultOrNestedTextJSON(element_column, istr, settings, elems[element_pos]);
             else
                 elems[element_pos]->deserializeTextJSON(element_column, istr, settings);
+            return true;
         }
         else
         {
@@ -353,7 +351,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 {
                     if constexpr (throw_exception)
                         throw Exception(ErrorCodes::INCORRECT_DATA, "Unexpected number of elements in named tuple. Expected no more than {} (consider enabling input_format_json_ignore_unknown_keys_in_named_tuple setting)", elems.size());
-                    return ReturnType(false);
+                    return false;
                 }
 
                 if (processed + skipped > 0)
@@ -361,7 +359,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                     if constexpr (throw_exception)
                         assertChar(',', istr);
                     else if (!checkChar(',', istr))
-                        return ReturnType(false);
+                        return false;
                     skipWhitespaceIfAny(istr);
                 }
 
@@ -369,13 +367,13 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 if constexpr (throw_exception)
                     readDoubleQuotedString(name, istr);
                 else if (!tryReadDoubleQuotedString(name, istr))
-                    return ReturnType(false);
+                    return false;
 
                 skipWhitespaceIfAny(istr);
                 if constexpr (throw_exception)
                     assertChar(':', istr);
                 else if (!checkChar(':', istr))
-                    return ReturnType(false);
+                    return false;
                 skipWhitespaceIfAny(istr);
 
                 const size_t element_pos = getPositionByName(name);
@@ -386,7 +384,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                         if constexpr (throw_exception)
                             skipJSONField(istr, name);
                         else if (!trySkipJSONField(istr, name))
-                            return ReturnType(false);
+                            return false;
 
                         skipWhitespaceIfAny(istr);
                         ++skipped;
@@ -396,7 +394,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                     {
                         if constexpr (throw_exception)
                             throw Exception(ErrorCodes::NOT_FOUND_COLUMN_IN_BLOCK, "Tuple doesn't have element with name '{}', enable setting input_format_json_ignore_unknown_keys_in_named_tuple", name);
-                        return ReturnType(false);
+                        return false;
                     }
                 }
 
@@ -418,7 +416,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 else
                 {
                     if (!deserialize_element(element_column, element_pos))
-                        return ReturnType(false);
+                        return false;
                 }
 
                 skipWhitespaceIfAny(istr);
@@ -428,7 +426,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
             if constexpr (throw_exception)
                 assertChar('}', istr);
             else if (!checkChar('}', istr))
-                return ReturnType(false);
+                return false;
 
             /// Check if we have missing elements.
             if (processed != elems.size())
@@ -446,7 +444,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                                 "JSON object doesn't contain tuple element {}. If you want to insert defaults in case of missing elements, "
                                 "enable setting input_format_json_defaults_for_missing_elements_in_named_tuple",
                                 elems[element_pos]->getElementName());
-                        return ReturnType(false);
+                        return false;
                     }
 
                     auto & element_column = extractElementColumn(column, element_pos);
@@ -454,7 +452,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 }
             }
 
-            return ReturnType(true);
+            return true;
         };
 
         return addElementSafe<ReturnType>(elems.size(), column, impl);
@@ -465,7 +463,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
         if constexpr (throw_exception)
             assertChar('[', istr);
         else if (!checkChar('[', istr))
-            return ReturnType(false);
+            return false;
         skipWhitespaceIfAny(istr);
 
         auto impl = [&]()
@@ -478,7 +476,7 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                     if constexpr (throw_exception)
                         assertChar(',', istr);
                     else if (!checkChar(',', istr))
-                        return ReturnType(false);
+                        return false;
                     skipWhitespaceIfAny(istr);
                 }
 
@@ -487,16 +485,16 @@ ReturnType SerializationTuple::deserializeTextJSONImpl(IColumn & column, ReadBuf
                 if constexpr (throw_exception)
                     deserialize_element(element_column, i);
                 else if (!deserialize_element(element_column, i))
-                    return ReturnType(false);
+                    return false;
             }
 
             skipWhitespaceIfAny(istr);
             if constexpr (throw_exception)
                 assertChar(']', istr);
             else if (!checkChar(']', istr))
-                return ReturnType(false);
+                return false;
 
-            return ReturnType(true);
+            return true;
         };
 
         return addElementSafe<ReturnType>(elems.size(), column, impl);
@@ -538,7 +536,7 @@ void SerializationTuple::serializeTextCSV(const IColumn & column, size_t row_num
 
 void SerializationTuple::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const FormatSettings & settings) const
 {
-    addElementSafe(elems.size(), column, [&]
+    addElementSafe<void>(elems.size(), column, [&]
     {
         const size_t size = elems.size();
         for (size_t i = 0; i < size; ++i)
@@ -556,6 +554,7 @@ void SerializationTuple::deserializeTextCSV(IColumn & column, ReadBuffer & istr,
             else
                 elems[i]->deserializeTextCSV(element_column, istr, settings);
         }
+        return true;
     });
 }
 

From 503bec73ec5337942592063d861bac837a8484ca Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 06:11:02 +0100
Subject: [PATCH 0982/1081] Exclude test run from a slow build

---
 tests/queries/0_stateless/01193_metadata_loading.sh | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/01193_metadata_loading.sh b/tests/queries/0_stateless/01193_metadata_loading.sh
index c25cdf4e970..69178a93d42 100755
--- a/tests/queries/0_stateless/01193_metadata_loading.sh
+++ b/tests/queries/0_stateless/01193_metadata_loading.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-tsan, no-asan, no-ubsan, no-msan, no-debug, no-parallel, no-fasttest, no-s3-storage
+# Tags: no-tsan, no-asan, no-ubsan, no-msan, no-debug, no-parallel, no-fasttest, no-s3-storage, no-sanitize-coverage
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -8,16 +8,12 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Check that attaching a database with a large number of tables is not too slow.
 # it is the worst way of making performance test, nevertheless it can detect significant slowdown and some other issues, that usually found by stress test
 
-db="test_01193_$RANDOM"
+db="test_01193_$RANDOM_$RANDOM_$RANDOM_$RANDOM"
 tables=1000
 threads=10
 count_multiplier=1
 max_time_ms=1500
 
-debug_or_sanitizer_build=$($CLICKHOUSE_CLIENT -q "WITH ((SELECT value FROM system.build_options WHERE name='BUILD_TYPE') AS build, (SELECT value FROM system.build_options WHERE name='CXX_FLAGS') as flags) SELECT build='Debug' OR flags LIKE '%fsanitize%' OR hasThreadFuzzer()")
-
-if [[ debug_or_sanitizer_build -eq 1 ]]; then tables=100; count_multiplier=10; max_time_ms=1500; fi
-
 create_tables() {
   $CLICKHOUSE_CLIENT -q "WITH
           'CREATE TABLE $db.table_$1_' AS create1,

From accc63500dc87e5a5585a826a872c37d6a099995 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 06:54:18 +0100
Subject: [PATCH 0983/1081] Fix broken lambdas formatting

---
 src/Parsers/ASTFunction.cpp | 24 +++++++++++++++---------
 1 file changed, 15 insertions(+), 9 deletions(-)

diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index e7f7b48091a..73625fcfe35 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -1034,7 +1034,15 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
                 }
             }
 
-            if (!written && name == "lambda"sv)
+            const auto & first_argument = arguments->children[0];
+            const ASTIdentifier * first_argument_identifier = first_argument->as<ASTIdentifier>();
+            const ASTFunction * first_argument_function = first_argument->as<ASTFunction>();
+            bool first_argument_is_tuple = first_argument_function && first_argument_function->name == "tuple";
+
+            /// Only these types of arguments are accepted by the parser of the '->' operator.
+            bool acceptable_first_argument_for_lambda_expression = first_argument_identifier || first_argument_is_tuple;
+
+            if (!written && name == "lambda"sv && acceptable_first_argument_for_lambda_expression)
             {
                 /// Special case: zero elements tuple in lhs of lambda is printed as ().
                 /// Special case: one-element tuple in lhs of lambda is printed as its element.
@@ -1042,19 +1050,17 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
                 if (frame.need_parens)
                     settings.ostr << '(';
 
-                const auto * first_arg_func = arguments->children[0]->as<ASTFunction>();
-                if (first_arg_func
-                    && first_arg_func->name == "tuple"
-                    && first_arg_func->arguments
-                    && (first_arg_func->arguments->children.size() == 1 || first_arg_func->arguments->children.empty()))
+                if (first_argument_is_tuple
+                    && first_argument_function->arguments
+                    && (first_argument_function->arguments->children.size() == 1 || first_argument_function->arguments->children.empty()))
                 {
-                    if (first_arg_func->arguments->children.size() == 1)
-                        first_arg_func->arguments->children[0]->formatImpl(settings, state, nested_need_parens);
+                    if (first_argument_function->arguments->children.size() == 1)
+                        first_argument_function->arguments->children[0]->formatImpl(settings, state, nested_need_parens);
                     else
                         settings.ostr << "()";
                 }
                 else
-                    arguments->children[0]->formatImpl(settings, state, nested_need_parens);
+                    first_argument->formatImpl(settings, state, nested_need_parens);
 
                 settings.ostr << (settings.hilite ? hilite_operator : "") << " -> " << (settings.hilite ? hilite_none : "");
                 arguments->children[1]->formatImpl(settings, state, nested_need_parens);

From b322be55b26fa594a97db6f92b01784e56ebb470 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 06:54:28 +0100
Subject: [PATCH 0984/1081] Add a test

---
 .../0_stateless/02990_format_lambdas.reference        | 10 ++++++++++
 tests/queries/0_stateless/02990_format_lambdas.sh     | 11 +++++++++++
 2 files changed, 21 insertions(+)
 create mode 100644 tests/queries/0_stateless/02990_format_lambdas.reference
 create mode 100755 tests/queries/0_stateless/02990_format_lambdas.sh

diff --git a/tests/queries/0_stateless/02990_format_lambdas.reference b/tests/queries/0_stateless/02990_format_lambdas.reference
new file mode 100644
index 00000000000..f898d6ffa0e
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_lambdas.reference
@@ -0,0 +1,10 @@
+SELECT lambda(1, 1)
+SELECT lambda(1, 1)
+SELECT x -> 1
+SELECT x -> 1
+SELECT (x, y) -> 1
+SELECT (x, y) -> 1
+SELECT lambda(f(1), 1)
+SELECT lambda(f(1), 1)
+SELECT lambda(f(x), 1)
+SELECT lambda(f(x), 1)
diff --git a/tests/queries/0_stateless/02990_format_lambdas.sh b/tests/queries/0_stateless/02990_format_lambdas.sh
new file mode 100755
index 00000000000..9dc5e0f0461
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_lambdas.sh
@@ -0,0 +1,11 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+QUERY="SELECT lambda(1, 1)"; QUERY2=$(${CLICKHOUSE_FORMAT} --query "$QUERY"); echo "$QUERY2"; QUERY3=$(${CLICKHOUSE_FORMAT} --query "$QUERY2"); echo "$QUERY3";
+QUERY="SELECT lambda(x, 1)"; QUERY2=$(${CLICKHOUSE_FORMAT} --query "$QUERY"); echo "$QUERY2"; QUERY3=$(${CLICKHOUSE_FORMAT} --query "$QUERY2"); echo "$QUERY3";
+QUERY="SELECT lambda((x, y), 1)"; QUERY2=$(${CLICKHOUSE_FORMAT} --query "$QUERY"); echo "$QUERY2"; QUERY3=$(${CLICKHOUSE_FORMAT} --query "$QUERY2"); echo "$QUERY3";
+QUERY="SELECT lambda(f(1), 1)"; QUERY2=$(${CLICKHOUSE_FORMAT} --query "$QUERY"); echo "$QUERY2"; QUERY3=$(${CLICKHOUSE_FORMAT} --query "$QUERY2"); echo "$QUERY3";
+QUERY="SELECT lambda(f(x), 1)"; QUERY2=$(${CLICKHOUSE_FORMAT} --query "$QUERY"); echo "$QUERY2"; QUERY3=$(${CLICKHOUSE_FORMAT} --query "$QUERY2"); echo "$QUERY3";

From 0258aba5c018446a1a0e4fae871208b637de96b2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 07:49:13 +0100
Subject: [PATCH 0985/1081] Verify formatting consistency on the server-side

---
 src/Interpreters/executeQuery.cpp | 26 +++++++++++++++++++++++++-
 1 file changed, 25 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 8b36790a269..824bb3c255b 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -704,7 +704,10 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     {
         if (settings.dialect == Dialect::kusto && !internal)
         {
-            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Kusto dialect is disabled until these two bugs will be fixed: https://github.com/ClickHouse/ClickHouse/issues/59037 and https://github.com/ClickHouse/ClickHouse/issues/59036");
+            ParserKQLStatement parser(end, settings.allow_settings_after_format_in_insert);
+
+            /// TODO: parser should fail early when max_query_size limit is reached.
+            ast = parseKQLQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
         }
         else if (settings.dialect == Dialect::prql && !internal)
         {
@@ -716,6 +719,27 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             ParserQuery parser(end, settings.allow_settings_after_format_in_insert);
             /// TODO: parser should fail early when max_query_size limit is reached.
             ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+
+#ifndef NDEBUG
+            /// Verify that AST formatting is consistent:
+            /// If you format AST, parse it back, and format it again, you get the same string.
+
+            String formatted1 = ast->formatForErrorMessage();
+
+            ASTPtr ast2 = parseQuery(parser,
+                formatted1.data(),
+                formatted1.data() + formatted1.size(),
+                "", max_query_size, settings.max_parser_depth);
+
+            chassert(ast2);
+
+            String formatted2 = ast2->formatForErrorMessage();
+
+            if (formatted1 != formatted2)
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                    "Inconsistent AST formatting: the query:\n{}\nWas parsed and formatted back as:\n{}",
+                    formatted1, formatted2);
+#endif
         }
 
         const char * query_end = end;

From a037933cc68adf82e628b8e137f07644eb9f5ab2 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Wed, 14 Feb 2024 22:57:23 -0800
Subject: [PATCH 0986/1081] [Docs] Add min version for startsWithUTF8

---
 docs/en/sql-reference/functions/string-functions.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index 60cb3ac4ac4..9ae403be524 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -4,6 +4,8 @@ sidebar_position: 170
 sidebar_label: Strings
 ---
 
+import VersionBadge from '@theme/badges/VersionBadge';
+
 # Functions for Working with Strings
 
 Functions for [searching](string-search-functions.md) in strings and for [replacing](string-replace-functions.md) in strings are described separately.
@@ -783,6 +785,8 @@ SELECT startsWith('Spider-Man', 'Spi');
 
 ## startsWithUTF8
 
+<VersionBadge minVersion='23.8' />
+
 Returns whether string `str` starts with `prefix`, the difference between `startsWithUTF8` and `startsWith` is that `startsWithUTF8` match `str` and `suffix` by UTF-8 characters.
 
 
From ddc429ccbcd519ffcadf6f50d003fd998b06c2c0 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 15 Feb 2024 10:14:58 +0100
Subject: [PATCH 0987/1081] Revert incorrect changes

---
 tests/integration/test_settings_profile/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 4c9fc31f76d..70740104d63 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -468,7 +468,9 @@ def test_show_profiles():
         "CREATE SETTINGS PROFILE default\n"
         "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
         "CREATE SETTINGS PROFILE xyz\n",
-        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n",
+        "CREATE SETTINGS PROFILE default SETTINGS allow_experimental_analyzer = true\n"
+        "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n"
+        "CREATE SETTINGS PROFILE xyz\n",
     ]
     assert instance.query("SHOW CREATE PROFILES") in query_possible_response
 

From 31128ecaa7b3d8e0bd7c359389504356579a664e Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 15 Feb 2024 10:29:27 +0000
Subject: [PATCH 0988/1081] Analyzer: Fix
 test_sql_user_defined_functions_on_cluster

---
 tests/analyzer_integration_broken_tests.txt   |  1 -
 .../test.py                                   | 33 ++++++++-----------
 2 files changed, 14 insertions(+), 20 deletions(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 18086b6a5c1..2c8ee34fdf4 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -9,4 +9,3 @@ test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_ove
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
 test_select_access_rights/test_main.py::test_alias_columns
 test_settings_profile/test.py::test_show_profiles
-test_sql_user_defined_functions_on_cluster/test.py::test_sql_user_defined_functions_on_cluster
diff --git a/tests/integration/test_sql_user_defined_functions_on_cluster/test.py b/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
index c940998ec42..46c166965d7 100644
--- a/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
+++ b/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
@@ -1,5 +1,5 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance
 
 cluster = ClickHouseCluster(__file__)
 ch1 = cluster.add_instance(
@@ -24,15 +24,15 @@ def started_cluster():
 
 
 def test_sql_user_defined_functions_on_cluster():
-    assert "Unknown function test_function" in ch1.query_and_get_error(
-        "SELECT test_function(1);"
-    )
-    assert "Unknown function test_function" in ch2.query_and_get_error(
-        "SELECT test_function(1);"
-    )
-    assert "Unknown function test_function" in ch3.query_and_get_error(
-        "SELECT test_function(1);"
-    )
+    def check_function_does_not_exist(node : ClickHouseInstance):
+        error_message = node.query_and_get_error(
+            "SELECT test_function(1);"
+        )
+        assert "Unknown function test_function" in error_message or "Function with name 'test_function' does not exists. In scope SELECT test_function(1)" in error_message
+
+    check_function_does_not_exist(ch1)
+    check_function_does_not_exist(ch2)
+    check_function_does_not_exist(ch3)
 
     ch1.query_with_retry(
         "CREATE FUNCTION test_function ON CLUSTER 'cluster' AS x -> x + 1;"
@@ -43,12 +43,7 @@ def test_sql_user_defined_functions_on_cluster():
     assert ch3.query("SELECT test_function(1);") == "2\n"
 
     ch2.query_with_retry("DROP FUNCTION test_function ON CLUSTER 'cluster'")
-    assert "Unknown function test_function" in ch1.query_and_get_error(
-        "SELECT test_function(1);"
-    )
-    assert "Unknown function test_function" in ch2.query_and_get_error(
-        "SELECT test_function(1);"
-    )
-    assert "Unknown function test_function" in ch3.query_and_get_error(
-        "SELECT test_function(1);"
-    )
+
+    check_function_does_not_exist(ch1)
+    check_function_does_not_exist(ch2)
+    check_function_does_not_exist(ch3)

From ad626233a188e8bf0ef29669eada5d7da0eec175 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 15 Feb 2024 10:43:16 +0000
Subject: [PATCH 0989/1081] Automatic style fix

---
 .../test_sql_user_defined_functions_on_cluster/test.py | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_sql_user_defined_functions_on_cluster/test.py b/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
index 46c166965d7..0bf03f545be 100644
--- a/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
+++ b/tests/integration/test_sql_user_defined_functions_on_cluster/test.py
@@ -24,11 +24,13 @@ def started_cluster():
 
 
 def test_sql_user_defined_functions_on_cluster():
-    def check_function_does_not_exist(node : ClickHouseInstance):
-        error_message = node.query_and_get_error(
-            "SELECT test_function(1);"
+    def check_function_does_not_exist(node: ClickHouseInstance):
+        error_message = node.query_and_get_error("SELECT test_function(1);")
+        assert (
+            "Unknown function test_function" in error_message
+            or "Function with name 'test_function' does not exists. In scope SELECT test_function(1)"
+            in error_message
         )
-        assert "Unknown function test_function" in error_message or "Function with name 'test_function' does not exists. In scope SELECT test_function(1)" in error_message
 
     check_function_does_not_exist(ch1)
     check_function_does_not_exist(ch2)

From 7396fa0b1474cf091dfd608e50cf2631255f312a Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Thu, 15 Feb 2024 11:23:54 +0000
Subject: [PATCH 0990/1081] add docs spelling

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 51aa8222a89..f97ea747471 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -990,6 +990,7 @@ VIEWs
 Vadim
 Valgrind
 Vectorized
+VersionBadge
 VersionInteger
 VersionedCollapsingMergeTree
 VideoContainer

From 504a2dd9d9dfaf2bad9b46f740364e1885cb3ca2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 13 Feb 2024 11:27:52 +0100
Subject: [PATCH 0991/1081] Do not rewrite sum() to count() if return value
 differs in analyzer

v2: fix for LowCardinality
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Analyzer/Passes/NormalizeCountVariantsPass.cpp         | 6 ++++++
 .../0_stateless/02991_count_rewrite_analyzer.reference     | 4 ++++
 tests/queries/0_stateless/02991_count_rewrite_analyzer.sql | 7 +++++++
 3 files changed, 17 insertions(+)
 create mode 100644 tests/queries/0_stateless/02991_count_rewrite_analyzer.reference
 create mode 100644 tests/queries/0_stateless/02991_count_rewrite_analyzer.sql

diff --git a/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp b/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
index ce368a69ba9..0d6f3fc2d87 100644
--- a/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
+++ b/src/Analyzer/Passes/NormalizeCountVariantsPass.cpp
@@ -7,6 +7,7 @@
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/FunctionNode.h>
 #include <Interpreters/Context.h>
+#include <DataTypes/DataTypesNumber.h>
 
 namespace DB
 {
@@ -32,6 +33,11 @@ public:
         if (function_node->getArguments().getNodes().size() != 1)
             return;
 
+        /// forbid the optimization if return value of sum() and count() differs:
+        /// count() returns only UInt64 type, while sum() could return Nullable().
+        if (!function_node->getResultType()->equals(DataTypeUInt64()))
+            return;
+
         auto & first_argument = function_node->getArguments().getNodes()[0];
         auto * first_argument_constant_node = first_argument->as<ConstantNode>();
         if (!first_argument_constant_node)
diff --git a/tests/queries/0_stateless/02991_count_rewrite_analyzer.reference b/tests/queries/0_stateless/02991_count_rewrite_analyzer.reference
new file mode 100644
index 00000000000..ccb266fc2b5
--- /dev/null
+++ b/tests/queries/0_stateless/02991_count_rewrite_analyzer.reference
@@ -0,0 +1,4 @@
+Nullable(UInt64)
+UInt64
+Nullable(UInt64)
+UInt64
diff --git a/tests/queries/0_stateless/02991_count_rewrite_analyzer.sql b/tests/queries/0_stateless/02991_count_rewrite_analyzer.sql
new file mode 100644
index 00000000000..b11aeedd225
--- /dev/null
+++ b/tests/queries/0_stateless/02991_count_rewrite_analyzer.sql
@@ -0,0 +1,7 @@
+-- Regression test for https://github.com/ClickHouse/ClickHouse/issues/59919
+SET allow_experimental_analyzer=1;
+
+SELECT toTypeName(sum(toNullable('a') IN toNullable('a'))) AS x;
+SELECT toTypeName(count(toNullable('a') IN toNullable('a'))) AS x;
+SELECT toTypeName(sum(toFixedString('a', toLowCardinality(toNullable(1))) IN toFixedString('a', 1))) AS x;
+SELECT toTypeName(count(toFixedString('a', toLowCardinality(toNullable(1))) IN toFixedString('a', 1))) AS x;

From bbe38a3fe4717fad4c79b2ee5a8e40323c8e3dcb Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 15 Feb 2024 09:15:51 +0100
Subject: [PATCH 0992/1081] Add ability to escape quotes in Values format with
 single quote

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Core/Settings.h                                  |  2 ++
 src/DataTypes/Serializations/SerializationString.cpp |  7 +++++--
 src/Formats/FormatFactory.cpp                        |  1 +
 src/Formats/FormatSettings.h                         |  1 +
 .../0_stateless/02993_values_escape_quote.reference  |  3 +++
 .../0_stateless/02993_values_escape_quote.sql        | 12 ++++++++++++
 6 files changed, 24 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/02993_values_escape_quote.reference
 create mode 100644 tests/queries/0_stateless/02993_values_escape_quote.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 42dad28aa74..53ba18a3001 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1146,6 +1146,8 @@ class IColumn;
     M(Bool, output_format_sql_insert_use_replace, false, "Use REPLACE statement instead of INSERT", 0) \
     M(Bool, output_format_sql_insert_quote_names, true, "Quote column names with '`' characters", 0) \
     \
+    M(Bool, output_format_values_escape_quote_with_quote, false, "If true escape ' with '', otherwise quoted with \\'", 0) \
+    \
     M(Bool, output_format_bson_string_as_string, false, "Use BSON String type instead of Binary for String columns.", 0) \
     M(Bool, input_format_bson_skip_fields_with_unsupported_types_in_schema_inference, false, "Skip fields with unsupported types while schema inference for format BSON.", 0) \
     \
diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index 6bffa0ff72e..fd46206e9ad 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -334,9 +334,12 @@ bool SerializationString::tryDeserializeTextEscaped(IColumn & column, ReadBuffer
     return read<bool>(column, [&](ColumnString::Chars & data) { readEscapedStringInto(data, istr); return true; });
 }
 
-void SerializationString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
+void SerializationString::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
-    writeQuotedString(assert_cast<const ColumnString &>(column).getDataAt(row_num), ostr);
+    if (settings.values.escape_quote_with_quote)
+        writeQuotedStringPostgreSQL(assert_cast<const ColumnString &>(column).getDataAt(row_num).toView(), ostr);
+    else
+        writeQuotedString(assert_cast<const ColumnString &>(column).getDataAt(row_num), ostr);
 }
 
 
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 8c39b4b71e4..866b6934b70 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -181,6 +181,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.values.allow_data_after_semicolon = settings.input_format_values_allow_data_after_semicolon;
     format_settings.values.deduce_templates_of_expressions = settings.input_format_values_deduce_templates_of_expressions;
     format_settings.values.interpret_expressions = settings.input_format_values_interpret_expressions;
+    format_settings.values.escape_quote_with_quote = settings.output_format_values_escape_quote_with_quote;
     format_settings.with_names_use_header = settings.input_format_with_names_use_header;
     format_settings.with_types_use_header = settings.input_format_with_types_use_header;
     format_settings.write_statistics = settings.output_format_write_statistics;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index bdd2dda5287..cda15fd6531 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -361,6 +361,7 @@ struct FormatSettings
         bool deduce_templates_of_expressions = true;
         bool accurate_types_of_literals = true;
         bool allow_data_after_semicolon = false;
+        bool escape_quote_with_quote = false;
     } values;
 
     enum class ORCCompression
diff --git a/tests/queries/0_stateless/02993_values_escape_quote.reference b/tests/queries/0_stateless/02993_values_escape_quote.reference
new file mode 100644
index 00000000000..29d6a133fec
--- /dev/null
+++ b/tests/queries/0_stateless/02993_values_escape_quote.reference
@@ -0,0 +1,3 @@
+('foo')('foo\'bar')('foo\'\'bar')
+output_format_values_escape_quote_with_quote=1
+('foo')('foo''bar')('foo''''bar')
diff --git a/tests/queries/0_stateless/02993_values_escape_quote.sql b/tests/queries/0_stateless/02993_values_escape_quote.sql
new file mode 100644
index 00000000000..e6fc5f1b280
--- /dev/null
+++ b/tests/queries/0_stateless/02993_values_escape_quote.sql
@@ -0,0 +1,12 @@
+select 'foo' format Values;
+select 'foo\'bar' format Values;
+select 'foo\'\'bar' format Values;
+
+select '\noutput_format_values_escape_quote_with_quote=1' format LineAsString;
+set output_format_values_escape_quote_with_quote=1;
+
+select 'foo' format Values;
+select 'foo\'bar' format Values;
+select 'foo\'\'bar' format Values;
+-- fix no newline at end of file
+select '' format LineAsString;

From f10fc95933cb3beaf63329c97c412ec8201f082f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 15 Feb 2024 09:28:24 +0100
Subject: [PATCH 0993/1081] Fix INSERT into SQLite with single quote

Previously it leads to syntax error, due to incorrect escaping of single
quotes for SQLite, "\'" had been used instead of "''"

So set output_format_values_escape_quote_with_quote=true for SQLite to
fix this.

v2: prepare modified Context for writing on storage creation
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageSQLite.cpp                  | 17 ++++++++++++++++-
 src/Storages/StorageSQLite.h                    |  3 +++
 .../01889_sqlite_read_write.reference           |  2 +-
 .../0_stateless/01889_sqlite_read_write.sh      |  2 +-
 4 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/src/Storages/StorageSQLite.cpp b/src/Storages/StorageSQLite.cpp
index 85c5e16a1bf..30cca409dc8 100644
--- a/src/Storages/StorageSQLite.cpp
+++ b/src/Storages/StorageSQLite.cpp
@@ -19,6 +19,20 @@
 #include <QueryPipeline/Pipe.h>
 #include <Common/filesystemHelpers.h>
 
+namespace
+{
+
+using namespace DB;
+
+ContextPtr makeSQLiteWriteContext(ContextPtr context)
+{
+    auto write_context = Context::createCopy(context);
+    write_context->setSetting("output_format_values_escape_quote_with_quote", Field(true));
+    return write_context;
+}
+
+}
+
 
 namespace DB
 {
@@ -43,6 +57,7 @@ StorageSQLite::StorageSQLite(
     , database_path(database_path_)
     , sqlite_db(sqlite_db_)
     , log(getLogger("StorageSQLite (" + table_id_.table_name + ")"))
+    , write_context(makeSQLiteWriteContext(getContext()))
 {
     StorageInMemoryMetadata storage_metadata;
 
@@ -144,7 +159,7 @@ public:
 
         sqlbuf << ") VALUES ";
 
-        auto writer = FormatFactory::instance().getOutputFormat("Values", sqlbuf, metadata_snapshot->getSampleBlock(), storage.getContext());
+        auto writer = FormatFactory::instance().getOutputFormat("Values", sqlbuf, metadata_snapshot->getSampleBlock(), storage.write_context);
         writer->write(block);
 
         sqlbuf << ";";
diff --git a/src/Storages/StorageSQLite.h b/src/Storages/StorageSQLite.h
index baacdfb4899..ed673123fe0 100644
--- a/src/Storages/StorageSQLite.h
+++ b/src/Storages/StorageSQLite.h
@@ -47,10 +47,13 @@ public:
         const String & table);
 
 private:
+    friend class SQLiteSink; /// for write_context
+
     String remote_table_name;
     String database_path;
     SQLitePtr sqlite_db;
     LoggerPtr log;
+    ContextPtr write_context;
 };
 
 }
diff --git a/tests/queries/0_stateless/01889_sqlite_read_write.reference b/tests/queries/0_stateless/01889_sqlite_read_write.reference
index 9f2b382e41e..e605693d95d 100644
--- a/tests/queries/0_stateless/01889_sqlite_read_write.reference
+++ b/tests/queries/0_stateless/01889_sqlite_read_write.reference
@@ -29,7 +29,7 @@ CREATE TABLE default.sqlite_table3\n(\n    `col1` String,\n    `col2` Int32\n)\n
 not a null	2
 	3
 	4
-line6	6
+line\'6	6
 	7
 test table function
 line1	1
diff --git a/tests/queries/0_stateless/01889_sqlite_read_write.sh b/tests/queries/0_stateless/01889_sqlite_read_write.sh
index 02b9a649e94..fd0a1df20ac 100755
--- a/tests/queries/0_stateless/01889_sqlite_read_write.sh
+++ b/tests/queries/0_stateless/01889_sqlite_read_write.sh
@@ -76,7 +76,7 @@ ${CLICKHOUSE_CLIENT} --query='DROP TABLE IF EXISTS sqlite_table3'
 ${CLICKHOUSE_CLIENT} --query="CREATE TABLE sqlite_table3 (col1 String, col2 Int32) ENGINE = SQLite('${DB_PATH}', 'table3')"
 
 ${CLICKHOUSE_CLIENT} --query='SHOW CREATE TABLE sqlite_table3;' | sed -r 's/(.*SQLite)(.*)/\1/'
-${CLICKHOUSE_CLIENT} --query="INSERT INTO sqlite_table3 VALUES ('line6', 6);"
+${CLICKHOUSE_CLIENT} --query="INSERT INTO sqlite_table3 VALUES ('line\'6', 6);"
 ${CLICKHOUSE_CLIENT} --query="INSERT INTO sqlite_table3 VALUES (NULL, 7);"
 
 ${CLICKHOUSE_CLIENT} --query='SELECT * FROM sqlite_table3 ORDER BY col2'

From eeaa9fb1bac01d394be483cc555293c6c0d952ab Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 15 Feb 2024 11:38:13 +0000
Subject: [PATCH 0994/1081] Update tests

---
 ...mn_must_not_override_past_values.reference | 38 +++++++++-----
 ...e_column_must_not_override_past_values.sql | 50 +++++++++++++++----
 2 files changed, 66 insertions(+), 22 deletions(-)

diff --git a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
index a5a0370620b..461075e9607 100644
--- a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
+++ b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.reference
@@ -1,33 +1,45 @@
+DEFAULT expressions
 -- Compact parts
-Origin
-1	2
+Before materialize
+1	1
 2	54321
 After materialize
-1	2
+1	1
 2	54321
 -- Wide parts
-Origin
-1	2
+Before materialize
+1	1
 2	54321
 After materialize
-1	2
+1	1
 2	54321
 -- Nullable column != physically absent
-Origin
-1	2
+Before materialize
+1	1
 2	\N
 3	54321
 After materialize
-1	2
+1	1
 2	\N
 3	54321
 -- Parts with renamed column
-Origin
-1	2
+Before materialize
+1	1
 2	54321
 After rename
-1	2
+1	1
 2	54321
 After materialize
-1	2
+1	1
 2	54321
+MATERIALIZED expressions
+-- Compact parts
+Before materialize
+1	54321
+After materialize
+1	65432
+-- Compact parts
+Before materialize
+1	54321
+After materialize
+1	65432
diff --git a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
index 825c7eab048..cfdde287712 100644
--- a/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
+++ b/tests/queries/0_stateless/02946_materialize_column_must_not_override_past_values.sql
@@ -1,11 +1,16 @@
 SET mutations_sync = 2;
 
+DROP TABLE IF EXISTS tab;
+
+-- Tests that existing parts which contain a non-default value in columns with DEFAULT expression remain unchanged by MATERIALIZE COLUMN>
+SELECT 'DEFAULT expressions';
+
 SELECT '-- Compact parts';
 
 CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id;
-INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id, dflt) VALUES (1, 1);
 INSERT INTO tab (id) VALUES (2);
-SELECT 'Origin';
+SELECT 'Before materialize';
 SELECT * FROM tab ORDER BY id;
 ALTER TABLE tab MATERIALIZE COLUMN dflt;
 SELECT 'After materialize';
@@ -15,9 +20,9 @@ DROP TABLE tab;
 SELECT '-- Wide parts';
 
 CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
-INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id, dflt) VALUES (1, 1);
 INSERT INTO tab (id) VALUES (2);
-SELECT 'Origin';
+SELECT 'Before materialize';
 SELECT * FROM tab ORDER BY id;
 ALTER TABLE tab MATERIALIZE COLUMN dflt;
 SELECT 'After materialize';
@@ -27,10 +32,10 @@ DROP TABLE tab;
 SELECT '-- Nullable column != physically absent';
 
 CREATE TABLE tab (id Int64, dflt Nullable(Int64) DEFAULT 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
-INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id, dflt) VALUES (1, 1);
 INSERT INTO tab (id, dflt) VALUES (2, NULL);
 INSERT INTO tab (id) VALUES (3);
-SELECT 'Origin';
+SELECT 'Before materialize';
 SELECT * FROM tab ORDER BY id;
 ALTER TABLE tab MATERIALIZE COLUMN dflt;
 SELECT 'After materialize';
@@ -40,14 +45,41 @@ DROP TABLE tab;
 SELECT '-- Parts with renamed column';
 
 CREATE TABLE tab (id Int64, dflt Int64 DEFAULT 54321) ENGINE MergeTree ORDER BY id;
-INSERT INTO tab (id, dflt) VALUES (1, 2);
+INSERT INTO tab (id, dflt) VALUES (1, 1);
 INSERT INTO tab (id) VALUES (2);
-SELECT 'Origin';
+SELECT 'Before materialize';
 SELECT * FROM tab ORDER BY id;
 ALTER TABLE tab RENAME COLUMN dflt TO dflt2;
 SELECT 'After rename';
 SELECT * FROM tab ORDER BY id;
-ALTER TABLE tab MATERIALIZE COLUMN bar;
+ALTER TABLE tab MATERIALIZE COLUMN dflt2;
 SELECT 'After materialize';
 SELECT * FROM tab ORDER BY id;
 DROP TABLE tab;
+
+-- But for columns with MATERIALIZED expression, all existing parts should be rewritten in case a new expression was set in the meantime.
+SELECT 'MATERIALIZED expressions';
+
+SELECT '-- Compact parts';
+
+CREATE TABLE tab (id Int64, mtrl Int64 MATERIALIZED 54321) ENGINE MergeTree ORDER BY id;
+INSERT INTO tab (id) VALUES (1);
+SELECT 'Before materialize';
+SELECT id, mtrl FROM tab ORDER BY id;
+ALTER TABLE tab MODIFY COLUMN mtrl Int64 MATERIALIZED 65432;
+ALTER TABLE tab MATERIALIZE COLUMN mtrl;
+SELECT 'After materialize';
+SELECT id, mtrl FROM tab ORDER BY id;
+DROP TABLE tab;
+
+SELECT '-- Compact parts';
+
+CREATE TABLE tab (id Int64, mtrl Int64 MATERIALIZED 54321) ENGINE MergeTree ORDER BY id SETTINGS min_bytes_for_wide_part = 1;
+INSERT INTO tab (id) VALUES (1);
+SELECT 'Before materialize';
+SELECT id, mtrl FROM tab ORDER BY id;
+ALTER TABLE tab MODIFY COLUMN mtrl Int64 MATERIALIZED 65432;
+ALTER TABLE tab MATERIALIZE COLUMN mtrl;
+SELECT 'After materialize';
+SELECT id, mtrl FROM tab ORDER BY id;
+DROP TABLE tab;

From 91f54f44b60cd0c9ac21495f1c801a6297512ad8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 13:21:39 +0100
Subject: [PATCH 0995/1081] Fix several logical errors in arrayFold

---
 src/Functions/array/arrayFold.cpp             |  3 ++
 .../02990_arrayFold_nullable_lc.reference     | 14 +++++++++
 .../02990_arrayFold_nullable_lc.sql           | 31 +++++++++++++++++++
 3 files changed, 48 insertions(+)
 create mode 100644 tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
 create mode 100644 tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql

diff --git a/src/Functions/array/arrayFold.cpp b/src/Functions/array/arrayFold.cpp
index 44fe95624a6..94d05238cea 100644
--- a/src/Functions/array/arrayFold.cpp
+++ b/src/Functions/array/arrayFold.cpp
@@ -32,6 +32,9 @@ public:
     size_t getNumberOfArguments() const override { return 0; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
 
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+
     void getLambdaArgumentTypes(DataTypes & arguments) const override
     {
         if (arguments.size() < 3)
diff --git a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
new file mode 100644
index 00000000000..59eb1cea7a0
--- /dev/null
+++ b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
@@ -0,0 +1,14 @@
+23
+23
+23
+23
+3
+3
+\N
+1
+\N
+\N
+\N
+23
+23
+23
diff --git a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql
new file mode 100644
index 00000000000..01bd949bd4a
--- /dev/null
+++ b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql
@@ -0,0 +1,31 @@
+SET allow_suspicious_low_cardinality_types=1;
+
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], toInt64(3));
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], toInt64(toNullable(3)));
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], materialize(toInt64(toNullable(3))));
+
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(3)); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toNullable(3)));
+
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), []::Array(Int64), toInt64(3));
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), []::Array(Nullable(Int64)), toInt64(toNullable(3)));
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), []::Array(Nullable(Int64)), toInt64(NULL));
+
+SELECT arrayFold((acc, x) -> x, materialize(CAST('[0, 1]', 'Array(Nullable(UInt8))')), toUInt8(toNullable(0)));
+SELECT arrayFold((acc, x) -> x, materialize(CAST([NULL], 'Array(Nullable(UInt8))')), toUInt8(toNullable(0)));
+SELECT arrayFold((acc, x) -> acc + x, materialize(CAST([NULL], 'Array(Nullable(UInt8))')), toUInt64(toNullable(0)));
+SELECT arrayFold((acc, x) -> acc + x, materialize(CAST([1, 2, NULL], 'Array(Nullable(UInt8))')), toUInt64(toNullable(0)));
+
+SELECT arrayFold((acc, x) -> toNullable(acc + (x * 2)), [1, 2, 3, 4], toInt64(3)); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> toNullable(acc + (x * 2)), [1, 2, 3, 4], toNullable(toInt64(3)));
+
+
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], toLowCardinality(toInt64(3))); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4], toLowCardinality(toInt64(3)));
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4]::Array(LowCardinality(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(LowCardinality(Int64)), toInt64(toLowCardinality(3)));
+
+
+SELECT arrayFold((acc, x) -> acc + (x * 2), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toNullable(3))); -- { serverError TYPE_MISMATCH }

From c580cdb96e2aaa25dd0e6ed719db519afbfc5613 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 15 Feb 2024 12:55:43 +0000
Subject: [PATCH 0996/1081] Fix review comment

---
 src/Interpreters/executeQuery.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 11eaffb99ff..5595e9801b2 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1381,6 +1381,7 @@ void executeQuery(
                     result_details.format = format_name;
 
                     fiu_do_on(FailPoints::execute_query_calling_empty_set_result_func_on_exception, {
+                        // it will throw std::bad_function_call
                         set_result_details = nullptr;
                         set_result_details(result_details);
                     });

From 5baae9326cc1920a270f06ac3d15ce7f8efd1fe1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 14:10:55 +0100
Subject: [PATCH 0997/1081] Fix optimize_uniq_to_count removing the column
 alias

---
 .../RewriteUniqToCountVisitor.cpp             |  4 ++
 ...990_optimize_uniq_to_count_alias.reference |  2 +
 .../02990_optimize_uniq_to_count_alias.sql    | 37 +++++++++++++++++++
 3 files changed, 43 insertions(+)
 create mode 100644 tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.reference
 create mode 100644 tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.sql

diff --git a/src/Interpreters/RewriteUniqToCountVisitor.cpp b/src/Interpreters/RewriteUniqToCountVisitor.cpp
index ddec6fe063e..a2e3a790c27 100644
--- a/src/Interpreters/RewriteUniqToCountVisitor.cpp
+++ b/src/Interpreters/RewriteUniqToCountVisitor.cpp
@@ -156,7 +156,11 @@ void RewriteUniqToCountMatcher::visit(ASTPtr & ast, Data & /*data*/)
     };
 
     if (match_subquery_with_distinct() || match_subquery_with_group_by())
+    {
+        auto main_alias = expr_list->children[0]->tryGetAlias();
         expr_list->children[0] = makeASTFunction("count");
+        expr_list->children[0]->setAlias(main_alias);
+    }
 }
 
 }
diff --git a/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.reference b/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.reference
new file mode 100644
index 00000000000..6ed281c757a
--- /dev/null
+++ b/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.reference
@@ -0,0 +1,2 @@
+1
+1
diff --git a/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.sql b/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.sql
new file mode 100644
index 00000000000..5ba0be39991
--- /dev/null
+++ b/tests/queries/0_stateless/02990_optimize_uniq_to_count_alias.sql
@@ -0,0 +1,37 @@
+--https://github.com/ClickHouse/ClickHouse/issues/59999
+DROP TABLE IF EXISTS tags;
+CREATE TABLE tags (dev_tag String) ENGINE = Memory AS SELECT '1';
+
+SELECT *
+FROM
+(
+    SELECT countDistinct(dev_tag) AS total_devtags
+    FROM
+    (
+        SELECT dev_tag
+        FROM
+            (
+                SELECT *
+                FROM tags
+            ) AS t
+    GROUP BY dev_tag
+    ) AS t
+) SETTINGS optimize_uniq_to_count=0;
+
+SELECT *
+FROM
+(
+    SELECT countDistinct(dev_tag) AS total_devtags
+    FROM
+    (
+        SELECT dev_tag
+        FROM
+            (
+                SELECT *
+                FROM tags
+            ) AS t
+    GROUP BY dev_tag
+    ) AS t
+) SETTINGS optimize_uniq_to_count=1;
+
+DROP TABLE IF EXISTS tags;

From 2d42054845c123895b77b2be3166f7f3638c4992 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 14:44:38 +0100
Subject: [PATCH 0998/1081] Fix 02981_vertical_merges_memory_usage with
 SharedMergeTree

---
 .../0_stateless/02981_vertical_merges_memory_usage.sql        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
index 6ca594ebc7d..c1b6e0beb7d 100644
--- a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
@@ -1,4 +1,4 @@
--- Tags: long
+-- Tags: long, no-random-merge-tree-settings
 
 DROP TABLE IF EXISTS t_vertical_merge_memory;
 
@@ -14,7 +14,7 @@ SETTINGS
     merge_max_block_size_bytes = '10M';
 
 INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3000);
-INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3000);
+INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3001);
 
 OPTIMIZE TABLE t_vertical_merge_memory FINAL;
 

From a11b9553ca290c28e8014832bc4fa2aad6c3f6f6 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 15 Feb 2024 17:16:27 +0100
Subject: [PATCH 0999/1081] Fix implementation in new analyzer

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 69 ++++++-------------
 src/Analyzer/TableFunctionNode.cpp            |  7 --
 src/Analyzer/TableFunctionNode.h              | 13 +---
 src/Interpreters/Context.cpp                  | 30 ++++++++
 src/Interpreters/Context.h                    |  2 +
 .../02428_parameterized_view.reference        |  1 +
 .../0_stateless/02428_parameterized_view.sh   |  3 +-
 7 files changed, 58 insertions(+), 67 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index ed67250312a..269094cbf63 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6634,55 +6634,8 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     QueryExpressionsAliasVisitor & expressions_visitor,
     bool nested_table_function)
 {
-
-    String database_name = scope.context->getCurrentDatabase();
-    String table_name;
-
-    auto * function_ast = table_function_node->getOriginalAST() ? table_function_node->getOriginalAST()->as<ASTFunction>() : nullptr;
     auto &table_function_node_typed = table_function_node->as<TableFunctionNode &>();
 
-    if (function_ast)
-    {
-        table_name = function_ast->name;
-        if (function_ast->is_compound_name)
-        {
-            std::vector<std::string> parts;
-            splitInto<'.'>(parts, function_ast->name);
-
-            if (parts.size() == 2)
-            {
-                database_name = parts[0];
-                table_name = parts[1];
-            }
-        }
-
-        StoragePtr table = table_name.empty() ? nullptr : DatabaseCatalog::instance().tryGetTable(
-                {database_name, table_name}, scope.context->getQueryContext());
-        if (table)
-        {
-            if (table.get()->isView() && table->as<StorageView>() && table->as<StorageView>()->isParameterizedView())
-            {
-                auto query = table->getInMemoryMetadataPtr()->getSelectQuery().inner_query->clone();
-                NameToNameMap parameterized_view_values = analyzeFunctionParamValues(
-                        table_function_node->getOriginalAST());
-                StorageView::replaceQueryParametersIfParametrizedView(query, parameterized_view_values);
-
-                ASTCreateQuery create;
-                create.select = query->as<ASTSelectWithUnionQuery>();
-                auto sample_block = InterpreterSelectWithUnionQuery::getSampleBlock(query, scope.context);
-                auto res = std::make_shared<StorageView>(StorageID(database_name, table_name),
-                                                         create,
-                                                         ColumnsDescription(sample_block.getNamesAndTypesList()),
-                        /* comment */ "",
-                        /* is_parameterized_view */ true);
-                res->startup();
-                function_ast->prefer_subquery_to_function_formatting = true;
-                table_function_node_typed.resolve(std::move(res), scope.context);
-                return;
-            }
-        }
-    }
-
     if (!nested_table_function)
         expressions_visitor.visit(table_function_node_typed.getArgumentsNode());
 
@@ -6693,6 +6646,28 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     TableFunctionPtr table_function_ptr = TableFunctionFactory::instance().tryGet(table_function_name, scope_context);
     if (!table_function_ptr)
     {
+        String database_name = scope_context->getCurrentDatabase();
+        String table_name;
+
+        auto function_ast = table_function_node->toAST();
+        Identifier table_identifier{table_function_name};
+        if (table_identifier.getPartsSize() == 1)
+        {
+            table_name = table_identifier[0];
+        }
+        else if (table_identifier.getPartsSize() == 2)
+        {
+            database_name = table_identifier[0];
+            table_name = table_identifier[1];
+        }
+
+        auto parametrized_view_storage = scope_context->getQueryContext()->buildParametrizedViewStorage(function_ast, database_name, table_name);
+        if (parametrized_view_storage)
+        {
+            table_function_node = std::make_shared<TableNode>(parametrized_view_storage, scope_context);
+            return;
+        }
+
         auto hints = TableFunctionFactory::instance().getHints(table_function_name);
         if (!hints.empty())
             throw Exception(ErrorCodes::UNKNOWN_FUNCTION,
diff --git a/src/Analyzer/TableFunctionNode.cpp b/src/Analyzer/TableFunctionNode.cpp
index f4ffe7f4ee5..e5158a06373 100644
--- a/src/Analyzer/TableFunctionNode.cpp
+++ b/src/Analyzer/TableFunctionNode.cpp
@@ -36,13 +36,6 @@ void TableFunctionNode::resolve(TableFunctionPtr table_function_value, StoragePt
     unresolved_arguments_indexes = std::move(unresolved_arguments_indexes_);
 }
 
-void TableFunctionNode::resolve(StoragePtr storage_value, ContextPtr context)
-{
-    storage = std::move(storage_value);
-    storage_id = storage->getStorageID();
-    storage_snapshot = storage->getStorageSnapshot(storage->getInMemoryMetadataPtr(), context);
-}
-
 const StorageID & TableFunctionNode::getStorageID() const
 {
     if (!storage)
diff --git a/src/Analyzer/TableFunctionNode.h b/src/Analyzer/TableFunctionNode.h
index cb65511bfce..69237ac8416 100644
--- a/src/Analyzer/TableFunctionNode.h
+++ b/src/Analyzer/TableFunctionNode.h
@@ -5,7 +5,6 @@
 #include <Storages/IStorage_fwd.h>
 #include <Storages/TableLockHolder.h>
 #include <Storages/StorageSnapshot.h>
-#include <Storages/StorageView.h>
 
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/StorageID.h>
@@ -74,14 +73,7 @@ public:
     /// Returns true, if table function is resolved, false otherwise
     bool isResolved() const
     {
-        /// For parameterized view, we only have storage
-        if (storage)
-            if (storage->as<StorageView>() && storage->as<StorageView>()->isParameterizedView())
-                return true;
-            else
-                return table_function != nullptr;
-        else
-            return false;
+        return storage != nullptr && table_function != nullptr;
     }
 
     /// Get table function, returns nullptr if table function node is not resolved
@@ -108,9 +100,6 @@ public:
     /// Resolve table function with table function, storage and context
     void resolve(TableFunctionPtr table_function_value, StoragePtr storage_value, ContextPtr context, std::vector<size_t> unresolved_arguments_indexes_);
 
-    /// Resolve table function as parameterized view with storage and context
-    void resolve(StoragePtr storage_value, ContextPtr context);
-
     /// Get storage id, throws exception if function node is not resolved
     const StorageID & getStorageID() const;
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 0e5897e7306..1f11779a6aa 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -94,6 +94,7 @@
 #include <Common/logger_useful.h>
 #include <Common/RemoteHostFilter.h>
 #include <Common/HTTPHeaderFilter.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Interpreters/AsynchronousInsertQueue.h>
 #include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/JIT/CompiledExpressionCache.h>
@@ -1931,6 +1932,35 @@ StoragePtr Context::executeTableFunction(const ASTPtr & table_expression, const
 }
 
 
+StoragePtr Context::buildParametrizedViewStorage(const ASTPtr & table_expression, const String & database_name, const String & table_name)
+{
+    if (table_name.empty())
+        return nullptr;
+
+    StoragePtr original_view = DatabaseCatalog::instance().tryGetTable({database_name, table_name}, getQueryContext());
+    if (!original_view || !original_view->isView())
+        return nullptr;
+    auto * storage_view = original_view->as<StorageView>();
+    if (!storage_view || !storage_view->isParameterizedView())
+        return nullptr;
+
+    auto query = original_view->getInMemoryMetadataPtr()->getSelectQuery().inner_query->clone();
+    NameToNameMap parameterized_view_values = analyzeFunctionParamValues(table_expression);
+    StorageView::replaceQueryParametersIfParametrizedView(query, parameterized_view_values);
+
+    ASTCreateQuery create;
+    create.select = query->as<ASTSelectWithUnionQuery>();
+    auto sample_block = InterpreterSelectQueryAnalyzer::getSampleBlock(query, shared_from_this());
+    auto res = std::make_shared<StorageView>(StorageID(database_name, table_name),
+                                                create,
+                                                ColumnsDescription(sample_block.getNamesAndTypesList()),
+            /* comment */ "",
+            /* is_parameterized_view */ true);
+    res->startup();
+    return res;
+}
+
+
 void Context::addViewSource(const StoragePtr & storage)
 {
     if (view_source)
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 8d40ccb301b..cdd188faa48 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -718,6 +718,8 @@ public:
     /// Overload for the new analyzer. Structure inference is performed in QueryAnalysisPass.
     StoragePtr executeTableFunction(const ASTPtr & table_expression, const TableFunctionPtr & table_function_ptr);
 
+    StoragePtr buildParametrizedViewStorage(const ASTPtr & table_expression, const String & database_name, const String & table_name);
+
     void addViewSource(const StoragePtr & storage);
     StoragePtr getViewSource() const;
 
diff --git a/tests/queries/0_stateless/02428_parameterized_view.reference b/tests/queries/0_stateless/02428_parameterized_view.reference
index 422fdaa4983..fd77e6ed8df 100644
--- a/tests/queries/0_stateless/02428_parameterized_view.reference
+++ b/tests/queries/0_stateless/02428_parameterized_view.reference
@@ -23,6 +23,7 @@ ERROR
 20
 20
 ERROR
+20
 30
 20
 30
diff --git a/tests/queries/0_stateless/02428_parameterized_view.sh b/tests/queries/0_stateless/02428_parameterized_view.sh
index 499b8697ffc..c6f0927db36 100755
--- a/tests/queries/0_stateless/02428_parameterized_view.sh
+++ b/tests/queries/0_stateless/02428_parameterized_view.sh
@@ -72,7 +72,8 @@ $CLICKHOUSE_CLIENT -q "INSERT INTO ${CLICKHOUSE_TEST_UNIQUE_NAME}.Catalog VALUES
 $CLICKHOUSE_CLIENT -q "INSERT INTO ${CLICKHOUSE_TEST_UNIQUE_NAME}.Catalog VALUES ('Paper', 20, 1)"
 $CLICKHOUSE_CLIENT -q "CREATE VIEW ${CLICKHOUSE_TEST_UNIQUE_NAME}.pv1 AS SELECT * FROM ${CLICKHOUSE_TEST_UNIQUE_NAME}.Catalog WHERE Price={price:UInt64}"
 $CLICKHOUSE_CLIENT -q "SELECT Price FROM ${CLICKHOUSE_TEST_UNIQUE_NAME}.pv1(price=20)"
-$CLICKHOUSE_CLIENT -q "SELECT Price FROM \`${CLICKHOUSE_TEST_UNIQUE_NAME}.pv1\`(price=20)"  2>&1 |  grep -Fq "UNKNOWN_FUNCTION" &&  echo 'ERROR' || echo 'OK'
+$CLICKHOUSE_CLIENT -q "SELECT Price FROM \`${CLICKHOUSE_TEST_UNIQUE_NAME}.pv1\`(price=20) SETTINGS allow_experimental_analyzer = 0"  2>&1 |  grep -Fq "UNKNOWN_FUNCTION" &&  echo 'ERROR' || echo 'OK'
+$CLICKHOUSE_CLIENT -q "SELECT Price FROM \`${CLICKHOUSE_TEST_UNIQUE_NAME}.pv1\`(price=20) SETTINGS allow_experimental_analyzer = 1"
 
 
 $CLICKHOUSE_CLIENT -q "INSERT INTO test_02428_Catalog VALUES ('Book2', 30, 8)"

From dfaea604c375882fd9f4f553ef2576848d11c531 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 15 Feb 2024 17:27:26 +0100
Subject: [PATCH 1000/1081] Remove redundant includes

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 269094cbf63..a2a6c8e128d 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -79,14 +79,6 @@
 #include <Analyzer/QueryTreeBuilder.h>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/Identifier.h>
-#include <Parsers/FunctionParameterValuesVisitor.h>
-#include <Parsers/ASTSelectWithUnionQuery.h>
-#include <Parsers/ASTCreateQuery.h>
-#include <Storages/StorageView.h>
-#include <Interpreters/InterpreterSelectWithUnionQuery.h>
-#include <Parsers/QueryParameterVisitor.h>
-#include <Poco/Logger.h>
-#include <Common/logger_useful.h>
 
 namespace ProfileEvents
 {

From 5a3a93bea538e947090be4350e7600c7b6935aca Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 29 Jan 2024 17:13:32 +0000
Subject: [PATCH 1001/1081] CI: refactor bugfix validate job

 #no_merge_commit
---
 .github/workflows/pull_request.yml |  15 +-
 .gitmessage                        |  10 +-
 tests/ci/bugfix_validate_check.py  | 218 +++++++++++++++------------
 tests/ci/ci.py                     |   9 +-
 tests/ci/ci_config.py              |  16 +-
 tests/ci/clickbench.py             |  19 +--
 tests/ci/commit_status_helper.py   |  19 +--
 tests/ci/fast_test_check.py        |  10 +-
 tests/ci/functional_test_check.py  | 228 +++++++++--------------------
 tests/ci/integration_test_check.py | 131 ++++-------------
 tests/ci/pr_info.py                |   1 -
 tests/ci/report.py                 |  12 +-
 tests/ci/run_check.py              |   5 +-
 tests/ci/sqllogic_test.py          |   7 +-
 tests/ci/upload_result_helper.py   |   7 +-
 tests/integration/ci-runner.py     |   4 +-
 16 files changed, 274 insertions(+), 437 deletions(-)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 405e1ec1502..9f735d210b6 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -500,21 +500,9 @@ jobs:
     if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: tests bugfix validate check
+      test_name: Bugfix validation
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        TEMP_PATH="${TEMP_PATH}/integration" \
-          python3 integration_test_check.py "Integration $CHECK_NAME" \
-            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
-
-        TEMP_PATH="${TEMP_PATH}/stateless" \
-          python3 functional_test_check.py "Stateless $CHECK_NAME" "$KILL_TIMEOUT" \
-            --validate-bugfix --post-commit-status=file || echo "ignore exit code"
-
-        python3 bugfix_validate_check.py "${TEMP_PATH}/stateless/functional_commit_status.tsv" "${TEMP_PATH}/integration/integration_commit_status.tsv"
 ##############################################################################################
 ############################ FUNCTIONAl STATEFUL TESTS #######################################
 ##############################################################################################
@@ -915,6 +903,7 @@ jobs:
       - BuilderSpecialReport
       - DocsCheck
       - FastTest
+      - TestsBugfixCheck
       - FunctionalStatelessTestDebug
       - FunctionalStatelessTestRelease
       - FunctionalStatelessTestReleaseDatabaseReplicated
diff --git a/.gitmessage b/.gitmessage
index 200d19e774d..760cfec97a4 100644
--- a/.gitmessage
+++ b/.gitmessage
@@ -1,6 +1,6 @@
 
 
-### CI modificators (add a leading space to apply):
+### CI modificators (add a leading space to apply) ###
 
 ## To avoid a merge commit in CI:
 #no_merge_commit
@@ -8,13 +8,21 @@
 ## To discard CI cache:
 #no_ci_cache
 
+## To not test (only style check):
+#do_not_test
+
 ## To run specified set of tests in CI:
 #ci_set_<SET_NAME>
 #ci_set_reduced
 #ci_set_arm
+#ci_set_integration
 
 ## To run specified job in CI:
 #job_<JOB NAME>
 #job_stateless_tests_release
 #job_package_debug
 #job_integration_tests_asan
+
+## To run only specified batches for multi-batch job(s)
+#batch_2
+#btach_1_2_3
diff --git a/tests/ci/bugfix_validate_check.py b/tests/ci/bugfix_validate_check.py
index 7fda81f11b2..ae7fce1f102 100644
--- a/tests/ci/bugfix_validate_check.py
+++ b/tests/ci/bugfix_validate_check.py
@@ -1,28 +1,28 @@
 #!/usr/bin/env python3
 
-import argparse
+from pathlib import Path
+import subprocess
+import sys
+from typing import List, Sequence, Tuple
 import csv
 import logging
-from pathlib import Path
-from typing import List, Optional, Tuple
 
-# isort: off
-from github import Github
-
-# isort: on
-
-from commit_status_helper import get_commit, post_commit_status
-from get_robot_token import get_best_robot_token
-from pr_info import PRInfo
-from report import ERROR, SUCCESS, TestResult, TestResults
-from s3_helper import S3Helper
-from upload_result_helper import upload_results
-
-
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser()
-    parser.add_argument("files", nargs="+", type=Path, help="Path to status files")
-    return parser.parse_args()
+from report import (
+    ERROR,
+    FAILURE,
+    SKIPPED,
+    SUCCESS,
+    FAIL,
+    OK,
+    TestResult,
+    TestResults,
+    JobReport,
+)
+from env_helper import TEMP_PATH
+from stopwatch import Stopwatch
+from ci_config import JobNames
+from ci_utils import normalize_string
+from functional_test_check import NO_CHANGES_MSG
 
 
 def post_commit_status_from_file(file_path: Path) -> List[str]:
@@ -35,93 +35,123 @@ def post_commit_status_from_file(file_path: Path) -> List[str]:
     return res[0]
 
 
-# Returns (is_ok, test_results, error_message)
-def process_result(file_path: Path) -> Tuple[bool, TestResults, Optional[str]]:
-    test_results = []  # type: TestResults
-    state, report_url, description = post_commit_status_from_file(file_path)
-    prefix = file_path.parent.name
-    if description.strip() in [
-        "Invalid check_status.tsv",
-        "Not found test_results.tsv",
-        "Empty test_results.tsv",
-    ]:
-        status = (
-            f'Check failed (<a href="{report_url}">Report</a>)'
-            if report_url != "null"
-            else "Check failed"
-        )
-        return False, [TestResult(f"{prefix}: {description}", status)], "Check failed"
-
-    is_ok = state == SUCCESS
-    if is_ok and report_url == "null":
-        return is_ok, test_results, None
-
-    status = (
-        f'OK: Bug reproduced (<a href="{report_url}">Report</a>)'
-        if is_ok
-        else f'Bug is not reproduced (<a href="{report_url}">Report</a>)'
-    )
-    test_results.append(TestResult(f"{prefix}: {description}", status))
-    return is_ok, test_results, None
+def get_failed_test_cases(file_path: Path) -> List[TestResult]:
+    job_report = JobReport.load(from_file=file_path)
+    test_results = []  # type: List[TestResult]
+    for tr in job_report.test_results:
+        if tr.status == FAIL:
+            if tr.name == NO_CHANGES_MSG:
+                tr.status = SKIPPED
+            else:
+                tr.name = "[with NOT_OK]   " + tr.name
+                tr.status = OK
+        elif tr.status == OK:
+            tr.name = "[with NOT_OK]   " + tr.name
+            tr.status = FAIL
+        else:
+            # do not invert error status
+            pass
+        test_results.append(tr)
+    return test_results
 
 
 def process_all_results(
-    file_paths: List[Path],
-) -> Tuple[bool, TestResults, Optional[str]]:
-    any_ok = False
-    all_results = []
-    error = None
-    for status_path in file_paths:
-        is_ok, test_results, error = process_result(status_path)
-        any_ok = any_ok or is_ok
-        if test_results is not None:
-            all_results.extend(test_results)
+    file_paths: Sequence[Path],
+) -> Tuple[str, str, TestResults]:
+    all_results = []  # type: TestResults
+    has_fail = False
+    has_error = False
+    has_ok = False
+    for job_report_path in file_paths:
+        test_results = get_failed_test_cases(job_report_path)
+        for tr in test_results:
+            if tr.status == FAIL:
+                has_fail = True
+            elif tr.status == ERROR:
+                has_error = True
+            elif tr.status == OK:
+                has_ok = True
+        all_results.extend(test_results)
+    if has_error:
+        status = ERROR
+        description = "Some error(s) occured in tests"
+    elif has_ok:
+        status = SUCCESS
+        description = "New test(s) reproduced a bug"
+    elif has_fail:
+        status = FAILURE
+        description = "New test(s) failed to reproduce a bug"
+    else:
+        status = ERROR
+        description = "Invalid job results"
 
-    return any_ok and error is None, all_results, error
+    return status, description, all_results
 
 
 def main():
     logging.basicConfig(level=logging.INFO)
-    args = parse_args()
-    status_files = args.files  # type: List[Path]
+    # args = parse_args()
+    stopwatch = Stopwatch()
+    jobs_to_validate = [JobNames.STATELESS_TEST_RELEASE, JobNames.INTEGRATION_TEST]
+    functional_job_report_file = Path(TEMP_PATH) / "functional_test_job_report.json"
+    integration_job_report_file = Path(TEMP_PATH) / "integration_test_job_report.json"
+    jobs_report_files = {
+        JobNames.STATELESS_TEST_RELEASE: functional_job_report_file,
+        JobNames.INTEGRATION_TEST: integration_job_report_file,
+    }
+    jobs_scripts = {
+        JobNames.STATELESS_TEST_RELEASE: "functional_test_check.py",
+        JobNames.INTEGRATION_TEST: "integration_test_check.py",
+    }
 
-    check_name_with_group = "Bugfix validate check"
-
-    is_ok, test_results, error = process_all_results(status_files)
-
-    description = ""
-    if error:
-        description = error
-    elif not is_ok:
-        description = "Changed tests don't reproduce the bug"
-
-    pr_info = PRInfo()
-    if not test_results:
-        description = "No results to upload"
-        report_url = ""
-        logging.info("No results to upload")
-    else:
-        report_url = upload_results(
-            S3Helper(),
-            pr_info.number,
-            pr_info.sha,
-            test_results,
-            status_files,
-            check_name_with_group,
+    for test_job in jobs_to_validate:
+        report_file = jobs_report_files[test_job]
+        test_script = jobs_scripts[test_job]
+        if report_file.exists():
+            report_file.unlink()
+        extra_timeout_option = ""
+        if test_job == JobNames.STATELESS_TEST_RELEASE:
+            extra_timeout_option = str(3600)
+        # "bugfix" must be present in checkname, as integration test runner checks this
+        check_name = f"Validate bugfix: {test_job}"
+        command = f"python3 {test_script} '{check_name}' {extra_timeout_option} --validate-bugfix --report-to-file {report_file}"
+        print(f"Going to validate job [{test_job}], command [{command}]")
+        _ = subprocess.run(
+            command,
+            stdout=sys.stdout,
+            stderr=sys.stderr,
+            text=True,
+            check=False,
+            shell=True,
         )
+        assert (
+            report_file.is_file()
+        ), f"No job report [{report_file}] found after job execution"
 
-    gh = Github(get_best_robot_token(), per_page=100)
-    commit = get_commit(gh, pr_info.sha)
-    post_commit_status(
-        commit,
-        SUCCESS if is_ok else ERROR,
-        report_url,
-        description,
-        check_name_with_group,
-        pr_info,
-        dump_to_file=True,
+    status, description, test_results = process_all_results(
+        list(jobs_report_files.values())
     )
 
+    additional_files = []
+    for job_id, report_file in jobs_report_files.items():
+        jr = JobReport.load(from_file=report_file)
+        additional_files.append(report_file)
+        for file in set(jr.additional_files):
+            file_ = Path(file)
+            file_name = file_.name
+            file_name = file_name.replace(".", "__" + normalize_string(job_id) + ".", 1)
+            file_ = file_.rename(file_.parent / file_name)
+            additional_files.append(file_)
+
+    JobReport(
+        description=description,
+        test_results=test_results,
+        status=status,
+        start_time=stopwatch.start_time_str,
+        duration=stopwatch.duration_seconds,
+        additional_files=additional_files,
+    ).dump()
+
 
 if __name__ == "__main__":
     main()
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 47e20b3ec09..819152fadc3 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1284,10 +1284,13 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
             if CI_CONFIG.is_build_job(job):
                 # no GH status for build jobs
                 continue
-            num_batches = CI_CONFIG.get_job_config(job).num_batches
-            for batch in range(num_batches):
+            job_config = CI_CONFIG.get_job_config(job)
+            if not job_config:
+                # there might be a new job that does not exist on this branch - skip it
+                continue
+            for batch in range(job_config.num_batches):
                 future = executor.submit(
-                    _concurrent_create_status, job, batch, num_batches
+                    _concurrent_create_status, job, batch, job_config.num_batches
                 )
                 futures.append(future)
         done, _ = concurrent.futures.wait(futures)
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index db5a83d5b96..3ebcbb7ed59 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -141,7 +141,7 @@ class JobNames(metaclass=WithIter):
     BUILD_CHECK_SPECIAL = "ClickHouse special build check"
 
     DOCS_CHECK = "Docs check"
-    BUGFIX_VALIDATE = "tests bugfix validate check"
+    BUGFIX_VALIDATE = "Bugfix validation"
 
 
 # dynamically update JobName with Build jobs
@@ -282,7 +282,6 @@ class BuildReportConfig:
 @dataclass
 class TestConfig:
     required_build: str
-    force_tests: bool = False
     job_config: JobConfig = field(default_factory=JobConfig)
 
 
@@ -302,6 +301,7 @@ install_check_digest = DigestConfig(
 )
 stateless_check_digest = DigestConfig(
     include_paths=[
+        "./tests/ci/functional_test_check.py",
         "./tests/queries/0_stateless/",
         "./tests/clickhouse-test",
         "./tests/config",
@@ -312,6 +312,7 @@ stateless_check_digest = DigestConfig(
 )
 stateful_check_digest = DigestConfig(
     include_paths=[
+        "./tests/ci/functional_test_check.py",
         "./tests/queries/1_stateful/",
         "./tests/clickhouse-test",
         "./tests/config",
@@ -473,9 +474,6 @@ class CIConfig:
             if check_name in config:  # type: ignore
                 res = config[check_name].job_config  # type: ignore
                 break
-        assert (
-            res is not None
-        ), f"Invalid check_name or CI_CONFIG outdated, config not found for [{check_name}]"
         return res  # type: ignore
 
     @staticmethod
@@ -890,7 +888,9 @@ CI_CONFIG = CIConfig(
         JobNames.BUGFIX_VALIDATE: TestConfig(
             "",
             # we run this check by label - no digest required
-            job_config=JobConfig(run_by_label="pr-bugfix"),
+            job_config=JobConfig(
+                run_by_label="pr-bugfix", run_command="bugfix_validate_check.py"
+            ),
         ),
     },
     test_configs={
@@ -1173,10 +1173,10 @@ CHECK_DESCRIPTIONS = [
         lambda x: x.startswith("AST fuzzer"),
     ),
     CheckDescription(
-        "Bugfix validate check",
+        JobNames.BUGFIX_VALIDATE,
         "Checks that either a new test (functional or integration) or there "
         "some changed tests that fail with the binary built on master branch",
-        lambda x: x == "Bugfix validate check",
+        lambda x: x == JobNames.BUGFIX_VALIDATE,
     ),
     CheckDescription(
         "CI running",
diff --git a/tests/ci/clickbench.py b/tests/ci/clickbench.py
index f8707cbcff7..50c7bb85d28 100644
--- a/tests/ci/clickbench.py
+++ b/tests/ci/clickbench.py
@@ -10,14 +10,15 @@ from pathlib import Path
 from typing import List, Tuple
 
 from build_download_helper import download_all_deb_packages
-from clickhouse_helper import CiLogsCredentials
-from commit_status_helper import override_status
-from docker_images_helper import DockerImage, get_docker_image, pull_image
-from env_helper import REPORT_PATH, TEMP_PATH
-from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import ERROR, SUCCESS, JobReport, StatusType, TestResults
+from clickhouse_helper import (
+    CiLogsCredentials,
+)
+from docker_images_helper import get_docker_image, pull_image, DockerImage
+from env_helper import TEMP_PATH, REPORT_PATH
+from pr_info import PRInfo
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
+from report import ERROR, SUCCESS, JobReport, StatusType, TestResults
 
 
 def get_image_name() -> str:
@@ -164,7 +165,6 @@ def main():
     state, description, test_results, additional_logs = process_results(
         result_path, server_log_path
     )
-    state = override_status(state, check_name)
 
     JobReport(
         description=description,
@@ -176,10 +176,7 @@ def main():
     ).dump()
 
     if state != SUCCESS:
-        if FORCE_TESTS_LABEL in pr_info.labels:
-            print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
-        else:
-            sys.exit(1)
+        sys.exit(1)
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 8a34d375d1e..b7128e36434 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -18,9 +18,7 @@ from github.GithubObject import NotSet
 from github.IssueComment import IssueComment
 from github.Repository import Repository
 
-# isort: on
-
-from ci_config import CHECK_DESCRIPTIONS, CI_CONFIG, REQUIRED_CHECKS, CheckDescription
+from ci_config import REQUIRED_CHECKS, CHECK_DESCRIPTIONS, CheckDescription
 from env_helper import GITHUB_JOB_URL, GITHUB_REPOSITORY, TEMP_PATH
 from pr_info import SKIP_MERGEABLE_CHECK_LABEL, PRInfo
 from report import (
@@ -67,21 +65,6 @@ class RerunHelper:
         return None
 
 
-def override_status(
-    status: StatusType, check_name: str, invert: bool = False
-) -> StatusType:
-    test_config = CI_CONFIG.test_configs.get(check_name)
-    if test_config and test_config.force_tests:
-        return SUCCESS
-
-    if invert:
-        if status == SUCCESS:
-            return ERROR
-        return SUCCESS
-
-    return status
-
-
 def get_commit(gh: Github, commit_sha: str, retry_count: int = RETRY) -> Commit:
     for i in range(retry_count):
         try:
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index e483e9d4ac2..5d528bb4c48 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -10,7 +10,7 @@ from typing import Tuple
 
 from docker_images_helper import DockerImage, get_docker_image, pull_image
 from env_helper import REPO_COPY, S3_BUILDS_BUCKET, TEMP_PATH
-from pr_info import FORCE_TESTS_LABEL, PRInfo
+from pr_info import PRInfo
 from report import (
     ERROR,
     FAILURE,
@@ -190,13 +190,7 @@ def main():
 
     # Refuse other checks to run if fast test failed
     if state != SUCCESS:
-        if state == ERROR:
-            print("The status is 'error', report failure disregard the labels")
-            sys.exit(1)
-        elif FORCE_TESTS_LABEL in pr_info.labels:
-            print(f"'{FORCE_TESTS_LABEL}' enabled, reporting success")
-        else:
-            sys.exit(1)
+        sys.exit(1)
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index e230aa5a679..da2dea60fc1 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -1,7 +1,6 @@
 #!/usr/bin/env python3
 
 import argparse
-import atexit
 import csv
 import logging
 import os
@@ -11,34 +10,16 @@ import sys
 from pathlib import Path
 from typing import List, Tuple
 
-# isort: off
-from github import Github
-
-# isort: on
-
 from build_download_helper import download_all_deb_packages
-from clickhouse_helper import (
-    CiLogsCredentials,
-    ClickHouseHelper,
-    prepare_tests_results_for_clickhouse,
-)
-from commit_status_helper import (
-    get_commit,
-    override_status,
-    post_commit_status,
-    post_commit_status_to_file,
-    update_mergeable_check,
-)
-from docker_images_helper import DockerImage, get_docker_image, pull_image
+from clickhouse_helper import CiLogsCredentials
+
+from docker_images_helper import DockerImage, pull_image, get_docker_image
 from download_release_packages import download_last_release
-from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
-from get_robot_token import get_best_robot_token
-from pr_info import FORCE_TESTS_LABEL, PRInfo
-from report import ERROR, SUCCESS, StatusType, TestResults, read_test_results
-from s3_helper import S3Helper
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
+from pr_info import PRInfo
+from report import ERROR, SUCCESS, JobReport, StatusType, TestResults, read_test_results
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
-from upload_result_helper import upload_results
 
 NO_CHANGES_MSG = "Nothing to run"
 
@@ -130,7 +111,7 @@ def get_run_command(
     )
 
 
-def get_tests_to_run(pr_info: PRInfo) -> List[str]:
+def _get_statless_tests_to_run(pr_info: PRInfo) -> List[str]:
     result = set()
 
     if pr_info.changed_files is None:
@@ -213,10 +194,10 @@ def parse_args():
         help="Check that added tests failed on latest stable",
     )
     parser.add_argument(
-        "--post-commit-status",
-        default="commit_status",
-        choices=["commit_status", "file"],
-        help="Where to public post commit status",
+        "--report-to-file",
+        type=str,
+        default="",
+        help="Path to write script report to (for --validate-bugfix)",
     )
     return parser.parse_args()
 
@@ -232,7 +213,6 @@ def main():
     reports_path.mkdir(parents=True, exist_ok=True)
 
     repo_path = Path(REPO_COPY)
-    post_commit_path = temp_path / "functional_commit_status.tsv"
 
     args = parse_args()
     check_name = args.check_name or os.getenv("CHECK_NAME")
@@ -249,62 +229,20 @@ def main():
     flaky_check = "flaky" in check_name.lower()
 
     run_changed_tests = flaky_check or validate_bugfix_check
-
-    # For validate_bugfix_check we need up to date information about labels, so pr_event_from_api is used
-    pr_info = PRInfo(
-        need_changed_files=run_changed_tests, pr_event_from_api=validate_bugfix_check
-    )
-
-    # FIXME: move to job report and remove
-    gh = Github(get_best_robot_token(), per_page=100)
-    commit = get_commit(gh, pr_info.sha)
-    atexit.register(update_mergeable_check, commit, pr_info, check_name)
-
-    if validate_bugfix_check and "pr-bugfix" not in pr_info.labels:
-        if args.post_commit_status == "file":
-            post_commit_status_to_file(
-                post_commit_path,
-                f"Skipped (no pr-bugfix in {pr_info.labels})",
-                SUCCESS,
-                "null",
-            )
-        logging.info("Skipping '%s' (no pr-bugfix in %s)", check_name, pr_info.labels)
-        sys.exit(0)
+    pr_info = PRInfo(need_changed_files=run_changed_tests)
+    tests_to_run = []
+    if run_changed_tests:
+        assert (
+            args.report_to_file
+        ), "JobReport file path must be provided with --validate-bugfix"
+        tests_to_run = _get_statless_tests_to_run(pr_info)
 
     if "RUN_BY_HASH_NUM" in os.environ:
         run_by_hash_num = int(os.getenv("RUN_BY_HASH_NUM", "0"))
         run_by_hash_total = int(os.getenv("RUN_BY_HASH_TOTAL", "0"))
-        check_name_with_group = (
-            check_name + f" [{run_by_hash_num + 1}/{run_by_hash_total}]"
-        )
     else:
         run_by_hash_num = 0
         run_by_hash_total = 0
-        check_name_with_group = check_name
-
-    tests_to_run = []
-    if run_changed_tests:
-        tests_to_run = get_tests_to_run(pr_info)
-        if not tests_to_run:
-            state = override_status(SUCCESS, check_name, validate_bugfix_check)
-            if args.post_commit_status == "commit_status":
-                post_commit_status(
-                    commit,
-                    state,
-                    "",
-                    NO_CHANGES_MSG,
-                    check_name_with_group,
-                    pr_info,
-                    dump_to_file=True,
-                )
-            elif args.post_commit_status == "file":
-                post_commit_status_to_file(
-                    post_commit_path,
-                    description=NO_CHANGES_MSG,
-                    state=state,
-                    report_url="null",
-                )
-            sys.exit(0)
 
     image_name = get_image_name(check_name)
 
@@ -338,91 +276,65 @@ def main():
         pr_info, stopwatch.start_time_str, check_name
     )
 
-    run_command = get_run_command(
-        check_name,
-        packages_path,
-        repo_path,
-        result_path,
-        server_log_path,
-        kill_timeout,
-        additional_envs,
-        ci_logs_args,
-        docker_image,
-        flaky_check,
-        tests_to_run,
-    )
-    logging.info("Going to run func tests: %s", run_command)
-
-    with TeePopen(run_command, run_log_path) as process:
-        retcode = process.wait()
-        if retcode == 0:
-            logging.info("Run successfully")
-        else:
-            logging.info("Run failed")
-
-    try:
-        subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
-    except subprocess.CalledProcessError:
-        logging.warning("Failed to change files owner in %s, ignoring it", temp_path)
-
-    ci_logs_credentials.clean_ci_logs_from_credentials(run_log_path)
-    s3_helper = S3Helper()
-
-    state, description, test_results, additional_logs = process_results(
-        result_path, server_log_path
-    )
-    state = override_status(state, check_name, invert=validate_bugfix_check)
-
-    ch_helper = ClickHouseHelper()
-
-    report_url = upload_results(
-        s3_helper,
-        pr_info.number,
-        pr_info.sha,
-        test_results,
-        [run_log_path] + additional_logs,
-        check_name_with_group,
-    )
-
-    print(f"::notice:: {check_name} Report url: {report_url}")
-    if args.post_commit_status == "commit_status":
-        post_commit_status(
-            commit,
-            state,
-            report_url,
-            description,
-            check_name_with_group,
-            pr_info,
-            dump_to_file=True,
+    if (not validate_bugfix_check and not flaky_check) or tests_to_run:
+        run_command = get_run_command(
+            check_name,
+            packages_path,
+            repo_path,
+            result_path,
+            server_log_path,
+            kill_timeout,
+            additional_envs,
+            ci_logs_args,
+            docker_image,
+            flaky_check,
+            tests_to_run,
         )
-    elif args.post_commit_status == "file":
-        post_commit_status_to_file(
-            post_commit_path,
-            description,
-            state,
-            report_url,
+        logging.info("Going to run func tests: %s", run_command)
+
+        with TeePopen(run_command, run_log_path) as process:
+            retcode = process.wait()
+            if retcode == 0:
+                logging.info("Run successfully")
+            else:
+                logging.info("Run failed")
+
+        try:
+            subprocess.check_call(
+                f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True
+            )
+        except subprocess.CalledProcessError:
+            logging.warning(
+                "Failed to change files owner in %s, ignoring it", temp_path
+            )
+
+        ci_logs_credentials.clean_ci_logs_from_credentials(run_log_path)
+
+        state, description, test_results, additional_logs = process_results(
+            result_path, server_log_path
         )
     else:
-        raise Exception(
-            f'Unknown post_commit_status option "{args.post_commit_status}"'
+        print(
+            "This is validate bugfix or flaky check run, but no changes test to run - skip with success"
+        )
+        state, description, test_results, additional_logs = (
+            SUCCESS,
+            "No tests to run",
+            [],
+            [],
         )
 
-    prepared_events = prepare_tests_results_for_clickhouse(
-        pr_info,
-        test_results,
-        state,
-        stopwatch.duration_seconds,
-        stopwatch.start_time_str,
-        report_url,
-        check_name_with_group,
-    )
-    ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
+    JobReport(
+        description=description,
+        test_results=test_results,
+        status=state,
+        start_time=stopwatch.start_time_str,
+        duration=stopwatch.duration_seconds,
+        additional_files=additional_logs,
+    ).dump(to_file=args.report_to_file if args.report_to_file else None)
 
     if state != SUCCESS:
-        if FORCE_TESTS_LABEL in pr_info.labels:
-            print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
-        else:
-            sys.exit(1)
+        sys.exit(1)
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index 5af4d5e625b..751abf617fa 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -5,38 +5,27 @@ import csv
 import json
 import logging
 import os
-import subprocess
 import sys
 from pathlib import Path
 from typing import Dict, List, Tuple
 
 from build_download_helper import download_all_deb_packages
-from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
-from commit_status_helper import (
-    get_commit,
-    override_status,
-    post_commit_status,
-    post_commit_status_to_file,
-)
 from docker_images_helper import DockerImage, get_docker_image
 from download_release_packages import download_last_release
 from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
-from get_robot_token import get_best_robot_token
-from github_helper import GitHub
 from integration_test_images import IMAGES
 from pr_info import PRInfo
 from report import (
     ERROR,
     SUCCESS,
     StatusType,
+    JobReport,
     TestResult,
     TestResults,
     read_test_results,
 )
-from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
-from upload_result_helper import upload_results
 
 
 def get_json_params_dict(
@@ -131,16 +120,19 @@ def process_results(
 def parse_args():
     parser = argparse.ArgumentParser()
     parser.add_argument("check_name")
+    parser.add_argument(
+        "--run-tests", nargs="*", help="List of tests to run", default=None
+    )
     parser.add_argument(
         "--validate-bugfix",
         action="store_true",
         help="Check that added tests failed on latest stable",
     )
     parser.add_argument(
-        "--post-commit-status",
-        default="commit_status",
-        choices=["commit_status", "file"],
-        help="Where to public post commit status",
+        "--report-to-file",
+        type=str,
+        default="",
+        help="Path to write script report to (for --validate-bugfix)",
     )
     return parser.parse_args()
 
@@ -154,7 +146,6 @@ def main():
     reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
 
-    post_commit_path = temp_path / "integration_commit_status.tsv"
     repo_path = Path(REPO_COPY)
 
     args = parse_args()
@@ -167,37 +158,19 @@ def main():
     if "RUN_BY_HASH_NUM" in os.environ:
         run_by_hash_num = int(os.getenv("RUN_BY_HASH_NUM", "0"))
         run_by_hash_total = int(os.getenv("RUN_BY_HASH_TOTAL", "0"))
-        check_name_with_group = (
-            check_name + f" [{run_by_hash_num + 1}/{run_by_hash_total}]"
-        )
     else:
         run_by_hash_num = 0
         run_by_hash_total = 0
-        check_name_with_group = check_name
 
     is_flaky_check = "flaky" in check_name
 
+    assert (
+        not validate_bugfix_check or args.report_to_file
+    ), "--report-to-file must be provided for --validate-bugfix"
+
     # For validate_bugfix_check we need up to date information about labels, so
     # pr_event_from_api is used
-    pr_info = PRInfo(
-        need_changed_files=is_flaky_check or validate_bugfix_check,
-        pr_event_from_api=validate_bugfix_check,
-    )
-
-    if validate_bugfix_check and "pr-bugfix" not in pr_info.labels:
-        if args.post_commit_status == "file":
-            post_commit_status_to_file(
-                post_commit_path,
-                f"Skipped (no pr-bugfix in {pr_info.labels})",
-                SUCCESS,
-                "null",
-            )
-        logging.info("Skipping '%s' (no pr-bugfix in '%s')", check_name, pr_info.labels)
-        sys.exit(0)
-
-    # FIXME: switch to JobReport and remove:
-    gh = GitHub(get_best_robot_token())
-    commit = get_commit(gh, pr_info.sha)
+    pr_info = PRInfo(need_changed_files=is_flaky_check or validate_bugfix_check)
 
     images = [get_docker_image(image_) for image_ in IMAGES]
 
@@ -245,7 +218,7 @@ def main():
         ),
     )
 
-    ch_helper = ClickHouseHelper()
+    integration_infrastructure_fail = False
     with TeePopen(run_command, output_path_log, my_env) as process:
         retcode = process.wait()
         if retcode == 0:
@@ -254,73 +227,31 @@ def main():
             logging.warning(
                 "There were issues with infrastructure. Not writing status report to restart job."
             )
-            prepared_events = prepare_tests_results_for_clickhouse(
-                pr_info,
-                [
-                    TestResult(
-                        "integration_infrastructure_fail",
-                        "ERROR",
-                        stopwatch.duration_seconds,
-                    )
-                ],
-                ERROR,
-                stopwatch.duration_seconds,
-                stopwatch.start_time_str,
-                "",
-                check_name_with_group,
-            )
-
-            ch_helper.insert_events_into(
-                db="default", table="checks", events=prepared_events
-            )
+            integration_infrastructure_fail = True
             sys.exit(1)
         else:
             logging.info("Some tests failed")
 
-    subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
+    # subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
 
-    state, description, test_results, additional_logs = process_results(result_path)
-    state = override_status(state, check_name, invert=validate_bugfix_check)
-
-    s3_helper = S3Helper()
-    report_url = upload_results(
-        s3_helper,
-        pr_info.number,
-        pr_info.sha,
-        test_results,
-        [output_path_log] + additional_logs,
-        check_name_with_group,
-    )
-
-    print(f"::notice:: {check_name} Report url: {report_url}")
-    if args.post_commit_status == "commit_status":
-        post_commit_status(
-            commit,
-            state,
-            report_url,
-            description,
-            check_name_with_group,
-            pr_info,
-            dump_to_file=True,
-        )
-    elif args.post_commit_status == "file":
-        post_commit_status_to_file(post_commit_path, description, state, report_url)
+    if not integration_infrastructure_fail:
+        state, description, test_results, additional_logs = process_results(result_path)
     else:
-        raise Exception(
-            f'Unknown post_commit_status option "{args.post_commit_status}"'
+        state, description, test_results, additional_logs = (
+            ERROR,
+            "no description",
+            [TestResult("infrastructure error", ERROR, stopwatch.duration_seconds)],
+            [],
         )
 
-    prepared_events = prepare_tests_results_for_clickhouse(
-        pr_info,
-        test_results,
-        state,
-        stopwatch.duration_seconds,
-        stopwatch.start_time_str,
-        report_url,
-        check_name_with_group,
-    )
-
-    ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
+    JobReport(
+        description=description,
+        test_results=test_results,
+        status=state,
+        start_time=stopwatch.start_time_str,
+        duration=stopwatch.duration_seconds,
+        additional_files=[output_path_log] + additional_logs,
+    ).dump(to_file=args.report_to_file if args.report_to_file else None)
 
     if state != SUCCESS:
         sys.exit(1)
diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index 744de7dea72..70f358e8070 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -19,7 +19,6 @@ from env_helper import (
     GITHUB_SERVER_URL,
 )
 
-FORCE_TESTS_LABEL = "force tests"
 SKIP_MERGEABLE_CHECK_LABEL = "skip mergeable check"
 NeedsDataType = Dict[str, Dict[str, Union[str, Dict[str, str]]]]
 
diff --git a/tests/ci/report.py b/tests/ci/report.py
index 55d1f604605..282c343eec3 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -34,6 +34,7 @@ SUCCESS: Final = "success"
 
 OK: Final = "OK"
 FAIL: Final = "FAIL"
+SKIPPED: Final = "SKIPPED"
 
 StatusType = Literal["error", "failure", "pending", "success"]
 STATUSES = [ERROR, FAILURE, PENDING, SUCCESS]  # type: List[StatusType]
@@ -292,9 +293,10 @@ class JobReport:
         return JOB_REPORT_FILE.is_file()
 
     @classmethod
-    def load(cls):  # type: ignore
+    def load(cls, from_file=None):  # type: ignore
         res = {}
-        with open(JOB_REPORT_FILE, "r") as json_file:
+        from_file = from_file or JOB_REPORT_FILE
+        with open(from_file, "r") as json_file:
             res = json.load(json_file)
             # Deserialize the nested lists of TestResult
             test_results_data = res.get("test_results", [])
@@ -307,13 +309,14 @@ class JobReport:
         if JOB_REPORT_FILE.exists():
             JOB_REPORT_FILE.unlink()
 
-    def dump(self):
+    def dump(self, to_file=None):
         def path_converter(obj):
             if isinstance(obj, Path):
                 return str(obj)
             raise TypeError("Type not serializable")
 
-        with open(JOB_REPORT_FILE, "w") as json_file:
+        to_file = to_file or JOB_REPORT_FILE
+        with open(to_file, "w") as json_file:
             json.dump(asdict(self), json_file, default=path_converter, indent=2)
 
 
@@ -594,7 +597,6 @@ class ReportColorTheme:
         blue = "#00B4FF"
 
     default = (ReportColor.green, ReportColor.red, ReportColor.yellow)
-    bugfixcheck = (ReportColor.yellow, ReportColor.blue, ReportColor.blue)
 
 
 ColorTheme = Tuple[str, str, str]
diff --git a/tests/ci/run_check.py b/tests/ci/run_check.py
index 2aeac5b5740..09d50c902d8 100644
--- a/tests/ci/run_check.py
+++ b/tests/ci/run_check.py
@@ -26,7 +26,7 @@ from lambda_shared_package.lambda_shared.pr import (
     TRUSTED_CONTRIBUTORS,
     check_pr_description,
 )
-from pr_info import FORCE_TESTS_LABEL, PRInfo
+from pr_info import PRInfo
 from report import FAILURE, PENDING
 
 TRUSTED_ORG_IDS = {
@@ -66,9 +66,6 @@ def pr_is_by_trusted_user(pr_user_login, pr_user_orgs):
 def should_run_ci_for_pr(pr_info: PRInfo) -> Tuple[bool, str]:
     # Consider the labels and whether the user is trusted.
     print("Got labels", pr_info.labels)
-    if FORCE_TESTS_LABEL in pr_info.labels:
-        print(f"Label '{FORCE_TESTS_LABEL}' set, forcing remaining checks")
-        return True, f"Labeled '{FORCE_TESTS_LABEL}'"
 
     if OK_SKIP_LABELS.intersection(pr_info.labels):
         return True, "Don't try new checks for release/backports/cherry-picks"
diff --git a/tests/ci/sqllogic_test.py b/tests/ci/sqllogic_test.py
index bbd81fd76bb..e9a109e425e 100755
--- a/tests/ci/sqllogic_test.py
+++ b/tests/ci/sqllogic_test.py
@@ -9,9 +9,8 @@ from pathlib import Path
 from typing import Tuple
 
 from build_download_helper import download_all_deb_packages
-from commit_status_helper import override_status
-from docker_images_helper import DockerImage, get_docker_image, pull_image
-from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
+from docker_images_helper import DockerImage, pull_image, get_docker_image
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
 from report import (
     ERROR,
     FAIL,
@@ -163,7 +162,7 @@ def main():
         status, description = ERROR, "Empty test_results.tsv"
 
     assert status is not None
-    status = override_status(status, check_name)
+
     test_results.append(
         TestResult(
             "All tests",
diff --git a/tests/ci/upload_result_helper.py b/tests/ci/upload_result_helper.py
index 6fa9c1dd873..9dca3fae1dc 100644
--- a/tests/ci/upload_result_helper.py
+++ b/tests/ci/upload_result_helper.py
@@ -9,7 +9,7 @@ from env_helper import (
     GITHUB_RUN_URL,
     GITHUB_SERVER_URL,
 )
-from report import ReportColorTheme, TestResults, create_test_html_report
+from report import TestResults, create_test_html_report
 from s3_helper import S3Helper
 
 
@@ -92,10 +92,6 @@ def upload_results(
     else:
         raw_log_url = GITHUB_JOB_URL()
 
-    statuscolors = (
-        ReportColorTheme.bugfixcheck if "bugfix validate check" in check_name else None
-    )
-
     if test_results or not ready_report_url:
         html_report = create_test_html_report(
             check_name,
@@ -107,7 +103,6 @@ def upload_results(
             branch_name,
             commit_url,
             additional_urls,
-            statuscolors=statuscolors,
         )
         report_path = Path("report.html")
         report_path.write_text(html_report, encoding="utf-8")
diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index 7c922e339fe..08dd9ba276b 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -252,9 +252,7 @@ class ClickhouseIntegrationTestsRunner:
         self.image_versions = self.params["docker_images_with_versions"]
         self.shuffle_groups = self.params["shuffle_test_groups"]
         self.flaky_check = "flaky check" in self.params["context_name"]
-        self.bugfix_validate_check = (
-            "bugfix validate check" in self.params["context_name"]
-        )
+        self.bugfix_validate_check = "bugfix" in self.params["context_name"].lower()
         # if use_tmpfs is not set we assume it to be true, otherwise check
         self.use_tmpfs = "use_tmpfs" not in self.params or self.params["use_tmpfs"]
         self.disable_net_host = (

From 8397b856ae98d2a54dac50d301104e6813bd1b25 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 15 Feb 2024 17:28:54 +0100
Subject: [PATCH 1002/1081] Cleanup

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index a2a6c8e128d..4d141ee962f 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -6626,7 +6626,7 @@ void QueryAnalyzer::resolveTableFunction(QueryTreeNodePtr & table_function_node,
     QueryExpressionsAliasVisitor & expressions_visitor,
     bool nested_table_function)
 {
-    auto &table_function_node_typed = table_function_node->as<TableFunctionNode &>();
+    auto & table_function_node_typed = table_function_node->as<TableFunctionNode &>();
 
     if (!nested_table_function)
         expressions_visitor.visit(table_function_node_typed.getArgumentsNode());

From 896e3298df58d3627614060e2709cda096df7a28 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 17:49:05 +0100
Subject: [PATCH 1003/1081] Update 02981_vertical_merges_memory_usage.sql

---
 .../queries/0_stateless/02981_vertical_merges_memory_usage.sql  | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
index c1b6e0beb7d..b784e734457 100644
--- a/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
+++ b/tests/queries/0_stateless/02981_vertical_merges_memory_usage.sql
@@ -14,6 +14,8 @@ SETTINGS
     merge_max_block_size_bytes = '10M';
 
 INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3000);
+-- Why 3001? - Deduplication, which is off with normal MergeTree by default but on for ReplicatedMergeTree and SharedMergeTree.
+-- We automatically replace MergeTree with SharedMergeTree in ClickHouse Cloud.
 INSERT INTO t_vertical_merge_memory SELECT number, arrayMap(x -> repeat('a', 50), range(1000)) FROM numbers(3001);
 
 OPTIMIZE TABLE t_vertical_merge_memory FINAL;

From 7c73af9f13690b3ac5ee757a18aca1b848b76bc8 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 15 Feb 2024 17:49:35 +0100
Subject: [PATCH 1004/1081] Remove test completely

---
 .../__init__.py                               |  0
 .../configs/legacy.xml                        |  7 --
 .../configs/remote_servers.xml                | 18 ------
 .../test.py                                   | 64 -------------------
 4 files changed, 89 deletions(-)
 delete mode 100644 tests/integration/test_distributed_backward_compatability/__init__.py
 delete mode 100644 tests/integration/test_distributed_backward_compatability/configs/legacy.xml
 delete mode 100644 tests/integration/test_distributed_backward_compatability/configs/remote_servers.xml
 delete mode 100644 tests/integration/test_distributed_backward_compatability/test.py

diff --git a/tests/integration/test_distributed_backward_compatability/__init__.py b/tests/integration/test_distributed_backward_compatability/__init__.py
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/integration/test_distributed_backward_compatability/configs/legacy.xml b/tests/integration/test_distributed_backward_compatability/configs/legacy.xml
deleted file mode 100644
index 5c1985a17a4..00000000000
--- a/tests/integration/test_distributed_backward_compatability/configs/legacy.xml
+++ /dev/null
@@ -1,7 +0,0 @@
-<clickhouse>
-    <profiles>
-        <default>
-            <legacy_column_name_of_tuple_literal>1</legacy_column_name_of_tuple_literal>
-        </default>
-    </profiles>
-</clickhouse>
diff --git a/tests/integration/test_distributed_backward_compatability/configs/remote_servers.xml b/tests/integration/test_distributed_backward_compatability/configs/remote_servers.xml
deleted file mode 100644
index 68b420f36b4..00000000000
--- a/tests/integration/test_distributed_backward_compatability/configs/remote_servers.xml
+++ /dev/null
@@ -1,18 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <test_cluster>
-            <shard>
-                <replica>
-                    <host>node1</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-            <shard>
-                <replica>
-                    <host>node2</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </test_cluster>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_distributed_backward_compatability/test.py b/tests/integration/test_distributed_backward_compatability/test.py
deleted file mode 100644
index 21ae5f2dc59..00000000000
--- a/tests/integration/test_distributed_backward_compatability/test.py
+++ /dev/null
@@ -1,64 +0,0 @@
-import pytest
-
-from helpers.cluster import ClickHouseCluster
-
-cluster = ClickHouseCluster(__file__)
-
-node_old = cluster.add_instance(
-    "node1",
-    main_configs=["configs/remote_servers.xml"],
-    image="clickhouse/clickhouse-server",
-    tag="24.1",
-    stay_alive=True,
-    with_installed_binary=True,
-)
-node_new = cluster.add_instance(
-    "node2",
-    main_configs=["configs/remote_servers.xml"],
-    user_configs=["configs/legacy.xml"],
-)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    try:
-        cluster.start()
-
-        for node in (node_old, node_new):
-            node.query(
-                "CREATE TABLE local_table(id UInt32, val String) ENGINE = MergeTree ORDER BY id"
-            )
-
-        node_old.query("INSERT INTO local_table VALUES (1, 'node1')")
-        node_new.query("INSERT INTO local_table VALUES (2, 'node2')")
-
-        node_old.query(
-            "CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)"
-        )
-        node_new.query(
-            "CREATE TABLE distributed(id UInt32, val String) ENGINE = Distributed(test_cluster, default, local_table)"
-        )
-
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-def test_distributed_in_tuple(started_cluster):
-    query1 = "SELECT count() FROM distributed WHERE (id, val) IN ((1, 'node1'), (2, 'a'), (3, 'b'))"
-    query2 = (
-        "SELECT sum((id, val) IN ((1, 'node1'), (2, 'a'), (3, 'b'))) FROM distributed"
-    )
-    assert node_old.query(query1) == "1\n"
-    assert node_old.query(query2) == "1\n"
-    assert node_new.query(query1) == "1\n"
-    assert node_new.query(query2) == "1\n"
-
-    large_set = "(" + ",".join([str(i) for i in range(1000)]) + ")"
-    query3 = "SELECT count() FROM distributed WHERE id IN " + large_set
-    query4 = "SELECT sum(id IN {}) FROM distributed".format(large_set)
-    assert node_old.query(query3) == "2\n"
-    assert node_old.query(query4) == "2\n"
-    assert node_new.query(query3) == "2\n"
-    assert node_new.query(query4) == "2\n"

From 2a783321d78b4427f1f8fff2eda6ee60558c41c1 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 15 Feb 2024 17:51:48 +0100
Subject: [PATCH 1005/1081] Fix deletion of s3 queue

---
 src/Storages/S3Queue/S3QueueFilesMetadata.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
index ac80ded5792..8583de27e00 100644
--- a/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
+++ b/src/Storages/S3Queue/S3QueueFilesMetadata.cpp
@@ -214,7 +214,7 @@ size_t S3QueueFilesMetadata::registerNewShard()
     }
 
     const auto zk_client = getZooKeeper();
-    zk_client->createAncestors(zookeeper_shards_path / "");
+    zk_client->createIfNotExists(zookeeper_shards_path, "");
 
     std::string shard_node_path;
     size_t shard_id = 0;
@@ -287,7 +287,10 @@ void S3QueueFilesMetadata::unregisterShard(size_t shard_id)
 
     const auto zk_client = getZooKeeper();
     const auto node_path = getZooKeeperPathForShard(shard_id);
-    zk_client->remove(node_path);
+    auto error_code = zk_client->tryRemove(node_path);
+    if (error_code != Coordination::Error::ZOK
+        && error_code != Coordination::Error::ZNONODE)
+        throw zkutil::KeeperException::fromPath(error_code, node_path);
 }
 
 size_t S3QueueFilesMetadata::getProcessingIdsNum() const

From f17d58ccedfd2a4dbb238339bb6fb4de748b9bc6 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 20:53:22 +0100
Subject: [PATCH 1006/1081] Add comment

---
 src/Functions/array/arrayFold.cpp                         | 3 +++
 .../0_stateless/02990_arrayFold_nullable_lc.reference     | 2 ++
 tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql | 8 ++++++--
 3 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/src/Functions/array/arrayFold.cpp b/src/Functions/array/arrayFold.cpp
index 94d05238cea..63c14f475fc 100644
--- a/src/Functions/array/arrayFold.cpp
+++ b/src/Functions/array/arrayFold.cpp
@@ -32,6 +32,9 @@ public:
     size_t getNumberOfArguments() const override { return 0; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
 
+    /// Avoid the default adaptors since they modify the inputs and that makes knowing the lambda argument types
+    /// (getLambdaArgumentTypes) more complex, as it requires knowing what the adaptors will do
+    /// It's much simpler to avoid the adapters
     bool useDefaultImplementationForNulls() const override { return false; }
     bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
 
diff --git a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
index 59eb1cea7a0..5bd5d7bbd90 100644
--- a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
+++ b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.reference
@@ -12,3 +12,5 @@
 23
 23
 23
+\N
+\N
diff --git a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql
index 01bd949bd4a..280defdfbb4 100644
--- a/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql
+++ b/tests/queries/0_stateless/02990_arrayFold_nullable_lc.sql
@@ -19,13 +19,17 @@ SELECT arrayFold((acc, x) -> acc + x, materialize(CAST([1, 2, NULL], 'Array(Null
 SELECT arrayFold((acc, x) -> toNullable(acc + (x * 2)), [1, 2, 3, 4], toInt64(3)); -- { serverError TYPE_MISMATCH }
 SELECT arrayFold((acc, x) -> toNullable(acc + (x * 2)), [1, 2, 3, 4], toNullable(toInt64(3)));
 
-
 SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], toLowCardinality(toInt64(3))); -- { serverError TYPE_MISMATCH }
 SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4], toLowCardinality(toInt64(3)));
 SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4]::Array(LowCardinality(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
 SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(LowCardinality(Int64)), toInt64(toLowCardinality(3)));
 
-
 SELECT arrayFold((acc, x) -> acc + (x * 2), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
 SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toLowCardinality(3))); -- { serverError TYPE_MISMATCH }
 SELECT arrayFold((acc, x) -> toLowCardinality(acc + (x * 2)), [1, 2, 3, 4]::Array(Nullable(Int64)), toInt64(toNullable(3))); -- { serverError TYPE_MISMATCH }
+
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], NULL);
+-- It's debatable which one of the following 2 queries should work, but considering the return type must match the
+-- accumulator type it makes sense to be the second one
+SELECT arrayFold((acc, x) -> (acc + (x * 2)), [1, 2, 3, 4], NULL::LowCardinality(Nullable(Int64))); -- { serverError TYPE_MISMATCH }
+SELECT arrayFold((acc, x) -> (acc + (x * 2))::LowCardinality(Nullable(Int64)), [1, 2, 3, 4], NULL::LowCardinality(Nullable(Int64)));

From a249840421de5fd432e648e96ebe55c94123583d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 21:42:47 +0100
Subject: [PATCH 1007/1081] Fix formatting of NOT with single literals

---
 src/Parsers/ASTFunction.cpp                   | 21 +++++++++++--------
 .../02990_format_not_precedence.reference     | 13 ++++++++++++
 .../02990_format_not_precedence.sql           |  7 +++++++
 3 files changed, 32 insertions(+), 9 deletions(-)
 create mode 100644 tests/queries/0_stateless/02990_format_not_precedence.reference
 create mode 100644 tests/queries/0_stateless/02990_format_not_precedence.sql

diff --git a/src/Parsers/ASTFunction.cpp b/src/Parsers/ASTFunction.cpp
index e7f7b48091a..dc3b011b096 100644
--- a/src/Parsers/ASTFunction.cpp
+++ b/src/Parsers/ASTFunction.cpp
@@ -835,34 +835,37 @@ void ASTFunction::formatImplWithoutAlias(const FormatSettings & settings, Format
 
                 const auto * literal = arguments->children[0]->as<ASTLiteral>();
                 const auto * function = arguments->children[0]->as<ASTFunction>();
-                bool negate = name == "negate";
                 bool is_tuple = literal && literal->value.getType() == Field::Types::Tuple;
                 // do not add parentheses for tuple literal, otherwise extra parens will be added `-((3, 7, 3), 1)` -> `-(((3, 7, 3), 1))`
                 bool literal_need_parens = literal && !is_tuple;
+
                 // negate always requires parentheses, otherwise -(-1) will be printed as --1
-                bool negate_need_parens = negate && (literal_need_parens || (function && function->name == "negate"));
-                // We don't need parentheses around a single literal.
-                bool need_parens = !literal && frame.need_parens && !negate_need_parens;
+                bool inside_parens = name == "negate" && (literal_need_parens || (function && function->name == "negate"));
+
+                /// We DO need parentheses around a single literal
+                /// For example, SELECT (NOT 0) + (NOT 0) cannot be transformed into SELECT NOT 0 + NOT 0, since
+                /// this is equal to SELECT NOT (0 + NOT 0)
+                bool outside_parens = frame.need_parens && !inside_parens;
 
                 // do not add extra parentheses for functions inside negate, i.e. -(-toUInt64(-(1)))
-                if (negate_need_parens)
+                if (inside_parens)
                     nested_need_parens.need_parens = false;
 
-                if (need_parens)
+                if (outside_parens)
                     settings.ostr << '(';
 
                 settings.ostr << (settings.hilite ? hilite_operator : "") << func[1] << (settings.hilite ? hilite_none : "");
 
-                if (negate_need_parens)
+                if (inside_parens)
                     settings.ostr << '(';
 
                 arguments->formatImpl(settings, state, nested_need_parens);
                 written = true;
 
-                if (negate_need_parens)
+                if (inside_parens)
                     settings.ostr << ')';
 
-                if (need_parens)
+                if (outside_parens)
                     settings.ostr << ')';
 
                 break;
diff --git a/tests/queries/0_stateless/02990_format_not_precedence.reference b/tests/queries/0_stateless/02990_format_not_precedence.reference
new file mode 100644
index 00000000000..f44cf2fdb52
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_not_precedence.reference
@@ -0,0 +1,13 @@
+-- { echoOn }
+SELECT NOT 0 + NOT 0;
+0
+SELECT NOT (0 + (NOT 0));
+0
+SELECT (NOT 0) + (NOT 0);
+2
+SELECT formatQuery('SELECT NOT 0 + NOT 0');
+SELECT NOT (0 + (NOT 0))
+SELECT formatQuery('SELECT NOT (0 + (NOT 0))');
+SELECT NOT (0 + (NOT 0))
+SELECT formatQuery('SELECT (NOT 0) + (NOT 0)');
+SELECT (NOT 0) + (NOT 0)
diff --git a/tests/queries/0_stateless/02990_format_not_precedence.sql b/tests/queries/0_stateless/02990_format_not_precedence.sql
new file mode 100644
index 00000000000..98ef2c9e781
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_not_precedence.sql
@@ -0,0 +1,7 @@
+-- { echoOn }
+SELECT NOT 0 + NOT 0;
+SELECT NOT (0 + (NOT 0));
+SELECT (NOT 0) + (NOT 0);
+SELECT formatQuery('SELECT NOT 0 + NOT 0');
+SELECT formatQuery('SELECT NOT (0 + (NOT 0))');
+SELECT formatQuery('SELECT (NOT 0) + (NOT 0)');

From 867eb8b9b934502df56f8412014809d9d850be0d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 15 Feb 2024 22:19:09 +0100
Subject: [PATCH 1008/1081] Adapt tests

---
 tests/queries/0_stateless/01920_not_chain_format.reference | 4 ++--
 tests/queries/0_stateless/01921_not_chain.reference        | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/01920_not_chain_format.reference b/tests/queries/0_stateless/01920_not_chain_format.reference
index 22abfd17dc7..bb58a0ff146 100644
--- a/tests/queries/0_stateless/01920_not_chain_format.reference
+++ b/tests/queries/0_stateless/01920_not_chain_format.reference
@@ -1,5 +1,5 @@
 -- { echo }
 EXPLAIN SYNTAX SELECT NOT NOT (NOT (NOT (NULL)));
-SELECT NOT (NOT (NOT NOT NULL))
+SELECT NOT (NOT (NOT (NOT NULL)))
 EXPLAIN SYNTAX SELECT NOT (NOT (NOT NOT NULL));
-SELECT NOT (NOT (NOT NOT NULL))
+SELECT NOT (NOT (NOT (NOT NULL)))
diff --git a/tests/queries/0_stateless/01921_not_chain.reference b/tests/queries/0_stateless/01921_not_chain.reference
index c29c66f1274..ebd18f4b342 100644
--- a/tests/queries/0_stateless/01921_not_chain.reference
+++ b/tests/queries/0_stateless/01921_not_chain.reference
@@ -4,6 +4,6 @@ SELECT 1 != (NOT 1);
 SELECT 1 != NOT 1;
 1
 EXPLAIN SYNTAX SELECT 1 != (NOT 1);
-SELECT 1 != NOT 1
+SELECT 1 != (NOT 1)
 EXPLAIN SYNTAX SELECT 1 != NOT 1;
-SELECT 1 != NOT 1
+SELECT 1 != (NOT 1)

From 712df1b51e5dc2da23525fadaa0c75223df9d922 Mon Sep 17 00:00:00 2001
From: Ronald Bradford <ronald.bradford@gmail.com>
Date: Thu, 15 Feb 2024 16:45:19 -0500
Subject: [PATCH 1009/1081] Update configuration-files.md

Fixed typo in XML example
---
 docs/en/operations/configuration-files.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 5a7b12a7421..81b25a4e897 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -36,7 +36,7 @@ which is equal to
 <clickhouse>
     <profiles>
         <default>
-            <max_query_size/>150000</max_query_size>
+            <max_query_size>150000</max_query_size>
         </default>
     </profiles>
 </clickhouse>

From 15683ae6a0233bbce64c9c7ec7b40fb9969f2192 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 22:58:07 +0100
Subject: [PATCH 1010/1081] Revert wrong modification

---
 src/Interpreters/executeQuery.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 824bb3c255b..827023cf663 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -704,10 +704,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
     {
         if (settings.dialect == Dialect::kusto && !internal)
         {
-            ParserKQLStatement parser(end, settings.allow_settings_after_format_in_insert);
-
-            /// TODO: parser should fail early when max_query_size limit is reached.
-            ast = parseKQLQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Kusto dialect is disabled until these two bugs will be fixed: https://github.com/ClickHouse/ClickHouse/issues/59037 and https://github.com/ClickHouse/ClickHouse/issues/59036");
         }
         else if (settings.dialect == Dialect::prql && !internal)
         {

From 123a34637d265358156fa3479342e943e35f3fa1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 15 Feb 2024 23:38:32 +0100
Subject: [PATCH 1011/1081] Disable tests with coverage

---
 .github/workflows/master.yml       | 16 ----------------
 .github/workflows/pull_request.yml | 16 ----------------
 2 files changed, 32 deletions(-)

diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index 0e83a777641..24daca44da6 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -375,14 +375,6 @@ jobs:
       test_name: Stateless tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-  FunctionalStatelessTestCoverage:
-    needs: [RunConfig, BuilderDebReleaseCoverage]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (coverage)
-      runner_type: func-tester
-      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
     needs: [RunConfig, BuilderDebRelease]
     if: ${{ !failure() && !cancelled() }}
@@ -483,14 +475,6 @@ jobs:
       test_name: Stateful tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-  FunctionalStatefulTestCoverage:
-    needs: [RunConfig, BuilderDebReleaseCoverage]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateful tests (coverage)
-      runner_type: func-tester
-      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
     needs: [RunConfig, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index 405e1ec1502..cf86afc5f6e 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -391,14 +391,6 @@ jobs:
       test_name: Stateless tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-  FunctionalStatelessTestCoverage:
-    needs: [RunConfig, BuilderDebReleaseCoverage]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (coverage)
-      runner_type: func-tester
-      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
     needs: [RunConfig, BuilderDebRelease]
     if: ${{ !failure() && !cancelled() }}
@@ -526,14 +518,6 @@ jobs:
       test_name: Stateful tests (release)
       runner_type: func-tester
       data: ${{ needs.RunConfig.outputs.data }}
-  FunctionalStatefulTestCoverage:
-    needs: [RunConfig, BuilderDebReleaseCoverage]
-    if: ${{ !failure() && !cancelled() }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateful tests (coverage)
-      runner_type: func-tester
-      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
     needs: [RunConfig, BuilderDebAarch64]
     if: ${{ !failure() && !cancelled() }}

From 2f36c9e965b01ca68a795499bfbdbec020c47609 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 16 Feb 2024 00:56:24 +0100
Subject: [PATCH 1012/1081] Maybe less memory usage for primary keys in memory

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 1 +
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 0f82e00edff..9e264cba3f8 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -842,6 +842,7 @@ void IMergeTreeDataPart::loadIndex()
 
         for (size_t i = 0; i < key_size; ++i)
         {
+            loaded_index[i]->shrinkToFit();
             loaded_index[i]->protect();
             if (loaded_index[i]->size() != marks_count)
                 throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Cannot read all data from index file {}(expected size: "
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index fcf9d5bd17d..8da9298b290 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -660,7 +660,7 @@ private:
 
     virtual void appendFilesOfIndexGranularity(Strings & files) const;
 
-    /// Loads index file.
+    /// Loads the index file.
     void loadIndex();
 
     void appendFilesOfIndex(Strings & files) const;

From 77c8f671cd258129af6f627293fca2e45e063a5f Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Thu, 15 Feb 2024 18:09:11 -0800
Subject: [PATCH 1013/1081] [Docs] Add info on using
 select_sequential_consistency for INSERTS in cloud

---
 docs/en/sql-reference/statements/insert-into.md | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/docs/en/sql-reference/statements/insert-into.md b/docs/en/sql-reference/statements/insert-into.md
index f9d93305071..2eebd62cbc6 100644
--- a/docs/en/sql-reference/statements/insert-into.md
+++ b/docs/en/sql-reference/statements/insert-into.md
@@ -204,6 +204,20 @@ Result:
 └─────┴───────────────────────┘
 ```
 
+## Inserts into ClickHouse Cloud
+
+By default, services on ClickHouse Cloud provide multiple replicas for high availability. When you connect to a service, a connection is established to one of these replicas.
+
+After an `INSERT` succeeds, data is written to the underlying storage. However, it may take some time for replicas to receive these updates. Therefore, if you use a different connection that executes a `SELECT` query on one of these other replicas, the updated data may not yet be reflected.
+
+It is possible to use the `select_sequential_consistency` to force replicas to receive the latest updates. Here is an example of a SELECT query using this setting:
+
+```sql
+SELECT .... SETTINGS select_sequential_consistency = 1;
+```
+
+Note that using `select_sequential_consistency` will increase the load on ClickHouse Keeper (used by ClickHouse Cloud internally) and may result in slower performance depending on the load on the service. We recommend against enabling this setting unless necessary. The recommended approach is to execute read/writes in the same session or to use a client driver that uses the native protocol (and thus supports sticky connections).
+
 ## Performance Considerations
 
 `INSERT` sorts the input data by primary key and splits them into partitions by a partition key. If you insert data into several partitions at once, it can significantly reduce the performance of the `INSERT` query. To avoid this:

From e168329ade6ff1153dc060c7504a0cbd2d71f8aa Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 16 Feb 2024 11:44:16 +0100
Subject: [PATCH 1014/1081] Revert "ReplicatedMergeTree invalid
 metadata_version fix"

---
 src/Storages/StorageReplicatedMergeTree.cpp   | 14 +++----
 ...ge_tree_invalid_metadata_version.reference | 14 -------
 ...ed_merge_tree_invalid_metadata_version.sql | 40 -------------------
 3 files changed, 5 insertions(+), 63 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
 delete mode 100644 tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 8e1598a1eef..6119541ff52 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -513,15 +513,8 @@ StorageReplicatedMergeTree::StorageReplicatedMergeTree(
             if (same_structure)
             {
                 Coordination::Stat metadata_stat;
-                current_zookeeper->get(fs::path(zookeeper_path) / "metadata", &metadata_stat);
-
-                /** We change metadata_snapshot so that `createReplica` method will create `metadata_version` node in ZooKeeper
-                  * with version of table '/metadata' node in Zookeeper.
-                  *
-                  * Otherwise `metadata_version` for not first replica will be initialized with 0 by default.
-                  */
+                current_zookeeper->get(zookeeper_path + "/metadata", &metadata_stat);
                 setInMemoryMetadata(metadata_snapshot->withMetadataVersion(metadata_stat.version));
-                metadata_snapshot = getInMemoryMetadataPtr();
             }
         }
         catch (Coordination::Exception & e)
@@ -5824,7 +5817,6 @@ bool StorageReplicatedMergeTree::executeMetadataAlter(const StorageReplicatedMer
     Coordination::Requests requests;
     requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "columns", entry.columns_str, -1));
     requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "metadata", entry.metadata_str, -1));
-    requests.emplace_back(zkutil::makeSetRequest(fs::path(replica_path) / "metadata_version", std::to_string(entry.alter_version), -1));
 
     auto table_id = getStorageID();
     auto alter_context = getContext();
@@ -5871,6 +5863,10 @@ bool StorageReplicatedMergeTree::executeMetadataAlter(const StorageReplicatedMer
         resetObjectColumnsFromActiveParts(parts_lock);
     }
 
+    /// This transaction may not happen, but it's OK, because on the next retry we will eventually create/update this node
+    /// TODO Maybe do in in one transaction for Replicated database?
+    zookeeper->createOrUpdate(fs::path(replica_path) / "metadata_version", std::to_string(current_metadata->getMetadataVersion()), zkutil::CreateMode::Persistent);
+
     return true;
 }
 
diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
deleted file mode 100644
index 128e3adcc0a..00000000000
--- a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.reference
+++ /dev/null
@@ -1,14 +0,0 @@
-Row 1:
-──────
-name:    metadata
-version: 1
---
-Row 1:
-──────
-name:  metadata_version
-value: 1
---
-id	UInt64					
-value	String					
-insert_time	DateTime					
-insert_time_updated	DateTime					
diff --git a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql b/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
deleted file mode 100644
index 3e37f368fd8..00000000000
--- a/tests/queries/0_stateless/02989_replicated_merge_tree_invalid_metadata_version.sql
+++ /dev/null
@@ -1,40 +0,0 @@
--- Tags: zookeeper
-
-DROP TABLE IF EXISTS test_table_replicated;
-CREATE TABLE test_table_replicated
-(
-    id UInt64,
-    value String
-) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '1_replica') ORDER BY id;
-
-ALTER TABLE test_table_replicated ADD COLUMN insert_time DateTime;
-
-SELECT name, version FROM system.zookeeper
-WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/'
-AND name = 'metadata' FORMAT Vertical;
-
-DROP TABLE IF EXISTS test_table_replicated_second;
-CREATE TABLE test_table_replicated_second
-(
-    id UInt64,
-    value String,
-    insert_time DateTime
-) ENGINE=ReplicatedMergeTree('/clickhouse/tables/{database}/test_table_replicated', '2_replica') ORDER BY id;
-
-DROP TABLE test_table_replicated;
-
-SELECT '--';
-
-SELECT name, value FROM system.zookeeper
-WHERE path = '/clickhouse/tables/' || currentDatabase() ||'/test_table_replicated/replicas/2_replica'
-AND name = 'metadata_version' FORMAT Vertical;
-
-SYSTEM RESTART REPLICA test_table_replicated_second;
-
-ALTER TABLE test_table_replicated_second ADD COLUMN insert_time_updated DateTime;
-
-SELECT '--';
-
-DESCRIBE test_table_replicated_second;
-
-DROP TABLE test_table_replicated_second;

From 5b83e771ed70870374defeade7feba3118a6abb8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 16 Feb 2024 13:06:57 +0100
Subject: [PATCH 1015/1081] Print CPU flags at startup

---
 programs/server/Server.cpp         | 15 +++++
 src/Common/{CpuId.h => CPUID.h}    | 91 +++++++++++++++---------------
 src/Common/ProfileEvents.cpp       |  8 +--
 src/Common/TargetSpecific.cpp      | 22 ++++----
 src/Common/ThreadProfileEvents.cpp | 16 +++---
 src/Functions/FunctionsJSON.h      |  2 +-
 src/Functions/divide/divide.cpp    |  6 +-
 7 files changed, 87 insertions(+), 73 deletions(-)
 rename src/Common/{CpuId.h => CPUID.h} (68%)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 53fc32663e7..b85bf6f814f 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -44,6 +44,7 @@
 #include <Common/assertProcessUserMatchesDataOwner.h>
 #include <Common/makeSocketAddress.h>
 #include <Common/FailPoint.h>
+#include <Common/CPUID.h>
 #include <Server/waitServersToFinish.h>
 #include <Interpreters/Cache/FileCacheFactory.h>
 #include <Core/ServerUUID.h>
@@ -712,6 +713,20 @@ try
         getNumberOfPhysicalCPUCores(),  // on ARM processors it can show only enabled at current moment cores
         std::thread::hardware_concurrency());
 
+    String cpu_info;
+#define COLLECT_FLAG(X) \
+    if (CPU::have##X()) \
+    {                   \
+        if (!cpu_info.empty()) \
+            cpu_info += ", ";  \
+        cpu_info += #X; \
+    }
+
+    CPU_ID_ENUMERATE(COLLECT_FLAG)
+#undef COLLECT_FLAG
+
+    LOG_INFO(log, "Available CPU instructions: {}", cpu_info);
+
     sanityChecks(*this);
 
     // Initialize global thread pool. Do it before we fetch configs from zookeeper
diff --git a/src/Common/CpuId.h b/src/Common/CPUID.h
similarity index 68%
rename from src/Common/CpuId.h
rename to src/Common/CPUID.h
index 1d15867289d..44b608ac1fe 100644
--- a/src/Common/CpuId.h
+++ b/src/Common/CPUID.h
@@ -11,7 +11,7 @@
 
 namespace DB
 {
-namespace Cpu
+namespace CPU
 {
 
 #if (defined(__x86_64__) || defined(__i386__))
@@ -98,7 +98,7 @@ inline bool cpuid(UInt32 op, UInt32 * res) noexcept /// NOLINT
     OP(AMXTILE)              \
     OP(AMXINT8)
 
-union CpuInfo
+union CPUInfo
 {
     UInt32 info[4];
 
@@ -110,9 +110,9 @@ union CpuInfo
         UInt32 edx;
     } registers;
 
-    inline explicit CpuInfo(UInt32 op) noexcept { cpuid(op, info); }
+    inline explicit CPUInfo(UInt32 op) noexcept { cpuid(op, info); }
 
-    inline CpuInfo(UInt32 op, UInt32 sub_op) noexcept { cpuid(op, sub_op, info); }
+    inline CPUInfo(UInt32 op, UInt32 sub_op) noexcept { cpuid(op, sub_op, info); }
 };
 
 #define DEF_NAME(X) inline bool have##X() noexcept;
@@ -121,67 +121,67 @@ union CpuInfo
 
 bool haveRDTSCP() noexcept
 {
-    return (CpuInfo(0x80000001).registers.edx >> 27) & 1u;
+    return (CPUInfo(0x80000001).registers.edx >> 27) & 1u;
 }
 
 bool haveSSE() noexcept
 {
-    return (CpuInfo(0x1).registers.edx >> 25) & 1u;
+    return (CPUInfo(0x1).registers.edx >> 25) & 1u;
 }
 
 bool haveSSE2() noexcept
 {
-    return (CpuInfo(0x1).registers.edx >> 26) & 1u;
+    return (CPUInfo(0x1).registers.edx >> 26) & 1u;
 }
 
 bool haveSSE3() noexcept
 {
-    return CpuInfo(0x1).registers.ecx & 1u;
+    return CPUInfo(0x1).registers.ecx & 1u;
 }
 
 bool havePCLMUL() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 1) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 1) & 1u;
 }
 
 bool haveSSSE3() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 9) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 9) & 1u;
 }
 
 bool haveSSE41() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 19) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 19) & 1u;
 }
 
 bool haveSSE42() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 20) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 20) & 1u;
 }
 
 bool haveF16C() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 29) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 29) & 1u;
 }
 
 bool havePOPCNT() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 23) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 23) & 1u;
 }
 
 bool haveAES() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 25) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 25) & 1u;
 }
 
 bool haveXSAVE() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 26) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 26) & 1u;
 }
 
 bool haveOSXSAVE() noexcept
 {
-    return (CpuInfo(0x1).registers.ecx >> 27) & 1u;
+    return (CPUInfo(0x1).registers.ecx >> 27) & 1u;
 }
 
 bool haveAVX() noexcept
@@ -191,7 +191,7 @@ bool haveAVX() noexcept
     // https://bugs.chromium.org/p/chromium/issues/detail?id=375968
     return haveOSXSAVE()                           // implies haveXSAVE()
            && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
-           && ((CpuInfo(0x1).registers.ecx >> 28) & 1u); // AVX bit
+           && ((CPUInfo(0x1).registers.ecx >> 28) & 1u); // AVX bit
 #else
     return false;
 #endif
@@ -199,22 +199,22 @@ bool haveAVX() noexcept
 
 bool haveFMA() noexcept
 {
-    return haveAVX() && ((CpuInfo(0x1).registers.ecx >> 12) & 1u);
+    return haveAVX() && ((CPUInfo(0x1).registers.ecx >> 12) & 1u);
 }
 
 bool haveAVX2() noexcept
 {
-    return haveAVX() && ((CpuInfo(0x7, 0).registers.ebx >> 5) & 1u);
+    return haveAVX() && ((CPUInfo(0x7, 0).registers.ebx >> 5) & 1u);
 }
 
 bool haveBMI1() noexcept
 {
-    return (CpuInfo(0x7, 0).registers.ebx >> 3) & 1u;
+    return (CPUInfo(0x7, 0).registers.ebx >> 3) & 1u;
 }
 
 bool haveBMI2() noexcept
 {
-    return (CpuInfo(0x7, 0).registers.ebx >> 8) & 1u;
+    return (CPUInfo(0x7, 0).registers.ebx >> 8) & 1u;
 }
 
 bool haveAVX512F() noexcept
@@ -224,8 +224,8 @@ bool haveAVX512F() noexcept
     return haveOSXSAVE()                           // implies haveXSAVE()
            && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
            && ((our_xgetbv(0) >> 5) & 7u) == 7u       // ZMM state is enabled by OS
-           && CpuInfo(0x0).registers.eax >= 0x7          // leaf 7 is present
-           && ((CpuInfo(0x7, 0).registers.ebx >> 16) & 1u); // AVX512F bit
+           && CPUInfo(0x0).registers.eax >= 0x7          // leaf 7 is present
+           && ((CPUInfo(0x7, 0).registers.ebx >> 16) & 1u); // AVX512F bit
 #else
     return false;
 #endif
@@ -233,87 +233,87 @@ bool haveAVX512F() noexcept
 
 bool haveAVX512DQ() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 17) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 17) & 1u);
 }
 
 bool haveRDSEED() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 18) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 18) & 1u);
 }
 
 bool haveADX() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 19) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 19) & 1u);
 }
 
 bool haveAVX512IFMA() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 21) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 21) & 1u);
 }
 
 bool havePCOMMIT() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 22) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 22) & 1u);
 }
 
 bool haveCLFLUSHOPT() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 23) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 23) & 1u);
 }
 
 bool haveCLWB() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 24) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 24) & 1u);
 }
 
 bool haveAVX512PF() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 26) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 26) & 1u);
 }
 
 bool haveAVX512ER() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 27) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 27) & 1u);
 }
 
 bool haveAVX512CD() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 28) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 28) & 1u);
 }
 
 bool haveSHA() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ebx >> 29) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 29) & 1u);
 }
 
 bool haveAVX512BW() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 30) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 30) & 1u);
 }
 
 bool haveAVX512VL() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ebx >> 31) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 31) & 1u);
 }
 
 bool havePREFETCHWT1() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x7, 0).registers.ecx >> 0) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ecx >> 0) & 1u);
 }
 
 bool haveAVX512VBMI() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ecx >> 1) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 1) & 1u);
 }
 
 bool haveAVX512VBMI2() noexcept
 {
-    return haveAVX512F() && ((CpuInfo(0x7, 0).registers.ecx >> 6) & 1u);
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 6) & 1u);
 }
 
 bool haveRDRAND() noexcept
 {
-    return CpuInfo(0x0).registers.eax >= 0x7 && ((CpuInfo(0x1).registers.ecx >> 30) & 1u);
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x1).registers.ecx >> 30) & 1u);
 }
 
 inline bool haveAMX() noexcept
@@ -330,22 +330,22 @@ inline bool haveAMX() noexcept
 bool haveAMXBF16() noexcept
 {
     return haveAMX()
-            && ((CpuInfo(0x7, 0).registers.edx >> 22) & 1u);  // AMX-BF16 bit
+            && ((CPUInfo(0x7, 0).registers.edx >> 22) & 1u);  // AMX-BF16 bit
 }
 
 bool haveAMXTILE() noexcept
 {
     return haveAMX()
-            && ((CpuInfo(0x7, 0).registers.edx >> 24) & 1u);  // AMX-TILE bit
+            && ((CPUInfo(0x7, 0).registers.edx >> 24) & 1u);  // AMX-TILE bit
 }
 
 bool haveAMXINT8() noexcept
 {
     return haveAMX()
-            && ((CpuInfo(0x7, 0).registers.edx >> 25) & 1u);  // AMX-INT8 bit
+            && ((CPUInfo(0x7, 0).registers.edx >> 25) & 1u);  // AMX-INT8 bit
 }
 
-struct CpuFlagsCache
+struct CPUFlagsCache
 {
 #define DEF_NAME(X) static inline bool have_##X = have##X();
     CPU_ID_ENUMERATE(DEF_NAME)
@@ -354,4 +354,3 @@ struct CpuFlagsCache
 
 }
 }
-
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index bdc5d2d88a8..679da441c76 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -310,7 +310,7 @@ The server successfully detected this situation and will download merged part fr
     M(ParallelReplicasStealingLeftoversMicroseconds, "Time spent collecting orphaned segments") \
     M(ParallelReplicasCollectingOwnedSegmentsMicroseconds, "Time spent collecting segments meant by hash") \
     \
-    M(PerfCpuCycles, "Total cycles. Be wary of what happens during CPU frequency scaling.")  \
+    M(PerfCPUCycles, "Total cycles. Be wary of what happens during CPU frequency scaling.")  \
     M(PerfInstructions, "Retired instructions. Be careful, these can be affected by various issues, most notably hardware interrupt counts.") \
     M(PerfCacheReferences, "Cache accesses. Usually, this indicates Last Level Cache accesses, but this may vary depending on your CPU. This may include prefetches and coherency messages; again this depends on the design of your CPU.") \
     M(PerfCacheMisses, "Cache misses. Usually this indicates Last Level Cache misses; this is intended to be used in conjunction with the PERFCOUNTHWCACHEREFERENCES event to calculate cache miss rates.") \
@@ -319,12 +319,12 @@ The server successfully detected this situation and will download merged part fr
     M(PerfBusCycles, "Bus cycles, which can be different from total cycles.") \
     M(PerfStalledCyclesFrontend, "Stalled cycles during issue.") \
     M(PerfStalledCyclesBackend, "Stalled cycles during retirement.") \
-    M(PerfRefCpuCycles, "Total cycles; not affected by CPU frequency scaling.") \
+    M(PerfRefCPUCycles, "Total cycles; not affected by CPU frequency scaling.") \
     \
-    M(PerfCpuClock, "The CPU clock, a high-resolution per-CPU timer") \
+    M(PerfCPUClock, "The CPU clock, a high-resolution per-CPU timer") \
     M(PerfTaskClock, "A clock count specific to the task that is running") \
     M(PerfContextSwitches, "Number of context switches") \
-    M(PerfCpuMigrations, "Number of times the process has migrated to a new CPU") \
+    M(PerfCPUMigrations, "Number of times the process has migrated to a new CPU") \
     M(PerfAlignmentFaults, "Number of alignment faults. These happen when unaligned memory accesses happen; the kernel can handle these but it reduces performance. This happens only on some architectures (never on x86).") \
     M(PerfEmulationFaults, "Number of emulation faults. The kernel sometimes traps on unimplemented instructions and emulates them for user space. This can negatively impact performance.") \
     M(PerfMinEnabledTime, "For all events, minimum time that an event was enabled. Used to track event multiplexing influence") \
diff --git a/src/Common/TargetSpecific.cpp b/src/Common/TargetSpecific.cpp
index b115d3a8734..49f396c0926 100644
--- a/src/Common/TargetSpecific.cpp
+++ b/src/Common/TargetSpecific.cpp
@@ -1,7 +1,7 @@
 #include <base/defines.h>
 #include <Common/TargetSpecific.h>
 
-#include <Common/CpuId.h>
+#include <Common/CPUID.h>
 
 namespace DB
 {
@@ -9,25 +9,25 @@ namespace DB
 UInt32 getSupportedArchs()
 {
     UInt32 result = 0;
-    if (Cpu::CpuFlagsCache::have_SSE42)
+    if (CPU::CPUFlagsCache::have_SSE42)
         result |= static_cast<UInt32>(TargetArch::SSE42);
-    if (Cpu::CpuFlagsCache::have_AVX)
+    if (CPU::CPUFlagsCache::have_AVX)
         result |= static_cast<UInt32>(TargetArch::AVX);
-    if (Cpu::CpuFlagsCache::have_AVX2)
+    if (CPU::CPUFlagsCache::have_AVX2)
         result |= static_cast<UInt32>(TargetArch::AVX2);
-    if (Cpu::CpuFlagsCache::have_AVX512F)
+    if (CPU::CPUFlagsCache::have_AVX512F)
         result |= static_cast<UInt32>(TargetArch::AVX512F);
-    if (Cpu::CpuFlagsCache::have_AVX512BW)
+    if (CPU::CPUFlagsCache::have_AVX512BW)
         result |= static_cast<UInt32>(TargetArch::AVX512BW);
-    if (Cpu::CpuFlagsCache::have_AVX512VBMI)
+    if (CPU::CPUFlagsCache::have_AVX512VBMI)
         result |= static_cast<UInt32>(TargetArch::AVX512VBMI);
-    if (Cpu::CpuFlagsCache::have_AVX512VBMI2)
+    if (CPU::CPUFlagsCache::have_AVX512VBMI2)
         result |= static_cast<UInt32>(TargetArch::AVX512VBMI2);
-    if (Cpu::CpuFlagsCache::have_AMXBF16)
+    if (CPU::CPUFlagsCache::have_AMXBF16)
         result |= static_cast<UInt32>(TargetArch::AMXBF16);
-    if (Cpu::CpuFlagsCache::have_AMXTILE)
+    if (CPU::CPUFlagsCache::have_AMXTILE)
         result |= static_cast<UInt32>(TargetArch::AMXTILE);
-    if (Cpu::CpuFlagsCache::have_AMXINT8)
+    if (CPU::CPUFlagsCache::have_AMXINT8)
         result |= static_cast<UInt32>(TargetArch::AMXINT8);
     return result;
 }
diff --git a/src/Common/ThreadProfileEvents.cpp b/src/Common/ThreadProfileEvents.cpp
index 990151d73ff..40ea1f43449 100644
--- a/src/Common/ThreadProfileEvents.cpp
+++ b/src/Common/ThreadProfileEvents.cpp
@@ -36,7 +36,7 @@ namespace ProfileEvents
     extern const Event OSReadBytes;
     extern const Event OSWriteBytes;
 
-    extern const Event PerfCpuCycles;
+    extern const Event PerfCPUCycles;
     extern const Event PerfInstructions;
     extern const Event PerfCacheReferences;
     extern const Event PerfCacheMisses;
@@ -45,12 +45,12 @@ namespace ProfileEvents
     extern const Event PerfBusCycles;
     extern const Event PerfStalledCyclesFrontend;
     extern const Event PerfStalledCyclesBackend;
-    extern const Event PerfRefCpuCycles;
+    extern const Event PerfRefCPUCycles;
 
-    extern const Event PerfCpuClock;
+    extern const Event PerfCPUClock;
     extern const Event PerfTaskClock;
     extern const Event PerfContextSwitches;
-    extern const Event PerfCpuMigrations;
+    extern const Event PerfCPUMigrations;
     extern const Event PerfAlignmentFaults;
     extern const Event PerfEmulationFaults;
     extern const Event PerfMinEnabledTime;
@@ -218,7 +218,7 @@ thread_local PerfEventsCounters current_thread_counters;
 
 // descriptions' source: http://man7.org/linux/man-pages/man2/perf_event_open.2.html
 static const PerfEventInfo raw_events_info[] = {
-    HARDWARE_EVENT(PERF_COUNT_HW_CPU_CYCLES, PerfCpuCycles),
+    HARDWARE_EVENT(PERF_COUNT_HW_CPU_CYCLES, PerfCPUCycles),
     HARDWARE_EVENT(PERF_COUNT_HW_INSTRUCTIONS, PerfInstructions),
     HARDWARE_EVENT(PERF_COUNT_HW_CACHE_REFERENCES, PerfCacheReferences),
     HARDWARE_EVENT(PERF_COUNT_HW_CACHE_MISSES, PerfCacheMisses),
@@ -227,13 +227,13 @@ static const PerfEventInfo raw_events_info[] = {
     HARDWARE_EVENT(PERF_COUNT_HW_BUS_CYCLES, PerfBusCycles),
     HARDWARE_EVENT(PERF_COUNT_HW_STALLED_CYCLES_FRONTEND, PerfStalledCyclesFrontend),
     HARDWARE_EVENT(PERF_COUNT_HW_STALLED_CYCLES_BACKEND, PerfStalledCyclesBackend),
-    HARDWARE_EVENT(PERF_COUNT_HW_REF_CPU_CYCLES, PerfRefCpuCycles),
+    HARDWARE_EVENT(PERF_COUNT_HW_REF_CPU_CYCLES, PerfRefCPUCycles),
 
     // `cpu-clock` is a bit broken according to this: https://stackoverflow.com/a/56967896
-    SOFTWARE_EVENT(PERF_COUNT_SW_CPU_CLOCK, PerfCpuClock),
+    SOFTWARE_EVENT(PERF_COUNT_SW_CPU_CLOCK, PerfCPUClock),
     SOFTWARE_EVENT(PERF_COUNT_SW_TASK_CLOCK, PerfTaskClock),
     SOFTWARE_EVENT(PERF_COUNT_SW_CONTEXT_SWITCHES, PerfContextSwitches),
-    SOFTWARE_EVENT(PERF_COUNT_SW_CPU_MIGRATIONS, PerfCpuMigrations),
+    SOFTWARE_EVENT(PERF_COUNT_SW_CPU_MIGRATIONS, PerfCPUMigrations),
     SOFTWARE_EVENT(PERF_COUNT_SW_ALIGNMENT_FAULTS, PerfAlignmentFaults),
     SOFTWARE_EVENT(PERF_COUNT_SW_EMULATION_FAULTS, PerfEmulationFaults),
 
diff --git a/src/Functions/FunctionsJSON.h b/src/Functions/FunctionsJSON.h
index 31a99475b63..2539fa1aeb4 100644
--- a/src/Functions/FunctionsJSON.h
+++ b/src/Functions/FunctionsJSON.h
@@ -5,7 +5,7 @@
 
 #include <base/range.h>
 
-#include <Common/CpuId.h>
+#include <Common/CPUID.h>
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
 
diff --git a/src/Functions/divide/divide.cpp b/src/Functions/divide/divide.cpp
index 6262d42a666..0708964c7d4 100644
--- a/src/Functions/divide/divide.cpp
+++ b/src/Functions/divide/divide.cpp
@@ -1,5 +1,5 @@
 #include "divide.h"
-#include <Common/CpuId.h>
+#include <Common/CPUID.h>
 
 #if defined(__x86_64__)
 namespace SSE2
@@ -26,9 +26,9 @@ template <typename A, typename B, typename ResultType>
 void divideImpl(const A * __restrict a_pos, B b, ResultType * __restrict c_pos, size_t size)
 {
 #if defined(__x86_64__)
-    if (DB::Cpu::CpuFlagsCache::have_AVX2)
+    if (DB::CPU::CPUFlagsCache::have_AVX2)
         AVX2::divideImpl(a_pos, b, c_pos, size);
-    else if (DB::Cpu::CpuFlagsCache::have_SSE2)
+    else if (DB::CPU::CPUFlagsCache::have_SSE2)
         SSE2::divideImpl(a_pos, b, c_pos, size);
 #else
     Generic::divideImpl(a_pos, b, c_pos, size);

From 39f363ba6e7dc21c1ac9d8e1dddc92d677e5b302 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 16 Feb 2024 13:09:07 +0100
Subject: [PATCH 1016/1081] Print CPU flags at startup

---
 programs/server/Server.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index b85bf6f814f..593c90e44b5 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -725,7 +725,7 @@ try
     CPU_ID_ENUMERATE(COLLECT_FLAG)
 #undef COLLECT_FLAG
 
-    LOG_INFO(log, "Available CPU instructions: {}", cpu_info);
+    LOG_INFO(log, "Available CPU instruction sets: {}", cpu_info);
 
     sanityChecks(*this);
 

From cb0ce2aaa94a818284ef3147603fa3441a737876 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 16 Feb 2024 15:26:08 +0000
Subject: [PATCH 1017/1081] Fix build

---
 src/Common/ThreadProfileEvents.cpp   | 2 --
 src/Coordination/KeeperConstants.cpp | 8 ++++----
 2 files changed, 4 insertions(+), 6 deletions(-)

diff --git a/src/Common/ThreadProfileEvents.cpp b/src/Common/ThreadProfileEvents.cpp
index 40ea1f43449..6a63d484cd9 100644
--- a/src/Common/ThreadProfileEvents.cpp
+++ b/src/Common/ThreadProfileEvents.cpp
@@ -6,10 +6,8 @@
 #include "ProcfsMetricsProvider.h"
 #include "hasLinuxCapability.h"
 
-#include <filesystem>
 #include <fstream>
 #include <optional>
-#include <unordered_set>
 
 #include <fcntl.h>
 #include <unistd.h>
diff --git a/src/Coordination/KeeperConstants.cpp b/src/Coordination/KeeperConstants.cpp
index 2aa84b691c4..f788095334e 100644
--- a/src/Coordination/KeeperConstants.cpp
+++ b/src/Coordination/KeeperConstants.cpp
@@ -85,7 +85,7 @@
     M(OSReadChars) \
     M(OSWriteChars) \
 \
-    M(PerfCpuCycles) \
+    M(PerfCPUCycles) \
     M(PerfInstructions) \
     M(PerfCacheReferences) \
     M(PerfCacheMisses) \
@@ -94,12 +94,12 @@
     M(PerfBusCycles) \
     M(PerfStalledCyclesFrontend) \
     M(PerfStalledCyclesBackend) \
-    M(PerfRefCpuCycles) \
+    M(PerfRefCPUCycles) \
 \
-    M(PerfCpuClock) \
+    M(PerfCPUClock) \
     M(PerfTaskClock) \
     M(PerfContextSwitches) \
-    M(PerfCpuMigrations) \
+    M(PerfCPUMigrations) \
     M(PerfAlignmentFaults) \
     M(PerfEmulationFaults) \
     M(PerfMinEnabledTime) \

From 96d978243939536ba7877e9daa2e2a309d1aa5a3 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 16 Feb 2024 19:16:02 +0300
Subject: [PATCH 1018/1081] Temporary table already exists exception message
 fix

---
 src/Interpreters/Context.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index fdd18c9bdeb..d6d0ed317d5 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -1534,7 +1534,7 @@ void Context::addExternalTable(const String & table_name, TemporaryTableHolder &
 
     std::lock_guard lock(mutex);
     if (external_tables_mapping.end() != external_tables_mapping.find(table_name))
-        throw Exception(ErrorCodes::TABLE_ALREADY_EXISTS, "Temporary table {} already exists.", backQuoteIfNeed(table_name));
+        throw Exception(ErrorCodes::TABLE_ALREADY_EXISTS, "Temporary table {} already exists", backQuoteIfNeed(table_name));
     external_tables_mapping.emplace(table_name, std::make_shared<TemporaryTableHolder>(std::move(temporary_table)));
 }
 

From 8c66db0d1c7e4393fbc528c85964ed4e7ebdb22e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 16 Feb 2024 19:21:25 +0000
Subject: [PATCH 1019/1081] Use max_query_size from context in DDLLogEntry
 instead of hardcoded 4096

---
 src/Interpreters/DDLTask.cpp | 5 +++--
 src/Interpreters/DDLTask.h   | 1 +
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/DDLTask.cpp b/src/Interpreters/DDLTask.cpp
index 90eec421abf..db45fa0d842 100644
--- a/src/Interpreters/DDLTask.cpp
+++ b/src/Interpreters/DDLTask.cpp
@@ -74,6 +74,8 @@ void DDLLogEntry::setSettingsIfRequired(ContextPtr context)
 
     if (version >= SETTINGS_IN_ZK_VERSION)
         settings.emplace(context->getSettingsRef().changes());
+
+    max_query_size = context->getSettingsRef().max_query_size;
 }
 
 String DDLLogEntry::toString() const
@@ -148,9 +150,8 @@ void DDLLogEntry::parse(const String & data)
             String settings_str;
             rb >> "settings: " >> settings_str >> "\n";
             ParserSetQuery parser{true};
-            constexpr UInt64 max_size = 4096;
             constexpr UInt64 max_depth = 16;
-            ASTPtr settings_ast = parseQuery(parser, settings_str, max_size, max_depth);
+            ASTPtr settings_ast = parseQuery(parser, settings_str, max_query_size, max_depth);
             settings.emplace(std::move(settings_ast->as<ASTSetQuery>()->changes));
         }
     }
diff --git a/src/Interpreters/DDLTask.h b/src/Interpreters/DDLTask.h
index 5a8a5bfb184..a1f20576281 100644
--- a/src/Interpreters/DDLTask.h
+++ b/src/Interpreters/DDLTask.h
@@ -89,6 +89,7 @@ struct DDLLogEntry
     OpenTelemetry::TracingContext tracing_context;
     String initial_query_id;
     bool is_backup_restore = false;
+    size_t max_query_size = DBMS_DEFAULT_MAX_QUERY_SIZE;
 
     void setSettingsIfRequired(ContextPtr context);
     String toString() const;

From 4e6f04ddf1dbfcf925d0fc4a978e926b4fd7d358 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 16 Feb 2024 19:30:16 +0000
Subject: [PATCH 1020/1081] Address comments

---
 src/Interpreters/DDLTask.cpp | 4 +---
 src/Interpreters/DDLTask.h   | 1 -
 2 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Interpreters/DDLTask.cpp b/src/Interpreters/DDLTask.cpp
index db45fa0d842..543d8b16791 100644
--- a/src/Interpreters/DDLTask.cpp
+++ b/src/Interpreters/DDLTask.cpp
@@ -74,8 +74,6 @@ void DDLLogEntry::setSettingsIfRequired(ContextPtr context)
 
     if (version >= SETTINGS_IN_ZK_VERSION)
         settings.emplace(context->getSettingsRef().changes());
-
-    max_query_size = context->getSettingsRef().max_query_size;
 }
 
 String DDLLogEntry::toString() const
@@ -151,7 +149,7 @@ void DDLLogEntry::parse(const String & data)
             rb >> "settings: " >> settings_str >> "\n";
             ParserSetQuery parser{true};
             constexpr UInt64 max_depth = 16;
-            ASTPtr settings_ast = parseQuery(parser, settings_str, max_query_size, max_depth);
+            ASTPtr settings_ast = parseQuery(parser, settings_str, Context::getGlobalContextInstance()->getSettingsRef().max_query_size, max_depth);
             settings.emplace(std::move(settings_ast->as<ASTSetQuery>()->changes));
         }
     }
diff --git a/src/Interpreters/DDLTask.h b/src/Interpreters/DDLTask.h
index a1f20576281..5a8a5bfb184 100644
--- a/src/Interpreters/DDLTask.h
+++ b/src/Interpreters/DDLTask.h
@@ -89,7 +89,6 @@ struct DDLLogEntry
     OpenTelemetry::TracingContext tracing_context;
     String initial_query_id;
     bool is_backup_restore = false;
-    size_t max_query_size = DBMS_DEFAULT_MAX_QUERY_SIZE;
 
     void setSettingsIfRequired(ContextPtr context);
     String toString() const;

From b5ef034697188f7c2d61723800f718c55864193e Mon Sep 17 00:00:00 2001
From: Kirill Nikiforov <allmazz@allmazz.me>
Date: Fri, 16 Feb 2024 22:31:22 +0300
Subject: [PATCH 1021/1081] Implement system.dns_cache table (#59856)

* system.dns_cache table WIP

* system.dns_cache table

* rollback unexpected contrib changes

* rollback unexpected changes

* add docs

* code style fixes

* optimize dns cache exporting

* stateful test for system.dns_cache table

* stateful test for system.dns_cache table

* cr fixes

* stateful test for system.dns_cache table

* stateful test for system.dns_cache table

* Update 02981_system_dns_cache_table.sql

* Update 02981_system_dns_cache_table.reference

---------

Co-authored-by: pufit <pufit@clickhouse.com>
---
 docs/en/operations/system-tables/dns_cache.md | 34 ++++++++++
 src/Common/DNSResolver.cpp                    | 26 +++++---
 src/Common/DNSResolver.h                      |  9 ++-
 src/Storages/System/StorageSystemDNSCache.cpp | 65 +++++++++++++++++++
 src/Storages/System/StorageSystemDNSCache.h   | 25 +++++++
 src/Storages/System/attachSystemTables.cpp    |  2 +
 .../02981_system_dns_cache_table.reference    |  2 +
 .../02981_system_dns_cache_table.sql          |  2 +
 8 files changed, 156 insertions(+), 9 deletions(-)
 create mode 100644 docs/en/operations/system-tables/dns_cache.md
 create mode 100644 src/Storages/System/StorageSystemDNSCache.cpp
 create mode 100644 src/Storages/System/StorageSystemDNSCache.h
 create mode 100644 tests/queries/0_stateless/02981_system_dns_cache_table.reference
 create mode 100644 tests/queries/0_stateless/02981_system_dns_cache_table.sql

diff --git a/docs/en/operations/system-tables/dns_cache.md b/docs/en/operations/system-tables/dns_cache.md
new file mode 100644
index 00000000000..ed5a5cd506f
--- /dev/null
+++ b/docs/en/operations/system-tables/dns_cache.md
@@ -0,0 +1,34 @@
+---
+slug: /en/operations/system-tables/dns_cache
+---
+# dns_cache
+
+Contains information about cached DNS records.
+
+Columns:
+
+- `hostname` ([String](../../sql-reference/data-types/string.md)) — cached hostname
+- `ip_address` ([String](../../sql-reference/data-types/string.md)) — ip address for the hostname
+- `family` ([String](../../sql-reference/data-types/string.md)) — family of the ip address: `IPv4`, `IPv6`, or `UNIX_LOCAL`.
+- `cached_at` ([String](../../sql-reference/data-types/datetime.md)) - datetime when the record was cached
+
+**Example**
+
+Query:
+
+```sql
+SELECT * FROM system.dns_cache;
+```
+
+Result:
+
+| hostname | ip\_address | ip\_family | cached\_at |
+| :--- | :--- | :--- | :--- |
+| localhost | ::1 | IPv6 | 2024-02-11 17:04:40 |
+| localhost | 127.0.0.1 | IPv4 | 2024-02-11 17:04:40 |
+
+**See also**
+
+- [disable_internal_dns_cache setting](../../operations/server-configuration-parameters/settings.md#disable_internal_dns_cache)
+- [dns_cache_update_period setting](../../operations/server-configuration-parameters/settings.md#dns_cache_update_period)
+- [dns_max_consecutive_failures setting](../../operations/server-configuration-parameters/settings.md#dns_max_consecutive_failures)
\ No newline at end of file
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index fcbbaf6b0be..70646d46434 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -4,13 +4,10 @@
 #include <Common/ProfileEvents.h>
 #include <Common/thread_local_rng.h>
 #include <Common/logger_useful.h>
-#include <Core/Names.h>
-#include <base/types.h>
 #include <Poco/Net/IPAddress.h>
 #include <Poco/Net/DNS.h>
 #include <Poco/Net/NetException.h>
 #include <Poco/NumberParser.h>
-#include <arpa/inet.h>
 #include <atomic>
 #include <optional>
 #include <string_view>
@@ -141,10 +138,10 @@ DNSResolver::IPAddresses resolveIPAddressImpl(const std::string & host)
     return addresses;
 }
 
-DNSResolver::IPAddresses resolveIPAddressWithCache(CacheBase<std::string, DNSResolver::IPAddresses> & cache, const std::string & host)
+DNSResolver::IPAddresses resolveIPAddressWithCache(CacheBase<std::string, DNSResolver::CacheEntry> & cache, const std::string & host)
 {
-    auto [result, _ ] = cache.getOrSet(host, [&host]() { return std::make_shared<DNSResolver::IPAddresses>(resolveIPAddressImpl(host)); });
-    return *result;
+    auto [result, _ ] = cache.getOrSet(host, [&host]() {return std::make_shared<DNSResolver::CacheEntry>(resolveIPAddressImpl(host), std::chrono::system_clock::now());});
+    return result->addresses;
 }
 
 std::unordered_set<String> reverseResolveImpl(const Poco::Net::IPAddress & address)
@@ -179,7 +176,7 @@ struct DNSResolver::Impl
     using HostWithConsecutiveFailures = std::unordered_map<String, UInt32>;
     using AddressWithConsecutiveFailures = std::unordered_map<Poco::Net::IPAddress, UInt32>;
 
-    CacheBase<std::string, DNSResolver::IPAddresses> cache_host{100};
+    CacheBase<std::string, DNSResolver::CacheEntry> cache_host{100};
     CacheBase<Poco::Net::IPAddress, std::unordered_set<std::string>> cache_address{100};
 
     std::mutex drop_mutex;
@@ -411,7 +408,7 @@ bool DNSResolver::updateHost(const String & host)
     const auto old_value = resolveIPAddressWithCache(impl->cache_host, host);
     auto new_value = resolveIPAddressImpl(host);
     const bool result = old_value != new_value;
-    impl->cache_host.set(host, std::make_shared<DNSResolver::IPAddresses>(std::move(new_value)));
+    impl->cache_host.set(host, std::make_shared<DNSResolver::CacheEntry>(std::move(new_value), std::chrono::system_clock::now()));
     return result;
 }
 
@@ -438,6 +435,19 @@ void DNSResolver::addToNewAddresses(const Poco::Net::IPAddress & address)
     impl->new_addresses.insert({address, consecutive_failures});
 }
 
+std::vector<std::pair<std::string, DNSResolver::CacheEntry>> DNSResolver::cacheEntries() const
+{
+    std::lock_guard lock(impl->drop_mutex);
+    std::vector<std::pair<std::string, DNSResolver::CacheEntry>> entries;
+
+    for (auto & [key, entry] : impl->cache_host.dump())
+    {
+        entries.emplace_back(std::move(key), *entry);
+    }
+
+    return entries;
+}
+
 DNSResolver::~DNSResolver() = default;
 
 DNSResolver & DNSResolver::instance()
diff --git a/src/Common/DNSResolver.h b/src/Common/DNSResolver.h
index 965688f84f2..38f19791051 100644
--- a/src/Common/DNSResolver.h
+++ b/src/Common/DNSResolver.h
@@ -20,7 +20,11 @@ class DNSResolver : private boost::noncopyable
 {
 public:
     using IPAddresses = std::vector<Poco::Net::IPAddress>;
-    using IPAddressesPtr = std::shared_ptr<IPAddresses>;
+    using CacheEntry = struct
+    {
+        IPAddresses addresses;
+        std::chrono::system_clock::time_point cached_at;
+    };
 
     static DNSResolver & instance();
 
@@ -58,6 +62,9 @@ public:
     /// Returns true if IP of any host has been changed or an element was dropped (too many failures)
     bool updateCache(UInt32 max_consecutive_failures);
 
+    /// Returns a copy of cache entries
+    std::vector<std::pair<std::string, CacheEntry>> cacheEntries() const;
+
     ~DNSResolver();
 
 private:
diff --git a/src/Storages/System/StorageSystemDNSCache.cpp b/src/Storages/System/StorageSystemDNSCache.cpp
new file mode 100644
index 00000000000..828c120fcb6
--- /dev/null
+++ b/src/Storages/System/StorageSystemDNSCache.cpp
@@ -0,0 +1,65 @@
+#include <Access/ContextAccess.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <Interpreters/Context.h>
+#include <Storages/System/StorageSystemDNSCache.h>
+#include <Common/DNSResolver.h>
+#include "StorageSystemDatabases.h"
+
+namespace DB
+{
+
+ColumnsDescription StorageSystemDNSCache::getColumnsDescription()
+{
+    return ColumnsDescription
+        {
+            {"hostname", std::make_shared<DataTypeString>(), "Hostname."},
+            {"ip_address", std::make_shared<DataTypeString>(), "IP address."},
+            {"ip_family", std::make_shared<DataTypeString>(), "IP address family."},
+            {"cached_at", std::make_shared<DataTypeDateTime>(), "Record cached timestamp."},
+        };
+}
+
+void StorageSystemDNSCache::fillData(MutableColumns & res_columns, ContextPtr, const SelectQueryInfo &) const
+{
+    using HostIPPair = std::pair<std::string, std::string>;
+    std::set<HostIPPair> reported_elements;
+
+    for (const auto & [hostname, entry] : DNSResolver::instance().cacheEntries())
+    {
+        for (const auto &address : entry.addresses)
+        {
+            std::string ip = address.toString();
+
+            // Cache might report the same ip address multiple times. Report only one of them.
+            if (reported_elements.contains(HostIPPair(hostname, ip)))
+                continue;
+
+            reported_elements.insert(HostIPPair(hostname, ip));
+
+            std::string family_str;
+            switch (address.family())
+            {
+                case Poco::Net::AddressFamily::IPv4:
+                    family_str = "IPv4";
+                    break;
+                case Poco::Net::AddressFamily::IPv6:
+                    family_str = "IPv6";
+                    break;
+                case Poco::Net::AddressFamily::UNIX_LOCAL:
+                    family_str = "UNIX_LOCAL";
+                    break;
+            }
+
+            size_t i = 0;
+            res_columns[i++]->insert(hostname);
+            res_columns[i++]->insert(ip);
+            res_columns[i++]->insert(family_str);
+            res_columns[i++]->insert(static_cast<UInt32>(std::chrono::system_clock::to_time_t(entry.cached_at)));
+        }
+    }
+}
+
+}
diff --git a/src/Storages/System/StorageSystemDNSCache.h b/src/Storages/System/StorageSystemDNSCache.h
new file mode 100644
index 00000000000..340060335b8
--- /dev/null
+++ b/src/Storages/System/StorageSystemDNSCache.h
@@ -0,0 +1,25 @@
+#pragma once
+
+#include <Storages/System/IStorageSystemOneBlock.h>
+
+
+namespace DB
+{
+
+class Context;
+
+/// system.dns_cache table.
+class StorageSystemDNSCache final : public IStorageSystemOneBlock<StorageSystemDNSCache>
+{
+public:
+    std::string getName() const override { return "SystemDNSCache"; }
+
+    static ColumnsDescription getColumnsDescription();
+
+protected:
+    using IStorageSystemOneBlock::IStorageSystemOneBlock;
+
+    void fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo & query_info) const override;
+};
+
+}
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index bf898f57833..f08d6972b98 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -90,6 +90,7 @@
 #include <Storages/System/StorageSystemS3Queue.h>
 #include <Storages/System/StorageSystemDashboards.h>
 #include <Storages/System/StorageSystemViewRefreshes.h>
+#include <Storages/System/StorageSystemDNSCache.h>
 
 #if defined(__ELF__) && !defined(OS_FREEBSD)
 #include <Storages/System/StorageSystemSymbols.h>
@@ -166,6 +167,7 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attach<StorageSystemDroppedTables>(context, system_database, "dropped_tables", "Contains a list of tables which were dropped from Atomic databases but not completely removed yet.");
     attach<StorageSystemDroppedTablesParts>(context, system_database, "dropped_tables_parts", "Contains parts of system.dropped_tables tables ");
     attach<StorageSystemScheduler>(context, system_database, "scheduler", "Contains information and status for scheduling nodes residing on the local server.");
+    attach<StorageSystemDNSCache>(context, system_database, "dns_cache", "Contains information about cached DNS records.");
 #if defined(__ELF__) && !defined(OS_FREEBSD)
     attach<StorageSystemSymbols>(context, system_database, "symbols", "Contains information for introspection of ClickHouse binary. This table is only useful for C++ experts and ClickHouse engineers.");
 #endif
diff --git a/tests/queries/0_stateless/02981_system_dns_cache_table.reference b/tests/queries/0_stateless/02981_system_dns_cache_table.reference
new file mode 100644
index 00000000000..0e51a855bbe
--- /dev/null
+++ b/tests/queries/0_stateless/02981_system_dns_cache_table.reference
@@ -0,0 +1,2 @@
+Ok.
+localhost	127.0.0.1	IPv4	1
diff --git a/tests/queries/0_stateless/02981_system_dns_cache_table.sql b/tests/queries/0_stateless/02981_system_dns_cache_table.sql
new file mode 100644
index 00000000000..87bb91ca29a
--- /dev/null
+++ b/tests/queries/0_stateless/02981_system_dns_cache_table.sql
@@ -0,0 +1,2 @@
+SELECT * FROM url('http://localhost:8123/ping', CSV, 'auto', headers());
+SELECT hostname, ip_address, ip_family, (isNotNull(cached_at) AND cached_at > '1970-01-01 00:00:00') FROM system.dns_cache WHERE hostname = 'localhost' AND ip_family = 'IPv4';

From 731c484b3d03edb7e1d62f5d97913b5658cfe375 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 01:46:41 +0100
Subject: [PATCH 1022/1081] Revert "Implement system.dns_cache table (#59856)"

This reverts commit b5ef034697188f7c2d61723800f718c55864193e.
---
 docs/en/operations/system-tables/dns_cache.md | 34 ----------
 src/Common/DNSResolver.cpp                    | 26 +++-----
 src/Common/DNSResolver.h                      |  9 +--
 src/Storages/System/StorageSystemDNSCache.cpp | 65 -------------------
 src/Storages/System/StorageSystemDNSCache.h   | 25 -------
 src/Storages/System/attachSystemTables.cpp    |  2 -
 .../02981_system_dns_cache_table.reference    |  2 -
 .../02981_system_dns_cache_table.sql          |  2 -
 8 files changed, 9 insertions(+), 156 deletions(-)
 delete mode 100644 docs/en/operations/system-tables/dns_cache.md
 delete mode 100644 src/Storages/System/StorageSystemDNSCache.cpp
 delete mode 100644 src/Storages/System/StorageSystemDNSCache.h
 delete mode 100644 tests/queries/0_stateless/02981_system_dns_cache_table.reference
 delete mode 100644 tests/queries/0_stateless/02981_system_dns_cache_table.sql

diff --git a/docs/en/operations/system-tables/dns_cache.md b/docs/en/operations/system-tables/dns_cache.md
deleted file mode 100644
index ed5a5cd506f..00000000000
--- a/docs/en/operations/system-tables/dns_cache.md
+++ /dev/null
@@ -1,34 +0,0 @@
----
-slug: /en/operations/system-tables/dns_cache
----
-# dns_cache
-
-Contains information about cached DNS records.
-
-Columns:
-
-- `hostname` ([String](../../sql-reference/data-types/string.md)) — cached hostname
-- `ip_address` ([String](../../sql-reference/data-types/string.md)) — ip address for the hostname
-- `family` ([String](../../sql-reference/data-types/string.md)) — family of the ip address: `IPv4`, `IPv6`, or `UNIX_LOCAL`.
-- `cached_at` ([String](../../sql-reference/data-types/datetime.md)) - datetime when the record was cached
-
-**Example**
-
-Query:
-
-```sql
-SELECT * FROM system.dns_cache;
-```
-
-Result:
-
-| hostname | ip\_address | ip\_family | cached\_at |
-| :--- | :--- | :--- | :--- |
-| localhost | ::1 | IPv6 | 2024-02-11 17:04:40 |
-| localhost | 127.0.0.1 | IPv4 | 2024-02-11 17:04:40 |
-
-**See also**
-
-- [disable_internal_dns_cache setting](../../operations/server-configuration-parameters/settings.md#disable_internal_dns_cache)
-- [dns_cache_update_period setting](../../operations/server-configuration-parameters/settings.md#dns_cache_update_period)
-- [dns_max_consecutive_failures setting](../../operations/server-configuration-parameters/settings.md#dns_max_consecutive_failures)
\ No newline at end of file
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index 70646d46434..fcbbaf6b0be 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -4,10 +4,13 @@
 #include <Common/ProfileEvents.h>
 #include <Common/thread_local_rng.h>
 #include <Common/logger_useful.h>
+#include <Core/Names.h>
+#include <base/types.h>
 #include <Poco/Net/IPAddress.h>
 #include <Poco/Net/DNS.h>
 #include <Poco/Net/NetException.h>
 #include <Poco/NumberParser.h>
+#include <arpa/inet.h>
 #include <atomic>
 #include <optional>
 #include <string_view>
@@ -138,10 +141,10 @@ DNSResolver::IPAddresses resolveIPAddressImpl(const std::string & host)
     return addresses;
 }
 
-DNSResolver::IPAddresses resolveIPAddressWithCache(CacheBase<std::string, DNSResolver::CacheEntry> & cache, const std::string & host)
+DNSResolver::IPAddresses resolveIPAddressWithCache(CacheBase<std::string, DNSResolver::IPAddresses> & cache, const std::string & host)
 {
-    auto [result, _ ] = cache.getOrSet(host, [&host]() {return std::make_shared<DNSResolver::CacheEntry>(resolveIPAddressImpl(host), std::chrono::system_clock::now());});
-    return result->addresses;
+    auto [result, _ ] = cache.getOrSet(host, [&host]() { return std::make_shared<DNSResolver::IPAddresses>(resolveIPAddressImpl(host)); });
+    return *result;
 }
 
 std::unordered_set<String> reverseResolveImpl(const Poco::Net::IPAddress & address)
@@ -176,7 +179,7 @@ struct DNSResolver::Impl
     using HostWithConsecutiveFailures = std::unordered_map<String, UInt32>;
     using AddressWithConsecutiveFailures = std::unordered_map<Poco::Net::IPAddress, UInt32>;
 
-    CacheBase<std::string, DNSResolver::CacheEntry> cache_host{100};
+    CacheBase<std::string, DNSResolver::IPAddresses> cache_host{100};
     CacheBase<Poco::Net::IPAddress, std::unordered_set<std::string>> cache_address{100};
 
     std::mutex drop_mutex;
@@ -408,7 +411,7 @@ bool DNSResolver::updateHost(const String & host)
     const auto old_value = resolveIPAddressWithCache(impl->cache_host, host);
     auto new_value = resolveIPAddressImpl(host);
     const bool result = old_value != new_value;
-    impl->cache_host.set(host, std::make_shared<DNSResolver::CacheEntry>(std::move(new_value), std::chrono::system_clock::now()));
+    impl->cache_host.set(host, std::make_shared<DNSResolver::IPAddresses>(std::move(new_value)));
     return result;
 }
 
@@ -435,19 +438,6 @@ void DNSResolver::addToNewAddresses(const Poco::Net::IPAddress & address)
     impl->new_addresses.insert({address, consecutive_failures});
 }
 
-std::vector<std::pair<std::string, DNSResolver::CacheEntry>> DNSResolver::cacheEntries() const
-{
-    std::lock_guard lock(impl->drop_mutex);
-    std::vector<std::pair<std::string, DNSResolver::CacheEntry>> entries;
-
-    for (auto & [key, entry] : impl->cache_host.dump())
-    {
-        entries.emplace_back(std::move(key), *entry);
-    }
-
-    return entries;
-}
-
 DNSResolver::~DNSResolver() = default;
 
 DNSResolver & DNSResolver::instance()
diff --git a/src/Common/DNSResolver.h b/src/Common/DNSResolver.h
index 38f19791051..965688f84f2 100644
--- a/src/Common/DNSResolver.h
+++ b/src/Common/DNSResolver.h
@@ -20,11 +20,7 @@ class DNSResolver : private boost::noncopyable
 {
 public:
     using IPAddresses = std::vector<Poco::Net::IPAddress>;
-    using CacheEntry = struct
-    {
-        IPAddresses addresses;
-        std::chrono::system_clock::time_point cached_at;
-    };
+    using IPAddressesPtr = std::shared_ptr<IPAddresses>;
 
     static DNSResolver & instance();
 
@@ -62,9 +58,6 @@ public:
     /// Returns true if IP of any host has been changed or an element was dropped (too many failures)
     bool updateCache(UInt32 max_consecutive_failures);
 
-    /// Returns a copy of cache entries
-    std::vector<std::pair<std::string, CacheEntry>> cacheEntries() const;
-
     ~DNSResolver();
 
 private:
diff --git a/src/Storages/System/StorageSystemDNSCache.cpp b/src/Storages/System/StorageSystemDNSCache.cpp
deleted file mode 100644
index 828c120fcb6..00000000000
--- a/src/Storages/System/StorageSystemDNSCache.cpp
+++ /dev/null
@@ -1,65 +0,0 @@
-#include <Access/ContextAccess.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <Interpreters/Context.h>
-#include <Storages/System/StorageSystemDNSCache.h>
-#include <Common/DNSResolver.h>
-#include "StorageSystemDatabases.h"
-
-namespace DB
-{
-
-ColumnsDescription StorageSystemDNSCache::getColumnsDescription()
-{
-    return ColumnsDescription
-        {
-            {"hostname", std::make_shared<DataTypeString>(), "Hostname."},
-            {"ip_address", std::make_shared<DataTypeString>(), "IP address."},
-            {"ip_family", std::make_shared<DataTypeString>(), "IP address family."},
-            {"cached_at", std::make_shared<DataTypeDateTime>(), "Record cached timestamp."},
-        };
-}
-
-void StorageSystemDNSCache::fillData(MutableColumns & res_columns, ContextPtr, const SelectQueryInfo &) const
-{
-    using HostIPPair = std::pair<std::string, std::string>;
-    std::set<HostIPPair> reported_elements;
-
-    for (const auto & [hostname, entry] : DNSResolver::instance().cacheEntries())
-    {
-        for (const auto &address : entry.addresses)
-        {
-            std::string ip = address.toString();
-
-            // Cache might report the same ip address multiple times. Report only one of them.
-            if (reported_elements.contains(HostIPPair(hostname, ip)))
-                continue;
-
-            reported_elements.insert(HostIPPair(hostname, ip));
-
-            std::string family_str;
-            switch (address.family())
-            {
-                case Poco::Net::AddressFamily::IPv4:
-                    family_str = "IPv4";
-                    break;
-                case Poco::Net::AddressFamily::IPv6:
-                    family_str = "IPv6";
-                    break;
-                case Poco::Net::AddressFamily::UNIX_LOCAL:
-                    family_str = "UNIX_LOCAL";
-                    break;
-            }
-
-            size_t i = 0;
-            res_columns[i++]->insert(hostname);
-            res_columns[i++]->insert(ip);
-            res_columns[i++]->insert(family_str);
-            res_columns[i++]->insert(static_cast<UInt32>(std::chrono::system_clock::to_time_t(entry.cached_at)));
-        }
-    }
-}
-
-}
diff --git a/src/Storages/System/StorageSystemDNSCache.h b/src/Storages/System/StorageSystemDNSCache.h
deleted file mode 100644
index 340060335b8..00000000000
--- a/src/Storages/System/StorageSystemDNSCache.h
+++ /dev/null
@@ -1,25 +0,0 @@
-#pragma once
-
-#include <Storages/System/IStorageSystemOneBlock.h>
-
-
-namespace DB
-{
-
-class Context;
-
-/// system.dns_cache table.
-class StorageSystemDNSCache final : public IStorageSystemOneBlock<StorageSystemDNSCache>
-{
-public:
-    std::string getName() const override { return "SystemDNSCache"; }
-
-    static ColumnsDescription getColumnsDescription();
-
-protected:
-    using IStorageSystemOneBlock::IStorageSystemOneBlock;
-
-    void fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo & query_info) const override;
-};
-
-}
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index f08d6972b98..bf898f57833 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -90,7 +90,6 @@
 #include <Storages/System/StorageSystemS3Queue.h>
 #include <Storages/System/StorageSystemDashboards.h>
 #include <Storages/System/StorageSystemViewRefreshes.h>
-#include <Storages/System/StorageSystemDNSCache.h>
 
 #if defined(__ELF__) && !defined(OS_FREEBSD)
 #include <Storages/System/StorageSystemSymbols.h>
@@ -167,7 +166,6 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attach<StorageSystemDroppedTables>(context, system_database, "dropped_tables", "Contains a list of tables which were dropped from Atomic databases but not completely removed yet.");
     attach<StorageSystemDroppedTablesParts>(context, system_database, "dropped_tables_parts", "Contains parts of system.dropped_tables tables ");
     attach<StorageSystemScheduler>(context, system_database, "scheduler", "Contains information and status for scheduling nodes residing on the local server.");
-    attach<StorageSystemDNSCache>(context, system_database, "dns_cache", "Contains information about cached DNS records.");
 #if defined(__ELF__) && !defined(OS_FREEBSD)
     attach<StorageSystemSymbols>(context, system_database, "symbols", "Contains information for introspection of ClickHouse binary. This table is only useful for C++ experts and ClickHouse engineers.");
 #endif
diff --git a/tests/queries/0_stateless/02981_system_dns_cache_table.reference b/tests/queries/0_stateless/02981_system_dns_cache_table.reference
deleted file mode 100644
index 0e51a855bbe..00000000000
--- a/tests/queries/0_stateless/02981_system_dns_cache_table.reference
+++ /dev/null
@@ -1,2 +0,0 @@
-Ok.
-localhost	127.0.0.1	IPv4	1
diff --git a/tests/queries/0_stateless/02981_system_dns_cache_table.sql b/tests/queries/0_stateless/02981_system_dns_cache_table.sql
deleted file mode 100644
index 87bb91ca29a..00000000000
--- a/tests/queries/0_stateless/02981_system_dns_cache_table.sql
+++ /dev/null
@@ -1,2 +0,0 @@
-SELECT * FROM url('http://localhost:8123/ping', CSV, 'auto', headers());
-SELECT hostname, ip_address, ip_family, (isNotNull(cached_at) AND cached_at > '1970-01-01 00:00:00') FROM system.dns_cache WHERE hostname = 'localhost' AND ip_family = 'IPv4';

From 4c2ee234299f26d3716c0e952a78147a49faa651 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 01:50:20 +0100
Subject: [PATCH 1023/1081] Update insert-into.md

---
 docs/en/sql-reference/statements/insert-into.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/insert-into.md b/docs/en/sql-reference/statements/insert-into.md
index 2eebd62cbc6..f5544f96750 100644
--- a/docs/en/sql-reference/statements/insert-into.md
+++ b/docs/en/sql-reference/statements/insert-into.md
@@ -210,7 +210,7 @@ By default, services on ClickHouse Cloud provide multiple replicas for high avai
 
 After an `INSERT` succeeds, data is written to the underlying storage. However, it may take some time for replicas to receive these updates. Therefore, if you use a different connection that executes a `SELECT` query on one of these other replicas, the updated data may not yet be reflected.
 
-It is possible to use the `select_sequential_consistency` to force replicas to receive the latest updates. Here is an example of a SELECT query using this setting:
+It is possible to use the `select_sequential_consistency` to force the replica to receive the latest updates. Here is an example of a SELECT query using this setting:
 
 ```sql
 SELECT .... SETTINGS select_sequential_consistency = 1;

From 509d8ee99ca259db0233fe4c174541753169256d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 01:54:54 +0100
Subject: [PATCH 1024/1081] Apply review comments

---
 programs/server/Server.cpp |  2 ++
 src/Common/CPUID.h         | 14 +++++++-------
 2 files changed, 9 insertions(+), 7 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 593c90e44b5..0a3c23d746a 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -713,6 +713,7 @@ try
         getNumberOfPhysicalCPUCores(),  // on ARM processors it can show only enabled at current moment cores
         std::thread::hardware_concurrency());
 
+#if defined(__x86_64__)
     String cpu_info;
 #define COLLECT_FLAG(X) \
     if (CPU::have##X()) \
@@ -726,6 +727,7 @@ try
 #undef COLLECT_FLAG
 
     LOG_INFO(log, "Available CPU instruction sets: {}", cpu_info);
+#endif
 
     sanityChecks(*this);
 
diff --git a/src/Common/CPUID.h b/src/Common/CPUID.h
index 44b608ac1fe..b47e7e808d7 100644
--- a/src/Common/CPUID.h
+++ b/src/Common/CPUID.h
@@ -2,7 +2,7 @@
 
 #include <base/types.h>
 
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
 #include <cpuid.h>
 #endif
 
@@ -14,7 +14,7 @@ namespace DB
 namespace CPU
 {
 
-#if (defined(__x86_64__) || defined(__i386__))
+#if (defined(__x86_64__))
 /// Our version is independent of -mxsave option, because we do dynamic dispatch.
 inline UInt64 our_xgetbv(UInt32 xcr) noexcept
 {
@@ -30,7 +30,7 @@ inline UInt64 our_xgetbv(UInt32 xcr) noexcept
 
 inline bool cpuid(UInt32 op, UInt32 sub_op, UInt32 * res) noexcept /// NOLINT
 {
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
     __cpuid_count(op, sub_op, res[0], res[1], res[2], res[3]);
     return true;
 #else
@@ -45,7 +45,7 @@ inline bool cpuid(UInt32 op, UInt32 sub_op, UInt32 * res) noexcept /// NOLINT
 
 inline bool cpuid(UInt32 op, UInt32 * res) noexcept /// NOLINT
 {
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
     __cpuid(op, res[0], res[1], res[2], res[3]);
     return true;
 #else
@@ -186,7 +186,7 @@ bool haveOSXSAVE() noexcept
 
 bool haveAVX() noexcept
 {
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
     // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
     // https://bugs.chromium.org/p/chromium/issues/detail?id=375968
     return haveOSXSAVE()                           // implies haveXSAVE()
@@ -219,7 +219,7 @@ bool haveBMI2() noexcept
 
 bool haveAVX512F() noexcept
 {
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
     // https://software.intel.com/en-us/articles/how-to-detect-knl-instruction-support
     return haveOSXSAVE()                           // implies haveXSAVE()
            && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
@@ -318,7 +318,7 @@ bool haveRDRAND() noexcept
 
 inline bool haveAMX() noexcept
 {
-#if defined(__x86_64__) || defined(__i386__)
+#if defined(__x86_64__)
     // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
     return haveOSXSAVE()                           // implies haveXSAVE()
            && ((our_xgetbv(0) >> 17) & 0x3) == 0x3;        // AMX state are enabled by OS

From 2f315e0eb54f1b9d93b6c5406287d83f748530ed Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 02:14:15 +0100
Subject: [PATCH 1025/1081] Style check for abbreviations

---
 src/Client/ConnectionParameters.cpp                    |  2 +-
 src/Dictionaries/YAMLRegExpTreeDictionarySource.cpp    |  2 +-
 src/Functions/serverConstants.cpp                      | 10 +++++-----
 src/IO/ConnectionTimeouts.cpp                          |  6 +++---
 src/IO/ConnectionTimeouts.h                            |  4 ++--
 src/IO/S3/Credentials.cpp                              |  5 +----
 src/IO/S3/PocoHTTPClient.cpp                           |  4 ++--
 src/Interpreters/Context.cpp                           |  2 +-
 src/Interpreters/Context.h                             |  2 +-
 src/Interpreters/InterpreterShowFunctionsQuery.cpp     |  4 ++--
 src/Interpreters/Session.cpp                           |  4 ++--
 src/Interpreters/Session.h                             |  2 +-
 .../Kusto/KustoFunctions/KQLFunctionFactory.cpp        |  4 ++--
 .../Kusto/KustoFunctions/KQLStringFunctions.cpp        |  4 ++--
 src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h  |  4 ++--
 src/Processors/Formats/Impl/AvroRowInputFormat.cpp     |  4 ++--
 src/Server/HTTPHandler.cpp                             |  8 ++++----
 src/Storages/StorageURL.cpp                            |  2 +-
 utils/check-style/check-style                          |  6 ++++++
 19 files changed, 41 insertions(+), 38 deletions(-)

diff --git a/src/Client/ConnectionParameters.cpp b/src/Client/ConnectionParameters.cpp
index a0ae47f0620..5c22b6c6d3f 100644
--- a/src/Client/ConnectionParameters.cpp
+++ b/src/Client/ConnectionParameters.cpp
@@ -125,7 +125,7 @@ ConnectionParameters::ConnectionParameters(const Poco::Util::AbstractConfigurati
                 Poco::Timespan(config.getInt("send_timeout", DBMS_DEFAULT_SEND_TIMEOUT_SEC), 0))
             .withReceiveTimeout(
                 Poco::Timespan(config.getInt("receive_timeout", DBMS_DEFAULT_RECEIVE_TIMEOUT_SEC), 0))
-            .withTcpKeepAliveTimeout(
+            .withTCPKeepAliveTimeout(
                 Poco::Timespan(config.getInt("tcp_keep_alive_timeout", DEFAULT_TCP_KEEP_ALIVE_TIMEOUT), 0))
             .withHandshakeTimeout(
                 Poco::Timespan(config.getInt("handshake_timeout_ms", DBMS_DEFAULT_RECEIVE_TIMEOUT_SEC * 1000) * 1000))
diff --git a/src/Dictionaries/YAMLRegExpTreeDictionarySource.cpp b/src/Dictionaries/YAMLRegExpTreeDictionarySource.cpp
index f1591943a12..b35e507b242 100644
--- a/src/Dictionaries/YAMLRegExpTreeDictionarySource.cpp
+++ b/src/Dictionaries/YAMLRegExpTreeDictionarySource.cpp
@@ -227,7 +227,7 @@ void parseMatchNode(UInt64 parent_id, UInt64 & id, const YAML::Node & node, Resu
 
     if (!match.contains(key_name))
     {
-        throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "Yaml match rule must contain key {}", key_name);
+        throw Exception(ErrorCodes::INVALID_CONFIG_PARAMETER, "YAML match rule must contain key {}", key_name);
     }
     for (const auto & [key, node_] : match)
     {
diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 9f1a3584df8..fd8fb22455b 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -51,12 +51,12 @@ namespace
     };
 
 
-    class FunctionTcpPort : public FunctionConstantBase<FunctionTcpPort, UInt16, DataTypeUInt16>
+    class FunctionTCPPort : public FunctionConstantBase<FunctionTCPPort, UInt16, DataTypeUInt16>
     {
     public:
         static constexpr auto name = "tcpPort";
-        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionTcpPort>(context); }
-        explicit FunctionTcpPort(ContextPtr context) : FunctionConstantBase(context->getTCPPort(), context->isDistributed()) {}
+        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionTCPPort>(context); }
+        explicit FunctionTCPPort(ContextPtr context) : FunctionConstantBase(context->getTCPPort(), context->isDistributed()) {}
     };
 
 
@@ -153,9 +153,9 @@ REGISTER_FUNCTION(ServerUUID)
     factory.registerFunction<FunctionServerUUID>();
 }
 
-REGISTER_FUNCTION(TcpPort)
+REGISTER_FUNCTION(TCPPort)
 {
-    factory.registerFunction<FunctionTcpPort>();
+    factory.registerFunction<FunctionTCPPort>();
 }
 
 REGISTER_FUNCTION(Timezone)
diff --git a/src/IO/ConnectionTimeouts.cpp b/src/IO/ConnectionTimeouts.cpp
index ecc0d64580b..f2db3169400 100644
--- a/src/IO/ConnectionTimeouts.cpp
+++ b/src/IO/ConnectionTimeouts.cpp
@@ -20,7 +20,7 @@ ConnectionTimeouts ConnectionTimeouts::getTCPTimeoutsWithoutFailover(const Setti
         .withConnectionTimeout(settings.connect_timeout)
         .withSendTimeout(settings.send_timeout)
         .withReceiveTimeout(settings.receive_timeout)
-        .withTcpKeepAliveTimeout(settings.tcp_keep_alive_timeout)
+        .withTCPKeepAliveTimeout(settings.tcp_keep_alive_timeout)
         .withHandshakeTimeout(settings.handshake_timeout_ms)
         .withHedgedConnectionTimeout(settings.hedged_connection_timeout_ms)
         .withReceiveDataTimeout(settings.receive_data_timeout_ms);
@@ -40,8 +40,8 @@ ConnectionTimeouts ConnectionTimeouts::getHTTPTimeouts(const Settings & settings
         .withConnectionTimeout(settings.http_connection_timeout)
         .withSendTimeout(settings.http_send_timeout)
         .withReceiveTimeout(settings.http_receive_timeout)
-        .withHttpKeepAliveTimeout(http_keep_alive_timeout)
-        .withTcpKeepAliveTimeout(settings.tcp_keep_alive_timeout)
+        .withHTTPKeepAliveTimeout(http_keep_alive_timeout)
+        .withTCPKeepAliveTimeout(settings.tcp_keep_alive_timeout)
         .withHandshakeTimeout(settings.handshake_timeout_ms);
 }
 
diff --git a/src/IO/ConnectionTimeouts.h b/src/IO/ConnectionTimeouts.h
index 6967af08204..7fe97b5ec36 100644
--- a/src/IO/ConnectionTimeouts.h
+++ b/src/IO/ConnectionTimeouts.h
@@ -16,8 +16,8 @@ struct Settings;
     M(secure_connection_timeout, withSecureConnectionTimeout) \
     M(send_timeout, withSendTimeout) \
     M(receive_timeout, withReceiveTimeout) \
-    M(tcp_keep_alive_timeout, withTcpKeepAliveTimeout) \
-    M(http_keep_alive_timeout, withHttpKeepAliveTimeout) \
+    M(tcp_keep_alive_timeout, withTCPKeepAliveTimeout) \
+    M(http_keep_alive_timeout, withHTTPKeepAliveTimeout) \
     M(hedged_connection_timeout, withHedgedConnectionTimeout) \
     M(receive_data_timeout, withReceiveDataTimeout) \
     M(handshake_timeout, withHandshakeTimeout) \
diff --git a/src/IO/S3/Credentials.cpp b/src/IO/S3/Credentials.cpp
index e64f54b99ad..80366510b53 100644
--- a/src/IO/S3/Credentials.cpp
+++ b/src/IO/S3/Credentials.cpp
@@ -22,7 +22,6 @@ namespace ErrorCodes
 #    include <aws/core/utils/UUID.h>
 #    include <aws/core/http/HttpClientFactory.h>
 
-#    include <IO/S3/PocoHTTPClientFactory.h>
 #    include <aws/core/utils/HashingUtils.h>
 #    include <aws/core/platform/FileSystem.h>
 
@@ -31,9 +30,7 @@ namespace ErrorCodes
 #    include <IO/S3/Client.h>
 
 #    include <fstream>
-#    include <base/EnumReflection.h>
 
-#    include <boost/algorithm/string.hpp>
 #    include <boost/algorithm/string/split.hpp>
 #    include <boost/algorithm/string/classification.hpp>
 #    include <Poco/Exception.h>
@@ -755,7 +752,7 @@ S3CredentialsProviderChain::S3CredentialsProviderChain(
                 configuration.put_request_throttler,
                 Aws::Http::SchemeMapper::ToString(Aws::Http::Scheme::HTTP));
 
-            /// See MakeDefaultHttpResourceClientConfiguration().
+            /// See MakeDefaultHTTPResourceClientConfiguration().
             /// This is part of EC2 metadata client, but unfortunately it can't be accessed from outside
             /// of contrib/aws/aws-cpp-sdk-core/source/internal/AWSHttpResourceClient.cpp
             aws_client_configuration.maxConnections = 2;
diff --git a/src/IO/S3/PocoHTTPClient.cpp b/src/IO/S3/PocoHTTPClient.cpp
index 21acdfd69f2..dbb93e63143 100644
--- a/src/IO/S3/PocoHTTPClient.cpp
+++ b/src/IO/S3/PocoHTTPClient.cpp
@@ -146,9 +146,9 @@ ConnectionTimeouts getTimeoutsFromConfiguration(const PocoHTTPClientConfiguratio
         .withConnectionTimeout(Poco::Timespan(client_configuration.connectTimeoutMs * 1000))
         .withSendTimeout(Poco::Timespan(client_configuration.requestTimeoutMs * 1000))
         .withReceiveTimeout(Poco::Timespan(client_configuration.requestTimeoutMs * 1000))
-        .withTcpKeepAliveTimeout(Poco::Timespan(
+        .withTCPKeepAliveTimeout(Poco::Timespan(
             client_configuration.enableTcpKeepAlive ? client_configuration.tcpKeepAliveIntervalMs * 1000 : 0))
-        .withHttpKeepAliveTimeout(Poco::Timespan(
+        .withHTTPKeepAliveTimeout(Poco::Timespan(
             client_configuration.http_keep_alive_timeout_ms * 1000)); /// flag indicating whether keep-alive is enabled is set to each session upon creation
 }
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index fdd18c9bdeb..1dbf54e675b 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -4513,7 +4513,7 @@ void Context::setClientConnectionId(uint32_t connection_id_)
     client_info.connection_id = connection_id_;
 }
 
-void Context::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
+void Context::setHTTPClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
 {
     client_info.http_method = http_method;
     client_info.http_user_agent = http_user_agent;
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index cdd188faa48..a7908d45a9b 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -630,7 +630,7 @@ public:
     void setClientInterface(ClientInfo::Interface interface);
     void setClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
     void setClientConnectionId(uint32_t connection_id);
-    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
+    void setHTTPClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
     void setForwardedFor(const String & forwarded_for);
     void setQueryKind(ClientInfo::QueryKind query_kind);
     void setQueryKindInitial();
diff --git a/src/Interpreters/InterpreterShowFunctionsQuery.cpp b/src/Interpreters/InterpreterShowFunctionsQuery.cpp
index e83f61eac53..829670d7929 100644
--- a/src/Interpreters/InterpreterShowFunctionsQuery.cpp
+++ b/src/Interpreters/InterpreterShowFunctionsQuery.cpp
@@ -25,13 +25,13 @@ String InterpreterShowFunctionsQuery::getRewrittenQuery()
 
     const auto & query = query_ptr->as<ASTShowFunctionsQuery &>();
 
-    DatabasePtr systemDb = DatabaseCatalog::instance().getSystemDatabase();
+    DatabasePtr system_db = DatabaseCatalog::instance().getSystemDatabase();
 
     String rewritten_query = fmt::format(
         R"(
 SELECT *
 FROM {}.{})",
-        systemDb->getDatabaseName(),
+        system_db->getDatabaseName(),
         functions_table);
 
     if (!query.like.empty())
diff --git a/src/Interpreters/Session.cpp b/src/Interpreters/Session.cpp
index df97a09f686..b52f8a507e3 100644
--- a/src/Interpreters/Session.cpp
+++ b/src/Interpreters/Session.cpp
@@ -429,11 +429,11 @@ void Session::setClientConnectionId(uint32_t connection_id)
         prepared_client_info->connection_id = connection_id;
 }
 
-void Session::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
+void Session::setHTTPClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
 {
     if (session_context)
     {
-        session_context->setHttpClientInfo(http_method, http_user_agent, http_referer);
+        session_context->setHTTPClientInfo(http_method, http_user_agent, http_referer);
     }
     else
     {
diff --git a/src/Interpreters/Session.h b/src/Interpreters/Session.h
index cde000d89fa..334560a33c8 100644
--- a/src/Interpreters/Session.h
+++ b/src/Interpreters/Session.h
@@ -65,7 +65,7 @@ public:
     void setClientInterface(ClientInfo::Interface interface);
     void setClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
     void setClientConnectionId(uint32_t connection_id);
-    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
+    void setHTTPClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
     void setForwardedFor(const String & forwarded_for);
     void setQuotaClientKey(const String & quota_key);
     void setConnectionClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLFunctionFactory.cpp b/src/Parsers/Kusto/KustoFunctions/KQLFunctionFactory.cpp
index adac892b49d..044cc2e0622 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLFunctionFactory.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLFunctionFactory.cpp
@@ -359,7 +359,7 @@ std::unique_ptr<IParserKQLFunction> KQLFunctionFactory::get(String & kql_functio
             return std::make_unique<ExtractAll>();
 
         case KQLFunctionValue::extract_json:
-            return std::make_unique<ExtractJson>();
+            return std::make_unique<ExtractJSON>();
 
         case KQLFunctionValue::has_any_index:
             return std::make_unique<HasAnyIndex>();
@@ -389,7 +389,7 @@ std::unique_ptr<IParserKQLFunction> KQLFunctionFactory::get(String & kql_functio
             return std::make_unique<ParseCSV>();
 
         case KQLFunctionValue::parse_json:
-            return std::make_unique<ParseJson>();
+            return std::make_unique<ParseJSON>();
 
         case KQLFunctionValue::parse_url:
             return std::make_unique<ParseURL>();
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
index 0f9ca67d6dc..afb8809c69e 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
@@ -240,7 +240,7 @@ bool ExtractAll::convertImpl(String & out, IParser::Pos & pos)
     return true;
 }
 
-bool ExtractJson::convertImpl(String & out, IParser::Pos & pos)
+bool ExtractJSON::convertImpl(String & out, IParser::Pos & pos)
 {
     String datatype = "String";
     ParserKeyword s_kql("typeof");
@@ -431,7 +431,7 @@ bool ParseCSV::convertImpl(String & out, IParser::Pos & pos)
     return true;
 }
 
-bool ParseJson::convertImpl(String & out, IParser::Pos & pos)
+bool ParseJSON::convertImpl(String & out, IParser::Pos & pos)
 {
     const String fn_name = getKQLFunctionName(pos);
     if (fn_name.empty())
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
index 492a59263ec..e55d07defd0 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
+++ b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
@@ -62,7 +62,7 @@ protected:
     bool convertImpl(String & out, IParser::Pos & pos) override;
 };
 
-class ExtractJson : public IParserKQLFunction
+class ExtractJSON : public IParserKQLFunction
 {
 protected:
     const char * getName() const override { return "extract_json(), extractjson()"; }
@@ -125,7 +125,7 @@ protected:
     bool convertImpl(String & out, IParser::Pos & pos) override;
 };
 
-class ParseJson : public IParserKQLFunction
+class ParseJJSON : public IParserKQLFunction
 {
 protected:
     const char * getName() const override { return "parse_json()"; }
diff --git a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
index 8dc8fa516dc..8ef2cda5587 100644
--- a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
@@ -212,7 +212,7 @@ static AvroDeserializer::DeserializeFn createDecimalDeserializeFn(const avro::No
     };
 }
 
-static std::string nodeToJson(avro::NodePtr root_node)
+static std::string nodeToJSON(avro::NodePtr root_node)
 {
     std::ostringstream ss;      // STYLE_CHECK_ALLOW_STD_STRING_STREAM
     ss.exceptions(std::ios::failbit);
@@ -641,7 +641,7 @@ AvroDeserializer::DeserializeFn AvroDeserializer::createDeserializeFn(const avro
 
     throw Exception(ErrorCodes::ILLEGAL_COLUMN,
         "Type {} is not compatible with Avro {}:\n{}",
-        target_type->getName(), avro::toString(root_node->type()), nodeToJson(root_node));
+        target_type->getName(), avro::toString(root_node->type()), nodeToJSON(root_node));
 }
 
 AvroDeserializer::SkipFn AvroDeserializer::createSkipFn(const avro::NodePtr & root_node)
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 72e7c5552f8..35a95c0534d 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -125,7 +125,7 @@ namespace ErrorCodes
 
 namespace
 {
-bool tryAddHttpOptionHeadersFromConfig(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
+bool tryAddHTTPOptionHeadersFromConfig(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
 {
     if (config.has("http_options_response"))
     {
@@ -153,7 +153,7 @@ bool tryAddHttpOptionHeadersFromConfig(HTTPServerResponse & response, const Poco
 void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
 {
     /// If can add some headers from config
-    if (tryAddHttpOptionHeadersFromConfig(response, config))
+    if (tryAddHTTPOptionHeadersFromConfig(response, config))
     {
         response.setKeepAlive(false);
         response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
@@ -496,7 +496,7 @@ bool HTTPHandler::authenticateUser(
     else if (request.getMethod() == HTTPServerRequest::HTTP_POST)
         http_method = ClientInfo::HTTPMethod::POST;
 
-    session->setHttpClientInfo(http_method, request.get("User-Agent", ""), request.get("Referer", ""));
+    session->setHTTPClientInfo(http_method, request.get("User-Agent", ""), request.get("Referer", ""));
     session->setForwardedFor(request.get("X-Forwarded-For", ""));
     session->setQuotaClientKey(quota_key);
 
@@ -1065,7 +1065,7 @@ void HTTPHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse
         response.set("X-ClickHouse-Server-Display-Name", server_display_name);
 
         if (!request.get("Origin", "").empty())
-            tryAddHttpOptionHeadersFromConfig(response, server.config());
+            tryAddHTTPOptionHeadersFromConfig(response, server.config());
 
         /// For keep-alive to work.
         if (request.getVersion() == HTTPServerRequest::HTTP_1_1)
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 547342cf439..6f3599630d3 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -1511,7 +1511,7 @@ void StorageURL::processNamedCollectionResult(Configuration & configuration, con
         && configuration.http_method != Poco::Net::HTTPRequest::HTTP_PUT)
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,
-            "Http method can be POST or PUT (current: {}). For insert default is POST, for select GET",
+            "HTTP method can be POST or PUT (current: {}). For insert default is POST, for select GET",
             configuration.http_method);
 
     configuration.format = collection.getOrDefault<String>("format", "auto");
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index f0745ab43f3..6c12970c4bb 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -442,3 +442,9 @@ ls -1d $ROOT_PATH/contrib/*-cmake | xargs -I@ find @ -name 'CMakeLists.txt' -or
 
 # DOS/Windows newlines
 find $ROOT_PATH/{base,src,programs,utils,docs} -name '*.md' -or -name '*.h' -or -name '*.cpp' -or -name '*.js' -or -name '*.py' -or -name '*.html' | xargs grep -l -P '\r$' && echo "^ Files contain DOS/Windows newlines (\r\n instead of \n)."
+
+# Wrong spelling of abbreviations, e.g. SQL is right, Sql is wrong. XMLHttpRequest is very wrong.
+find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
+    grep -vP $EXCLUDE_DIRS |
+    xargs grep -P 'Sql|Html|Xml|Cpu|Tcp|Udp|Http|Db|Json|Yaml' | grep -v -P 'RabbitMQ|Azure|Aws|aws|Avro|IO/S3' &&
+    echo "Abbreviations such as SQL, XML, HTTP, should be in all caps. For example, SQL is right, Sql is wrong. XMLHttpRequest is very wrong."

From 9686bb51bcbd0e1272ae8f8ad0b5265aff71a6c2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 02:15:14 +0100
Subject: [PATCH 1026/1081] Style check for abbreviations

---
 src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
index e55d07defd0..9b0c6327e01 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
+++ b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.h
@@ -125,7 +125,7 @@ protected:
     bool convertImpl(String & out, IParser::Pos & pos) override;
 };
 
-class ParseJJSON : public IParserKQLFunction
+class ParseJSON : public IParserKQLFunction
 {
 protected:
     const char * getName() const override { return "parse_json()"; }

From d10b18afeb121b47b7ccef384550e9eb765391e2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 02:21:55 +0100
Subject: [PATCH 1027/1081] I found TODO in the code, that can be implemented

---
 src/Client/QueryFuzzer.cpp | 24 +++++++-----------------
 1 file changed, 7 insertions(+), 17 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 24be7491ec7..0597a7c1eed 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -1168,23 +1168,13 @@ void QueryFuzzer::fuzz(ASTPtr & ast)
 
         fuzz(select->children);
     }
-    /*
-     * The time to fuzz the settings has not yet come.
-     * Apparently we don't have any infrastructure to validate the values of
-     * the settings, and the first query with max_block_size = -1 breaks
-     * because of overflows here and there.
-     *//*
-     * else if (auto * set = typeid_cast<ASTSetQuery *>(ast.get()))
-     * {
-     *      for (auto & c : set->changes)
-     *      {
-     *          if (fuzz_rand() % 50 == 0)
-     *          {
-     *              c.value = fuzzField(c.value);
-     *          }
-     *      }
-     * }
-     */
+    else if (auto * set = typeid_cast<ASTSetQuery *>(ast.get()))
+    {
+        /// Fuzz settings
+        for (auto & c : set->changes)
+            if (fuzz_rand() % 50 == 0)
+                c.value = fuzzField(c.value);
+    }
     else if (auto * literal = typeid_cast<ASTLiteral *>(ast.get()))
     {
         // There is a caveat with fuzzing the children: many ASTs also keep the

From 3128cf1f1b2ea4448822f2a3f5c7825d49258641 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 02:24:21 +0100
Subject: [PATCH 1028/1081] Remove the check for formatting consistency from
 the Fuzzer

---
 programs/client/Client.cpp | 78 +-------------------------------------
 1 file changed, 1 insertion(+), 77 deletions(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index fdd262f185d..7a77b7dd0ec 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -845,83 +845,7 @@ bool Client::processWithFuzzing(const String & full_query)
             have_error = true;
         }
 
-        // Check that after the query is formatted, we can parse it back,
-        // format again and get the same result. Unfortunately, we can't
-        // compare the ASTs, which would be more sensitive to errors. This
-        // double formatting check doesn't catch all errors, e.g. we can
-        // format query incorrectly, but to a valid SQL that we can then
-        // parse and format into the same SQL.
-        // There are some complicated cases where we can generate the SQL
-        // which we can't parse:
-        // * first argument of lambda() replaced by fuzzer with
-        //   something else, leading to constructs such as
-        //   arrayMap((min(x) + 3) -> x + 1, ....)
-        // * internals of Enum replaced, leading to:
-        //   Enum(equals(someFunction(y), 3)).
-        // And there are even the cases when we can parse the query, but
-        // it's logically incorrect and its formatting is a mess, such as
-        // when `lambda()` function gets substituted into a wrong place.
-        // To avoid dealing with these cases, run the check only for the
-        // queries we were able to successfully execute.
-        // Another caveat is that sometimes WITH queries are not executed,
-        // if they are not referenced by the main SELECT, so they can still
-        // have the aforementioned problems. Disable this check for such
-        // queries, for lack of a better solution.
-        // There is also a problem that fuzzer substitutes positive Int64
-        // literals or Decimal literals, which are then parsed back as
-        // UInt64, and suddenly duplicate alias substitution starts or stops
-        // working (ASTWithAlias::formatImpl) or something like that.
-        // So we compare not even the first and second formatting of the
-        // query, but second and third.
-        // If you have to add any more workarounds to this check, just remove
-        // it altogether, it's not so useful.
-        if (ast_to_process && !have_error && !queryHasWithClause(*ast_to_process))
-        {
-            ASTPtr ast_2;
-            try
-            {
-                const auto * tmp_pos = query_to_execute.c_str();
-                ast_2 = parseQuery(tmp_pos, tmp_pos + query_to_execute.size(), false /* allow_multi_statements */);
-            }
-            catch (Exception & e)
-            {
-                if (e.code() != ErrorCodes::SYNTAX_ERROR &&
-                    e.code() != ErrorCodes::TOO_DEEP_RECURSION)
-                    throw;
-            }
-
-            if (ast_2)
-            {
-                const auto text_2 = ast_2->formatForErrorMessage();
-                const auto * tmp_pos = text_2.c_str();
-                const auto ast_3 = parseQuery(tmp_pos, tmp_pos + text_2.size(),
-                    false /* allow_multi_statements */);
-                const auto text_3 = ast_3 ? ast_3->formatForErrorMessage() : "";
-
-                if (text_3 != text_2)
-                {
-                    fmt::print(stderr, "Found error: The query formatting is broken.\n");
-
-                    printChangedSettings();
-
-                    fmt::print(stderr,
-                        "Got the following (different) text after formatting the fuzzed query and parsing it back:\n'{}'\n, expected:\n'{}'\n",
-                        text_3, text_2);
-                    fmt::print(stderr, "In more detail:\n");
-                    fmt::print(stderr, "AST-1 (generated by fuzzer):\n'{}'\n", ast_to_process->dumpTree());
-                    fmt::print(stderr, "Text-1 (AST-1 formatted):\n'{}'\n", query_to_execute);
-                    fmt::print(stderr, "AST-2 (Text-1 parsed):\n'{}'\n", ast_2->dumpTree());
-                    fmt::print(stderr, "Text-2 (AST-2 formatted):\n'{}'\n", text_2);
-                    fmt::print(stderr, "AST-3 (Text-2 parsed):\n'{}'\n", ast_3 ? ast_3->dumpTree() : "");
-                    fmt::print(stderr, "Text-3 (AST-3 formatted):\n'{}'\n", text_3);
-                    fmt::print(stderr, "Text-3 must be equal to Text-2, but it is not.\n");
-
-                    _exit(1);
-                }
-            }
-        }
-
-        // The server is still alive so we're going to continue fuzzing.
+        // The server is still alive, so we're going to continue fuzzing.
         // Determine what we're going to use as the starting AST.
         if (have_error)
         {

From 52bcecf7b02cfff242164d2158ef10af342685f9 Mon Sep 17 00:00:00 2001
From: Joshua Hildred <jthildred@gmail.com>
Date: Fri, 16 Feb 2024 11:38:28 -0800
Subject: [PATCH 1029/1081] Bump curl to version 4.6.0

---
 contrib/curl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/curl b/contrib/curl
index 7161cb17c01..5ce164e0e92 160000
--- a/contrib/curl
+++ b/contrib/curl
@@ -1 +1 @@
-Subproject commit 7161cb17c01dcff1dc5bf89a18437d9d729f1ecd
+Subproject commit 5ce164e0e9290c96eb7d502173426c0a135ec008

From 20b9e519ffd30108e66a4457240a59696bca0181 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 04:59:32 +0100
Subject: [PATCH 1030/1081] Add a test

---
 .../1_stateful/00098_primary_key_memory_allocated.reference      | 1 +
 tests/queries/1_stateful/00098_primary_key_memory_allocated.sql  | 1 +
 2 files changed, 2 insertions(+)
 create mode 100644 tests/queries/1_stateful/00098_primary_key_memory_allocated.reference
 create mode 100644 tests/queries/1_stateful/00098_primary_key_memory_allocated.sql

diff --git a/tests/queries/1_stateful/00098_primary_key_memory_allocated.reference b/tests/queries/1_stateful/00098_primary_key_memory_allocated.reference
new file mode 100644
index 00000000000..72749c905a3
--- /dev/null
+++ b/tests/queries/1_stateful/00098_primary_key_memory_allocated.reference
@@ -0,0 +1 @@
+1	1	1
diff --git a/tests/queries/1_stateful/00098_primary_key_memory_allocated.sql b/tests/queries/1_stateful/00098_primary_key_memory_allocated.sql
new file mode 100644
index 00000000000..7371678a0f6
--- /dev/null
+++ b/tests/queries/1_stateful/00098_primary_key_memory_allocated.sql
@@ -0,0 +1 @@
+SELECT primary_key_bytes_in_memory < 16000, primary_key_bytes_in_memory_allocated < 16000, primary_key_bytes_in_memory_allocated / primary_key_bytes_in_memory < 1.1 FROM system.parts WHERE database = 'test' AND table = 'hits';

From b5efbe62e7dc25f6049571348ccf18d34ba5a191 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 05:41:52 +0100
Subject: [PATCH 1031/1081] Avoid overflow in settings

---
 src/Core/SettingsFields.cpp                                | 7 ++++---
 src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp | 2 --
 .../queries/0_stateless/02992_settings_overflow.reference  | 0
 tests/queries/0_stateless/02992_settings_overflow.sql      | 1 +
 4 files changed, 5 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/02992_settings_overflow.reference
 create mode 100644 tests/queries/0_stateless/02992_settings_overflow.sql

diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index 80197cfbe22..a5258b3d0b3 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -2,10 +2,11 @@
 
 #include <Core/Field.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Common/FieldVisitorConvertToNumber.h>
+#include <Interpreters/convertFieldToType.h>
 #include <Common/logger_useful.h>
 #include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteHelpers.h>
@@ -50,7 +51,7 @@ namespace
         if (f.getType() == Field::Types::String)
             return stringToNumber<T>(f.get<const String &>());
         else
-            return applyVisitor(FieldVisitorConvertToNumber<T>(), f);
+            return static_cast<T>(convertFieldToTypeOrThrow(f, DataTypeNumber<NearestFieldType<T>>()).template get<T>());
     }
 
     Map stringToMap(const String & str)
@@ -174,7 +175,7 @@ namespace
         if (f.getType() == Field::Types::String)
             return stringToMaxThreads(f.get<const String &>());
         else
-            return applyVisitor(FieldVisitorConvertToNumber<UInt64>(), f);
+            return convertFieldToTypeOrThrow(f, DataTypeUInt64()).template get<UInt64>();
     }
 }
 
diff --git a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
index bf584b759f8..f91f7cf536b 100644
--- a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
+++ b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
@@ -16,7 +16,6 @@
 #include <Interpreters/TreeRewriter.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/convertFieldToType.h>
-#include <Interpreters/ExpressionActions.h>
 #include <Interpreters/castColumn.h>
 #include <IO/ReadHelpers.h>
 #include <Parsers/ASTExpressionList.h>
@@ -28,7 +27,6 @@
 #include <Processors/Formats/Impl/ConstantExpressionTemplate.h>
 #include <Parsers/ExpressionElementParsers.h>
 #include <boost/functional/hash.hpp>
-#include <base/sort.h>
 
 
 namespace DB
diff --git a/tests/queries/0_stateless/02992_settings_overflow.reference b/tests/queries/0_stateless/02992_settings_overflow.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02992_settings_overflow.sql b/tests/queries/0_stateless/02992_settings_overflow.sql
new file mode 100644
index 00000000000..cbe14788709
--- /dev/null
+++ b/tests/queries/0_stateless/02992_settings_overflow.sql
@@ -0,0 +1 @@
+SET max_threads = -1; -- { serverError ARGUMENT_OUT_OF_BOUND }

From 96113a46c5f0f6d5488917e6657ce89330d2ee7d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 05:52:24 +0100
Subject: [PATCH 1032/1081] Update LZ4 to the latest dev

---
 contrib/lz4 | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/lz4 b/contrib/lz4
index 92ebf1870b9..ce45a9dbdb0 160000
--- a/contrib/lz4
+++ b/contrib/lz4
@@ -1 +1 @@
-Subproject commit 92ebf1870b9acbefc0e7970409a181954a10ff40
+Subproject commit ce45a9dbdb059511a3e9576b19db3e7f1a4f172e

From ac5bef7c74f98fdc8423d8ef5c9d78f1351d79cb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:16:01 +0100
Subject: [PATCH 1033/1081] A small preparation for better handling of primary
 key in memory

---
 src/Processors/QueryPlan/PartsSplitter.cpp    |  2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 21 ++++++++++---------
 src/Storages/MergeTree/MergeTreeData.cpp      |  4 ++--
 .../MergeTree/MergeTreeDataSelectExecutor.cpp |  2 +-
 .../MergeTree/MergedBlockOutputStream.cpp     |  2 +-
 src/Storages/MergeTree/MutateTask.cpp         |  2 +-
 7 files changed, 18 insertions(+), 17 deletions(-)

diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 363fdca22c5..0fc6ddd6408 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -54,7 +54,7 @@ public:
 
     Values getValue(size_t part_idx, size_t mark) const
     {
-        const auto & index = parts[part_idx].data_part->index;
+        const auto & index = parts[part_idx].data_part->getIndex();
         Values values(index.size());
         for (size_t i = 0; i < values.size(); ++i)
         {
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 0f82e00edff..bc64632356f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -313,13 +313,13 @@ IMergeTreeDataPart::IMergeTreeDataPart(
     const IMergeTreeDataPart * parent_part_)
     : DataPartStorageHolder(data_part_storage_)
     , storage(storage_)
-    , mutable_name(name_)
     , name(mutable_name)
     , info(info_)
     , index_granularity_info(storage_, part_type_)
     , part_type(part_type_)
     , parent_part(parent_part_)
     , parent_part_name(parent_part ? parent_part->name : "")
+    , mutable_name(name_)
 {
     if (parent_part)
     {
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index fcf9d5bd17d..878258bddf0 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -75,6 +75,7 @@ public:
     using ColumnSizeByName = std::unordered_map<std::string, ColumnSize>;
     using NameToNumber = std::unordered_map<std::string, size_t>;
 
+    using Index = Columns;
     using IndexSizeByName = std::unordered_map<std::string, ColumnSize>;
 
     using Type = MergeTreeDataPartType;
@@ -212,10 +213,6 @@ public:
 
     const MergeTreeData & storage;
 
-private:
-    String mutable_name;
-    mutable MergeTreeDataPartState state{MergeTreeDataPartState::Temporary};
-
 public:
     const String & name;    // const ref to private mutable_name
     MergeTreePartInfo info;
@@ -309,12 +306,6 @@ public:
     /// Throws an exception if state of the part is not in affordable_states
     void assertState(const std::initializer_list<MergeTreeDataPartState> & affordable_states) const;
 
-    /// Primary key (correspond to primary.idx file).
-    /// Always loaded in RAM. Contains each index_granularity-th value of primary key tuple.
-    /// Note that marks (also correspond to primary key) is not always in RAM, but cached. See MarkCache.h.
-    using Index = Columns;
-    Index index;
-
     MergeTreePartition partition;
 
     /// Amount of rows between marks
@@ -369,6 +360,9 @@ public:
     /// Version of part metadata (columns, pk and so on). Managed properly only for replicated merge tree.
     int32_t metadata_version;
 
+    const Index & getIndex() const { return index; }
+    void setIndex(Columns index_) { index = std::move(index_); }
+
     /// For data in RAM ('index')
     UInt64 getIndexSizeInBytes() const;
     UInt64 getIndexSizeInAllocatedBytes() const;
@@ -567,6 +561,10 @@ public:
     mutable std::atomic<time_t> last_removal_attempt_time = 0;
 
 protected:
+    /// Primary key (correspond to primary.idx file).
+    /// Always loaded in RAM. Contains each index_granularity-th value of primary key tuple.
+    /// Note that marks (also correspond to primary key) is not always in RAM, but cached. See MarkCache.h.
+    Index index;
 
     /// Total size of all columns, calculated once in calcuateColumnSizesOnDisk
     ColumnSize total_columns_size;
@@ -623,6 +621,9 @@ protected:
     void initializeIndexGranularityInfo();
 
 private:
+    String mutable_name;
+    mutable MergeTreeDataPartState state{MergeTreeDataPartState::Temporary};
+
     /// In compact parts order of columns is necessary
     NameToNumber column_name_to_position;
 
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index c8262914702..e14a358745e 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -6824,7 +6824,7 @@ Block MergeTreeData::getMinMaxCountProjectionBlock(
         {
             for (const auto & part : real_parts)
             {
-                const auto & primary_key_column = *part->index[0];
+                const auto & primary_key_column = *part->getIndex()[0];
                 auto & min_column = assert_cast<ColumnAggregateFunction &>(*partition_minmax_count_columns[pos]);
                 insert(min_column, primary_key_column[0]);
             }
@@ -6835,7 +6835,7 @@ Block MergeTreeData::getMinMaxCountProjectionBlock(
         {
             for (const auto & part : real_parts)
             {
-                const auto & primary_key_column = *part->index[0];
+                const auto & primary_key_column = *part->getIndex()[0];
                 auto & max_column = assert_cast<ColumnAggregateFunction &>(*partition_minmax_count_columns[pos]);
                 insert(max_column, primary_key_column[primary_key_column.size() - 1]);
             }
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index a76d370d057..1ba28713680 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -1087,7 +1087,7 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     MarkRanges res;
 
     size_t marks_count = part->index_granularity.getMarksCount();
-    const auto & index = part->index;
+    const auto & index = part->getIndex();
     if (marks_count == 0)
         return res;
 
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index 1d10a1433ef..f2fe2e0f255 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -181,7 +181,7 @@ MergedBlockOutputStream::Finalizer MergedBlockOutputStream::finalizePartAsync(
 
     new_part->rows_count = rows_count;
     new_part->modification_time = time(nullptr);
-    new_part->index = writer->releaseIndexColumns();
+    new_part->setIndex(writer->releaseIndexColumns());
     new_part->checksums = checksums;
     new_part->setBytesOnDisk(checksums.getTotalSizeOnDisk());
     new_part->setBytesUncompressedOnDisk(checksums.getTotalSizeUncompressedOnDisk());
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 9959688d889..6882963fd24 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -899,7 +899,7 @@ void finalizeMutatedPart(
 
     new_data_part->rows_count = source_part->rows_count;
     new_data_part->index_granularity = source_part->index_granularity;
-    new_data_part->index = source_part->index;
+    new_data_part->setIndex(source_part->getIndex());
     new_data_part->minmax_idx = source_part->minmax_idx;
     new_data_part->modification_time = time(nullptr);
 

From fce3a8cafc13b4b454ed53966b9f7fd1d7f845fa Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:16:56 +0100
Subject: [PATCH 1034/1081] A small preparation for better handling of primary
 key in memory

---
 src/Storages/MergeTree/IMergeTreeDataPart.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 878258bddf0..e82dc8fc2a3 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -563,7 +563,7 @@ public:
 protected:
     /// Primary key (correspond to primary.idx file).
     /// Always loaded in RAM. Contains each index_granularity-th value of primary key tuple.
-    /// Note that marks (also correspond to primary key) is not always in RAM, but cached. See MarkCache.h.
+    /// Note that marks (also correspond to primary key) are not always in RAM, but cached. See MarkCache.h.
     Index index;
 
     /// Total size of all columns, calculated once in calcuateColumnSizesOnDisk

From e9cf92245f126d8b92cd29747f38bf94e0b466c2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:20:44 +0100
Subject: [PATCH 1035/1081] Move methods to .cpp

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 13 +++++++++++++
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  4 ++--
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index bc64632356f..70a8cee6106 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -342,6 +342,19 @@ IMergeTreeDataPart::~IMergeTreeDataPart()
     decrementTypeMetric(part_type);
 }
 
+
+const IMergeTreeDataPart::Index & IMergeTreeDataPart::getIndex() const
+{
+    return index;
+}
+
+
+void IMergeTreeDataPart::setIndex(Columns index_)
+{
+    index = std::move(index_);
+}
+
+
 void IMergeTreeDataPart::setName(const String & new_name)
 {
     mutable_name = new_name;
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index e82dc8fc2a3..f93b1a4c9c1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -360,8 +360,8 @@ public:
     /// Version of part metadata (columns, pk and so on). Managed properly only for replicated merge tree.
     int32_t metadata_version;
 
-    const Index & getIndex() const { return index; }
-    void setIndex(Columns index_) { index = std::move(index_); }
+    const Index & getIndex() const;
+    void setIndex(Columns index_);
 
     /// For data in RAM ('index')
     UInt64 getIndexSizeInBytes() const;

From dc0b3e8bb5c0b1de5b7e2dd7a4b02e22ee800d35 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:33:13 +0100
Subject: [PATCH 1036/1081] Update test

---
 .../0_stateless/01557_field_infinite_convert_to_number.sql      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql b/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
index edc4d5cbc91..2ceea259de0 100644
--- a/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
+++ b/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
@@ -1 +1 @@
-SET max_threads = nan; -- { serverError 70 }
+SET max_threads = nan; -- { serverError 69 }

From 423ff759f1ee62bde0000b441751b3fdad24fdc0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:35:03 +0100
Subject: [PATCH 1037/1081] Lazy loading of primary keys in memory

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 11 +++++++++--
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  8 +++++---
 2 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 70a8cee6106..240010a7550 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -345,13 +345,21 @@ IMergeTreeDataPart::~IMergeTreeDataPart()
 
 const IMergeTreeDataPart::Index & IMergeTreeDataPart::getIndex() const
 {
+    std::scoped_lock lock(index_mutex);
+    if (!index_loaded)
+        loadIndex(lock);
+    index_loaded = true;
     return index;
 }
 
 
 void IMergeTreeDataPart::setIndex(Columns index_)
 {
+    std::scoped_lock lock(index_mutex);
+    if (!index.empty())
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The index of data part can be set only once");
     index = std::move(index_);
+    index_loaded = true;
 }
 
 
@@ -683,7 +691,6 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         loadChecksums(require_columns_checksums);
         loadIndexGranularity();
         calculateColumnsAndSecondaryIndicesSizesOnDisk();
-        loadIndex(); /// Must be called after loadIndexGranularity as it uses the value of `index_granularity`
         loadRowsCount(); /// Must be called after loadIndexGranularity() as it uses the value of `index_granularity`.
         loadPartitionAndMinMaxIndex();
         bool has_broken_projections = false;
@@ -817,7 +824,7 @@ void IMergeTreeDataPart::appendFilesOfIndexGranularity(Strings & /* files */) co
 {
 }
 
-void IMergeTreeDataPart::loadIndex()
+void IMergeTreeDataPart::loadIndex(std::scoped_lock<std::mutex> &) const
 {
     /// It can be empty in case of mutations
     if (!index_granularity.isInitialized())
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index f93b1a4c9c1..0fc874b7953 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -562,9 +562,11 @@ public:
 
 protected:
     /// Primary key (correspond to primary.idx file).
-    /// Always loaded in RAM. Contains each index_granularity-th value of primary key tuple.
+    /// Lazily loaded in RAM. Contains each index_granularity-th value of primary key tuple.
     /// Note that marks (also correspond to primary key) are not always in RAM, but cached. See MarkCache.h.
-    Index index;
+    mutable std::mutex index_mutex;
+    mutable Index index;
+    mutable bool index_loaded = false;
 
     /// Total size of all columns, calculated once in calcuateColumnSizesOnDisk
     ColumnSize total_columns_size;
@@ -662,7 +664,7 @@ private:
     virtual void appendFilesOfIndexGranularity(Strings & files) const;
 
     /// Loads index file.
-    void loadIndex();
+    void loadIndex(std::scoped_lock<std::mutex> &) const;
 
     void appendFilesOfIndex(Strings & files) const;
 

From 021e11e4fc674fa8eb5ea7fec17563dbfea58a22 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 06:42:53 +0100
Subject: [PATCH 1038/1081] Add a setting for lazy loading

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 4 ++++
 src/Storages/MergeTree/MergeTreeSettings.h    | 1 +
 2 files changed, 5 insertions(+)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 240010a7550..fee7286da3b 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -690,6 +690,10 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
         loadColumns(require_columns_checksums);
         loadChecksums(require_columns_checksums);
         loadIndexGranularity();
+
+        if (!storage.getSettings()->primary_key_lazy_load)
+            getIndex();
+
         calculateColumnsAndSecondaryIndicesSizesOnDisk();
         loadRowsCount(); /// Must be called after loadIndexGranularity() as it uses the value of `index_granularity`.
         loadPartitionAndMinMaxIndex();
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 96cab9c0293..b64632b6139 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -201,6 +201,7 @@ struct Settings;
     M(String, primary_key_compression_codec, "ZSTD(3)", "Compression encoding used by primary, primary key is small enough and cached, so the default compression is ZSTD(3).", 0) \
     M(UInt64, marks_compress_block_size, 65536, "Mark compress block size, the actual size of the block to compress.", 0) \
     M(UInt64, primary_key_compress_block_size, 65536, "Primary compress block size, the actual size of the block to compress.", 0) \
+    M(Bool, primary_key_lazy_load, true, "Load primary key in memory on first use instead of on table initialization. This can save memory in the presence of a large number of tables.", 0) \
     \
     /** Projection settings. */ \
     M(UInt64, max_projections, 25, "The maximum number of merge tree projections.", 0) \

From 9acd87aa8c847fe00db1be879f4bd83b9d9aea1c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 07:36:47 +0100
Subject: [PATCH 1039/1081] Add a test

---
 .../02993_lazy_index_loading.reference         |  4 ++++
 .../0_stateless/02993_lazy_index_loading.sql   | 18 ++++++++++++++++++
 2 files changed, 22 insertions(+)
 create mode 100644 tests/queries/0_stateless/02993_lazy_index_loading.reference
 create mode 100644 tests/queries/0_stateless/02993_lazy_index_loading.sql

diff --git a/tests/queries/0_stateless/02993_lazy_index_loading.reference b/tests/queries/0_stateless/02993_lazy_index_loading.reference
new file mode 100644
index 00000000000..5313c84136e
--- /dev/null
+++ b/tests/queries/0_stateless/02993_lazy_index_loading.reference
@@ -0,0 +1,4 @@
+100000000	140000000
+0	0
+1
+100000000	140000000
diff --git a/tests/queries/0_stateless/02993_lazy_index_loading.sql b/tests/queries/0_stateless/02993_lazy_index_loading.sql
new file mode 100644
index 00000000000..7de4af9ef0e
--- /dev/null
+++ b/tests/queries/0_stateless/02993_lazy_index_loading.sql
@@ -0,0 +1,18 @@
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (s String) ENGINE = MergeTree ORDER BY s SETTINGS index_granularity = 1;
+
+INSERT INTO test SELECT randomString(1000) FROM numbers(100000);
+SELECT round(primary_key_bytes_in_memory, -7), round(primary_key_bytes_in_memory_allocated, -7) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+
+DETACH TABLE test;
+SET max_memory_usage = '50M';
+ATTACH TABLE test;
+
+SELECT primary_key_bytes_in_memory, primary_key_bytes_in_memory_allocated FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+
+SET max_memory_usage = '200M';
+SELECT s != '' FROM test LIMIT 1;
+
+SELECT round(primary_key_bytes_in_memory, -7), round(primary_key_bytes_in_memory_allocated, -7) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+
+DROP TABLE test;

From 3d21d546a92a15e77470648a9652f2f62a4d6825 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 09:44:10 +0100
Subject: [PATCH 1040/1081] Better code

---
 src/Common/FieldVisitorConvertToNumber.h |  2 +-
 src/Core/AccurateComparison.h            |  2 +-
 src/Core/SettingsFields.cpp              | 49 +++++++++++++++++++++---
 3 files changed, 46 insertions(+), 7 deletions(-)

diff --git a/src/Common/FieldVisitorConvertToNumber.h b/src/Common/FieldVisitorConvertToNumber.h
index bf8c8c8638e..47a1e669969 100644
--- a/src/Common/FieldVisitorConvertToNumber.h
+++ b/src/Common/FieldVisitorConvertToNumber.h
@@ -91,7 +91,7 @@ public:
         if constexpr (std::is_floating_point_v<T>)
             return x.getValue().template convertTo<T>() / x.getScaleMultiplier().template convertTo<T>();
         else
-            return (x.getValue() / x.getScaleMultiplier()). template convertTo<T>();
+            return (x.getValue() / x.getScaleMultiplier()).template convertTo<T>();
     }
 
     T operator() (const AggregateFunctionStateData &) const
diff --git a/src/Core/AccurateComparison.h b/src/Core/AccurateComparison.h
index a201c136e3a..139ee4d88dc 100644
--- a/src/Core/AccurateComparison.h
+++ b/src/Core/AccurateComparison.h
@@ -152,7 +152,7 @@ bool notEqualsOp(A a, B b)
 }
 
 /// Converts numeric to an equal numeric of other type.
-/// When `strict` is `true` check that result exactly same as input, otherwise just check overflow
+/// When `strict` is `true` check that result exactly the same as input, otherwise just check overflow
 template <typename From, typename To, bool strict = true>
 inline bool NO_SANITIZE_UNDEFINED convertNumeric(From value, To & result)
 {
diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index a5258b3d0b3..223bdc1aeb7 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -1,12 +1,11 @@
 #include <Core/SettingsFields.h>
-
 #include <Core/Field.h>
+#include <Core/AccurateComparison.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Interpreters/convertFieldToType.h>
+#include <Common/FieldVisitors.h>
 #include <Common/logger_useful.h>
 #include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/WriteHelpers.h>
@@ -14,6 +13,7 @@
 
 #include <cmath>
 
+
 namespace DB
 {
 namespace ErrorCodes
@@ -21,6 +21,7 @@ namespace ErrorCodes
     extern const int SIZE_OF_FIXED_STRING_DOESNT_MATCH;
     extern const int CANNOT_PARSE_BOOL;
     extern const int CANNOT_PARSE_NUMBER;
+    extern const int CANNOT_CONVERT_TYPE;
 }
 
 
@@ -49,9 +50,47 @@ namespace
     T fieldToNumber(const Field & f)
     {
         if (f.getType() == Field::Types::String)
+        {
             return stringToNumber<T>(f.get<const String &>());
+        }
+        else if (f.getType() == Field::Types::UInt64)
+        {
+            T result;
+            if (!accurate::convertNumeric(f.get<UInt64>(), result))
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Field value {} is out of range of {} type", f, demangle(typeid(T).name()));
+            return result;
+        }
+        else if (f.getType() == Field::Types::Int64)
+        {
+            T result;
+            if (!accurate::convertNumeric(f.get<Int64>(), result))
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Field value {} is out of range of {} type", f, demangle(typeid(T).name()));
+            return result;
+        }
+        else if (f.getType() == Field::Types::Float64)
+        {
+            Float64 x = f.get<Float64>();
+            if constexpr (std::is_floating_point_v<T>)
+            {
+                return T(x);
+            }
+            else
+            {
+                if (!isFinite(x))
+                {
+                    /// Conversion of infinite values to integer is undefined.
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert infinite value to integer type");
+                }
+                else if (x > Float64(std::numeric_limits<T>::max()) || x < Float64(std::numeric_limits<T>::lowest()))
+                {
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert out of range floating point value to integer type");
+                }
+                else
+                    return T(x);
+            }
+        }
         else
-            return static_cast<T>(convertFieldToTypeOrThrow(f, DataTypeNumber<NearestFieldType<T>>()).template get<T>());
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Invalid value {} of the setting, which needs {}", f, demangle(typeid(T).name()));
     }
 
     Map stringToMap(const String & str)
@@ -175,7 +214,7 @@ namespace
         if (f.getType() == Field::Types::String)
             return stringToMaxThreads(f.get<const String &>());
         else
-            return convertFieldToTypeOrThrow(f, DataTypeUInt64()).template get<UInt64>();
+            return fieldToNumber<UInt64>(f);
     }
 }
 

From dbb0ed8157461eeafba98cc14e868c4536052687 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 10:08:36 +0100
Subject: [PATCH 1041/1081] Fix error

---
 src/Core/SettingsFields.cpp | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index 223bdc1aeb7..9562f45a35d 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -67,6 +67,13 @@ namespace
                 throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Field value {} is out of range of {} type", f, demangle(typeid(T).name()));
             return result;
         }
+        else if (f.getType() == Field::Types::Bool)
+        {
+            if constexpr (std::is_same_v<T, bool>)
+                return f.get<bool>();
+            else
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion of a bool value {} to {} looks suspicious", f, demangle(typeid(T).name()));
+        }
         else if (f.getType() == Field::Types::Float64)
         {
             Float64 x = f.get<Float64>();

From b7e563c0a699c416f8d38ac590c5a631aa2ea4a4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 11:13:54 +0100
Subject: [PATCH 1042/1081] Update test

---
 tests/queries/0_stateless/02993_lazy_index_loading.reference | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02993_lazy_index_loading.reference b/tests/queries/0_stateless/02993_lazy_index_loading.reference
index 5313c84136e..5bc329ae4eb 100644
--- a/tests/queries/0_stateless/02993_lazy_index_loading.reference
+++ b/tests/queries/0_stateless/02993_lazy_index_loading.reference
@@ -1,4 +1,4 @@
 100000000	140000000
 0	0
 1
-100000000	140000000
+100000000	100000000

From f075961728c69ace187aec038e2a21ee38ce6751 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 17 Feb 2024 11:37:31 +0100
Subject: [PATCH 1043/1081] Update

---
 src/Core/SettingsFields.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index 9562f45a35d..d1a1439fb15 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -69,10 +69,7 @@ namespace
         }
         else if (f.getType() == Field::Types::Bool)
         {
-            if constexpr (std::is_same_v<T, bool>)
-                return f.get<bool>();
-            else
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion of a bool value {} to {} looks suspicious", f, demangle(typeid(T).name()));
+            return T(f.get<bool>());
         }
         else if (f.getType() == Field::Types::Float64)
         {

From 3323d5ce81914d93026f2cf68b68170cf8c4053b Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Sat, 17 Feb 2024 15:02:26 +0100
Subject: [PATCH 1044/1081] Move threadPoolCallbackRunner to the "Common"
 folder.

---
 src/Backups/BackupIO_AzureBlobStorage.cpp               | 2 +-
 src/Backups/BackupIO_S3.cpp                             | 2 +-
 src/{Interpreters => Common}/threadPoolCallbackRunner.h | 0
 src/Disks/IO/ThreadPoolReader.h                         | 2 +-
 src/Disks/IO/ThreadPoolRemoteFSReader.h                 | 2 +-
 src/Disks/ObjectStorages/IObjectStorage.h               | 2 +-
 src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h   | 2 +-
 src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp         | 2 +-
 src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h      | 2 +-
 src/IO/ParallelReadBuffer.h                             | 2 +-
 src/IO/S3/copyS3File.h                                  | 2 +-
 src/IO/WriteBufferFromS3.h                              | 2 +-
 src/Storages/MergeTree/MergeTreeData.h                  | 2 +-
 src/Storages/MergeTree/MergeTreeMarksLoader.cpp         | 2 +-
 src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp  | 2 +-
 src/Storages/MergeTree/MergeTreeSource.cpp              | 2 +-
 src/Storages/StorageS3.h                                | 2 +-
 src/Storages/StorageURL.cpp                             | 2 +-
 src/Storages/System/StorageSystemDetachedParts.cpp      | 2 +-
 19 files changed, 18 insertions(+), 18 deletions(-)
 rename src/{Interpreters => Common}/threadPoolCallbackRunner.h (100%)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 52ce20d5108..b3b92323109 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -2,7 +2,7 @@
 
 #if USE_AZURE_BLOB_STORAGE
 #include <Common/quoteString.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Interpreters/Context.h>
 #include <IO/SharedThreadPools.h>
 #include <IO/HTTPHeaderEntries.h>
diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index fa4c1af3698..f8bbf5b1f79 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -2,7 +2,7 @@
 
 #if USE_AWS_S3
 #include <Common/quoteString.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Interpreters/Context.h>
 #include <IO/SharedThreadPools.h>
 #include <IO/ReadBufferFromS3.h>
diff --git a/src/Interpreters/threadPoolCallbackRunner.h b/src/Common/threadPoolCallbackRunner.h
similarity index 100%
rename from src/Interpreters/threadPoolCallbackRunner.h
rename to src/Common/threadPoolCallbackRunner.h
diff --git a/src/Disks/IO/ThreadPoolReader.h b/src/Disks/IO/ThreadPoolReader.h
index 42bc9bf8bb4..b8aff9f22a2 100644
--- a/src/Disks/IO/ThreadPoolReader.h
+++ b/src/Disks/IO/ThreadPoolReader.h
@@ -3,7 +3,7 @@
 #include <memory>
 #include <IO/AsynchronousReader.h>
 #include <Common/ThreadPool_fwd.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 
 
 namespace DB
diff --git a/src/Disks/IO/ThreadPoolRemoteFSReader.h b/src/Disks/IO/ThreadPoolRemoteFSReader.h
index cd2bf223f33..abc251b2b10 100644
--- a/src/Disks/IO/ThreadPoolRemoteFSReader.h
+++ b/src/Disks/IO/ThreadPoolRemoteFSReader.h
@@ -3,7 +3,7 @@
 #include <IO/AsynchronousReader.h>
 #include <IO/SeekableReadBuffer.h>
 #include <Common/ThreadPool_fwd.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 
 namespace DB
 {
diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index 049935ad60c..56c269a3fc5 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -22,7 +22,7 @@
 #include <Core/Types.h>
 #include <Disks/DirectoryIterator.h>
 #include <Common/ThreadPool.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Common/Exception.h>
 #include "config.h"
 
diff --git a/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h
index a6abe03bac9..5f63e5f6e8a 100644
--- a/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h
+++ b/src/Disks/ObjectStorages/ObjectStorageIteratorAsync.h
@@ -2,7 +2,7 @@
 
 #include <Disks/ObjectStorages/ObjectStorageIterator.h>
 #include <Common/ThreadPool.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <mutex>
 #include <Common/CurrentMetrics.h>
 
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index 4cc49288af6..5771eb1ebe0 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -13,7 +13,7 @@
 #include <IO/S3/getObjectInfo.h>
 #include <IO/S3/copyS3File.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 
 #include <Disks/ObjectStorages/S3/diskSettings.h>
diff --git a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
index 83814f42693..1433f8d18ba 100644
--- a/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
+++ b/src/IO/AzureBlobStorage/copyAzureBlobStorageFile.h
@@ -6,7 +6,7 @@
 
 #include <Storages/StorageAzureBlobCluster.h>
 #include <Storages/StorageAzureBlob.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <base/types.h>
 #include <functional>
 #include <memory>
diff --git a/src/IO/ParallelReadBuffer.h b/src/IO/ParallelReadBuffer.h
index e76b40f77b7..daac1190399 100644
--- a/src/IO/ParallelReadBuffer.h
+++ b/src/IO/ParallelReadBuffer.h
@@ -3,7 +3,7 @@
 #include <IO/BufferWithOwnMemory.h>
 #include <IO/ReadBuffer.h>
 #include <IO/SeekableReadBuffer.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Common/ArenaWithFreeLists.h>
 
 namespace DB
diff --git a/src/IO/S3/copyS3File.h b/src/IO/S3/copyS3File.h
index 607be51ed25..093d26ba7bb 100644
--- a/src/IO/S3/copyS3File.h
+++ b/src/IO/S3/copyS3File.h
@@ -5,7 +5,7 @@
 #if USE_AWS_S3
 
 #include <Storages/StorageS3Settings.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 #include <base/types.h>
 #include <functional>
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 230f39b074e..5dc269990a1 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -10,7 +10,7 @@
 #include <IO/WriteBuffer.h>
 #include <IO/WriteSettings.h>
 #include <Storages/StorageS3Settings.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 
 #include <memory>
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 4ad440dae00..1de79ed17ca 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -35,7 +35,7 @@
 #include <Storages/extractKeyExpressionList.h>
 #include <Storages/PartitionCommands.h>
 #include <Interpreters/PartLog.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 
 
 #include <boost/multi_index_container.hpp>
diff --git a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
index 7531c03a011..aeb6afeff11 100644
--- a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
+++ b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
@@ -1,6 +1,6 @@
 #include <Compression/CompressedReadBufferFromFile.h>
 #include <IO/ReadBufferFromFile.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/MergeTreeMarksLoader.h>
 #include <Common/CurrentMetrics.h>
diff --git a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
index 47c2fe07bb4..8d8b0f1cc79 100644
--- a/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
+++ b/src/Storages/MergeTree/MergeTreePrefetchedReadPool.cpp
@@ -1,6 +1,6 @@
 #include <IO/Operators.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Storages/MergeTree/AlterConversions.h>
 #include <Storages/MergeTree/IMergeTreeReader.h>
 #include <Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h>
diff --git a/src/Storages/MergeTree/MergeTreeSource.cpp b/src/Storages/MergeTree/MergeTreeSource.cpp
index a450505f7a8..e1d1d0951e4 100644
--- a/src/Storages/MergeTree/MergeTreeSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSource.cpp
@@ -1,6 +1,6 @@
 #include <Storages/MergeTree/MergeTreeSource.h>
 #include <Storages/MergeTree/MergeTreeSelectProcessor.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <IO/SharedThreadPools.h>
 #include <Common/EventFD.h>
 
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 73559ef8571..587145cd1a7 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -19,7 +19,7 @@
 #include <IO/CompressionMethod.h>
 #include <IO/SeekableReadBuffer.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Storages/Cache/SchemaCache.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Storages/StorageConfiguration.h>
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 6f3599630d3..608e44c3cd0 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -5,7 +5,7 @@
 #include <Storages/VirtualColumnUtils.h>
 
 #include <Interpreters/evaluateConstantExpression.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTInsertQuery.h>
 #include <Parsers/ASTLiteral.h>
diff --git a/src/Storages/System/StorageSystemDetachedParts.cpp b/src/Storages/System/StorageSystemDetachedParts.cpp
index a9cd5f2610a..3dae43976f7 100644
--- a/src/Storages/System/StorageSystemDetachedParts.cpp
+++ b/src/Storages/System/StorageSystemDetachedParts.cpp
@@ -11,7 +11,7 @@
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <QueryPipeline/Pipe.h>
 #include <IO/SharedThreadPools.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 
 #include <mutex>
 

From dfc4b72ab2d596405cef922eee1323edaea2e262 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 02:10:05 +0100
Subject: [PATCH 1045/1081] Update
 tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql

Co-authored-by: Yakov Olkhovskiy <99031427+yakov-olkhovskiy@users.noreply.github.com>
---
 .../0_stateless/01557_field_infinite_convert_to_number.sql      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql b/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
index 2ceea259de0..cc71c8e6f6c 100644
--- a/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
+++ b/tests/queries/0_stateless/01557_field_infinite_convert_to_number.sql
@@ -1 +1 @@
-SET max_threads = nan; -- { serverError 69 }
+SET max_threads = nan; -- { serverError CANNOT_CONVERT_TYPE }

From 2e95c689eb72f81a3cd078870c3dbda4ac038d3b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 02:10:24 +0100
Subject: [PATCH 1046/1081] Update 02992_settings_overflow.sql

---
 tests/queries/0_stateless/02992_settings_overflow.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02992_settings_overflow.sql b/tests/queries/0_stateless/02992_settings_overflow.sql
index cbe14788709..d120c3400e5 100644
--- a/tests/queries/0_stateless/02992_settings_overflow.sql
+++ b/tests/queries/0_stateless/02992_settings_overflow.sql
@@ -1 +1 @@
-SET max_threads = -1; -- { serverError ARGUMENT_OUT_OF_BOUND }
+SET max_threads = -1; -- { serverError CANNOT_CONVERT_TYPE }

From c50f8e79542eae88709cbe241bfb94710ac96af8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 02:12:31 +0100
Subject: [PATCH 1047/1081] Remove a header

---
 src/Core/SettingsFields.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Core/SettingsFields.cpp b/src/Core/SettingsFields.cpp
index d1a1439fb15..f72b64fd56d 100644
--- a/src/Core/SettingsFields.cpp
+++ b/src/Core/SettingsFields.cpp
@@ -2,7 +2,6 @@
 #include <Core/Field.h>
 #include <Core/AccurateComparison.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Common/FieldVisitors.h>
 #include <Common/logger_useful.h>
 #include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeString.h>

From c083498cf87b4181614228f2e796369bafb09bfe Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 05:13:17 +0100
Subject: [PATCH 1048/1081] Apply review comments

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp   | 3 +++
 src/Storages/MergeTree/MergeTreeMarksLoader.cpp | 1 -
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index b0eff01a4e7..2826c3e23f1 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -830,6 +830,9 @@ void IMergeTreeDataPart::appendFilesOfIndexGranularity(Strings & /* files */) co
 
 void IMergeTreeDataPart::loadIndex(std::scoped_lock<std::mutex> &) const
 {
+    /// Memory for index must not be accounted as memory usage for query, because it belongs to a table.
+    MemoryTrackerBlockerInThread temporarily_disable_memory_tracker;
+
     /// It can be empty in case of mutations
     if (!index_granularity.isInitialized())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Index granularity is not loaded before index loading");
diff --git a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
index 7531c03a011..eb7b60b0727 100644
--- a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
+++ b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
@@ -6,7 +6,6 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/MemoryTrackerBlockerInThread.h>
 #include <Common/ThreadPool.h>
-#include <Common/scope_guard_safe.h>
 #include <Common/setThreadName.h>
 
 #include <utility>

From 232fe0dd1b62974e6bcef053b8a13cdc4694fd07 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 05:38:34 +0100
Subject: [PATCH 1049/1081] Fix inconsistent formatting of SELECT ... FROM
 (EXPLAIN ...)

---
 src/Analyzer/QueryNode.cpp                  |  5 +----
 src/Analyzer/UnionNode.cpp                  |  5 +----
 src/Interpreters/TreeRewriter.cpp           |  3 +--
 src/Parsers/ASTSelectWithUnionQuery.cpp     |  3 +--
 src/Parsers/ASTSubquery.h                   |  7 +++++++
 src/Parsers/ExpressionElementParsers.cpp    |  7 +++----
 src/Parsers/ExpressionListParsers.cpp       |  6 ++----
 src/Parsers/Kusto/ParserKQLQuery.cpp        | 18 ++++++++----------
 src/Storages/StorageView.cpp                |  3 +--
 src/TableFunctions/TableFunctionExplain.cpp | 20 ++++++++++++++++++--
 10 files changed, 43 insertions(+), 34 deletions(-)

diff --git a/src/Analyzer/QueryNode.cpp b/src/Analyzer/QueryNode.cpp
index d0bff759dea..bc7a29247e4 100644
--- a/src/Analyzer/QueryNode.cpp
+++ b/src/Analyzer/QueryNode.cpp
@@ -421,11 +421,8 @@ ASTPtr QueryNode::toASTImpl(const ConvertToASTOptions & options) const
 
     if (is_subquery)
     {
-        auto subquery = std::make_shared<ASTSubquery>();
-
+        auto subquery = std::make_shared<ASTSubquery>(std::move(result_select_query));
         subquery->cte_name = cte_name;
-        subquery->children.push_back(std::move(result_select_query));
-
         return subquery;
     }
 
diff --git a/src/Analyzer/UnionNode.cpp b/src/Analyzer/UnionNode.cpp
index 5d2ac128abe..c6003126554 100644
--- a/src/Analyzer/UnionNode.cpp
+++ b/src/Analyzer/UnionNode.cpp
@@ -185,11 +185,8 @@ ASTPtr UnionNode::toASTImpl(const ConvertToASTOptions & options) const
 
     if (is_subquery)
     {
-        auto subquery = std::make_shared<ASTSubquery>();
-
+        auto subquery = std::make_shared<ASTSubquery>(std::move(select_with_union_query));
         subquery->cte_name = cte_name;
-        subquery->children.push_back(std::move(select_with_union_query));
-
         return subquery;
     }
 
diff --git a/src/Interpreters/TreeRewriter.cpp b/src/Interpreters/TreeRewriter.cpp
index ecd021328e7..bb6df2da8d9 100644
--- a/src/Interpreters/TreeRewriter.cpp
+++ b/src/Interpreters/TreeRewriter.cpp
@@ -262,8 +262,7 @@ struct ExistsExpressionData
         select_with_union_query->list_of_selects->children.push_back(std::move(select_query));
         select_with_union_query->children.push_back(select_with_union_query->list_of_selects);
 
-        auto new_subquery = std::make_shared<ASTSubquery>();
-        new_subquery->children.push_back(select_with_union_query);
+        auto new_subquery = std::make_shared<ASTSubquery>(std::move(select_with_union_query));
 
         auto function = makeASTFunction("in", std::make_shared<ASTLiteral>(1u), new_subquery);
         func = *function;
diff --git a/src/Parsers/ASTSelectWithUnionQuery.cpp b/src/Parsers/ASTSelectWithUnionQuery.cpp
index 48b4ae3c38d..c377e4bd66b 100644
--- a/src/Parsers/ASTSelectWithUnionQuery.cpp
+++ b/src/Parsers/ASTSelectWithUnionQuery.cpp
@@ -71,8 +71,7 @@ void ASTSelectWithUnionQuery::formatQueryImpl(const FormatSettings & settings, F
             }
             else
             {
-                auto sub_query = std::make_shared<ASTSubquery>();
-                sub_query->children.push_back(*it);
+                auto sub_query = std::make_shared<ASTSubquery>(*it);
                 sub_query->formatImpl(settings, state, frame);
             }
         }
diff --git a/src/Parsers/ASTSubquery.h b/src/Parsers/ASTSubquery.h
index ef277a63126..e92a88b04dd 100644
--- a/src/Parsers/ASTSubquery.h
+++ b/src/Parsers/ASTSubquery.h
@@ -26,6 +26,13 @@ public:
         return clone;
     }
 
+    ASTSubquery() = default;
+
+    ASTSubquery(ASTPtr child)
+    {
+        children.emplace_back(std::move(child));
+    }
+
     void updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const override;
     String getAliasOrColumnName() const override;
     String tryGetAlias() const override;
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 42400a0f13b..62c480e0f6b 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -123,7 +123,7 @@ bool ParserSubquery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "EXPLAIN in a subquery cannot have a table function or table override");
 
         /// Replace subquery `(EXPLAIN <kind> <explain_settings> SELECT ...)`
-        /// with `(SELECT * FROM viewExplain("<kind>", "<explain_settings>", SELECT ...))`
+        /// with `(SELECT * FROM viewExplain('<kind>', '<explain_settings>', (SELECT ...)))`
 
         String kind_str = ASTExplainQuery::toString(explain_query.getKind());
 
@@ -141,7 +141,7 @@ bool ParserSubquery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             auto view_explain = makeASTFunction("viewExplain",
                 std::make_shared<ASTLiteral>(kind_str),
                 std::make_shared<ASTLiteral>(settings_str),
-                explained_ast);
+                std::make_shared<ASTSubquery>(explained_ast));
             result_node = buildSelectFromTableFunction(view_explain);
         }
         else
@@ -161,8 +161,7 @@ bool ParserSubquery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         return false;
     ++pos;
 
-    node = std::make_shared<ASTSubquery>();
-    node->children.push_back(result_node);
+    node = std::make_shared<ASTSubquery>(std::move(result_node));
     return true;
 }
 
diff --git a/src/Parsers/ExpressionListParsers.cpp b/src/Parsers/ExpressionListParsers.cpp
index 1e9383f96ae..6d267a7d215 100644
--- a/src/Parsers/ExpressionListParsers.cpp
+++ b/src/Parsers/ExpressionListParsers.cpp
@@ -225,8 +225,7 @@ static bool modifyAST(ASTPtr ast, SubqueryFunctionType type)
     select_with_union_query->list_of_selects->children.push_back(std::move(select_query));
     select_with_union_query->children.push_back(select_with_union_query->list_of_selects);
 
-    auto new_subquery = std::make_shared<ASTSubquery>();
-    new_subquery->children.push_back(select_with_union_query);
+    auto new_subquery = std::make_shared<ASTSubquery>(std::move(select_with_union_query));
     ast->children[0]->children.back() = std::move(new_subquery);
 
     return true;
@@ -1582,8 +1581,7 @@ public:
         if (!ParserToken(TokenType::ClosingRoundBracket).ignore(pos, expected))
             return false;
 
-        auto subquery = std::make_shared<ASTSubquery>();
-        subquery->children.push_back(std::move(node));
+        auto subquery = std::make_shared<ASTSubquery>(std::move(node));
         elements = {makeASTFunction("exists", subquery)};
 
         finished = true;
diff --git a/src/Parsers/Kusto/ParserKQLQuery.cpp b/src/Parsers/Kusto/ParserKQLQuery.cpp
index 47986943662..30e9921e744 100644
--- a/src/Parsers/Kusto/ParserKQLQuery.cpp
+++ b/src/Parsers/Kusto/ParserKQLQuery.cpp
@@ -576,20 +576,19 @@ bool ParserKQLSubquery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     if (!ParserKQLTableFunction().parse(pos, select_node, expected))
         return false;
 
-    ASTPtr node_subquery = std::make_shared<ASTSubquery>();
-    node_subquery->children.push_back(select_node);
+    ASTPtr node_subquery = std::make_shared<ASTSubquery>(std::move(select_node));
 
     ASTPtr node_table_expr = std::make_shared<ASTTableExpression>();
     node_table_expr->as<ASTTableExpression>()->subquery = node_subquery;
 
     node_table_expr->children.emplace_back(node_subquery);
 
-    ASTPtr node_table_in_select_query_emlement = std::make_shared<ASTTablesInSelectQueryElement>();
-    node_table_in_select_query_emlement->as<ASTTablesInSelectQueryElement>()->table_expression = node_table_expr;
+    ASTPtr node_table_in_select_query_element = std::make_shared<ASTTablesInSelectQueryElement>();
+    node_table_in_select_query_element->as<ASTTablesInSelectQueryElement>()->table_expression = node_table_expr;
 
     ASTPtr res = std::make_shared<ASTTablesInSelectQuery>();
 
-    res->children.emplace_back(node_table_in_select_query_emlement);
+    res->children.emplace_back(node_table_in_select_query_element);
 
     node = res;
     return true;
@@ -618,20 +617,19 @@ bool ParserSimpleCHSubquery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
             ASTSelectQuery::Expression::TABLES, parent_select_node->as<ASTSelectQuery>()->tables());
     }
 
-    ASTPtr node_subquery = std::make_shared<ASTSubquery>();
-    node_subquery->children.push_back(sub_select_node);
+    ASTPtr node_subquery = std::make_shared<ASTSubquery>(std::move(sub_select_node));
 
     ASTPtr node_table_expr = std::make_shared<ASTTableExpression>();
     node_table_expr->as<ASTTableExpression>()->subquery = node_subquery;
 
     node_table_expr->children.emplace_back(node_subquery);
 
-    ASTPtr node_table_in_select_query_emlement = std::make_shared<ASTTablesInSelectQueryElement>();
-    node_table_in_select_query_emlement->as<ASTTablesInSelectQueryElement>()->table_expression = node_table_expr;
+    ASTPtr node_table_in_select_query_element = std::make_shared<ASTTablesInSelectQueryElement>();
+    node_table_in_select_query_element->as<ASTTablesInSelectQueryElement>()->table_expression = node_table_expr;
 
     ASTPtr res = std::make_shared<ASTTablesInSelectQuery>();
 
-    res->children.emplace_back(node_table_in_select_query_emlement);
+    res->children.emplace_back(node_table_in_select_query_element);
 
     node = res;
     return true;
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 588e5303117..181fd0ac61c 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -251,8 +251,7 @@ void StorageView::replaceWithSubquery(ASTSelectQuery & outer_query, ASTPtr view_
 
     view_name = table_expression->database_and_table_name;
     table_expression->database_and_table_name = {};
-    table_expression->subquery = std::make_shared<ASTSubquery>();
-    table_expression->subquery->children.push_back(view_query);
+    table_expression->subquery = std::make_shared<ASTSubquery>(view_query);
     table_expression->subquery->setAlias(alias);
 
     for (auto & child : table_expression->children)
diff --git a/src/TableFunctions/TableFunctionExplain.cpp b/src/TableFunctions/TableFunctionExplain.cpp
index f993a9820cb..400fc81e6d4 100644
--- a/src/TableFunctions/TableFunctionExplain.cpp
+++ b/src/TableFunctions/TableFunctionExplain.cpp
@@ -1,4 +1,5 @@
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTSubquery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ParserSetQuery.h>
 #include <Parsers/parseQuery.h>
@@ -21,6 +22,7 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int BAD_ARGUMENTS;
+    extern const int UNEXPECTED_AST_STRUCTURE;
 }
 
 namespace
@@ -103,11 +105,25 @@ void TableFunctionExplain::parseArguments(const ASTPtr & ast_function, ContextPt
 
     if (function->arguments->children.size() > 2)
     {
-        const auto & query_arg = function->arguments->children[2];
+        const auto & subquery_arg = function->arguments->children[2];
+        const auto * subquery = subquery_arg->as<ASTSubquery>();
+
+        if (!subquery)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "Table function '{}' requires a subquery argument, got '{}'",
+                getName(), queryToString(subquery_arg));
+
+        if (subquery->children.empty())
+            throw Exception(ErrorCodes::UNEXPECTED_AST_STRUCTURE,
+                "A subquery AST element must have a child");
+
+        const auto & query_arg = subquery->children[0];
+
         if (!query_arg->as<ASTSelectWithUnionQuery>())
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                "Table function '{}' requires a EXPLAIN SELECT query argument, got EXPLAIN '{}'",
+                "Table function '{}' requires a EXPLAIN's SELECT query argument, got '{}'",
                 getName(), queryToString(query_arg));
+
         explain_query->setExplainedQuery(query_arg);
     }
     else if (kind != ASTExplainQuery::ExplainKind::CurrentTransaction)

From 543b07639c97b08b291d76807452c17009cbde6a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 05:39:55 +0100
Subject: [PATCH 1050/1081] Add a test

---
 .../02990_format_select_from_explain.reference           | 9 +++++++++
 .../0_stateless/02990_format_select_from_explain.sh      | 7 +++++++
 2 files changed, 16 insertions(+)
 create mode 100644 tests/queries/0_stateless/02990_format_select_from_explain.reference
 create mode 100755 tests/queries/0_stateless/02990_format_select_from_explain.sh

diff --git a/tests/queries/0_stateless/02990_format_select_from_explain.reference b/tests/queries/0_stateless/02990_format_select_from_explain.reference
new file mode 100644
index 00000000000..7c8dcef3824
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_select_from_explain.reference
@@ -0,0 +1,9 @@
+SELECT explain
+FROM
+(
+    SELECT *
+    FROM viewExplain('EXPLAIN AST', '', (
+        SELECT *
+        FROM system.numbers
+    ))
+)
diff --git a/tests/queries/0_stateless/02990_format_select_from_explain.sh b/tests/queries/0_stateless/02990_format_select_from_explain.sh
new file mode 100755
index 00000000000..4955b733788
--- /dev/null
+++ b/tests/queries/0_stateless/02990_format_select_from_explain.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_FORMAT} --query "SELECT explain FROM (EXPLAIN AST SELECT * FROM system.numbers)"

From c8415ddc295b2c7f0ebe80aa16a090a6e4697f87 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 09:29:34 +0100
Subject: [PATCH 1051/1081] Speed up the CI

---
 docker/test/base/setup_export_logs.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 9e854dce65a..8858e12c50e 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -190,7 +190,7 @@ function setup_logs_replication
         echo -e "Creating remote destination table ${table}_${hash} with statement:\n${statement}" >&2
 
         echo "$statement" | clickhouse-client --database_replicated_initial_query_timeout_sec=10 \
-            --distributed_ddl_task_timeout=30 \
+            --distributed_ddl_task_timeout=30 --distributed_ddl_output_mode=throw_only_active \
             "${CONNECTION_ARGS[@]}" || continue
 
         echo "Creating table system.${table}_sender" >&2

From 096a679d6b6f496eebc7e49b2fe0b9ca5b28b8ab Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 10:47:18 +0100
Subject: [PATCH 1052/1081] Insignificant changes

---
 src/Common/Dwarf.cpp            | 5 +++--
 src/Functions/addressToLine.cpp | 2 +-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Common/Dwarf.cpp b/src/Common/Dwarf.cpp
index a405f73e35e..99da3b75429 100644
--- a/src/Common/Dwarf.cpp
+++ b/src/Common/Dwarf.cpp
@@ -2067,8 +2067,8 @@ Dwarf::LineNumberVM::StepResult Dwarf::LineNumberVM::step(std::string_view & pro
     if (opcode != 0)
     { // standard opcode
         // Only interpret opcodes that are recognized by the version we're parsing;
-        // the others are vendor extensions and we should ignore them.
-        switch (opcode) // NOLINT(bugprone-switch-missing-default-case)
+        // the others are vendor extensions, and we should ignore them.
+        switch (opcode)
         {
             case DW_LNS_copy:
                 basicBlock_ = false;
@@ -2121,6 +2121,7 @@ Dwarf::LineNumberVM::StepResult Dwarf::LineNumberVM::step(std::string_view & pro
                 }
                 isa_ = readULEB(program);
                 return CONTINUE;
+            default:
         }
 
         // Unrecognized standard opcode, slurp the appropriate number of LEB
diff --git a/src/Functions/addressToLine.cpp b/src/Functions/addressToLine.cpp
index 771c85cabf6..bb5edf2a07a 100644
--- a/src/Functions/addressToLine.cpp
+++ b/src/Functions/addressToLine.cpp
@@ -17,7 +17,7 @@ namespace DB
 namespace
 {
 
-class FunctionAddressToLine: public FunctionAddressToLineBase<StringRef, Dwarf::LocationInfoMode::FAST>
+class FunctionAddressToLine : public FunctionAddressToLineBase<StringRef, Dwarf::LocationInfoMode::FAST>
 {
 public:
     static constexpr auto name = "addressToLine";

From c2555dfb27c999c04a55ea5896b03b0094b8bf2f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 18 Feb 2024 10:58:10 +0100
Subject: [PATCH 1053/1081] Better check for inconsistent formatting

---
 src/Interpreters/executeQuery.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 10567fbafd4..1ab66f49ac7 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -721,7 +721,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             /// Verify that AST formatting is consistent:
             /// If you format AST, parse it back, and format it again, you get the same string.
 
-            String formatted1 = ast->formatForErrorMessage();
+            String formatted1 = ast->formatWithPossiblyHidingSensitiveData(0, true, true);
 
             ASTPtr ast2 = parseQuery(parser,
                 formatted1.data(),
@@ -730,7 +730,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
 
             chassert(ast2);
 
-            String formatted2 = ast2->formatForErrorMessage();
+            String formatted2 = ast2->formatWithPossiblyHidingSensitiveData(0, true, true);
 
             if (formatted1 != formatted2)
                 throw Exception(ErrorCodes::LOGICAL_ERROR,

From 8f29320a73c394357b20495433a1ac919f8be9c6 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sun, 18 Feb 2024 13:15:24 +0100
Subject: [PATCH 1054/1081] Flush StorageBuffer into multiple threads if
 num_layers > 1

---
 src/Common/CurrentMetrics.cpp  |  3 +++
 src/Storages/StorageBuffer.cpp | 12 +++++++++++-
 src/Storages/StorageBuffer.h   |  2 ++
 3 files changed, 16 insertions(+), 1 deletion(-)

diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index c6fbafa8dc3..6931001202d 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -262,6 +262,9 @@
     M(ActiveTimersInQueryProfiler, "Number of Active thread local timers in QueryProfiler") \
     M(RefreshableViews, "Number materialized views with periodic refreshing (REFRESH)") \
     M(RefreshingViews, "Number of materialized views currently executing a refresh") \
+    M(StorageBufferFlushThreads, "Number of threads for background flushes in StorageBuffer") \
+    M(StorageBufferFlushThreadsActive, "Number of threads for background flushes in StorageBuffer running a task") \
+    M(StorageBufferFlushThreadsScheduled, "Number of queued or active threads for background flushes in StorageBuffer")
 
 #ifdef APPLY_FOR_EXTERNAL_METRICS
     #define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M) APPLY_FOR_EXTERNAL_METRICS(M)
diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index d5c135bb81d..dbf6c7c7657 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -56,6 +56,9 @@ namespace CurrentMetrics
 {
     extern const Metric StorageBufferRows;
     extern const Metric StorageBufferBytes;
+    extern const Metric StorageBufferFlushThreads;
+    extern const Metric StorageBufferFlushThreadsActive;
+    extern const Metric StorageBufferFlushThreadsScheduled;
 }
 
 
@@ -131,6 +134,7 @@ StorageBuffer::StorageBuffer(
     : IStorage(table_id_)
     , WithContext(context_->getBufferContext())
     , num_shards(num_shards_)
+    , flush_pool(CurrentMetrics::StorageBufferFlushThreads, CurrentMetrics::StorageBufferFlushThreadsActive, CurrentMetrics::StorageBufferFlushThreadsScheduled, num_shards, 0, num_shards_)
     , buffers(num_shards_)
     , min_thresholds(min_thresholds_)
     , max_thresholds(max_thresholds_)
@@ -802,7 +806,13 @@ bool StorageBuffer::checkThresholdsImpl(bool direct, size_t rows, size_t bytes,
 void StorageBuffer::flushAllBuffers(bool check_thresholds)
 {
     for (auto & buf : buffers)
-        flushBuffer(buf, check_thresholds, false);
+    {
+        flush_pool.scheduleOrThrowOnError([&] ()
+        {
+            flushBuffer(buf, check_thresholds, false);
+        });
+    }
+    flush_pool.wait();
 }
 
 
diff --git a/src/Storages/StorageBuffer.h b/src/Storages/StorageBuffer.h
index 47f6239b173..50f12be5aef 100644
--- a/src/Storages/StorageBuffer.h
+++ b/src/Storages/StorageBuffer.h
@@ -3,6 +3,7 @@
 #include <Core/BackgroundSchedulePool.h>
 #include <Core/NamesAndTypes.h>
 #include <Storages/IStorage.h>
+#include <Common/ThreadPool.h>
 
 #include <Poco/Event.h>
 
@@ -149,6 +150,7 @@ private:
 
     /// There are `num_shards` of independent buffers.
     const size_t num_shards;
+    ThreadPool flush_pool;
     std::vector<Buffer> buffers;
 
     const Thresholds min_thresholds;

From 29e3e7cb965b5ada347028282e87005c570d3400 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sun, 18 Feb 2024 13:19:35 +0100
Subject: [PATCH 1055/1081] Better if only 1 layer

---
 src/Storages/StorageBuffer.cpp | 22 ++++++++++++++++++----
 src/Storages/StorageBuffer.h   |  2 +-
 2 files changed, 19 insertions(+), 5 deletions(-)

diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index dbf6c7c7657..c2b63101d11 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -134,7 +134,6 @@ StorageBuffer::StorageBuffer(
     : IStorage(table_id_)
     , WithContext(context_->getBufferContext())
     , num_shards(num_shards_)
-    , flush_pool(CurrentMetrics::StorageBufferFlushThreads, CurrentMetrics::StorageBufferFlushThreadsActive, CurrentMetrics::StorageBufferFlushThreadsScheduled, num_shards, 0, num_shards_)
     , buffers(num_shards_)
     , min_thresholds(min_thresholds_)
     , max_thresholds(max_thresholds_)
@@ -157,6 +156,12 @@ StorageBuffer::StorageBuffer(
     storage_metadata.setComment(comment);
     setInMemoryMetadata(storage_metadata);
 
+    if (num_shards > 1)
+    {
+        flush_pool = std::make_unique<ThreadPool>(
+            CurrentMetrics::StorageBufferFlushThreads, CurrentMetrics::StorageBufferFlushThreadsActive, CurrentMetrics::StorageBufferFlushThreadsScheduled,
+            num_shards, 0, num_shards);
+    }
     flush_handle = bg_pool.createTask(log->name() + "/Bg", [this]{ backgroundFlush(); });
 }
 
@@ -807,12 +812,21 @@ void StorageBuffer::flushAllBuffers(bool check_thresholds)
 {
     for (auto & buf : buffers)
     {
-        flush_pool.scheduleOrThrowOnError([&] ()
+        if (flush_pool)
+        {
+            flush_pool->scheduleOrThrowOnError([&] ()
+            {
+                flushBuffer(buf, check_thresholds, false);
+            });
+        }
+        else
         {
             flushBuffer(buf, check_thresholds, false);
-        });
+        }
     }
-    flush_pool.wait();
+
+    if (flush_pool)
+        flush_pool->wait();
 }
 
 
diff --git a/src/Storages/StorageBuffer.h b/src/Storages/StorageBuffer.h
index 50f12be5aef..6c15c7e0238 100644
--- a/src/Storages/StorageBuffer.h
+++ b/src/Storages/StorageBuffer.h
@@ -150,7 +150,7 @@ private:
 
     /// There are `num_shards` of independent buffers.
     const size_t num_shards;
-    ThreadPool flush_pool;
+    std::unique_ptr<ThreadPool> flush_pool;
     std::vector<Buffer> buffers;
 
     const Thresholds min_thresholds;

From 6fd563df523006946a5ebc44f350114d541aae56 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 02:58:51 +0100
Subject: [PATCH 1056/1081] Miscellaneous

---
 src/AggregateFunctions/AggregateFunctionCount.h           | 2 +-
 src/AggregateFunctions/AggregateFunctionFactory.cpp       | 4 ++--
 .../Combinators/AggregateFunctionIf.cpp                   | 2 +-
 .../Combinators/AggregateFunctionNull.h                   | 2 +-
 src/Client/MultiplexedConnections.cpp                     | 2 +-
 src/Columns/ColumnArray.cpp                               | 4 ++--
 src/Columns/ColumnNullable.cpp                            | 6 +-----
 src/Columns/getLeastSuperColumn.cpp                       | 2 +-
 src/Common/SensitiveDataMasker.cpp                        | 2 +-
 src/Common/SipHash.h                                      | 2 +-
 src/Common/checkStackSize.cpp                             | 2 +-
 src/Coordination/KeeperStorage.cpp                        | 2 +-
 src/DataTypes/DataTypeAggregateFunction.cpp               | 2 +-
 src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp   | 2 +-
 src/Functions/EmptyImpl.h                                 | 2 +-
 src/Functions/FunctionsComparison.h                       | 6 +++---
 src/Functions/FunctionsLogical.cpp                        | 2 +-
 src/Functions/trap.cpp                                    | 2 +-
 src/Interpreters/Aggregator.cpp                           | 6 +++---
 src/Interpreters/ArrayJoinedColumnsVisitor.h              | 2 +-
 src/Interpreters/ClientInfo.cpp                           | 4 ++--
 src/Interpreters/CrossToInnerJoinVisitor.cpp              | 4 ++--
 src/Interpreters/DatabaseAndTableWithAlias.cpp            | 2 +-
 src/Interpreters/HashJoin.cpp                             | 2 +-
 src/Interpreters/InJoinSubqueriesPreprocessor.cpp         | 4 ++--
 src/Interpreters/InterpreterSelectWithUnionQuery.cpp      | 2 +-
 src/Interpreters/JoinToSubqueryTransformVisitor.cpp       | 4 ++--
 src/Interpreters/MergeJoin.cpp                            | 2 +-
 src/Interpreters/ProcessList.cpp                          | 4 ++--
 src/Interpreters/Set.cpp                                  | 4 ++--
 src/Interpreters/SetVariants.cpp                          | 2 +-
 src/Interpreters/TablesStatus.cpp                         | 2 +-
 src/Interpreters/TranslateQualifiedNamesVisitor.cpp       | 2 +-
 src/Interpreters/evaluateConstantExpression.cpp           | 2 +-
 src/Parsers/ExpressionElementParsers.cpp                  | 2 +-
 src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp | 2 +-
 .../Formats/RowInputFormatWithDiagnosticInfo.cpp          | 2 +-
 src/Processors/Sources/WaitForAsyncInsertSource.h         | 2 +-
 src/Processors/Transforms/CreatingSetsTransform.cpp       | 2 +-
 src/Processors/Transforms/getSourceFromASTInsertQuery.cpp | 6 +++---
 src/QueryPipeline/ExecutionSpeedLimits.cpp                | 2 +-
 src/Server/TCPHandler.cpp                                 | 2 +-
 src/Storages/MergeTree/DataPartsExchange.cpp              | 2 +-
 src/Storages/MergeTree/EphemeralLockInZooKeeper.cpp       | 4 ++--
 src/Storages/MergeTree/MergeTreeData.cpp                  | 8 ++++----
 src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp     | 4 ++--
 src/Storages/MergeTree/MergeTreeDataWriter.cpp            | 6 +++---
 src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp  | 8 ++++----
 src/Storages/StorageJoin.cpp                              | 2 +-
 src/Storages/StorageLog.cpp                               | 6 +++---
 src/Storages/StorageReplicatedMergeTree.cpp               | 8 ++++----
 src/Storages/StorageView.cpp                              | 8 ++++----
 src/Storages/System/StorageSystemStackTrace.cpp           | 2 +-
 src/Storages/transformQueryForExternalDatabase.cpp        | 2 +-
 utils/check-style/check-style                             | 5 +++++
 55 files changed, 91 insertions(+), 90 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionCount.h b/src/AggregateFunctions/AggregateFunctionCount.h
index 36a8617ba91..f5d6030a777 100644
--- a/src/AggregateFunctions/AggregateFunctionCount.h
+++ b/src/AggregateFunctions/AggregateFunctionCount.h
@@ -219,7 +219,7 @@ public:
         : IAggregateFunctionDataHelper<AggregateFunctionCountData, AggregateFunctionCountNotNullUnary>({argument}, params, createResultType())
     {
         if (!argument->isNullable())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: not Nullable data type passed to AggregateFunctionCountNotNullUnary");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not Nullable data type passed to AggregateFunctionCountNotNullUnary");
     }
 
     String getName() const override { return "count"; }
diff --git a/src/AggregateFunctions/AggregateFunctionFactory.cpp b/src/AggregateFunctions/AggregateFunctionFactory.cpp
index b6ba562045d..18edb7c8ce0 100644
--- a/src/AggregateFunctions/AggregateFunctionFactory.cpp
+++ b/src/AggregateFunctions/AggregateFunctionFactory.cpp
@@ -100,7 +100,7 @@ AggregateFunctionPtr AggregateFunctionFactory::get(
     {
         AggregateFunctionCombinatorPtr combinator = AggregateFunctionCombinatorFactory::instance().tryFindSuffix("Null");
         if (!combinator)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: cannot find aggregate function combinator "
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot find aggregate function combinator "
                             "to apply a function to Nullable arguments.");
 
         DataTypes nested_types = combinator->transformArguments(types_without_low_cardinality);
@@ -123,7 +123,7 @@ AggregateFunctionPtr AggregateFunctionFactory::get(
     auto with_original_arguments = getImpl(name, action, types_without_low_cardinality, parameters, out_properties, false);
 
     if (!with_original_arguments)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: AggregateFunctionFactory returned nullptr");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "AggregateFunctionFactory returned nullptr");
     return with_original_arguments;
 }
 
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionIf.cpp b/src/AggregateFunctions/Combinators/AggregateFunctionIf.cpp
index 20a4bde6bb4..9b5ee79a533 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionIf.cpp
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionIf.cpp
@@ -249,7 +249,7 @@ public:
         : Base(std::move(nested_function_), arguments, params), number_of_arguments(arguments.size())
     {
         if (number_of_arguments == 1)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: single argument is passed to AggregateFunctionIfNullVariadic");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Single argument is passed to AggregateFunctionIfNullVariadic");
 
         if (number_of_arguments > MAX_ARGS)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
index 6b6580bf4c4..c8574e82be5 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
@@ -429,7 +429,7 @@ public:
         , number_of_arguments(arguments.size())
     {
         if (number_of_arguments == 1)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: single argument is passed to AggregateFunctionNullVariadic");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Single argument is passed to AggregateFunctionNullVariadic");
 
         if (number_of_arguments > MAX_ARGS)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
diff --git a/src/Client/MultiplexedConnections.cpp b/src/Client/MultiplexedConnections.cpp
index c7d7d0143c8..8433c8afe9f 100644
--- a/src/Client/MultiplexedConnections.cpp
+++ b/src/Client/MultiplexedConnections.cpp
@@ -320,7 +320,7 @@ Packet MultiplexedConnections::receivePacketUnlocked(AsyncCallback async_callbac
     ReplicaState & state = getReplicaForReading();
     current_connection = state.connection;
     if (current_connection == nullptr)
-        throw Exception(ErrorCodes::NO_AVAILABLE_REPLICA, "Logical error: no available replica");
+        throw Exception(ErrorCodes::NO_AVAILABLE_REPLICA, "No available replica");
 
     Packet packet;
     try
diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 6f60ec0e642..b3376b35b2e 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -810,7 +810,7 @@ ColumnPtr ColumnArray::filterTuple(const Filter & filt, ssize_t result_size_hint
     size_t tuple_size = tuple.tupleSize();
 
     if (tuple_size == 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: empty tuple");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty tuple");
 
     Columns temporary_arrays(tuple_size);
     for (size_t i = 0; i < tuple_size; ++i)
@@ -1263,7 +1263,7 @@ ColumnPtr ColumnArray::replicateTuple(const Offsets & replicate_offsets) const
     size_t tuple_size = tuple.tupleSize();
 
     if (tuple_size == 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: empty tuple");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty tuple");
 
     Columns temporary_arrays(tuple_size);
     for (size_t i = 0; i < tuple_size; ++i)
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 93638371b84..ddf5fc696fb 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -1,7 +1,5 @@
 #include <Common/Arena.h>
 #include <Common/SipHash.h>
-#include <Common/NaNUtils.h>
-#include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
 #include <Common/WeakHash.h>
 #include <Columns/ColumnDecimal.h>
@@ -28,7 +26,6 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int ILLEGAL_COLUMN;
-    extern const int SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT;
     extern const int NOT_IMPLEMENTED;
 }
 
@@ -829,8 +826,7 @@ void ColumnNullable::applyNullMap(const ColumnNullable & other)
 void ColumnNullable::checkConsistency() const
 {
     if (null_map->size() != getNestedColumn().size())
-        throw Exception(ErrorCodes::SIZES_OF_NESTED_COLUMNS_ARE_INCONSISTENT,
-                        "Logical error: Sizes of nested column and null map of Nullable column are not equal");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Sizes of nested column and null map of Nullable column are not equal");
 }
 
 ColumnPtr ColumnNullable::createWithOffsets(const IColumn::Offsets & offsets, const ColumnConst & column_with_default_value, size_t total_rows, size_t shift) const
diff --git a/src/Columns/getLeastSuperColumn.cpp b/src/Columns/getLeastSuperColumn.cpp
index 6ec5ca7a9c1..4f4a5f2b9b8 100644
--- a/src/Columns/getLeastSuperColumn.cpp
+++ b/src/Columns/getLeastSuperColumn.cpp
@@ -21,7 +21,7 @@ static bool sameConstants(const IColumn & a, const IColumn & b)
 ColumnWithTypeAndName getLeastSuperColumn(const std::vector<const ColumnWithTypeAndName *> & columns)
 {
     if (columns.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no src columns for supercolumn");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No src columns for supercolumn");
 
     ColumnWithTypeAndName result = *columns[0];
 
diff --git a/src/Common/SensitiveDataMasker.cpp b/src/Common/SensitiveDataMasker.cpp
index 70346919f65..28eae6f451d 100644
--- a/src/Common/SensitiveDataMasker.cpp
+++ b/src/Common/SensitiveDataMasker.cpp
@@ -91,7 +91,7 @@ void SensitiveDataMasker::setInstance(std::unique_ptr<SensitiveDataMasker>&& sen
 {
 
     if (!sensitive_data_masker_)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: the 'sensitive_data_masker' is not set");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "The 'sensitive_data_masker' is not set");
 
     if (sensitive_data_masker_->rulesCount() > 0)
     {
diff --git a/src/Common/SipHash.h b/src/Common/SipHash.h
index 5f27fdaa4b6..729fb76a573 100644
--- a/src/Common/SipHash.h
+++ b/src/Common/SipHash.h
@@ -209,7 +209,7 @@ public:
     {
         if (!is_reference_128)
             throw DB::Exception(
-                DB::ErrorCodes::LOGICAL_ERROR, "Logical error: can't call get128Reference when is_reference_128 is not set");
+                DB::ErrorCodes::LOGICAL_ERROR, "Can't call get128Reference when is_reference_128 is not set");
         finalize();
         const auto lo = v0 ^ v1 ^ v2 ^ v3;
         v1 ^= 0xdd;
diff --git a/src/Common/checkStackSize.cpp b/src/Common/checkStackSize.cpp
index 8c2a0aaed7f..1f4faf58fa5 100644
--- a/src/Common/checkStackSize.cpp
+++ b/src/Common/checkStackSize.cpp
@@ -136,7 +136,7 @@ __attribute__((__weak__)) void checkStackSize()
 
     /// We assume that stack grows towards lower addresses. And that it starts to grow from the end of a chunk of memory of max_stack_size.
     if (int_frame_address > int_stack_address + max_stack_size)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: frame address is greater than stack begin address");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Frame address is greater than stack begin address");
 
     size_t stack_size = int_stack_address + max_stack_size - int_frame_address;
     size_t max_stack_size_allowed = static_cast<size_t>(max_stack_size * STACK_SIZE_FREE_RATIO);
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index c62ed90e378..eaa0c3c9e68 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -1583,7 +1583,7 @@ struct KeeperStorageListRequestProcessor final : public KeeperStorageRequestProc
         {
             auto path_prefix = request.path;
             if (path_prefix.empty())
-                throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: path cannot be empty");
+                throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Path cannot be empty");
 
             const auto & children = node_it->value.getChildren();
             response.names.reserve(children.size());
diff --git a/src/DataTypes/DataTypeAggregateFunction.cpp b/src/DataTypes/DataTypeAggregateFunction.cpp
index 7dc036cafa4..14a3c6a4248 100644
--- a/src/DataTypes/DataTypeAggregateFunction.cpp
+++ b/src/DataTypes/DataTypeAggregateFunction.cpp
@@ -239,7 +239,7 @@ static DataTypePtr create(const ASTPtr & arguments)
         argument_types.push_back(DataTypeFactory::instance().get(arguments->children[i]));
 
     if (function_name.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: empty name of aggregate function passed");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty name of aggregate function passed");
 
     AggregateFunctionProperties properties;
     AggregateFunctionPtr function = AggregateFunctionFactory::instance().get(function_name, action, argument_types, params_row, properties);
diff --git a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
index aa3b154e49b..ee9870eb0ef 100644
--- a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
+++ b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
@@ -141,7 +141,7 @@ static std::pair<DataTypePtr, DataTypeCustomDescPtr> create(const ASTPtr & argum
         argument_types.push_back(DataTypeFactory::instance().get(arguments->children[i]));
 
     if (function_name.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: empty name of aggregate function passed");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty name of aggregate function passed");
 
     AggregateFunctionProperties properties;
     /// NullsAction is not part of the type definition, instead it will have transformed the function into a different one
diff --git a/src/Functions/EmptyImpl.h b/src/Functions/EmptyImpl.h
index 52484524e6a..d3b2dda024b 100644
--- a/src/Functions/EmptyImpl.h
+++ b/src/Functions/EmptyImpl.h
@@ -35,7 +35,7 @@ struct EmptyImpl
     /// Only make sense if is_fixed_to_constant.
     static void vectorFixedToConstant(const ColumnString::Chars & /*data*/, size_t /*n*/, UInt8 & /*res*/)
     {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: 'vectorFixedToConstant method' is called");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "'vectorFixedToConstant method' is called");
     }
 
     static void vectorFixedToVector(const ColumnString::Chars & data, size_t n, PaddedPODArray<UInt8> & res)
diff --git a/src/Functions/FunctionsComparison.h b/src/Functions/FunctionsComparison.h
index d04f76d051a..3be675f39b3 100644
--- a/src/Functions/FunctionsComparison.h
+++ b/src/Functions/FunctionsComparison.h
@@ -811,7 +811,7 @@ private:
                 c0_const_size = c0_const_fixed_string->getN();
             }
             else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Logical error: ColumnConst contains not String nor FixedString column");
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnConst contains not String nor FixedString column");
         }
 
         if (c1_const)
@@ -830,7 +830,7 @@ private:
                 c1_const_size = c1_const_fixed_string->getN();
             }
             else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Logical error: ColumnConst contains not String nor FixedString column");
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "ColumnConst contains not String nor FixedString column");
         }
 
         using StringImpl = StringComparisonImpl<Op<int, int>>;
@@ -1114,7 +1114,7 @@ private:
         /// This is a paranoid check to protect from a broken query analysis.
         if (c0->isNullable() != c1->isNullable())
             throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "Logical error: columns are assumed to be of identical types, but they are different in Nullable");
+                "Columns are assumed to be of identical types, but they are different in Nullable");
 
         if (c0_const && c1_const)
         {
diff --git a/src/Functions/FunctionsLogical.cpp b/src/Functions/FunctionsLogical.cpp
index d01fdc99076..2e0f4cd3038 100644
--- a/src/Functions/FunctionsLogical.cpp
+++ b/src/Functions/FunctionsLogical.cpp
@@ -530,7 +530,7 @@ DataTypePtr FunctionAnyArityLogical<Impl, Name>::getReturnTypeImpl(const DataTyp
         {
             has_nullable_arguments = arg_type->isNullable();
             if (has_nullable_arguments && !Impl::specialImplementationForNulls())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: Unexpected type of argument for function \"{}\": "
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected type of argument for function \"{}\": "
                     " argument {} is of type {}", getName(), i + 1, arg_type->getName());
         }
 
diff --git a/src/Functions/trap.cpp b/src/Functions/trap.cpp
index 99430f039a4..6ce696fedb5 100644
--- a/src/Functions/trap.cpp
+++ b/src/Functions/trap.cpp
@@ -177,7 +177,7 @@ public:
             }
             else if (mode == "logical error")
             {
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: trap");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Trap");
             }
             else
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown trap mode");
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 331cd991ea1..50fab486568 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -624,7 +624,7 @@ Aggregator::Aggregator(const Block & header_, const Params & params_)
         {
             size_t alignment_of_next_state = params.aggregates[i + 1].function->alignOfData();
             if ((alignment_of_next_state & (alignment_of_next_state - 1)) != 0)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: alignOfData is not 2^N");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "`alignOfData` is not 2^N");
 
             /// Extend total_size to next alignment requirement
             /// Add padding by rounding up 'total_size_of_aggregate_states' to be a multiplier of alignment_of_next_state.
@@ -857,7 +857,7 @@ AggregatedDataVariants::Type Aggregator::chooseAggregationMethod()
                 return AggregatedDataVariants::Type::low_cardinality_keys128;
             if (size_of_field == 32)
                 return AggregatedDataVariants::Type::low_cardinality_keys256;
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: low cardinality numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "LowCardinality numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
         }
 
         if (size_of_field == 1)
@@ -872,7 +872,7 @@ AggregatedDataVariants::Type Aggregator::chooseAggregationMethod()
             return AggregatedDataVariants::Type::keys128;
         if (size_of_field == 32)
             return AggregatedDataVariants::Type::keys256;
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
     }
 
     if (params.keys_size == 1 && isFixedString(types_removed_nullable[0]))
diff --git a/src/Interpreters/ArrayJoinedColumnsVisitor.h b/src/Interpreters/ArrayJoinedColumnsVisitor.h
index 3bbd6982213..f16751c4561 100644
--- a/src/Interpreters/ArrayJoinedColumnsVisitor.h
+++ b/src/Interpreters/ArrayJoinedColumnsVisitor.h
@@ -62,7 +62,7 @@ private:
     {
         auto [array_join_expression_list, _] = node.arrayJoinExpressionList();
         if (!array_join_expression_list)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no ARRAY JOIN");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "No ARRAY JOIN");
 
         std::vector<ASTPtr *> out;
         out.reserve(array_join_expression_list->children.size());
diff --git a/src/Interpreters/ClientInfo.cpp b/src/Interpreters/ClientInfo.cpp
index 347ec115aba..e4778edeb9c 100644
--- a/src/Interpreters/ClientInfo.cpp
+++ b/src/Interpreters/ClientInfo.cpp
@@ -23,7 +23,7 @@ namespace ErrorCodes
 void ClientInfo::write(WriteBuffer & out, UInt64 server_protocol_revision) const
 {
     if (server_protocol_revision < DBMS_MIN_REVISION_WITH_CLIENT_INFO)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: method ClientInfo::write is called for unsupported server revision");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Method ClientInfo::write is called for unsupported server revision");
 
     writeBinary(static_cast<UInt8>(query_kind), out);
     if (empty())
@@ -103,7 +103,7 @@ void ClientInfo::write(WriteBuffer & out, UInt64 server_protocol_revision) const
 void ClientInfo::read(ReadBuffer & in, UInt64 client_protocol_revision)
 {
     if (client_protocol_revision < DBMS_MIN_REVISION_WITH_CLIENT_INFO)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: method ClientInfo::read is called for unsupported client revision");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Method ClientInfo::read is called for unsupported client revision");
 
     UInt8 read_query_kind = 0;
     readBinary(read_query_kind, in);
diff --git a/src/Interpreters/CrossToInnerJoinVisitor.cpp b/src/Interpreters/CrossToInnerJoinVisitor.cpp
index 42af164f4ad..e3e8b80e437 100644
--- a/src/Interpreters/CrossToInnerJoinVisitor.cpp
+++ b/src/Interpreters/CrossToInnerJoinVisitor.cpp
@@ -173,7 +173,7 @@ std::vector<JoinedElement> getTables(const ASTSelectQuery & select)
     {
         const auto * table_element = child->as<ASTTablesInSelectQueryElement>();
         if (!table_element)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: TablesInSelectQueryElement expected");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "TablesInSelectQueryElement expected");
 
         JoinedElement & t = joined_tables.emplace_back(*table_element);
         t.rewriteCommaToCross();
@@ -224,7 +224,7 @@ void CrossToInnerJoinMatcher::visit(ASTSelectQuery & select, ASTPtr &, Data & da
     {
         if (joined_tables.size() != data.tables_with_columns.size())
             throw Exception(ErrorCodes::LOGICAL_ERROR,
-                            "Logical error: inconsistent number of tables: {} != {}",
+                            "Inconsistent number of tables: {} != {}",
                             joined_tables.size(), data.tables_with_columns.size());
 
         for (size_t i = 0; i < joined_tables.size(); ++i)
diff --git a/src/Interpreters/DatabaseAndTableWithAlias.cpp b/src/Interpreters/DatabaseAndTableWithAlias.cpp
index db020cb9166..329391b45d7 100644
--- a/src/Interpreters/DatabaseAndTableWithAlias.cpp
+++ b/src/Interpreters/DatabaseAndTableWithAlias.cpp
@@ -71,7 +71,7 @@ DatabaseAndTableWithAlias::DatabaseAndTableWithAlias(const ASTTableExpression &
         alias = table_expression.subquery->tryGetAlias();
     }
     else
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no known elements in ASTTableExpression");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No known elements in ASTTableExpression");
 }
 
 bool DatabaseAndTableWithAlias::satisfies(const DatabaseAndTableWithAlias & db_table, bool table_may_be_an_alias) const
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index 33dc178ca00..73487a0914a 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -368,7 +368,7 @@ HashJoin::Type HashJoin::chooseMethod(JoinKind kind, const ColumnRawPtrs & key_c
             return Type::keys128;
         if (size_of_field == 32)
             return Type::keys256;
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
     }
 
     /// If the keys fit in N bits, we will use a hash table for N-bit-packed keys
diff --git a/src/Interpreters/InJoinSubqueriesPreprocessor.cpp b/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
index 3858830a43b..ec4241a2740 100644
--- a/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
+++ b/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
@@ -103,12 +103,12 @@ private:
                     /// Already processed.
                 }
                 else
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unexpected function name {}", concrete->name);
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected function name {}", concrete->name);
             }
             else if (table_join)
                 table_join->locality = JoinLocality::Global;
             else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unexpected AST node");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected AST node");
         }
         else if (distributed_product_mode == DistributedProductMode::DENY)
         {
diff --git a/src/Interpreters/InterpreterSelectWithUnionQuery.cpp b/src/Interpreters/InterpreterSelectWithUnionQuery.cpp
index 16bc4b1fe2e..cc1d7dd6531 100644
--- a/src/Interpreters/InterpreterSelectWithUnionQuery.cpp
+++ b/src/Interpreters/InterpreterSelectWithUnionQuery.cpp
@@ -56,7 +56,7 @@ InterpreterSelectWithUnionQuery::InterpreterSelectWithUnionQuery(
 
     size_t num_children = ast->list_of_selects->children.size();
     if (!num_children)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no children in ASTSelectWithUnionQuery");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No children in ASTSelectWithUnionQuery");
 
     /// Note that we pass 'required_result_column_names' to first SELECT.
     /// And for the rest, we pass names at the corresponding positions of 'required_result_column_names' in the result of first SELECT,
diff --git a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
index bf2d1eb79cd..6251a9604e1 100644
--- a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@@ -168,7 +168,7 @@ private:
                 has_asterisks = true;
 
                 if (!qualified_asterisk->qualifier)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: qualified asterisk must have a qualifier");
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Qualified asterisk must have a qualifier");
 
                 auto & identifier = qualified_asterisk->qualifier->as<ASTIdentifier &>();
 
@@ -183,7 +183,7 @@ private:
                             transformer->as<ASTColumnsReplaceTransformer>())
                             IASTColumnsTransformer::transform(transformer, columns);
                         else
-                            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: qualified asterisk must only have children of IASTColumnsTransformer type");
+                            throw Exception(ErrorCodes::LOGICAL_ERROR, "Qualified asterisk must only have children of IASTColumnsTransformer type");
                     }
                 }
             }
diff --git a/src/Interpreters/MergeJoin.cpp b/src/Interpreters/MergeJoin.cpp
index 901c82029ee..d5fb0208d45 100644
--- a/src/Interpreters/MergeJoin.cpp
+++ b/src/Interpreters/MergeJoin.cpp
@@ -239,7 +239,7 @@ public:
 
         /// SortCursorImpl can work with permutation, but MergeJoinCursor can't.
         if (impl.permutation)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: MergeJoinCursor doesn't support permutation");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "MergeJoinCursor doesn't support permutation");
     }
 
     size_t position() const { return impl.getRow(); }
diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index 5b3b87114ae..3bd7b2d4206 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -295,7 +295,7 @@ ProcessListEntry::~ProcessListEntry()
     auto user_process_list_it = parent.user_to_queries.find(user);
     if (user_process_list_it == parent.user_to_queries.end())
     {
-        LOG_ERROR(getLogger("ProcessList"), "Logical error: cannot find user in ProcessList");
+        LOG_ERROR(getLogger("ProcessList"), "Cannot find user in ProcessList");
         std::terminate();
     }
 
@@ -323,7 +323,7 @@ ProcessListEntry::~ProcessListEntry()
 
     if (!found)
     {
-        LOG_ERROR(getLogger("ProcessList"), "Logical error: cannot find query by query_id and pointer to ProcessListElement in ProcessListForUser");
+        LOG_ERROR(getLogger("ProcessList"), "Cannot find query by query_id and pointer to ProcessListElement in ProcessListForUser");
         std::terminate();
     }
 
diff --git a/src/Interpreters/Set.cpp b/src/Interpreters/Set.cpp
index 84260faafd4..8f11754b3be 100644
--- a/src/Interpreters/Set.cpp
+++ b/src/Interpreters/Set.cpp
@@ -275,7 +275,7 @@ void Set::appendSetElements(SetKeyColumns & holder)
 void Set::checkIsCreated() const
 {
     if (!is_created.load())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: Trying to use set before it has been built.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to use set before it has been built.");
 }
 
 ColumnPtr Set::execute(const ColumnsWithTypeAndName & columns, bool negative) const
@@ -283,7 +283,7 @@ ColumnPtr Set::execute(const ColumnsWithTypeAndName & columns, bool negative) co
     size_t num_key_columns = columns.size();
 
     if (0 == num_key_columns)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no columns passed to Set::execute method.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No columns passed to Set::execute method.");
 
     auto res = ColumnUInt8::create();
     ColumnUInt8::Container & vec_res = res->getData();
diff --git a/src/Interpreters/SetVariants.cpp b/src/Interpreters/SetVariants.cpp
index cd9148a01cf..0fb2e5189d4 100644
--- a/src/Interpreters/SetVariants.cpp
+++ b/src/Interpreters/SetVariants.cpp
@@ -146,7 +146,7 @@ typename SetVariantsTemplate<Variant>::Type SetVariantsTemplate<Variant>::choose
             return Type::keys128;
         if (size_of_field == 32)
             return Type::keys256;
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Numeric column has sizeOfField not in 1, 2, 4, 8, 16, 32.");
     }
 
     /// If the keys fit in N bits, we will use a hash table for N-bit-packed keys
diff --git a/src/Interpreters/TablesStatus.cpp b/src/Interpreters/TablesStatus.cpp
index 005a4515c3a..911a028f813 100644
--- a/src/Interpreters/TablesStatus.cpp
+++ b/src/Interpreters/TablesStatus.cpp
@@ -35,7 +35,7 @@ void TableStatus::read(ReadBuffer & in)
 void TablesStatusRequest::write(WriteBuffer & out, UInt64 server_protocol_revision) const
 {
     if (server_protocol_revision < DBMS_MIN_REVISION_WITH_TABLES_STATUS)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: method TablesStatusRequest::write is called for unsupported server revision");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Method TablesStatusRequest::write is called for unsupported server revision");
 
     writeVarUInt(tables.size(), out);
     for (const auto & table_name : tables)
diff --git a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index 130ce2194fd..3de7e217e53 100644
--- a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -158,7 +158,7 @@ void TranslateQualifiedNamesMatcher::visit(ASTFunction & node, const ASTPtr &, D
 void TranslateQualifiedNamesMatcher::visit(const ASTQualifiedAsterisk & node, const ASTPtr &, Data & data)
 {
     if (!node.qualifier)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: qualified asterisk must have a qualifier");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Qualified asterisk must have a qualifier");
 
     /// @note it could contain table alias as table name.
     DatabaseAndTableWithAlias db_and_table(node.qualifier);
diff --git a/src/Interpreters/evaluateConstantExpression.cpp b/src/Interpreters/evaluateConstantExpression.cpp
index 00d36750cc1..b5c3e00e299 100644
--- a/src/Interpreters/evaluateConstantExpression.cpp
+++ b/src/Interpreters/evaluateConstantExpression.cpp
@@ -106,7 +106,7 @@ std::optional<EvaluateConstantExpressionResult> evaluateConstantExpressionImpl(c
 
     if (result_column->empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR,
-                        "Logical error: empty result column after evaluation "
+                        "Empty result column after evaluation "
                         "of constant expression for IN, VALUES, or LIMIT, or aggregate function parameter, or a table function argument");
 
     /// Expressions like rand() or now() are not constant
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 62c480e0f6b..486555ae86d 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -934,7 +934,7 @@ bool ParserNumber::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         {
             if (float_value < 0)
                 throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                "Logical error: token number cannot begin with minus, "
+                                "Token number cannot begin with minus, "
                                 "but parsed float number is less than zero.");
 
             if (negative)
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
index 0ef19a9c14f..6fa94356cd3 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
@@ -179,7 +179,7 @@ void JSONEachRowRowInputFormat::readJSONObject(MutableColumns & columns)
             else if (column_index == NESTED_FIELD)
                 readNestedData(name_ref.toString(), columns);
             else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: illegal value of column_index");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Illegal value of column_index");
         }
         else
         {
diff --git a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
index a56c24a740a..fcf338577f8 100644
--- a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
+++ b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
@@ -136,7 +136,7 @@ bool RowInputFormatWithDiagnosticInfo::deserializeFieldAndPrintDiagnosticInfo(co
     auto * curr_position = in->position();
 
     if (curr_position < prev_position)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: parsing is non-deterministic.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Parsing is non-deterministic.");
 
     if (isNativeNumber(type) || isDate(type) || isDateTime(type) || isDateTime64(type))
     {
diff --git a/src/Processors/Sources/WaitForAsyncInsertSource.h b/src/Processors/Sources/WaitForAsyncInsertSource.h
index 1029c164941..78af6294202 100644
--- a/src/Processors/Sources/WaitForAsyncInsertSource.h
+++ b/src/Processors/Sources/WaitForAsyncInsertSource.h
@@ -33,7 +33,7 @@ protected:
     {
         auto status = insert_future.wait_for(std::chrono::milliseconds(timeout_ms));
         if (status == std::future_status::deferred)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: got future in deferred state");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Got future in deferred state");
 
         if (status == std::future_status::timeout)
             throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Wait for async insert timeout ({} ms) exceeded)", timeout_ms);
diff --git a/src/Processors/Transforms/CreatingSetsTransform.cpp b/src/Processors/Transforms/CreatingSetsTransform.cpp
index cc0b5926e66..eeb8f4a6060 100644
--- a/src/Processors/Transforms/CreatingSetsTransform.cpp
+++ b/src/Processors/Transforms/CreatingSetsTransform.cpp
@@ -163,7 +163,7 @@ void CreatingSetsTransform::startSubquery()
     done_with_table = !external_table;
 
     if ((done_with_set && !set_from_cache) && done_with_table)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: nothing to do with subquery");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Nothing to do with subquery");
 
     if (table_out.initialized())
     {
diff --git a/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp b/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
index 6c7c7447070..8a13973b970 100644
--- a/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
+++ b/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
@@ -37,7 +37,7 @@ InputFormatPtr getInputFormatFromASTInsertQuery(
     const auto * ast_insert_query = ast->as<ASTInsertQuery>();
 
     if (!ast_insert_query)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: query requires data to insert, but it is not INSERT query");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Query requires data to insert, but it is not INSERT query");
 
     if (ast_insert_query->infile && context->getApplicationType() == Context::ApplicationType::SERVER)
         throw Exception(ErrorCodes::UNKNOWN_TYPE_OF_QUERY, "Query has infile and was send directly to server");
@@ -47,7 +47,7 @@ InputFormatPtr getInputFormatFromASTInsertQuery(
         if (input_function)
             throw Exception(ErrorCodes::INVALID_USAGE_OF_INPUT, "FORMAT must be specified for function input()");
         else
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: INSERT query requires format to be set");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "INSERT query requires format to be set");
     }
 
     /// Data could be in parsed (ast_insert_query.data) and in not parsed yet (input_buffer_tail_part) part of query.
@@ -105,7 +105,7 @@ std::unique_ptr<ReadBuffer> getReadBufferFromASTInsertQuery(const ASTPtr & ast)
 {
     const auto * insert_query = ast->as<ASTInsertQuery>();
     if (!insert_query)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: query requires data to insert, but it is not INSERT query");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Query requires data to insert, but it is not INSERT query");
 
     if (insert_query->infile)
     {
diff --git a/src/QueryPipeline/ExecutionSpeedLimits.cpp b/src/QueryPipeline/ExecutionSpeedLimits.cpp
index f8ae4c76d0f..05fd394db77 100644
--- a/src/QueryPipeline/ExecutionSpeedLimits.cpp
+++ b/src/QueryPipeline/ExecutionSpeedLimits.cpp
@@ -113,7 +113,7 @@ static bool handleOverflowMode(OverflowMode mode, int code, FormatStringHelper<A
             ProfileEvents::increment(ProfileEvents::OverflowBreak);
             return false;
         default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unknown overflow mode");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown overflow mode");
     }
 }
 
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 833f8ecc818..9464ef74586 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -943,7 +943,7 @@ void TCPHandler::processInsertQuery()
                 auto wait_status = result.future.wait_for(std::chrono::milliseconds(timeout_ms));
 
                 if (wait_status == std::future_status::deferred)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: got future in deferred state");
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Got future in deferred state");
 
                 if (wait_status == std::future_status::timeout)
                     throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Wait for async insert timeout ({} ms) exceeded)", timeout_ms);
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index ce70fbe18e5..168c5f729ce 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -903,7 +903,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToDisk(
         || part_name.empty()
         || std::string::npos != tmp_prefix.find_first_of("/.")
         || std::string::npos != part_name.find_first_of("/."))
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: tmp_prefix and part_name cannot be empty or contain '.' or '/' characters.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "`tmp_prefix` and `part_name` cannot be empty or contain '.' or '/' characters.");
 
     auto part_dir = tmp_prefix + part_name;
     auto part_relative_path = data.getRelativeDataPath() + String(to_detached ? "detached/" : "");
diff --git a/src/Storages/MergeTree/EphemeralLockInZooKeeper.cpp b/src/Storages/MergeTree/EphemeralLockInZooKeeper.cpp
index 1ffb5177430..cbdeabffa97 100644
--- a/src/Storages/MergeTree/EphemeralLockInZooKeeper.cpp
+++ b/src/Storages/MergeTree/EphemeralLockInZooKeeper.cpp
@@ -17,7 +17,7 @@ EphemeralLockInZooKeeper::EphemeralLockInZooKeeper(const String & path_prefix_,
     : zookeeper(zookeeper_), path_prefix(path_prefix_), path(path_), conflict_path(conflict_path_)
 {
     if (conflict_path.empty() && path.size() <= path_prefix.size())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: name of the main node is shorter than prefix.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Name of the main node is shorter than prefix.");
 }
 
 template <typename T>
@@ -179,7 +179,7 @@ EphemeralLocksInAllPartitions::EphemeralLocksInAllPartitions(
             size_t prefix_size = block_numbers_path.size() + 1 + partitions[i].size() + 1 + path_prefix.size();
             const String & path = dynamic_cast<const Coordination::CreateResponse &>(*lock_responses[i]).path_created;
             if (path.size() <= prefix_size)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: name of the sequential node is shorter than prefix.");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Name of the sequential node is shorter than prefix.");
 
             UInt64 number = parse<UInt64>(path.c_str() + prefix_size, path.size() - prefix_size);
             locks.push_back(LockInfo{path, partitions[i], number});
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index e14a358745e..5b297de3fda 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -869,7 +869,7 @@ void MergeTreeData::MergingParams::check(const StorageInMemoryMetadata & metadat
             if (is_optional)
                 return;
 
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: Sign column for storage {} is empty", storage);
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Sign column for storage {} is empty", storage);
         }
 
         bool miss_column = true;
@@ -896,7 +896,7 @@ void MergeTreeData::MergingParams::check(const StorageInMemoryMetadata & metadat
             if (is_optional)
                 return;
 
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: Version column for storage {} is empty", storage);
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Version column for storage {} is empty", storage);
         }
 
         bool miss_column = true;
@@ -925,12 +925,12 @@ void MergeTreeData::MergingParams::check(const StorageInMemoryMetadata & metadat
             if (is_optional)
                 return;
 
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: is_deleted ({}) column for storage {} is empty", is_deleted_column, storage);
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "`is_deleted` ({}) column for storage {} is empty", is_deleted_column, storage);
         }
         else
         {
             if (version_column.empty() && !is_optional)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: Version column ({}) for storage {} is empty while is_deleted ({}) is not.",
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Version column ({}) for storage {} is empty while is_deleted ({}) is not.",
                                 version_column, storage, is_deleted_column);
 
             bool miss_is_deleted_column = true;
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 58fddde7b54..1bf1d4a3c29 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -85,7 +85,7 @@ UInt64 MergeTreeDataMergerMutator::getMaxSourcePartsSizeForMerge(size_t max_coun
     if (scheduled_tasks_count > max_count)
     {
         throw Exception(ErrorCodes::LOGICAL_ERROR,
-            "Logical error: invalid argument passed to getMaxSourcePartsSize: scheduled_tasks_count = {} > max_count = {}",
+            "Invalid argument passed to getMaxSourcePartsSize: scheduled_tasks_count = {} > max_count = {}",
             scheduled_tasks_count, max_count);
     }
 
@@ -511,7 +511,7 @@ SelectPartsDecision MergeTreeDataMergerMutator::selectPartsToMergeFromRanges(
 
         /// Do not allow to "merge" part with itself for regular merges, unless it is a TTL-merge where it is ok to remove some values with expired ttl
         if (parts_to_merge.size() == 1)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: merge selector returned only one part to merge");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Merge selector returned only one part to merge");
 
         if (parts_to_merge.empty())
         {
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index c9c16b59f9e..ebf887f5e9e 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -384,13 +384,13 @@ Block MergeTreeDataWriter::mergeBlock(
 
     /// Check that after first merge merging_algorithm is waiting for data from input 0.
     if (status.required_source != 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: required source after the first merge is not 0. Chunk rows: {}, is_finished: {}, required_source: {}, algorithm: {}", status.chunk.getNumRows(), status.is_finished, status.required_source, merging_algorithm->getName());
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Required source after the first merge is not 0. Chunk rows: {}, is_finished: {}, required_source: {}, algorithm: {}", status.chunk.getNumRows(), status.is_finished, status.required_source, merging_algorithm->getName());
 
     status = merging_algorithm->merge();
 
     /// Check that merge is finished.
     if (!status.is_finished)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: merge is not finished after the second merge.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Merge is not finished after the second merge.");
 
     /// Merged Block is sorted and we don't need to use permutation anymore
     permutation = nullptr;
@@ -439,7 +439,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
         auto max_month = date_lut.toNumYYYYMM(max_date);
 
         if (min_month != max_month)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: part spans more than one month.");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Part spans more than one month.");
 
         part_name = new_part_info.getPartNameV0(min_date, max_date);
     }
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
index 4e339964de3..da89d52a9ff 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
@@ -54,9 +54,9 @@ MarkType::MarkType(bool adaptive_, bool compressed_, MergeTreeDataPartType::Valu
     : adaptive(adaptive_), compressed(compressed_), part_type(part_type_)
 {
     if (!adaptive && part_type != MergeTreeDataPartType::Wide)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: non-Wide data part type with non-adaptive granularity");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Non-Wide data part type with non-adaptive granularity");
     if (part_type == MergeTreeDataPartType::Unknown)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unknown data part type");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown data part type");
 }
 
 bool MarkType::isMarkFileExtension(std::string_view extension)
@@ -71,7 +71,7 @@ std::string MarkType::getFileExtension() const
     if (!adaptive)
     {
         if (part_type != MergeTreeDataPartType::Wide)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: non-Wide data part type with non-adaptive granularity");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Non-Wide data part type with non-adaptive granularity");
         return res;
     }
 
@@ -84,7 +84,7 @@ std::string MarkType::getFileExtension() const
         case MergeTreeDataPartType::InMemory:
             return "";
         case MergeTreeDataPartType::Unknown:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unknown data part type");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown data part type");
     }
 }
 
diff --git a/src/Storages/StorageJoin.cpp b/src/Storages/StorageJoin.cpp
index b9e082c0b22..b122674466f 100644
--- a/src/Storages/StorageJoin.cpp
+++ b/src/Storages/StorageJoin.cpp
@@ -500,7 +500,7 @@ protected:
         Chunk chunk;
         if (!joinDispatch(join->kind, join->strictness, join->data->maps.front(),
                 [&](auto kind, auto strictness, auto & map) { chunk = createChunk<kind, strictness>(map); }))
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unknown JOIN strictness");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown JOIN strictness");
         return chunk;
     }
 
diff --git a/src/Storages/StorageLog.cpp b/src/Storages/StorageLog.cpp
index c7b0a9d0644..99192fe1e50 100644
--- a/src/Storages/StorageLog.cpp
+++ b/src/Storages/StorageLog.cpp
@@ -241,7 +241,7 @@ void LogSource::readData(const NameAndTypePair & name_and_type, ColumnPtr & colu
 
             const auto & data_file_it = storage.data_files_by_names.find(data_file_name);
             if (data_file_it == storage.data_files_by_names.end())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no information about file {} in StorageLog", data_file_name);
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "No information about file {} in StorageLog", data_file_name);
             const auto & data_file = *data_file_it->second;
 
             size_t offset = stream_for_prefix ? 0 : offsets[data_file.index];
@@ -448,7 +448,7 @@ ISerialization::OutputStreamGetter LogSink::createStreamGetter(const NameAndType
         String data_file_name = ISerialization::getFileNameForStream(name_and_type, path);
         auto it = streams.find(data_file_name);
         if (it == streams.end())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: stream was not created when writing data in LogSink");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Stream was not created when writing data in LogSink");
 
         Stream & stream = it->second;
         if (stream.written)
@@ -473,7 +473,7 @@ void LogSink::writeData(const NameAndTypePair & name_and_type, const IColumn & c
         {
             const auto & data_file_it = storage.data_files_by_names.find(data_file_name);
             if (data_file_it == storage.data_files_by_names.end())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no information about file {} in StorageLog", data_file_name);
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "No information about file {} in StorageLog", data_file_name);
 
             const auto & data_file = *data_file_it->second;
             const auto & columns = metadata_snapshot->getColumns();
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6119541ff52..fb4e9b4ad87 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -2043,7 +2043,7 @@ bool StorageReplicatedMergeTree::executeFetch(LogEntry & entry, bool need_to_che
             if (entry.quorum)
             {
                 if (entry.type != LogEntry::GET_PART)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: log entry with quorum but type is not GET_PART");
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Log entry with quorum but type is not GET_PART");
 
                 LOG_DEBUG(log, "No active replica has part {} which needs to be written with quorum. Will try to mark that quorum as failed.", entry.new_part_name);
 
@@ -2106,7 +2106,7 @@ bool StorageReplicatedMergeTree::executeFetch(LogEntry & entry, bool need_to_che
                         auto part_info = MergeTreePartInfo::fromPartName(entry.new_part_name, format_version);
 
                         if (part_info.min_block != part_info.max_block)
-                            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: log entry with quorum for part covering more than one block number");
+                            throw Exception(ErrorCodes::LOGICAL_ERROR, "Log entry with quorum for part covering more than one block number");
 
                         ops.emplace_back(zkutil::makeCreateRequest(
                             fs::path(zookeeper_path) / "quorum" / "failed_parts" / entry.new_part_name,
@@ -6796,7 +6796,7 @@ bool StorageReplicatedMergeTree::tryWaitForReplicaToProcessLogEntry(
     }
     else
     {
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: unexpected name of log node: {}", entry.znode_name);
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected name of log node: {}", entry.znode_name);
     }
 
     /** Second - find the corresponding entry in the queue of the specified replica.
@@ -7172,7 +7172,7 @@ void StorageReplicatedMergeTree::fetchPartition(
     }
 
     if (best_replica.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: cannot choose best replica.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot choose best replica.");
 
     LOG_INFO(log, "Found {} replicas, {} of them are active. Selected {} to fetch from.", replicas.size(), active_replicas.size(), best_replica);
 
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 181fd0ac61c..5679effbcb2 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -207,12 +207,12 @@ void StorageView::read(
 static ASTTableExpression * getFirstTableExpression(ASTSelectQuery & select_query)
 {
     if (!select_query.tables() || select_query.tables()->children.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: no table expression in view select AST");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No table expression in view select AST");
 
     auto * select_element = select_query.tables()->children[0]->as<ASTTablesInSelectQueryElement>();
 
     if (!select_element->table_expression)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: incorrect table expression");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Incorrect table expression");
 
     return select_element->table_expression->as<ASTTableExpression>();
 }
@@ -243,7 +243,7 @@ void StorageView::replaceWithSubquery(ASTSelectQuery & outer_query, ASTPtr view_
 
         }
         if (!table_expression->database_and_table_name)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: incorrect table expression");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Incorrect table expression");
     }
 
     DatabaseAndTableWithAlias db_table(table_expression->database_and_table_name);
@@ -270,7 +270,7 @@ ASTPtr StorageView::restoreViewName(ASTSelectQuery & select_query, const ASTPtr
     ASTTableExpression * table_expression = getFirstTableExpression(select_query);
 
     if (!table_expression->subquery)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: incorrect table expression");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Incorrect table expression");
 
     ASTPtr subquery = table_expression->subquery;
     table_expression->subquery = {};
diff --git a/src/Storages/System/StorageSystemStackTrace.cpp b/src/Storages/System/StorageSystemStackTrace.cpp
index 82a5fd4e33f..90eb0ad89ec 100644
--- a/src/Storages/System/StorageSystemStackTrace.cpp
+++ b/src/Storages/System/StorageSystemStackTrace.cpp
@@ -168,7 +168,7 @@ bool wait(int timeout_ms)
                 continue;   /// Drain delayed notifications.
         }
 
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: read wrong number of bytes from pipe");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Read wrong number of bytes from pipe");
     }
 }
 
diff --git a/src/Storages/transformQueryForExternalDatabase.cpp b/src/Storages/transformQueryForExternalDatabase.cpp
index 4526a38a1c3..afc458ea612 100644
--- a/src/Storages/transformQueryForExternalDatabase.cpp
+++ b/src/Storages/transformQueryForExternalDatabase.cpp
@@ -145,7 +145,7 @@ bool isCompatible(ASTPtr & node)
             return false;
 
         if (!function->arguments)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: function->arguments is not set");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "function->arguments is not set");
 
         String name = function->name;
 
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index 6c12970c4bb..a71dac91683 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -448,3 +448,8 @@ find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
     grep -vP $EXCLUDE_DIRS |
     xargs grep -P 'Sql|Html|Xml|Cpu|Tcp|Udp|Http|Db|Json|Yaml' | grep -v -P 'RabbitMQ|Azure|Aws|aws|Avro|IO/S3' &&
     echo "Abbreviations such as SQL, XML, HTTP, should be in all caps. For example, SQL is right, Sql is wrong. XMLHttpRequest is very wrong."
+
+find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' |
+    grep -vP $EXCLUDE_DIRS |
+    xargs grep -F -i 'ErrorCodes::LOGICAL_ERROR, "Logical error:' &&
+    echo "If an exception has LOGICAL_ERROR code, there is no need to include the text 'Logical error' in the exception message, because then the phrase 'Logical error' will be printed twice."

From 6b2d89c78394f50c0053551b796cb5d2228c142f Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Mon, 19 Feb 2024 10:17:51 +0800
Subject: [PATCH 1057/1081] change as request

---
 .../0_stateless/02985_if_over_big_int_decimal.reference   | 6 ++++++
 .../queries/0_stateless/02985_if_over_big_int_decimal.sql | 8 ++++++++
 2 files changed, 14 insertions(+)

diff --git a/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference b/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
index 055103ad134..1dfad945ee2 100644
--- a/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
+++ b/tests/queries/0_stateless/02985_if_over_big_int_decimal.reference
@@ -4,3 +4,9 @@
 49500
 49500
 49500
+450000
+450000
+450000
+450000
+450000
+450000
diff --git a/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql b/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql
index 6868524d195..0295a64a092 100644
--- a/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql
+++ b/tests/queries/0_stateless/02985_if_over_big_int_decimal.sql
@@ -4,3 +4,11 @@ select sumIf(number::Int256, number % 10 == 0) from numbers(1000);
 select sumIf(number::UInt256, number % 10 == 0) from numbers(1000);
 select sumIf(number::Decimal128(3), number % 10 == 0) from numbers(1000);
 select sumIf(number::Decimal256(3), number % 10 == 0) from numbers(1000);
+
+-- Test when the condition is neither 0 nor 1
+select sumIf(number::Int128, number % 10) from numbers(1000);
+select sumIf(number::UInt128, number % 10) from numbers(1000);
+select sumIf(number::Int256, number % 10) from numbers(1000);
+select sumIf(number::UInt256, number % 10) from numbers(1000);
+select sumIf(number::Decimal128(3), number % 10) from numbers(1000);
+select sumIf(number::Decimal256(3), number % 10) from numbers(1000);

From fa1ca348a4326a96a58d74e3ad4bac738c2b22c3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 03:19:21 +0100
Subject: [PATCH 1058/1081] Miscellaneous

---
 src/Core/MySQL/PacketEndpoint.cpp                             | 2 +-
 src/Databases/MySQL/MaterializedMySQLSyncThread.cpp           | 4 ++--
 src/Functions/FunctionsConversion.h                           | 2 +-
 src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp          | 2 +-
 src/Server/HTTPHandlerFactory.cpp                             | 2 +-
 src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp | 2 +-
 src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.h   | 2 +-
 7 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Core/MySQL/PacketEndpoint.cpp b/src/Core/MySQL/PacketEndpoint.cpp
index 97b5d3b4d11..085d7595167 100644
--- a/src/Core/MySQL/PacketEndpoint.cpp
+++ b/src/Core/MySQL/PacketEndpoint.cpp
@@ -40,7 +40,7 @@ bool PacketEndpoint::tryReceivePacket(IMySQLReadPacket & packet, UInt64 millisec
         ReadBufferFromPocoSocket * socket_in = typeid_cast<ReadBufferFromPocoSocket *>(in);
 
         if (!socket_in)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: Attempt to pull the duration in a non socket stream");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to pull the duration in a non socket stream");
 
         if (!socket_in->poll(millisecond * 1000))
             return false;
diff --git a/src/Databases/MySQL/MaterializedMySQLSyncThread.cpp b/src/Databases/MySQL/MaterializedMySQLSyncThread.cpp
index 2656835f912..20db8036942 100644
--- a/src/Databases/MySQL/MaterializedMySQLSyncThread.cpp
+++ b/src/Databases/MySQL/MaterializedMySQLSyncThread.cpp
@@ -779,7 +779,7 @@ static void writeFieldsToColumn(
                         casted_int32_column->insertValue(num & 0x800000 ? num | 0xFF000000 : num);
                     }
                     else
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: it is a bug.");
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
                 }
             }
         }
@@ -844,7 +844,7 @@ static inline bool differenceSortingKeys(const Tuple & row_old_data, const Tuple
 static inline size_t onUpdateData(const Row & rows_data, Block & buffer, size_t version, const std::vector<size_t> & sorting_columns_index)
 {
     if (rows_data.size() % 2 != 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: It is a bug.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
 
     size_t prev_bytes = buffer.bytes();
     std::vector<bool> writeable_rows_mask(rows_data.size());
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 4089a5b542b..62148fa8022 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -2560,7 +2560,7 @@ public:
             if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
                 res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
             else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: It is a bug.");
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
             else if constexpr (to_decimal)
             {
                 UInt64 scale = extractToDecimalScale(arguments[1]);
diff --git a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
index 0fdc9347ee9..107b435ded4 100644
--- a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
+++ b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
@@ -337,7 +337,7 @@ static ASTPtr getPartitionPolicy(const NamesAndTypesList & primary_keys)
         WhichDataType which(type);
 
         if (which.isNullable())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: MySQL primary key must be not null, it is a bug.");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "MySQL's primary key must be not null, it is a bug.");
 
         if (which.isDate() || which.isDate32() || which.isDateTime() || which.isDateTime64())
         {
diff --git a/src/Server/HTTPHandlerFactory.cpp b/src/Server/HTTPHandlerFactory.cpp
index 06ca1182be5..9e4a440ddb2 100644
--- a/src/Server/HTTPHandlerFactory.cpp
+++ b/src/Server/HTTPHandlerFactory.cpp
@@ -120,7 +120,7 @@ HTTPRequestHandlerFactoryPtr createHandlerFactory(IServer & server, const Poco::
         return createPrometheusMainHandlerFactory(server, config, metrics_writer, name);
     }
 
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: Unknown HTTP handler factory name.");
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown HTTP handler factory name.");
 }
 
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
index da49814b83a..f506230b5ea 100644
--- a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.cpp
@@ -59,7 +59,7 @@ bool maybeTrueOnBloomFilter(const IColumn * hash_column, const BloomFilterPtr &
     const auto * non_const_column = typeid_cast<const ColumnUInt64 *>(hash_column);
 
     if (!const_column && !non_const_column)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: hash column must be Const Column or UInt64 Column.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Hash column must be Const or UInt64.");
 
     if (const_column)
     {
diff --git a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.h b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.h
index db85c804d8d..8029d6d405b 100644
--- a/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.h
+++ b/src/Storages/MergeTree/MergeTreeIndexConditionBloomFilter.h
@@ -53,7 +53,7 @@ public:
         if (const auto & bf_granule = typeid_cast<const MergeTreeIndexGranuleBloomFilter *>(granule.get()))
             return mayBeTrueOnGranule(bf_granule);
 
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "LOGICAL ERROR: require bloom filter index granule.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Requires bloom filter index granule.");
     }
 
 private:

From 4590d3f81a1f44f2a8de137a60ea496230cd5d86 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 05:10:39 +0100
Subject: [PATCH 1059/1081] Miscellaneous

---
 src/Interpreters/getHeaderForProcessingStage.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Interpreters/getHeaderForProcessingStage.cpp b/src/Interpreters/getHeaderForProcessingStage.cpp
index d16e01ef2d2..67a909ba6b4 100644
--- a/src/Interpreters/getHeaderForProcessingStage.cpp
+++ b/src/Interpreters/getHeaderForProcessingStage.cpp
@@ -167,8 +167,7 @@ Block getHeaderForProcessingStage(
             return result;
         }
     }
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical Error: unknown processed stage.");
+    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown processed stage.");
 }
 
 }
-

From e80bc24163efa5d838c3c9398644c19bba868e42 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 05:18:17 +0100
Subject: [PATCH 1060/1081] Writing object name is useless for our stack traces

---
 src/Common/StackTrace.cpp | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/Common/StackTrace.cpp b/src/Common/StackTrace.cpp
index 7e683ae91de..436b85ff30b 100644
--- a/src/Common/StackTrace.cpp
+++ b/src/Common/StackTrace.cpp
@@ -448,9 +448,6 @@ toStringEveryLineImpl([[maybe_unused]] bool fatal, const StackTraceRefTriple & s
             DB::writePointerHex(frame.physical_addr, out);
         }
 
-        if (frame.object.has_value())
-            out << " in " << *frame.object;
-
         callback(out.str());
     };
 #else

From e2de74cf66d218032615d68b2b073529ec359c60 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 05:34:40 +0100
Subject: [PATCH 1061/1081] Fix debug

---
 src/Parsers/IParser.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index e8f95954e70..198ec0346ff 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -82,7 +82,7 @@ public:
               * The frequency is arbitrary, but not too large, not too small,
               * and a power of two to simplify the division.
               */
-#if defined(USE_MUSL) || defined(SANITIZER)
+#if defined(USE_MUSL) || defined(SANITIZER) || !defined(NDEBUG)
             static constexpr uint32_t check_frequency = 128;
 #else
             static constexpr uint32_t check_frequency = 8192;

From ad26b6fc8d3e773594ced086d3915422071f597c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 07:08:24 +0100
Subject: [PATCH 1062/1081] Remove useless headers

---
 src/Client/ConnectionEstablisher.h                 | 1 -
 src/Client/PacketReceiver.h                        | 1 -
 src/Common/checkStackSize.cpp                      | 6 ------
 src/QueryPipeline/RemoteQueryExecutorReadContext.h | 1 -
 4 files changed, 9 deletions(-)

diff --git a/src/Client/ConnectionEstablisher.h b/src/Client/ConnectionEstablisher.h
index 1fa08d435e9..a3a01e63246 100644
--- a/src/Client/ConnectionEstablisher.h
+++ b/src/Client/ConnectionEstablisher.h
@@ -3,7 +3,6 @@
 #include <Common/AsyncTaskExecutor.h>
 #include <Common/Epoll.h>
 #include <Common/Fiber.h>
-#include <Common/FiberStack.h>
 #include <Common/TimerDescriptor.h>
 #include <Common/PoolWithFailoverBase.h>
 #include <Client/ConnectionPool.h>
diff --git a/src/Client/PacketReceiver.h b/src/Client/PacketReceiver.h
index deedf5cccdc..6b3da659290 100644
--- a/src/Client/PacketReceiver.h
+++ b/src/Client/PacketReceiver.h
@@ -5,7 +5,6 @@
 #include <variant>
 
 #include <Client/IConnections.h>
-#include <Common/FiberStack.h>
 #include <Common/Fiber.h>
 #include <Common/Epoll.h>
 #include <Common/TimerDescriptor.h>
diff --git a/src/Common/checkStackSize.cpp b/src/Common/checkStackSize.cpp
index 1f4faf58fa5..954def83e94 100644
--- a/src/Common/checkStackSize.cpp
+++ b/src/Common/checkStackSize.cpp
@@ -1,12 +1,6 @@
 #include <Common/checkStackSize.h>
 #include <Common/Exception.h>
-#include <base/getThreadId.h>
-#include <base/scope_guard.h>
-#include <base/defines.h> /// THREAD_SANITIZER
-#include <sys/resource.h>
 #include <pthread.h>
-#include <unistd.h>
-#include <cstdint>
 
 #if defined(OS_FREEBSD)
 #   include <pthread_np.h>
diff --git a/src/QueryPipeline/RemoteQueryExecutorReadContext.h b/src/QueryPipeline/RemoteQueryExecutorReadContext.h
index adfc0c5eacf..50df7e2db35 100644
--- a/src/QueryPipeline/RemoteQueryExecutorReadContext.h
+++ b/src/QueryPipeline/RemoteQueryExecutorReadContext.h
@@ -5,7 +5,6 @@
 #include <mutex>
 #include <atomic>
 #include <Common/Fiber.h>
-#include <Common/FiberStack.h>
 #include <Common/TimerDescriptor.h>
 #include <Common/Epoll.h>
 #include <Common/AsyncTaskExecutor.h>

From 7fa9c733bd290ab081c151bf64c37f964cb92e8a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 07:27:02 +0100
Subject: [PATCH 1063/1081] Fix Fibers

---
 src/Common/Fiber.h            | 15 +++++++--------
 src/Common/checkStackSize.cpp |  5 +++++
 2 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/src/Common/Fiber.h b/src/Common/Fiber.h
index f48ace149f4..8b88bd323ef 100644
--- a/src/Common/Fiber.h
+++ b/src/Common/Fiber.h
@@ -17,7 +17,7 @@ private:
     template <typename T> friend class FiberLocal;
 
 public:
-    template< typename StackAlloc, typename Fn>
+    template <typename StackAlloc, typename Fn>
     Fiber(StackAlloc && salloc, Fn && fn) : impl(std::allocator_arg_t(), std::forward<StackAlloc>(salloc), RoutineImpl(std::forward<Fn>(fn)))
     {
     }
@@ -46,6 +46,12 @@ public:
         current_fiber = parent_fiber;
     }
 
+    static FiberPtr & getCurrentFiber()
+    {
+        thread_local static FiberPtr current_fiber;
+        return current_fiber;
+    }
+
 private:
     template <typename Fn>
     struct RoutineImpl
@@ -74,12 +80,6 @@ private:
         Fn fn;
     };
 
-    static FiberPtr & getCurrentFiber()
-    {
-        thread_local static FiberPtr current_fiber;
-        return current_fiber;
-    }
-
     /// Special wrapper to store data in uniquer_ptr.
     struct DataWrapper
     {
@@ -146,4 +146,3 @@ private:
 
     T main_instance;
 };
-
diff --git a/src/Common/checkStackSize.cpp b/src/Common/checkStackSize.cpp
index 954def83e94..fd0e8d89ca6 100644
--- a/src/Common/checkStackSize.cpp
+++ b/src/Common/checkStackSize.cpp
@@ -1,5 +1,6 @@
 #include <Common/checkStackSize.h>
 #include <Common/Exception.h>
+#include <Common/Fiber.h>
 #include <pthread.h>
 
 #if defined(OS_FREEBSD)
@@ -108,6 +109,10 @@ __attribute__((__weak__)) void checkStackSize()
 {
     using namespace DB;
 
+    /// Not implemented for coroutines.
+    if (Fiber::getCurrentFiber())
+        return;
+
     if (!stack_address)
         max_stack_size = getStackSize(&stack_address);
 

From 6329b6ae459519bc0471d3ce0179ed2bd09dacca Mon Sep 17 00:00:00 2001
From: Hongbin Ma <mahongbin@apache.org>
Date: Mon, 19 Feb 2024 14:49:02 +0800
Subject: [PATCH 1064/1081] fix flaky test case

---
 tests/queries/0_stateless/00873_t64_codec_date.reference | 2 +-
 tests/queries/0_stateless/00873_t64_codec_date.sql       | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00873_t64_codec_date.reference b/tests/queries/0_stateless/00873_t64_codec_date.reference
index 1568c3122e6..9353696610c 100644
--- a/tests/queries/0_stateless/00873_t64_codec_date.reference
+++ b/tests/queries/0_stateless/00873_t64_codec_date.reference
@@ -1,4 +1,4 @@
 1970-01-01	1970-01-01	1950-01-01	1950-01-01
 1970-01-01	1970-01-01	1970-01-01	1970-01-01
-2149-06-06	2149-06-06	2149-06-08	2149-06-08
 2149-06-06	2149-06-06	2149-06-06	2149-06-06
+2149-06-06	2149-06-06	2149-06-08	2149-06-08
diff --git a/tests/queries/0_stateless/00873_t64_codec_date.sql b/tests/queries/0_stateless/00873_t64_codec_date.sql
index e9230c75665..c6e21baba12 100644
--- a/tests/queries/0_stateless/00873_t64_codec_date.sql
+++ b/tests/queries/0_stateless/00873_t64_codec_date.sql
@@ -13,7 +13,7 @@ INSERT INTO t64 values ('2149-06-06', '2149-06-06', '2149-06-06', '2149-06-06');
 INSERT INTO t64 values ('2149-06-08', '2149-06-08', '2149-06-08', '2149-06-08');
 INSERT INTO t64 values ('1950-01-01', '1950-01-01', '1950-01-01', '1950-01-01');
 
-SELECT * FROM t64 ORDER BY date16;
+SELECT * FROM t64 ORDER BY date_32;
 
 SELECT * FROM t64 WHERE date16 != t_date16;
 SELECT * FROM t64 WHERE date_32 != t_date32;

From 1f882063e759ec43d42fb47c83fc02b7510bc455 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 08:44:53 +0100
Subject: [PATCH 1065/1081] Fix build

---
 src/Common/checkStackSize.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Common/checkStackSize.cpp b/src/Common/checkStackSize.cpp
index fd0e8d89ca6..c88554ca8fe 100644
--- a/src/Common/checkStackSize.cpp
+++ b/src/Common/checkStackSize.cpp
@@ -1,7 +1,12 @@
+#include <base/getThreadId.h>
+#include <base/defines.h> /// THREAD_SANITIZER
 #include <Common/checkStackSize.h>
 #include <Common/Exception.h>
 #include <Common/Fiber.h>
+#include <sys/resource.h>
 #include <pthread.h>
+#include <unistd.h>
+#include <cstdint>
 
 #if defined(OS_FREEBSD)
 #   include <pthread_np.h>

From c55204d8efdd8ab9fb19e35fb8d07d2c171e5870 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 09:29:19 +0100
Subject: [PATCH 1066/1081] Implement TODO

---
 src/Common/tests/gtest_async_loader.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Common/tests/gtest_async_loader.cpp b/src/Common/tests/gtest_async_loader.cpp
index 950c7bbab76..fc2537abcfc 100644
--- a/src/Common/tests/gtest_async_loader.cpp
+++ b/src/Common/tests/gtest_async_loader.cpp
@@ -427,9 +427,7 @@ TEST(AsyncLoader, CancelExecutingTask)
     }
 }
 
-// This test is disabled due to `MemorySanitizer: use-of-uninitialized-value` issue in `collectSymbolsFromProgramHeaders` function
-// More details: https://github.com/ClickHouse/ClickHouse/pull/48923#issuecomment-1545415482
-TEST(AsyncLoader, DISABLED_JobFailure)
+TEST(AsyncLoader, JobFailure)
 {
     AsyncLoaderTest t;
     t.loader.start();

From 327ba7d174f287bb6a25fefd8372632b31c0f62e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 19 Feb 2024 09:30:19 +0100
Subject: [PATCH 1067/1081] Fix bad log message

---
 src/Common/LoggingFormatStringHelpers.cpp     | 5 ++---
 src/Processors/Formats/Impl/Parquet/Write.cpp | 2 +-
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/Common/LoggingFormatStringHelpers.cpp b/src/Common/LoggingFormatStringHelpers.cpp
index b3353a59010..7cbef779f28 100644
--- a/src/Common/LoggingFormatStringHelpers.cpp
+++ b/src/Common/LoggingFormatStringHelpers.cpp
@@ -130,13 +130,12 @@ LogSeriesLimiter::LogSeriesLimiter(LoggerPtr logger_, size_t allowed_count_, tim
     if (last_time + interval_s_ <= now)
     {
         debug_message = fmt::format(
-            " (LogSeriesLimiter: on interval from {} to {} accepted series {} / {} for the logger {} : {})",
+            " (LogSeriesLimiter: on interval from {} to {} accepted series {} / {} for the logger {})",
             DateLUT::instance().timeToString(last_time),
             DateLUT::instance().timeToString(now),
             accepted_count,
             total_count,
-            logger->name(),
-            double(name_hash));
+            logger->name());
 
         register_as_first();
         return;
diff --git a/src/Processors/Formats/Impl/Parquet/Write.cpp b/src/Processors/Formats/Impl/Parquet/Write.cpp
index 02ca2734ff8..4d71e0102d8 100644
--- a/src/Processors/Formats/Impl/Parquet/Write.cpp
+++ b/src/Processors/Formats/Impl/Parquet/Write.cpp
@@ -409,7 +409,7 @@ PODArray<char> & compress(PODArray<char> & source, PODArray<char> & scratch, Com
             #pragma clang diagnostic pop
 
             if (max_dest_size > std::numeric_limits<int>::max())
-                throw Exception(ErrorCodes::CANNOT_COMPRESS, "Cannot compress column of size {}", formatReadableSizeWithBinarySuffix(source.size()));
+                throw Exception(ErrorCodes::CANNOT_COMPRESS, "Cannot compress column of size {}", ReadableSize(source.size()));
 
             scratch.resize(max_dest_size);
 

From 6565423b1a3ca7a6127b848fc112e8c2eadb66ae Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Mon, 19 Feb 2024 10:32:36 +0100
Subject: [PATCH 1068/1081] Review fix

---
 src/Storages/StorageBuffer.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index c2b63101d11..5d717f84a1d 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -5,6 +5,7 @@
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/addMissingDefaults.h>
 #include <Interpreters/getColumnFromBlock.h>
+#include <Interpreters/threadPoolCallbackRunner.h>
 #include <Storages/StorageBuffer.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/AlterCommands.h>
@@ -814,10 +815,10 @@ void StorageBuffer::flushAllBuffers(bool check_thresholds)
     {
         if (flush_pool)
         {
-            flush_pool->scheduleOrThrowOnError([&] ()
+            scheduleFromThreadPool<void>([&] ()
             {
                 flushBuffer(buf, check_thresholds, false);
-            });
+            }, *flush_pool, "BufferFlush");
         }
         else
         {

From 0496d0f45fa6d07038a32de93f6f65ed02f0c971 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 18 Feb 2024 10:55:22 +0100
Subject: [PATCH 1069/1081] Do not retry queries if container is down in
 integration tests

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/integration/helpers/cluster.py | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 1d96563251b..95722dd0db9 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -3484,6 +3484,10 @@ class ClickHouseInstance:
                 if check_callback(result):
                     return result
                 time.sleep(sleep_time)
+            except QueryRuntimeException as ex:
+                # Container is down, this is likely due to server crash.
+                if "No route to host" in str(ex):
+                    raise
             except Exception as ex:
                 # logging.debug("Retry {} got exception {}".format(i + 1, ex))
                 time.sleep(sleep_time)

From cfa198c4773cf05619766020bbe6aee859bb2739 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Mon, 19 Feb 2024 13:34:00 +0100
Subject: [PATCH 1070/1081] remove comment

Co-authored-by: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
---
 src/Functions/FunctionBinaryArithmetic.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 9b4249b0aef..d253095ca01 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -2101,7 +2101,6 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
                         type_res = std::make_shared<LeftDataType>(left.getPrecision(), left.getScale());
                     else
                         type_res = std::make_shared<RightDataType>(right.getPrecision(), right.getScale());
-                    // Create result decimal type somehow, maybe similar to how we do it in getReturnTypeImplStatic
 
                     auto res = executeNumericWithDecimal<LeftDataType, RightDataType, DecimalResultType>(
                             left, right,

From a5b62df0d6a2202d4a8ccdd766470db1c77e3cc3 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 19 Feb 2024 13:46:51 +0100
Subject: [PATCH 1071/1081] Update 02982_dont_infer_exponent_floats.sql

---
 tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql
index 17f62557fc2..2a281e898f1 100644
--- a/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql
+++ b/tests/queries/0_stateless/02982_dont_infer_exponent_floats.sql
@@ -1,3 +1,2 @@
 DESC format(CSV, '1E20\n1.1E20') settings input_format_try_infer_exponent_floats = 0;
 DESC format(CSV, '1E20\n1.1E20') settings input_format_try_infer_exponent_floats = 1;
-

From 7c2654f62e210d76bff31571bcf60cf28a7e5a14 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 19 Feb 2024 13:41:22 +0100
Subject: [PATCH 1072/1081] Fix data race

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 6 ++++--
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 7 ++++---
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 2826c3e23f1..11ede661f78 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -347,7 +347,7 @@ const IMergeTreeDataPart::Index & IMergeTreeDataPart::getIndex() const
 {
     std::scoped_lock lock(index_mutex);
     if (!index_loaded)
-        loadIndex(lock);
+        loadIndex();
     index_loaded = true;
     return index;
 }
@@ -569,6 +569,7 @@ void IMergeTreeDataPart::removeIfNeeded()
 
 UInt64 IMergeTreeDataPart::getIndexSizeInBytes() const
 {
+    std::scoped_lock lock(index_mutex);
     UInt64 res = 0;
     for (const ColumnPtr & column : index)
         res += column->byteSize();
@@ -577,6 +578,7 @@ UInt64 IMergeTreeDataPart::getIndexSizeInBytes() const
 
 UInt64 IMergeTreeDataPart::getIndexSizeInAllocatedBytes() const
 {
+    std::scoped_lock lock(index_mutex);
     UInt64 res = 0;
     for (const ColumnPtr & column : index)
         res += column->allocatedBytes();
@@ -828,7 +830,7 @@ void IMergeTreeDataPart::appendFilesOfIndexGranularity(Strings & /* files */) co
 {
 }
 
-void IMergeTreeDataPart::loadIndex(std::scoped_lock<std::mutex> &) const
+void IMergeTreeDataPart::loadIndex() const
 {
     /// Memory for index must not be accounted as memory usage for query, because it belongs to a table.
     MemoryTrackerBlockerInThread temporarily_disable_memory_tracker;
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index c9dea1afcc5..0d7acfab891 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -3,6 +3,7 @@
 #include <IO/WriteSettings.h>
 #include <Core/Block.h>
 #include <base/types.h>
+#include <base/defines.h>
 #include <Core/NamesAndTypes.h>
 #include <Storages/IStorage.h>
 #include <Storages/LightweightDeleteDescription.h>
@@ -565,8 +566,8 @@ protected:
     /// Lazily loaded in RAM. Contains each index_granularity-th value of primary key tuple.
     /// Note that marks (also correspond to primary key) are not always in RAM, but cached. See MarkCache.h.
     mutable std::mutex index_mutex;
-    mutable Index index;
-    mutable bool index_loaded = false;
+    mutable Index index TSA_GUARDED_BY(index_mutex);
+    mutable bool index_loaded TSA_GUARDED_BY(index_mutex) = false;
 
     /// Total size of all columns, calculated once in calcuateColumnSizesOnDisk
     ColumnSize total_columns_size;
@@ -664,7 +665,7 @@ private:
     virtual void appendFilesOfIndexGranularity(Strings & files) const;
 
     /// Loads the index file.
-    void loadIndex(std::scoped_lock<std::mutex> &) const;
+    void loadIndex() const TSA_REQUIRES(index_mutex);
 
     void appendFilesOfIndex(Strings & files) const;
 

From 17b1760eca0c9f61276d6a7e5cdba497bfdc48b2 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 19 Feb 2024 14:29:00 +0100
Subject: [PATCH 1073/1081] Add new setting to changes history

---
 src/Core/SettingsChangesHistory.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 64650bf0ef5..600fe150805 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -85,6 +85,7 @@ namespace SettingsChangesHistory
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
     {"24.2", {
+              {"output_format_values_escape_quote_with_quote", false, false, "If true escape ' with '', otherwise quoted with \\'"},
               {"async_insert_max_data_size", 1000000, 10485760, "The previous value appeared to be too small."},
               {"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
               {"async_insert_use_adaptive_busy_timeout", true, true, "Use adaptive asynchronous insert timeout"},

From 175a1db7876d4a7ff115a56c7018a386812b5a87 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 19 Feb 2024 16:11:29 +0100
Subject: [PATCH 1074/1081] Support specifying users for s3 settings

---
 src/Backups/BackupIO_S3.cpp                   |  4 +-
 src/IO/S3Common.cpp                           | 21 +++++++-
 src/IO/S3Common.h                             |  5 ++
 src/Storages/StorageS3.cpp                    |  2 +-
 src/Storages/StorageS3Settings.cpp            |  5 +-
 src/Storages/StorageS3Settings.h              |  2 +-
 .../configs/s3_settings.xml                   |  7 +++
 .../test_backup_restore_s3/test.py            | 54 +++++++++++++++++++
 8 files changed, 93 insertions(+), 7 deletions(-)

diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index fa4c1af3698..174b5cfc27c 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -127,7 +127,7 @@ BackupReaderS3::BackupReaderS3(
     : BackupReaderDefault(read_settings_, write_settings_, getLogger("BackupReaderS3"))
     , s3_uri(s3_uri_)
     , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::S3, MetadataStorageType::None, s3_uri.endpoint, false, false}
-    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()))
+    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString(), context_->getUserName()))
 {
     auto & request_settings = s3_settings.request_settings;
     request_settings.updateFromSettings(context_->getSettingsRef());
@@ -217,7 +217,7 @@ BackupWriterS3::BackupWriterS3(
     : BackupWriterDefault(read_settings_, write_settings_, getLogger("BackupWriterS3"))
     , s3_uri(s3_uri_)
     , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::S3, MetadataStorageType::None, s3_uri.endpoint, false, false}
-    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()))
+    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString(), context_->getUserName()))
 {
     auto & request_settings = s3_settings.request_settings;
     request_settings.updateFromSettings(context_->getSettingsRef());
diff --git a/src/IO/S3Common.cpp b/src/IO/S3Common.cpp
index 5039059f522..56e3e0df21b 100644
--- a/src/IO/S3Common.cpp
+++ b/src/IO/S3Common.cpp
@@ -1,7 +1,9 @@
 #include <IO/S3Common.h>
 
 #include <Common/Exception.h>
+#include <Common/StringUtils/StringUtils.h>
 #include <Poco/Util/AbstractConfiguration.h>
+
 #include "config.h"
 
 #if USE_AWS_S3
@@ -124,6 +126,15 @@ AuthSettings AuthSettings::loadFromConfig(const std::string & config_elem, const
     HTTPHeaderEntries headers = getHTTPHeaders(config_elem, config);
     ServerSideEncryptionKMSConfig sse_kms_config = getSSEKMSConfig(config_elem, config);
 
+    std::unordered_set<std::string> users;
+    Poco::Util::AbstractConfiguration::Keys keys;
+    config.keys(config_elem, keys);
+    for (const auto & key : keys)
+    {
+        if (startsWith(key, "user"))
+            users.insert(config.getString(config_elem + "." + key));
+    }
+
     return AuthSettings
     {
         std::move(access_key_id), std::move(secret_access_key), std::move(session_token),
@@ -134,10 +145,16 @@ AuthSettings AuthSettings::loadFromConfig(const std::string & config_elem, const
         use_environment_credentials,
         use_insecure_imds_request,
         expiration_window_seconds,
-        no_sign_request
+        no_sign_request,
+        std::move(users)
     };
 }
 
+bool AuthSettings::canBeUsedByUser(const String & user) const
+{
+    return users.empty() || users.contains(user);
+}
+
 bool AuthSettings::hasUpdates(const AuthSettings & other) const
 {
     AuthSettings copy = *this;
@@ -173,6 +190,8 @@ void AuthSettings::updateFrom(const AuthSettings & from)
 
     if (from.no_sign_request.has_value())
         no_sign_request = from.no_sign_request;
+
+    users.insert(from.users.begin(), from.users.end());
 }
 
 }
diff --git a/src/IO/S3Common.h b/src/IO/S3Common.h
index 6ee8d96ed09..b3e01bd6132 100644
--- a/src/IO/S3Common.h
+++ b/src/IO/S3Common.h
@@ -6,6 +6,7 @@
 
 #include <string>
 #include <optional>
+#include <unordered_set>
 
 #include "config.h"
 
@@ -92,9 +93,13 @@ struct AuthSettings
     std::optional<uint64_t> expiration_window_seconds;
     std::optional<bool> no_sign_request;
 
+    std::unordered_set<std::string> users;
+
     bool hasUpdates(const AuthSettings & other) const;
     void updateFrom(const AuthSettings & from);
 
+    bool canBeUsedByUser(const String & user) const;
+
 private:
     bool operator==(const AuthSettings & other) const = default;
 };
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index e29fdd0d4a0..2d8ef3df1c8 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1385,7 +1385,7 @@ const StorageS3::Configuration & StorageS3::getConfiguration()
 
 bool StorageS3::Configuration::update(const ContextPtr & context)
 {
-    auto s3_settings = context->getStorageS3Settings().getSettings(url.uri.toString());
+    auto s3_settings = context->getStorageS3Settings().getSettings(url.uri.toString(), context->getUserName());
     request_settings = s3_settings.request_settings;
     request_settings.updateFromSettings(context->getSettings());
 
diff --git a/src/Storages/StorageS3Settings.cpp b/src/Storages/StorageS3Settings.cpp
index b0c1160429a..2a0d15a2bab 100644
--- a/src/Storages/StorageS3Settings.cpp
+++ b/src/Storages/StorageS3Settings.cpp
@@ -293,7 +293,7 @@ void StorageS3Settings::loadFromConfig(const String & config_elem, const Poco::U
     }
 }
 
-S3Settings StorageS3Settings::getSettings(const String & endpoint) const
+S3Settings StorageS3Settings::getSettings(const String & endpoint, const String & user) const
 {
     std::lock_guard lock(mutex);
     auto next_prefix_setting = s3_settings.upper_bound(endpoint);
@@ -302,7 +302,8 @@ S3Settings StorageS3Settings::getSettings(const String & endpoint) const
     for (auto possible_prefix_setting = next_prefix_setting; possible_prefix_setting != s3_settings.begin();)
     {
         std::advance(possible_prefix_setting, -1);
-        if (boost::algorithm::starts_with(endpoint, possible_prefix_setting->first))
+        const auto & [endpoint_prefix, settings] = *possible_prefix_setting;
+        if (boost::algorithm::starts_with(endpoint, endpoint_prefix) && settings.auth_settings.canBeUsedByUser(user))
             return possible_prefix_setting->second;
     }
 
diff --git a/src/Storages/StorageS3Settings.h b/src/Storages/StorageS3Settings.h
index 0e152bb2d31..21b6264717e 100644
--- a/src/Storages/StorageS3Settings.h
+++ b/src/Storages/StorageS3Settings.h
@@ -112,7 +112,7 @@ class StorageS3Settings
 public:
     void loadFromConfig(const String & config_elem, const Poco::Util::AbstractConfiguration & config, const Settings & settings);
 
-    S3Settings getSettings(const String & endpoint) const;
+    S3Settings getSettings(const String & endpoint, const String & user) const;
 
 private:
     mutable std::mutex mutex;
diff --git a/tests/integration/test_backup_restore_s3/configs/s3_settings.xml b/tests/integration/test_backup_restore_s3/configs/s3_settings.xml
index 981cf67bbe9..adeb61cbe07 100644
--- a/tests/integration/test_backup_restore_s3/configs/s3_settings.xml
+++ b/tests/integration/test_backup_restore_s3/configs/s3_settings.xml
@@ -10,6 +10,13 @@
             <upload_part_size_multiply_parts_count_threshold>3</upload_part_size_multiply_parts_count_threshold>
             <upload_part_size_multiply_factor>2</upload_part_size_multiply_factor>
         </multipart>
+        <limited>
+            <endpoint>http://minio1:9001/root/data/backups/limited/</endpoint>
+            <access_key_id>minio</access_key_id>
+            <secret_access_key>minio123</secret_access_key>
+            <user>superuser1</user>
+            <user>superuser2</user>
+        </limited>
     </s3>
     <backup_threads>1</backup_threads>
     <restore_threads>1</restore_threads>
diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index cd8f70b3239..783cf1feade 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -452,3 +452,57 @@ def test_backup_to_zip():
     backup_name = new_backup_name()
     backup_destination = f"S3('http://minio1:9001/root/data/backups/{backup_name}.zip', 'minio', 'minio123')"
     check_backup_and_restore(storage_policy, backup_destination)
+
+
+def test_user_specific_auth(start_cluster):
+    def create_user(user):
+        node.query(f"CREATE USER {user}")
+        node.query(f"GRANT CURRENT GRANTS ON *.* TO {user}")
+
+    create_user("superuser1")
+    create_user("superuser2")
+    create_user("regularuser")
+
+    node.query("CREATE TABLE specific_auth (col UInt64) ENGINE=Memory")
+
+    assert "Access Denied" in node.query_and_get_error(
+        "BACKUP TABLE specific_auth TO S3('http://minio1:9001/root/data/backups/limited/backup1.zip')"
+    )
+    assert "Access Denied" in node.query_and_get_error(
+        "BACKUP TABLE specific_auth TO S3('http://minio1:9001/root/data/backups/limited/backup1.zip')",
+        user="regularuser",
+    )
+
+    node.query(
+        "BACKUP TABLE specific_auth TO S3('http://minio1:9001/root/data/backups/limited/backup1.zip')",
+        user="superuser1",
+    )
+    node.query(
+        "RESTORE TABLE specific_auth FROM S3('http://minio1:9001/root/data/backups/limited/backup1.zip')",
+        user="superuser1",
+    )
+
+    node.query(
+        "BACKUP TABLE specific_auth TO S3('http://minio1:9001/root/data/backups/limited/backup2.zip')",
+        user="superuser2",
+    )
+    node.query(
+        "RESTORE TABLE specific_auth FROM S3('http://minio1:9001/root/data/backups/limited/backup2.zip')",
+        user="superuser2",
+    )
+
+    assert "Access Denied" in node.query_and_get_error(
+        "RESTORE TABLE specific_auth FROM S3('http://minio1:9001/root/data/backups/limited/backup1.zip')",
+        user="regularuser",
+    )
+
+    assert "HTTP response code: 403" in node.query_and_get_error(
+        "SELECT * FROM s3('http://minio1:9001/root/data/backups/limited/backup1.zip', 'RawBLOB')",
+        user="regularuser",
+    )
+    node.query(
+        "SELECT * FROM s3('http://minio1:9001/root/data/backups/limited/backup1.zip', 'RawBLOB')",
+        user="superuser1",
+    )
+
+    node.query("DROP TABLE IF EXISTS test.specific_auth")

From 793ae52bf886372579e2ae6af9a73eb0bbe25f99 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 19 Feb 2024 17:30:00 +0100
Subject: [PATCH 1075/1081] Fix cosineDistance crash with Nullable

---
 .../en/sql-reference/functions/distance-functions.md |  2 +-
 src/Functions/vectorFunctions.cpp                    | 12 ++++++------
 .../02994_cosineDistanceNullable.reference           | 11 +++++++++++
 .../0_stateless/02994_cosineDistanceNullable.sql     |  3 +++
 4 files changed, 21 insertions(+), 7 deletions(-)
 create mode 100644 tests/queries/0_stateless/02994_cosineDistanceNullable.reference
 create mode 100644 tests/queries/0_stateless/02994_cosineDistanceNullable.sql

diff --git a/docs/en/sql-reference/functions/distance-functions.md b/docs/en/sql-reference/functions/distance-functions.md
index 1774c22014d..e20c35c6b6f 100644
--- a/docs/en/sql-reference/functions/distance-functions.md
+++ b/docs/en/sql-reference/functions/distance-functions.md
@@ -509,7 +509,7 @@ Result:
 
 ## cosineDistance
 
-Calculates the cosine distance between two vectors (the values of the tuples are the coordinates). The less the returned value is, the more similar are the vectors.
+Calculates the cosine distance between two vectors (the values of the tuples are the coordinates). The smaller the returned value is, the more similar are the vectors.
 
 **Syntax**
 
diff --git a/src/Functions/vectorFunctions.cpp b/src/Functions/vectorFunctions.cpp
index 33b0e9f6039..de4a6fb0a5c 100644
--- a/src/Functions/vectorFunctions.cpp
+++ b/src/Functions/vectorFunctions.cpp
@@ -1,9 +1,9 @@
 #include <Columns/ColumnTuple.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeInterval.h>
+#include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeNothing.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/ITupleFunction.h>
@@ -1364,11 +1364,11 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
-        if (getReturnTypeImpl(arguments)->isNullable())
-        {
-            return DataTypeNullable(std::make_shared<DataTypeNothing>())
-                   .createColumnConstWithDefaultValue(input_rows_count);
-        }
+        /// TODO: cosineDistance does not support nullable arguments
+        /// https://github.com/ClickHouse/ClickHouse/pull/27933#issuecomment-916670286
+        auto return_type = getReturnTypeImpl(arguments);
+        if (return_type->isNullable())
+            return return_type->createColumnConstWithDefaultValue(input_rows_count);
 
         FunctionDotProduct dot(context);
         ColumnWithTypeAndName dot_result{dot.executeImpl(arguments, DataTypePtr(), input_rows_count),
diff --git a/tests/queries/0_stateless/02994_cosineDistanceNullable.reference b/tests/queries/0_stateless/02994_cosineDistanceNullable.reference
new file mode 100644
index 00000000000..e4fe1f97e7e
--- /dev/null
+++ b/tests/queries/0_stateless/02994_cosineDistanceNullable.reference
@@ -0,0 +1,11 @@
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+\N
diff --git a/tests/queries/0_stateless/02994_cosineDistanceNullable.sql b/tests/queries/0_stateless/02994_cosineDistanceNullable.sql
new file mode 100644
index 00000000000..a62216982f3
--- /dev/null
+++ b/tests/queries/0_stateless/02994_cosineDistanceNullable.sql
@@ -0,0 +1,3 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/59596
+SELECT cosineDistance((1, 1), (toNullable(0.5), 0.1));
+SELECT cosineDistance((1, 1), (toNullable(0.5), 0.1)) from numbers(10);

From 9361946d151a082ca190b9d7489804b9c30ef3b2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 19 Feb 2024 17:48:53 +0100
Subject: [PATCH 1076/1081] Fix build in master

---
 src/Storages/StorageBuffer.cpp | 58 +++++++++++++++++-----------------
 1 file changed, 29 insertions(+), 29 deletions(-)

diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index 5d717f84a1d..2925038ec8e 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -1,41 +1,41 @@
-#include <boost/range/algorithm_ext/erase.hpp>
-#include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/InterpreterInsertQuery.h>
+#include <Interpreters/InterpreterSelectQuery.h>
+#include <Interpreters/addMissingDefaults.h>
 #include <Interpreters/castColumn.h>
 #include <Interpreters/evaluateConstantExpression.h>
-#include <Interpreters/addMissingDefaults.h>
 #include <Interpreters/getColumnFromBlock.h>
-#include <Interpreters/threadPoolCallbackRunner.h>
-#include <Storages/StorageBuffer.h>
-#include <Storages/StorageFactory.h>
-#include <Storages/AlterCommands.h>
-#include <Storages/checkAndGetLiteralArgument.h>
-#include <Parsers/ASTInsertQuery.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTExpressionList.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/MemoryTrackerBlockerInThread.h>
-#include <Common/FieldVisitorConvertToNumber.h>
-#include <Common/quoteString.h>
-#include <Common/typeid_cast.h>
-#include <Common/ProfileEvents.h>
-#include <Common/logger_useful.h>
-#include <base/getThreadId.h>
-#include <base/range.h>
-#include <Processors/QueryPlan/ExpressionStep.h>
-#include <Processors/Transforms/FilterTransform.h>
-#include <Processors/Transforms/ExpressionTransform.h>
-#include <Processors/Transforms/ReverseTransform.h>
-#include <Processors/Transforms/PartialSortingTransform.h>
-#include <Processors/Sinks/SinkToStorage.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTInsertQuery.h>
+#include <Parsers/ASTLiteral.h>
+#include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Processors/ISource.h>
+#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
+#include <Processors/QueryPlan/ExpressionStep.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/ReadFromPreparedSource.h>
 #include <Processors/QueryPlan/UnionStep.h>
-#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
-#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
-#include <Processors/Executors/PushingPipelineExecutor.h>
+#include <Processors/Sinks/SinkToStorage.h>
+#include <Processors/Transforms/ExpressionTransform.h>
+#include <Processors/Transforms/FilterTransform.h>
+#include <Processors/Transforms/PartialSortingTransform.h>
+#include <Processors/Transforms/ReverseTransform.h>
+#include <Storages/AlterCommands.h>
+#include <Storages/StorageBuffer.h>
+#include <Storages/StorageFactory.h>
+#include <Storages/checkAndGetLiteralArgument.h>
+#include <base/getThreadId.h>
+#include <base/range.h>
+#include <boost/range/algorithm_ext/erase.hpp>
+#include <Common/CurrentMetrics.h>
+#include <Common/FieldVisitorConvertToNumber.h>
+#include <Common/MemoryTrackerBlockerInThread.h>
+#include <Common/ProfileEvents.h>
+#include <Common/logger_useful.h>
+#include <Common/quoteString.h>
+#include <Common/threadPoolCallbackRunner.h>
+#include <Common/typeid_cast.h>
 
 
 namespace ProfileEvents

From f2091ac6cf90bb87b1d6370bc6cd0b4d4c0daa29 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 19 Feb 2024 19:33:14 +0000
Subject: [PATCH 1077/1081] Mini cleanup of CPUID.h

---
 src/Common/CPUID.h | 490 ++++++++++++++++++++++-----------------------
 1 file changed, 243 insertions(+), 247 deletions(-)

diff --git a/src/Common/CPUID.h b/src/Common/CPUID.h
index b47e7e808d7..d7a714ec5af 100644
--- a/src/Common/CPUID.h
+++ b/src/Common/CPUID.h
@@ -57,6 +57,249 @@ inline bool cpuid(UInt32 op, UInt32 * res) noexcept /// NOLINT
 #endif
 }
 
+union CPUInfo
+{
+    UInt32 info[4];
+
+    struct Registers
+    {
+        UInt32 eax;
+        UInt32 ebx;
+        UInt32 ecx;
+        UInt32 edx;
+    } registers;
+
+    inline explicit CPUInfo(UInt32 op) noexcept { cpuid(op, info); }
+
+    inline CPUInfo(UInt32 op, UInt32 sub_op) noexcept { cpuid(op, sub_op, info); }
+};
+
+inline bool haveRDTSCP() noexcept
+{
+    return (CPUInfo(0x80000001).registers.edx >> 27) & 1u;
+}
+
+inline bool haveSSE() noexcept
+{
+    return (CPUInfo(0x1).registers.edx >> 25) & 1u;
+}
+
+inline bool haveSSE2() noexcept
+{
+    return (CPUInfo(0x1).registers.edx >> 26) & 1u;
+}
+
+inline bool haveSSE3() noexcept
+{
+    return CPUInfo(0x1).registers.ecx & 1u;
+}
+
+inline bool havePCLMUL() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 1) & 1u;
+}
+
+inline bool haveSSSE3() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 9) & 1u;
+}
+
+inline bool haveSSE41() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 19) & 1u;
+}
+
+inline bool haveSSE42() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 20) & 1u;
+}
+
+inline bool haveF16C() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 29) & 1u;
+}
+
+inline bool havePOPCNT() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 23) & 1u;
+}
+
+inline bool haveAES() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 25) & 1u;
+}
+
+inline bool haveXSAVE() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 26) & 1u;
+}
+
+inline bool haveOSXSAVE() noexcept
+{
+    return (CPUInfo(0x1).registers.ecx >> 27) & 1u;
+}
+
+inline bool haveAVX() noexcept
+{
+#if defined(__x86_64__)
+    // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
+    // https://bugs.chromium.org/p/chromium/issues/detail?id=375968
+    return haveOSXSAVE()                           // implies haveXSAVE()
+           && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
+           && ((CPUInfo(0x1).registers.ecx >> 28) & 1u); // AVX bit
+#else
+    return false;
+#endif
+}
+
+inline bool haveFMA() noexcept
+{
+    return haveAVX() && ((CPUInfo(0x1).registers.ecx >> 12) & 1u);
+}
+
+inline bool haveAVX2() noexcept
+{
+    return haveAVX() && ((CPUInfo(0x7, 0).registers.ebx >> 5) & 1u);
+}
+
+inline bool haveBMI1() noexcept
+{
+    return (CPUInfo(0x7, 0).registers.ebx >> 3) & 1u;
+}
+
+inline bool haveBMI2() noexcept
+{
+    return (CPUInfo(0x7, 0).registers.ebx >> 8) & 1u;
+}
+
+inline bool haveAVX512F() noexcept
+{
+#if defined(__x86_64__)
+    // https://software.intel.com/en-us/articles/how-to-detect-knl-instruction-support
+    return haveOSXSAVE()                           // implies haveXSAVE()
+           && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
+           && ((our_xgetbv(0) >> 5) & 7u) == 7u       // ZMM state is enabled by OS
+           && CPUInfo(0x0).registers.eax >= 0x7          // leaf 7 is present
+           && ((CPUInfo(0x7, 0).registers.ebx >> 16) & 1u); // AVX512F bit
+#else
+    return false;
+#endif
+}
+
+inline bool haveAVX512DQ() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 17) & 1u);
+}
+
+inline bool haveRDSEED() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 18) & 1u);
+}
+
+inline bool haveADX() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 19) & 1u);
+}
+
+inline bool haveAVX512IFMA() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 21) & 1u);
+}
+
+inline bool havePCOMMIT() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 22) & 1u);
+}
+
+inline bool haveCLFLUSHOPT() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 23) & 1u);
+}
+
+inline bool haveCLWB() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 24) & 1u);
+}
+
+inline bool haveAVX512PF() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 26) & 1u);
+}
+
+inline bool haveAVX512ER() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 27) & 1u);
+}
+
+inline bool haveAVX512CD() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 28) & 1u);
+}
+
+inline bool haveSHA() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 29) & 1u);
+}
+
+inline bool haveAVX512BW() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 30) & 1u);
+}
+
+inline bool haveAVX512VL() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 31) & 1u);
+}
+
+inline bool havePREFETCHWT1() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ecx >> 0) & 1u);
+}
+
+inline bool haveAVX512VBMI() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 1) & 1u);
+}
+
+inline bool haveAVX512VBMI2() noexcept
+{
+    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 6) & 1u);
+}
+
+inline bool haveRDRAND() noexcept
+{
+    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x1).registers.ecx >> 30) & 1u);
+}
+
+inline bool haveAMX() noexcept
+{
+#if defined(__x86_64__)
+    // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
+    return haveOSXSAVE()                           // implies haveXSAVE()
+           && ((our_xgetbv(0) >> 17) & 0x3) == 0x3;        // AMX state are enabled by OS
+#else
+    return false;
+#endif
+}
+
+inline bool haveAMXBF16() noexcept
+{
+    return haveAMX()
+            && ((CPUInfo(0x7, 0).registers.edx >> 22) & 1u);  // AMX-BF16 bit
+}
+
+inline bool haveAMXTILE() noexcept
+{
+    return haveAMX()
+            && ((CPUInfo(0x7, 0).registers.edx >> 24) & 1u);  // AMX-TILE bit
+}
+
+inline bool haveAMXINT8() noexcept
+{
+    return haveAMX()
+            && ((CPUInfo(0x7, 0).registers.edx >> 25) & 1u);  // AMX-INT8 bit
+}
+
 #define CPU_ID_ENUMERATE(OP) \
     OP(SSE)                  \
     OP(SSE2)                 \
@@ -98,253 +341,6 @@ inline bool cpuid(UInt32 op, UInt32 * res) noexcept /// NOLINT
     OP(AMXTILE)              \
     OP(AMXINT8)
 
-union CPUInfo
-{
-    UInt32 info[4];
-
-    struct Registers
-    {
-        UInt32 eax;
-        UInt32 ebx;
-        UInt32 ecx;
-        UInt32 edx;
-    } registers;
-
-    inline explicit CPUInfo(UInt32 op) noexcept { cpuid(op, info); }
-
-    inline CPUInfo(UInt32 op, UInt32 sub_op) noexcept { cpuid(op, sub_op, info); }
-};
-
-#define DEF_NAME(X) inline bool have##X() noexcept;
-    CPU_ID_ENUMERATE(DEF_NAME)
-#undef DEF_NAME
-
-bool haveRDTSCP() noexcept
-{
-    return (CPUInfo(0x80000001).registers.edx >> 27) & 1u;
-}
-
-bool haveSSE() noexcept
-{
-    return (CPUInfo(0x1).registers.edx >> 25) & 1u;
-}
-
-bool haveSSE2() noexcept
-{
-    return (CPUInfo(0x1).registers.edx >> 26) & 1u;
-}
-
-bool haveSSE3() noexcept
-{
-    return CPUInfo(0x1).registers.ecx & 1u;
-}
-
-bool havePCLMUL() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 1) & 1u;
-}
-
-bool haveSSSE3() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 9) & 1u;
-}
-
-bool haveSSE41() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 19) & 1u;
-}
-
-bool haveSSE42() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 20) & 1u;
-}
-
-bool haveF16C() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 29) & 1u;
-}
-
-bool havePOPCNT() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 23) & 1u;
-}
-
-bool haveAES() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 25) & 1u;
-}
-
-bool haveXSAVE() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 26) & 1u;
-}
-
-bool haveOSXSAVE() noexcept
-{
-    return (CPUInfo(0x1).registers.ecx >> 27) & 1u;
-}
-
-bool haveAVX() noexcept
-{
-#if defined(__x86_64__)
-    // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
-    // https://bugs.chromium.org/p/chromium/issues/detail?id=375968
-    return haveOSXSAVE()                           // implies haveXSAVE()
-           && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
-           && ((CPUInfo(0x1).registers.ecx >> 28) & 1u); // AVX bit
-#else
-    return false;
-#endif
-}
-
-bool haveFMA() noexcept
-{
-    return haveAVX() && ((CPUInfo(0x1).registers.ecx >> 12) & 1u);
-}
-
-bool haveAVX2() noexcept
-{
-    return haveAVX() && ((CPUInfo(0x7, 0).registers.ebx >> 5) & 1u);
-}
-
-bool haveBMI1() noexcept
-{
-    return (CPUInfo(0x7, 0).registers.ebx >> 3) & 1u;
-}
-
-bool haveBMI2() noexcept
-{
-    return (CPUInfo(0x7, 0).registers.ebx >> 8) & 1u;
-}
-
-bool haveAVX512F() noexcept
-{
-#if defined(__x86_64__)
-    // https://software.intel.com/en-us/articles/how-to-detect-knl-instruction-support
-    return haveOSXSAVE()                           // implies haveXSAVE()
-           && (our_xgetbv(0) & 6u) == 6u              // XMM state and YMM state are enabled by OS
-           && ((our_xgetbv(0) >> 5) & 7u) == 7u       // ZMM state is enabled by OS
-           && CPUInfo(0x0).registers.eax >= 0x7          // leaf 7 is present
-           && ((CPUInfo(0x7, 0).registers.ebx >> 16) & 1u); // AVX512F bit
-#else
-    return false;
-#endif
-}
-
-bool haveAVX512DQ() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 17) & 1u);
-}
-
-bool haveRDSEED() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 18) & 1u);
-}
-
-bool haveADX() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 19) & 1u);
-}
-
-bool haveAVX512IFMA() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 21) & 1u);
-}
-
-bool havePCOMMIT() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 22) & 1u);
-}
-
-bool haveCLFLUSHOPT() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 23) & 1u);
-}
-
-bool haveCLWB() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 24) & 1u);
-}
-
-bool haveAVX512PF() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 26) & 1u);
-}
-
-bool haveAVX512ER() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 27) & 1u);
-}
-
-bool haveAVX512CD() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 28) & 1u);
-}
-
-bool haveSHA() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ebx >> 29) & 1u);
-}
-
-bool haveAVX512BW() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 30) & 1u);
-}
-
-bool haveAVX512VL() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ebx >> 31) & 1u);
-}
-
-bool havePREFETCHWT1() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x7, 0).registers.ecx >> 0) & 1u);
-}
-
-bool haveAVX512VBMI() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 1) & 1u);
-}
-
-bool haveAVX512VBMI2() noexcept
-{
-    return haveAVX512F() && ((CPUInfo(0x7, 0).registers.ecx >> 6) & 1u);
-}
-
-bool haveRDRAND() noexcept
-{
-    return CPUInfo(0x0).registers.eax >= 0x7 && ((CPUInfo(0x1).registers.ecx >> 30) & 1u);
-}
-
-inline bool haveAMX() noexcept
-{
-#if defined(__x86_64__)
-    // http://www.intel.com/content/dam/www/public/us/en/documents/manuals/64-ia-32-architectures-optimization-manual.pdf
-    return haveOSXSAVE()                           // implies haveXSAVE()
-           && ((our_xgetbv(0) >> 17) & 0x3) == 0x3;        // AMX state are enabled by OS
-#else
-    return false;
-#endif
-}
-
-bool haveAMXBF16() noexcept
-{
-    return haveAMX()
-            && ((CPUInfo(0x7, 0).registers.edx >> 22) & 1u);  // AMX-BF16 bit
-}
-
-bool haveAMXTILE() noexcept
-{
-    return haveAMX()
-            && ((CPUInfo(0x7, 0).registers.edx >> 24) & 1u);  // AMX-TILE bit
-}
-
-bool haveAMXINT8() noexcept
-{
-    return haveAMX()
-            && ((CPUInfo(0x7, 0).registers.edx >> 25) & 1u);  // AMX-INT8 bit
-}
-
 struct CPUFlagsCache
 {
 #define DEF_NAME(X) static inline bool have_##X = have##X();

From 474efd98a50d20f955fc5b939916cf9077c3a730 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 19 Feb 2024 20:46:06 +0000
Subject: [PATCH 1078/1081] Docs: Add example how to use "replace" and "remove"
 attributes in configuration

Bug: 8394
---
 docs/en/operations/configuration-files.md | 56 +++++++++++++++++++++--
 1 file changed, 51 insertions(+), 5 deletions(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 81b25a4e897..615cff6496a 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -10,11 +10,57 @@ The ClickHouse server can be configured with configuration files in XML or YAML
 
 It is possible to mix XML and YAML configuration files, for example you could have a main configuration file `config.xml` and additional configuration files `config.d/network.xml`, `config.d/timezone.yaml` and `config.d/keeper.yaml`. Mixing XML and YAML within a single configuration file is not supported. XML configuration files should use `<clickhouse>...</clickhouse>` as top-level tag. In YAML configuration files, `clickhouse:` is optional, the parser inserts it implicitly if absent.
 
-## Overriding Configuration {#override}
+## Merging Configuration {#merging}
 
-The merge of configuration files behaves as one intuitively expects: The contents of both files are combined recursively, children with the same name are replaced by the element of the more specific configuration file. The merge can be customized using attributes `replace` and `remove`.
-- Attribute `replace` means that the element is replaced by the specified one.
-- Attribute `remove` means that the element is deleted.
+Two configuration files (usually the main configuration file and another configuration files from `config.d/`) are merged as follows:
+
+- If a node (i.e. a path leading to an element) appears in both files and does not have attributes `replace` or `remove`, it is included in the merged configuration file and children from both nodes are included and merged recursively.
+- If one of both nodes contains attribute `replace`, it is included in the merged configuration file but only children from the node with attribute `replace` are included.
+- If one of both nodes contains attribute `remove`, the node is not included in the merged configuration file (if it exists already, it is deleted).
+
+```xml
+<clickhouse>
+    <config_a>
+        <setting_1>1</setting_1>
+    </config_a>
+    <config_b>
+        <setting_2>2</setting_2>
+    </config_b>
+    <config_c>
+        <setting_3>3</setting_3>
+    </config_c>
+</clickhouse>
+```
+
+and
+
+```xml
+<clickhouse>
+    <config_a>
+        <setting_4>4</setting_4>
+    </config_a>
+    <config_b replace="replace">
+        <setting_5>5</setting_5>
+    </config_b>
+    <config_c remove="remove">
+        <setting_6>6</setting_6>
+    </config_c>
+</clickhouse>
+```
+
+generates merged configuration file:
+
+```xml
+<clickhouse>
+    <config_a>
+        <setting_1>1</setting_1>
+        <setting_4>4</setting_4>
+    </config_a>
+    <config_b replace="replace">
+        <setting_5>5</setting_5>
+    </config_b>
+</clickhouse>
+```
 
 To specify that a value of an element should be replaced by the value of an environment variable, you can use attribute `from_env`.
 
@@ -125,7 +171,7 @@ Users configuration can be split into separate files similar to `config.xml` and
 Directory name is defined as `users_config` setting without `.xml` postfix concatenated with `.d`.
 Directory `users.d` is used by default, as `users_config` defaults to `users.xml`.
 
-Note that configuration files are first merged taking into account [Override](#override) settings and includes are processed after that.
+Note that configuration files are first [merged](#merging) taking into account settings, and includes are processed after that.
 
 ## XML example {#example}
 

From b2285ce6e5c119356120016f6a45cd93636c9ca9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 20 Feb 2024 06:52:07 +0100
Subject: [PATCH 1079/1081] Remove extensively aggressive check

---
 src/Interpreters/executeQuery.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 808a2ee2d81..f2aa51bd6de 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -722,7 +722,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
             /// TODO: parser should fail early when max_query_size limit is reached.
             ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
 
-#ifndef NDEBUG
+#if 0
             /// Verify that AST formatting is consistent:
             /// If you format AST, parse it back, and format it again, you get the same string.
 

From 4412f71a1252198d1f18117ebf54f2204a71fc36 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 20 Feb 2024 10:16:46 +0000
Subject: [PATCH 1080/1081] Docs: Follow-up to #60157

---
 docs/en/operations/configuration-files.md | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 615cff6496a..9f17f4af1e8 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -18,7 +18,11 @@ Two configuration files (usually the main configuration file and another configu
 - If one of both nodes contains attribute `replace`, it is included in the merged configuration file but only children from the node with attribute `replace` are included.
 - If one of both nodes contains attribute `remove`, the node is not included in the merged configuration file (if it exists already, it is deleted).
 
+Example:
+
+
 ```xml
+<!-- config.xml -->
 <clickhouse>
     <config_a>
         <setting_1>1</setting_1>
@@ -35,6 +39,7 @@ Two configuration files (usually the main configuration file and another configu
 and
 
 ```xml
+<!-- config.d/other_config.xml -->
 <clickhouse>
     <config_a>
         <setting_4>4</setting_4>
@@ -56,7 +61,7 @@ generates merged configuration file:
         <setting_1>1</setting_1>
         <setting_4>4</setting_4>
     </config_a>
-    <config_b replace="replace">
+    <config_b>
         <setting_5>5</setting_5>
     </config_b>
 </clickhouse>

From ead2e7bc41e71eb2041d8616f9fa5e3ecc2a2f61 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 20 Feb 2024 12:32:25 +0100
Subject: [PATCH 1081/1081] Revert "Restriction for the access key id for s3."

---
 src/IO/S3/Client.cpp                             | 16 ----------------
 .../02966_s3_access_key_id_restriction.reference |  0
 .../02966_s3_access_key_id_restriction.sql       |  6 ------
 3 files changed, 22 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02966_s3_access_key_id_restriction.reference
 delete mode 100644 tests/queries/0_stateless/02966_s3_access_key_id_restriction.sql

diff --git a/src/IO/S3/Client.cpp b/src/IO/S3/Client.cpp
index 7f0ede72740..182e7ad18cd 100644
--- a/src/IO/S3/Client.cpp
+++ b/src/IO/S3/Client.cpp
@@ -27,7 +27,6 @@
 
 #include <base/sleep.h>
 
-#include <algorithm>
 
 namespace ProfileEvents
 {
@@ -48,7 +47,6 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int TOO_MANY_REDIRECTS;
-    extern const int BAD_ARGUMENTS;
 }
 
 namespace S3
@@ -106,19 +104,6 @@ void verifyClientConfiguration(const Aws::Client::ClientConfiguration & client_c
     assert_cast<const Client::RetryStrategy &>(*client_config.retryStrategy);
 }
 
-void validateCredentials(const Aws::Auth::AWSCredentials& auth_credentials)
-{
-    if (auth_credentials.GetAWSAccessKeyId().empty())
-    {
-        return;
-    }
-    /// Follow https://docs.aws.amazon.com/IAM/latest/APIReference/API_AccessKey.html
-    if (!std::all_of(auth_credentials.GetAWSAccessKeyId().begin(), auth_credentials.GetAWSAccessKeyId().end(), isWordCharASCII))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Access key id has an invalid character");
-    }
-}
-
 void addAdditionalAMZHeadersToCanonicalHeadersList(
     Aws::AmazonWebServiceRequest & request,
     const HTTPHeaderEntries & extra_headers
@@ -144,7 +129,6 @@ std::unique_ptr<Client> Client::create(
     const ClientSettings & client_settings)
 {
     verifyClientConfiguration(client_configuration);
-    validateCredentials(credentials_provider->GetAWSCredentials());
     return std::unique_ptr<Client>(
         new Client(max_redirects_, std::move(sse_kms_config_), credentials_provider, client_configuration, sign_payloads, client_settings));
 }
diff --git a/tests/queries/0_stateless/02966_s3_access_key_id_restriction.reference b/tests/queries/0_stateless/02966_s3_access_key_id_restriction.reference
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/queries/0_stateless/02966_s3_access_key_id_restriction.sql b/tests/queries/0_stateless/02966_s3_access_key_id_restriction.sql
deleted file mode 100644
index c1ca0b4bcd5..00000000000
--- a/tests/queries/0_stateless/02966_s3_access_key_id_restriction.sql
+++ /dev/null
@@ -1,6 +0,0 @@
--- Tags: no-fasttest
-
-select * from s3('http://localhost:11111/test/a.tsv', '\ninjection\n', 'admin'); -- { serverError 36 }
-select * from deltaLake('http://localhost:11111/test/a.tsv', '\ninjection\n', 'admin'); -- { serverError 36 }
-select * from hudi('http://localhost:11111/test/a.tsv', '\ninjection\n', 'admin'); -- { serverError 36 }
-select * from iceberg('http://localhost:11111/test/a.tsv', '\ninjection\n', 'admin'); -- { serverError 36 }