From 0d6561ee77041725f12d350e620c1d126563e82e Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <var1able@var1able.ru>
Date: Mon, 17 Apr 2023 16:52:30 +0200
Subject: [PATCH 001/101] Prototype

---
 src/Common/ZooKeeper/ZooKeeperCommon.cpp    |  1 +
 src/Common/ZooKeeper/ZooKeeperCommon.h      |  9 +++++--
 src/Common/ZooKeeper/ZooKeeperConstants.cpp |  3 +++
 src/Common/ZooKeeper/ZooKeeperConstants.h   |  1 +
 src/Coordination/KeeperStorage.cpp          | 27 ++++++++++++++++++---
 5 files changed, 35 insertions(+), 6 deletions(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.cpp b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
index 5031af38812..527b04c8c43 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -962,6 +962,7 @@ ZooKeeperRequestFactory::ZooKeeperRequestFactory()
     registerZooKeeperRequest<OpNum::Check, ZooKeeperCheckRequest>(*this);
     registerZooKeeperRequest<OpNum::Multi, ZooKeeperMultiRequest>(*this);
     registerZooKeeperRequest<OpNum::MultiRead, ZooKeeperMultiRequest>(*this);
+    registerZooKeeperRequest<OpNum::CreateIfNotExists, ZooKeeperCreateIfNotExistsRequest>(*this);
     registerZooKeeperRequest<OpNum::SessionID, ZooKeeperSessionIDRequest>(*this);
     registerZooKeeperRequest<OpNum::GetACL, ZooKeeperGetACLRequest>(*this);
     registerZooKeeperRequest<OpNum::SetACL, ZooKeeperSetACLRequest>(*this);
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index 5f00698423e..69f4dd84860 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -194,7 +194,7 @@ struct ZooKeeperCloseResponse final : ZooKeeperResponse
     OpNum getOpNum() const override { return OpNum::Close; }
 };
 
-struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
+struct ZooKeeperCreateRequest : public CreateRequest, ZooKeeperRequest
 {
     /// used only during restore from zookeeper log
     int32_t parent_cversion = -1;
@@ -215,7 +215,7 @@ struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
     void createLogElements(LogElements & elems) const override;
 };
 
-struct ZooKeeperCreateResponse final : CreateResponse, ZooKeeperResponse
+struct ZooKeeperCreateResponse : CreateResponse, ZooKeeperResponse
 {
     void readImpl(ReadBuffer & in) override;
 
@@ -228,6 +228,11 @@ struct ZooKeeperCreateResponse final : CreateResponse, ZooKeeperResponse
     void fillLogElements(LogElements & elems, size_t idx) const override;
 };
 
+struct ZooKeeperCreateIfNotExistsRequest final : public ZooKeeperCreateRequest
+{
+    OpNum getOpNum() const override { return OpNum::CreateIfNotExists; }
+};
+
 struct ZooKeeperRemoveRequest final : RemoveRequest, ZooKeeperRequest
 {
     ZooKeeperRemoveRequest() = default;
diff --git a/src/Common/ZooKeeper/ZooKeeperConstants.cpp b/src/Common/ZooKeeper/ZooKeeperConstants.cpp
index 86f70ea547a..334afde52f2 100644
--- a/src/Common/ZooKeeper/ZooKeeperConstants.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperConstants.cpp
@@ -21,6 +21,7 @@ static const std::unordered_set<int32_t> VALID_OPERATIONS =
     static_cast<int32_t>(OpNum::Check),
     static_cast<int32_t>(OpNum::Multi),
     static_cast<int32_t>(OpNum::MultiRead),
+    static_cast<int32_t>(OpNum::CreateIfNotExists),
     static_cast<int32_t>(OpNum::Auth),
     static_cast<int32_t>(OpNum::SessionID),
     static_cast<int32_t>(OpNum::SetACL),
@@ -57,6 +58,8 @@ std::string toString(OpNum op_num)
             return "Multi";
         case OpNum::MultiRead:
             return "MultiRead";
+        case OpNum::CreateIfNotExists:
+            return "CreateIfNotExists";
         case OpNum::Sync:
             return "Sync";
         case OpNum::Heartbeat:
diff --git a/src/Common/ZooKeeper/ZooKeeperConstants.h b/src/Common/ZooKeeper/ZooKeeperConstants.h
index 6b50c5c5d09..6582e58e92c 100644
--- a/src/Common/ZooKeeper/ZooKeeperConstants.h
+++ b/src/Common/ZooKeeper/ZooKeeperConstants.h
@@ -37,6 +37,7 @@ enum class OpNum : int32_t
     // CH Keeper specific operations
     FilteredList = 500,
     CheckNotExists = 501,
+    CreateIfNotExists = 502,
 
     SessionID = 997, /// Special internal request
 };
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 7a1a5e42632..e0c69933337 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -1001,11 +1001,25 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
     Coordination::ZooKeeperResponsePtr process(KeeperStorage & storage, int64_t zxid) const override
     {
         Coordination::ZooKeeperResponsePtr response_ptr = zk_request->makeResponse();
-        Coordination::ZooKeeperCreateResponse & response = dynamic_cast<Coordination::ZooKeeperCreateResponse &>(*response_ptr);
+        Coordination::ZooKeeperCreateResponse * response = dynamic_cast<Coordination::ZooKeeperCreateResponse *>(response_ptr.get());
+
+        Coordination::ZooKeeperCreateIfNotExistsRequest * create_if_not_exists_request = dynamic_cast<Coordination::ZooKeeperCreateIfNotExistsRequest *>(zk_request.get());
+
+        if (create_if_not_exists_request != nullptr) {
+            Coordination::ZooKeeperCreateIfNotExistsRequest & request = dynamic_cast<Coordination::ZooKeeperCreateIfNotExistsRequest &>(*zk_request);
+
+            auto & container = storage.container;
+            auto node_it = container.find(request.path);
+            if (node_it != container.end())
+            {
+                response->error = Coordination::Error::ZOK;
+                return response_ptr;
+            }
+        }
 
         if (const auto result = storage.commit(zxid); result != Coordination::Error::ZOK)
         {
-            response.error = result;
+            response->error = result;
             return response_ptr;
         }
 
@@ -1016,8 +1030,8 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
             [zxid](const auto & delta)
             { return delta.zxid == zxid && std::holds_alternative<KeeperStorage::CreateNodeDelta>(delta.operation); });
 
-        response.path_created = create_delta_it->path;
-        response.error = Coordination::Error::ZOK;
+        response->path_created = create_delta_it->path;
+        response->error = Coordination::Error::ZOK;
         return response_ptr;
     }
 };
@@ -1730,6 +1744,10 @@ struct KeeperStorageMultiRequestProcessor final : public KeeperStorageRequestPro
                     check_operation_type(OperationType::Write);
                     concrete_requests.push_back(std::make_shared<KeeperStorageCreateRequestProcessor>(sub_zk_request));
                     break;
+                case Coordination::OpNum::CreateIfNotExists:
+                    check_operation_type(OperationType::Write);
+                    concrete_requests.push_back(std::make_shared<KeeperStorageCreateRequestProcessor>(sub_zk_request));
+                    break;
                 case Coordination::OpNum::Remove:
                     check_operation_type(OperationType::Write);
                     concrete_requests.push_back(std::make_shared<KeeperStorageRemoveRequestProcessor>(sub_zk_request));
@@ -1993,6 +2011,7 @@ KeeperStorageRequestProcessorsFactory::KeeperStorageRequestProcessorsFactory()
     registerKeeperRequestProcessor<Coordination::OpNum::Check, KeeperStorageCheckRequestProcessor>(*this);
     registerKeeperRequestProcessor<Coordination::OpNum::Multi, KeeperStorageMultiRequestProcessor>(*this);
     registerKeeperRequestProcessor<Coordination::OpNum::MultiRead, KeeperStorageMultiRequestProcessor>(*this);
+    registerKeeperRequestProcessor<Coordination::OpNum::CreateIfNotExists, KeeperStorageCreateRequestProcessor>(*this);
     registerKeeperRequestProcessor<Coordination::OpNum::SetACL, KeeperStorageSetACLRequestProcessor>(*this);
     registerKeeperRequestProcessor<Coordination::OpNum::GetACL, KeeperStorageGetACLRequestProcessor>(*this);
     registerKeeperRequestProcessor<Coordination::OpNum::CheckNotExists, KeeperStorageCheckRequestProcessor>(*this);

From b53f36369e9a148634d6b4c1fa9526b3bcd3c67c Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <var1able@var1able.ru>
Date: Mon, 17 Apr 2023 17:47:57 +0200
Subject: [PATCH 002/101] Remove new request object

---
 src/Common/ZooKeeper/ZooKeeperCommon.cpp |  2 +-
 src/Common/ZooKeeper/ZooKeeperCommon.h   |  9 ++-------
 src/Coordination/KeeperStorage.cpp       | 16 +++++++---------
 3 files changed, 10 insertions(+), 17 deletions(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.cpp b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
index 527b04c8c43..c148b68b95e 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -962,7 +962,7 @@ ZooKeeperRequestFactory::ZooKeeperRequestFactory()
     registerZooKeeperRequest<OpNum::Check, ZooKeeperCheckRequest>(*this);
     registerZooKeeperRequest<OpNum::Multi, ZooKeeperMultiRequest>(*this);
     registerZooKeeperRequest<OpNum::MultiRead, ZooKeeperMultiRequest>(*this);
-    registerZooKeeperRequest<OpNum::CreateIfNotExists, ZooKeeperCreateIfNotExistsRequest>(*this);
+    registerZooKeeperRequest<OpNum::CreateIfNotExists, ZooKeeperCreateRequest>(*this);
     registerZooKeeperRequest<OpNum::SessionID, ZooKeeperSessionIDRequest>(*this);
     registerZooKeeperRequest<OpNum::GetACL, ZooKeeperGetACLRequest>(*this);
     registerZooKeeperRequest<OpNum::SetACL, ZooKeeperSetACLRequest>(*this);
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index 69f4dd84860..5f00698423e 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -194,7 +194,7 @@ struct ZooKeeperCloseResponse final : ZooKeeperResponse
     OpNum getOpNum() const override { return OpNum::Close; }
 };
 
-struct ZooKeeperCreateRequest : public CreateRequest, ZooKeeperRequest
+struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
 {
     /// used only during restore from zookeeper log
     int32_t parent_cversion = -1;
@@ -215,7 +215,7 @@ struct ZooKeeperCreateRequest : public CreateRequest, ZooKeeperRequest
     void createLogElements(LogElements & elems) const override;
 };
 
-struct ZooKeeperCreateResponse : CreateResponse, ZooKeeperResponse
+struct ZooKeeperCreateResponse final : CreateResponse, ZooKeeperResponse
 {
     void readImpl(ReadBuffer & in) override;
 
@@ -228,11 +228,6 @@ struct ZooKeeperCreateResponse : CreateResponse, ZooKeeperResponse
     void fillLogElements(LogElements & elems, size_t idx) const override;
 };
 
-struct ZooKeeperCreateIfNotExistsRequest final : public ZooKeeperCreateRequest
-{
-    OpNum getOpNum() const override { return OpNum::CreateIfNotExists; }
-};
-
 struct ZooKeeperRemoveRequest final : RemoveRequest, ZooKeeperRequest
 {
     ZooKeeperRemoveRequest() = default;
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index e0c69933337..825fcca42f5 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -1001,25 +1001,23 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
     Coordination::ZooKeeperResponsePtr process(KeeperStorage & storage, int64_t zxid) const override
     {
         Coordination::ZooKeeperResponsePtr response_ptr = zk_request->makeResponse();
-        Coordination::ZooKeeperCreateResponse * response = dynamic_cast<Coordination::ZooKeeperCreateResponse *>(response_ptr.get());
+        Coordination::ZooKeeperCreateResponse & response = dynamic_cast<Coordination::ZooKeeperCreateResponse &>(*response_ptr);
 
-        Coordination::ZooKeeperCreateIfNotExistsRequest * create_if_not_exists_request = dynamic_cast<Coordination::ZooKeeperCreateIfNotExistsRequest *>(zk_request.get());
-
-        if (create_if_not_exists_request != nullptr) {
-            Coordination::ZooKeeperCreateIfNotExistsRequest & request = dynamic_cast<Coordination::ZooKeeperCreateIfNotExistsRequest &>(*zk_request);
+        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists) {
+            Coordination::ZooKeeperCreateRequest & request = dynamic_cast<Coordination::ZooKeeperCreateRequest &>(*zk_request);
 
             auto & container = storage.container;
             auto node_it = container.find(request.path);
             if (node_it != container.end())
             {
-                response->error = Coordination::Error::ZOK;
+                response.error = Coordination::Error::ZOK;
                 return response_ptr;
             }
         }
 
         if (const auto result = storage.commit(zxid); result != Coordination::Error::ZOK)
         {
-            response->error = result;
+            response.error = result;
             return response_ptr;
         }
 
@@ -1030,8 +1028,8 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
             [zxid](const auto & delta)
             { return delta.zxid == zxid && std::holds_alternative<KeeperStorage::CreateNodeDelta>(delta.operation); });
 
-        response->path_created = create_delta_it->path;
-        response->error = Coordination::Error::ZOK;
+        response.path_created = create_delta_it->path;
+        response.error = Coordination::Error::ZOK;
         return response_ptr;
     }
 };

From f84fdb7f1079c688278d1378d677ecdc60bd942b Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <var1able@var1able.ru>
Date: Mon, 17 Apr 2023 17:48:22 +0200
Subject: [PATCH 003/101] Increment Keeper API version

---
 src/Coordination/KeeperConstants.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Coordination/KeeperConstants.h b/src/Coordination/KeeperConstants.h
index 4b5a5b54be0..afe3fcfb4c9 100644
--- a/src/Coordination/KeeperConstants.h
+++ b/src/Coordination/KeeperConstants.h
@@ -11,9 +11,10 @@ enum class KeeperApiVersion : uint8_t
     WITH_FILTERED_LIST,
     WITH_MULTI_READ,
     WITH_CHECK_NOT_EXISTS,
+    WITH_CREATE_IF_NOT_EXISTS
 };
 
-inline constexpr auto current_keeper_api_version = KeeperApiVersion::WITH_CHECK_NOT_EXISTS;
+inline constexpr auto current_keeper_api_version = KeeperApiVersion::WITH_CREATE_IF_NOT_EXISTS;
 
 const std::string keeper_system_path = "/keeper";
 const std::string keeper_api_version_path = keeper_system_path + "/api_version";

From 965f7850f8b7d5150bfedaffc11f9a5d4c2fe6fd Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <var1able@var1able.ru>
Date: Thu, 20 Apr 2023 13:26:52 +0200
Subject: [PATCH 004/101] Cleanup

---
 src/Common/ZooKeeper/ZooKeeperCommon.cpp |  2 ++
 src/Common/ZooKeeper/ZooKeeperCommon.h   |  5 ++++-
 src/Coordination/KeeperStorage.cpp       | 21 +++++++++++----------
 3 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.cpp b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
index c148b68b95e..89999f7d56b 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -941,6 +941,8 @@ void registerZooKeeperRequest(ZooKeeperRequestFactory & factory)
             res->operation_type = ZooKeeperMultiRequest::OperationType::Write;
         else if constexpr (num == OpNum::CheckNotExists)
             res->not_exists = true;
+        else if constexpr (num == OpNum::CreateIfNotExists)
+            res->not_exists = true;
 
         return res;
     });
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index 5f00698423e..ee4eab1156c 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -199,10 +199,13 @@ struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
     /// used only during restore from zookeeper log
     int32_t parent_cversion = -1;
 
+    /// should it fail if node already exists
+    bool not_exists = false;
+
     ZooKeeperCreateRequest() = default;
     explicit ZooKeeperCreateRequest(const CreateRequest & base) : CreateRequest(base) {}
 
-    OpNum getOpNum() const override { return OpNum::Create; }
+    OpNum getOpNum() const override { return not_exists ? OpNum::CreateIfNotExists : OpNum::Create; }
     void writeImpl(WriteBuffer & out) const override;
     void readImpl(ReadBuffer & in) override;
     std::string toStringImpl() const override;
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 825fcca42f5..8bfe1e667b4 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -917,6 +917,15 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
 
         std::vector<KeeperStorage::Delta> new_deltas;
 
+        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists) {
+            auto & container = storage.container;
+            auto node_it = container.find(request.path);
+            if (node_it != container.end())
+            {
+                return new_deltas;
+            }
+        }
+
         auto parent_path = parentPath(request.path);
         auto parent_node = storage.uncommitted_state.getNode(parent_path);
         if (parent_node == nullptr)
@@ -1003,16 +1012,8 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         Coordination::ZooKeeperResponsePtr response_ptr = zk_request->makeResponse();
         Coordination::ZooKeeperCreateResponse & response = dynamic_cast<Coordination::ZooKeeperCreateResponse &>(*response_ptr);
 
-        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists) {
-            Coordination::ZooKeeperCreateRequest & request = dynamic_cast<Coordination::ZooKeeperCreateRequest &>(*zk_request);
-
-            auto & container = storage.container;
-            auto node_it = container.find(request.path);
-            if (node_it != container.end())
-            {
-                response.error = Coordination::Error::ZOK;
-                return response_ptr;
-            }
+        if (storage.uncommitted_state.deltas.begin()->zxid != zxid) {
+            return response_ptr;
         }
 
         if (const auto result = storage.commit(zxid); result != Coordination::Error::ZOK)

From 7e151428acb257dbaab24940351159c9b50b6a9c Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 21 Apr 2023 15:10:38 +0200
Subject: [PATCH 005/101] Lint

---
 src/Common/ZooKeeper/ZooKeeperCommon.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.cpp b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
index 89999f7d56b..61b9d6e5172 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -1,4 +1,5 @@
 #include "Common/ZooKeeper/IKeeper.h"
+#include "Common/ZooKeeper/ZooKeeperConstants.h"
 #include <Common/ZooKeeper/ZooKeeperCommon.h>
 #include <Common/ZooKeeper/ZooKeeperIO.h>
 #include <Common/Stopwatch.h>
@@ -939,9 +940,7 @@ void registerZooKeeperRequest(ZooKeeperRequestFactory & factory)
             res->operation_type = ZooKeeperMultiRequest::OperationType::Read;
         else if constexpr (num == OpNum::Multi)
             res->operation_type = ZooKeeperMultiRequest::OperationType::Write;
-        else if constexpr (num == OpNum::CheckNotExists)
-            res->not_exists = true;
-        else if constexpr (num == OpNum::CreateIfNotExists)
+        else if constexpr (num == OpNum::CheckNotExists || num == OpNum::CreateIfNotExists)
             res->not_exists = true;
 
         return res;

From 203276dfcc40b9d4f2b19a1eb0af430e612e8949 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 21 Apr 2023 15:18:39 +0200
Subject: [PATCH 006/101] Use `storage.uncommited_state`

---
 src/Coordination/KeeperStorage.cpp | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 8bfe1e667b4..308f6dcf815 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -918,12 +918,14 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         std::vector<KeeperStorage::Delta> new_deltas;
 
         if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists) {
-            auto & container = storage.container;
-            auto node_it = container.find(request.path);
-            if (node_it != container.end())
-            {
+            // auto & container = storage.container;
+            // auto node_it = container.find(request.path);
+            // if (node_it != container.end())
+            // {
+            //     return new_deltas;
+            // }
+            if (storage.uncommitted_state.getNode(request.path) != nullptr)
                 return new_deltas;
-            }
         }
 
         auto parent_path = parentPath(request.path);

From 2b94418dc3e3a891212a7a677e11930b987e2f34 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Fri, 21 Apr 2023 15:19:08 +0200
Subject: [PATCH 007/101] Add new OpNum to ZooKeeperLogElement

---
 src/Interpreters/ZooKeeperLog.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/ZooKeeperLog.cpp b/src/Interpreters/ZooKeeperLog.cpp
index 48f4d510af7..880b9d3686d 100644
--- a/src/Interpreters/ZooKeeperLog.cpp
+++ b/src/Interpreters/ZooKeeperLog.cpp
@@ -88,6 +88,7 @@ NamesAndTypesList ZooKeeperLogElement::getNamesAndTypes()
                 {"SessionID",           static_cast<Int16>(Coordination::OpNum::SessionID)},
                 {"FilteredList",        static_cast<Int16>(Coordination::OpNum::FilteredList)},
                 {"CheckNotExists",      static_cast<Int16>(Coordination::OpNum::CheckNotExists)},
+                {"CreateIfNotExists",   static_cast<Int16>(Coordination::OpNum::CreateIfNotExists)},
             });
 
     auto error_enum = getCoordinationErrorCodesEnumType();

From bd2718c79dc0dbbd84b81f8086082f8164f887e7 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Mon, 8 May 2023 17:55:49 +0200
Subject: [PATCH 008/101] Fix comment

---
 src/Common/ZooKeeper/ZooKeeperCommon.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index ee4eab1156c..264b2bb9606 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -199,7 +199,7 @@ struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
     /// used only during restore from zookeeper log
     int32_t parent_cversion = -1;
 
-    /// should it fail if node already exists
+    /// should it succeed if node already exists
     bool not_exists = false;
 
     ZooKeeperCreateRequest() = default;

From 3a3539b9965012752f955e956e12624b54083bd2 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Mon, 8 May 2023 18:22:35 +0200
Subject: [PATCH 009/101] Style fix

---
 src/Coordination/KeeperStorage.cpp | 15 +++------------
 1 file changed, 3 insertions(+), 12 deletions(-)

diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 308f6dcf815..f368c11a2c6 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -917,16 +917,8 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
 
         std::vector<KeeperStorage::Delta> new_deltas;
 
-        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists) {
-            // auto & container = storage.container;
-            // auto node_it = container.find(request.path);
-            // if (node_it != container.end())
-            // {
-            //     return new_deltas;
-            // }
-            if (storage.uncommitted_state.getNode(request.path) != nullptr)
-                return new_deltas;
-        }
+        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists && storage.uncommitted_state.getNode(request.path) != nullptr)
+            return new_deltas;
 
         auto parent_path = parentPath(request.path);
         auto parent_node = storage.uncommitted_state.getNode(parent_path);
@@ -1014,9 +1006,8 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         Coordination::ZooKeeperResponsePtr response_ptr = zk_request->makeResponse();
         Coordination::ZooKeeperCreateResponse & response = dynamic_cast<Coordination::ZooKeeperCreateResponse &>(*response_ptr);
 
-        if (storage.uncommitted_state.deltas.begin()->zxid != zxid) {
+        if (storage.uncommitted_state.deltas.begin()->zxid != zxid)
             return response_ptr;
-        }
 
         if (const auto result = storage.commit(zxid); result != Coordination::Error::ZOK)
         {

From b61ffe3ff7873fe17a33d8ce90a795bd1d6879b6 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 9 May 2023 18:11:55 +0200
Subject: [PATCH 010/101] Merge checks

---
 src/Coordination/KeeperStorage.cpp | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index f368c11a2c6..53df5451e67 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -917,9 +917,6 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
 
         std::vector<KeeperStorage::Delta> new_deltas;
 
-        if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists && storage.uncommitted_state.getNode(request.path) != nullptr)
-            return new_deltas;
-
         auto parent_path = parentPath(request.path);
         auto parent_node = storage.uncommitted_state.getNode(parent_path);
         if (parent_node == nullptr)
@@ -949,7 +946,12 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         }
 
         if (storage.uncommitted_state.getNode(path_created))
+        {
+            if (zk_request->getOpNum() == Coordination::OpNum::CreateIfNotExists)
+                return new_deltas;
+
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZNODEEXISTS}};
+        }
 
         if (getBaseName(path_created).size == 0)
             return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADARGUMENTS}};

From b2324d723e02616d472f4b0c7622c99f4acd6296 Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <konstantin@clickhouse.com>
Date: Tue, 30 May 2023 21:09:37 +0200
Subject: [PATCH 011/101] Use native `createIfNotExists` for `createAncestors`
 if available

---
 src/Common/ZooKeeper/IKeeper.h           |  3 +++
 src/Common/ZooKeeper/Types.h             |  2 +-
 src/Common/ZooKeeper/ZooKeeper.cpp       | 30 +++++++++++++++++++++++-
 src/Common/ZooKeeper/ZooKeeperCommon.cpp |  8 ++++++-
 src/Common/ZooKeeper/ZooKeeperCommon.h   | 11 +++++----
 5 files changed, 47 insertions(+), 7 deletions(-)

diff --git a/src/Common/ZooKeeper/IKeeper.h b/src/Common/ZooKeeper/IKeeper.h
index 3eb5819df90..efc05fd7db1 100644
--- a/src/Common/ZooKeeper/IKeeper.h
+++ b/src/Common/ZooKeeper/IKeeper.h
@@ -199,6 +199,9 @@ struct CreateRequest : virtual Request
     bool is_sequential = false;
     ACLs acls;
 
+    /// should it succeed if node already exists
+    bool not_exists = false;
+
     void addRootPath(const String & root_path) override;
     String getPath() const override { return path; }
 
diff --git a/src/Common/ZooKeeper/Types.h b/src/Common/ZooKeeper/Types.h
index 0309f56ad5b..d2876adaabc 100644
--- a/src/Common/ZooKeeper/Types.h
+++ b/src/Common/ZooKeeper/Types.h
@@ -29,7 +29,7 @@ using EventPtr = std::shared_ptr<Poco::Event>;
 template <typename R>
 using AsyncResponses = std::vector<std::pair<std::string, std::future<R>>>;
 
-Coordination::RequestPtr makeCreateRequest(const std::string & path, const std::string & data, int create_mode);
+Coordination::RequestPtr makeCreateRequest(const std::string & path, const std::string & data, int create_mode, bool ignore_if_exists = false);
 Coordination::RequestPtr makeRemoveRequest(const std::string & path, int version);
 Coordination::RequestPtr makeSetRequest(const std::string & path, const std::string & data, int version);
 Coordination::RequestPtr makeCheckRequest(const std::string & path, int version);
diff --git a/src/Common/ZooKeeper/ZooKeeper.cpp b/src/Common/ZooKeeper/ZooKeeper.cpp
index a587ad6caf4..3357c75f50a 100644
--- a/src/Common/ZooKeeper/ZooKeeper.cpp
+++ b/src/Common/ZooKeeper/ZooKeeper.cpp
@@ -1,4 +1,5 @@
 #include "ZooKeeper.h"
+#include "Coordination/KeeperConstants.h"
 #include "ZooKeeperImpl.h"
 #include "KeeperException.h"
 #include "TestKeeper.h"
@@ -351,6 +352,32 @@ void ZooKeeper::createIfNotExists(const std::string & path, const std::string &
 void ZooKeeper::createAncestors(const std::string & path)
 {
     size_t pos = 1;
+
+    if (getApiVersion() >= DB::KeeperApiVersion::WITH_CREATE_IF_NOT_EXISTS)
+    {
+        Coordination::Requests create_ops;
+
+        while (true)
+        {
+            pos = path.find('/', pos);
+            if (pos == std::string::npos)
+                break;
+
+            auto request = makeCreateRequest(path.substr(0, pos), "", CreateMode::Persistent, true);
+            create_ops.emplace_back(request);
+
+            ++pos;
+        }
+
+        Coordination::Responses responses;
+        Coordination::Error code = multiImpl(create_ops, responses);
+
+        if (code == Coordination::Error::ZOK)
+            return;
+
+        throw KeeperException(code, path);
+    }
+
     while (true)
     {
         pos = path.find('/', pos);
@@ -1261,13 +1288,14 @@ void KeeperMultiException::check(
 }
 
 
-Coordination::RequestPtr makeCreateRequest(const std::string & path, const std::string & data, int create_mode)
+Coordination::RequestPtr makeCreateRequest(const std::string & path, const std::string & data, int create_mode, bool ignore_if_exists)
 {
     auto request = std::make_shared<Coordination::CreateRequest>();
     request->path = path;
     request->data = data;
     request->is_ephemeral = create_mode == CreateMode::Ephemeral || create_mode == CreateMode::EphemeralSequential;
     request->is_sequential = create_mode == CreateMode::PersistentSequential || create_mode == CreateMode::EphemeralSequential;
+    request->not_exists = ignore_if_exists;
     return request;
 }
 
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.cpp b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
index 61b9d6e5172..5a34f7cc8d5 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.cpp
@@ -660,7 +660,6 @@ void ZooKeeperMultiResponse::writeImpl(WriteBuffer & out) const
 ZooKeeperResponsePtr ZooKeeperHeartbeatRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperHeartbeatResponse>()); }
 ZooKeeperResponsePtr ZooKeeperSyncRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperSyncResponse>()); }
 ZooKeeperResponsePtr ZooKeeperAuthRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperAuthResponse>()); }
-ZooKeeperResponsePtr ZooKeeperCreateRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperCreateResponse>()); }
 ZooKeeperResponsePtr ZooKeeperRemoveRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperRemoveResponse>()); }
 ZooKeeperResponsePtr ZooKeeperExistsRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperExistsResponse>()); }
 ZooKeeperResponsePtr ZooKeeperGetRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperGetResponse>()); }
@@ -668,6 +667,13 @@ ZooKeeperResponsePtr ZooKeeperSetRequest::makeResponse() const { return setTime(
 ZooKeeperResponsePtr ZooKeeperListRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperListResponse>()); }
 ZooKeeperResponsePtr ZooKeeperSimpleListRequest::makeResponse() const { return setTime(std::make_shared<ZooKeeperSimpleListResponse>()); }
 
+ZooKeeperResponsePtr ZooKeeperCreateRequest::makeResponse() const
+{
+    if (not_exists)
+        return setTime(std::make_shared<ZooKeeperCreateIfNotExistsResponse>());
+    return setTime(std::make_shared<ZooKeeperCreateResponse>());
+}
+
 ZooKeeperResponsePtr ZooKeeperCheckRequest::makeResponse() const
 {
     if (not_exists)
diff --git a/src/Common/ZooKeeper/ZooKeeperCommon.h b/src/Common/ZooKeeper/ZooKeeperCommon.h
index 264b2bb9606..b79cbc204a0 100644
--- a/src/Common/ZooKeeper/ZooKeeperCommon.h
+++ b/src/Common/ZooKeeper/ZooKeeperCommon.h
@@ -199,9 +199,6 @@ struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
     /// used only during restore from zookeeper log
     int32_t parent_cversion = -1;
 
-    /// should it succeed if node already exists
-    bool not_exists = false;
-
     ZooKeeperCreateRequest() = default;
     explicit ZooKeeperCreateRequest(const CreateRequest & base) : CreateRequest(base) {}
 
@@ -218,7 +215,7 @@ struct ZooKeeperCreateRequest final : public CreateRequest, ZooKeeperRequest
     void createLogElements(LogElements & elems) const override;
 };
 
-struct ZooKeeperCreateResponse final : CreateResponse, ZooKeeperResponse
+struct ZooKeeperCreateResponse : CreateResponse, ZooKeeperResponse
 {
     void readImpl(ReadBuffer & in) override;
 
@@ -231,6 +228,12 @@ struct ZooKeeperCreateResponse final : CreateResponse, ZooKeeperResponse
     void fillLogElements(LogElements & elems, size_t idx) const override;
 };
 
+struct ZooKeeperCreateIfNotExistsResponse : ZooKeeperCreateResponse
+{
+    OpNum getOpNum() const override { return OpNum::CreateIfNotExists; }
+    using ZooKeeperCreateResponse::ZooKeeperCreateResponse;
+};
+
 struct ZooKeeperRemoveRequest final : RemoveRequest, ZooKeeperRequest
 {
     ZooKeeperRemoveRequest() = default;

From 6e8ccafbb22813f7c736c3fd2f5363124985da3e Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Mon, 5 Jun 2023 09:40:29 +0200
Subject: [PATCH 012/101] Fix test

---
 .../0_stateless/02735_system_zookeeper_connection.reference     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
index 1deabd88b88..2176580086b 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
@@ -1,2 +1,2 @@
-default	::1	9181	0	0	3
+default	::1	9181	0	0	4
 zookeeper2	::1	9181	0	0	0

From eb0e14b870108acf131456abee6acfab389bfa42 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 6 Jun 2023 00:44:20 +0000
Subject: [PATCH 013/101] allow to replace long file names to hashes

---
 src/Common/SipHash.h                          | 11 ++++
 src/DataTypes/Serializations/ISerialization.h |  1 +
 .../MergeTree/MergeTreeDataPartChecksum.cpp   | 13 ++++
 .../MergeTree/MergeTreeDataPartChecksum.h     |  2 +
 .../MergeTree/MergeTreeDataPartWriterWide.cpp | 40 +++++++-----
 .../MergeTree/MergeTreeDataPartWriterWide.h   |  4 ++
 .../MergeTree/MergeTreeReaderWide.cpp         | 61 +++++++++++--------
 src/Storages/MergeTree/MergeTreeSettings.h    |  2 +
 8 files changed, 93 insertions(+), 41 deletions(-)

diff --git a/src/Common/SipHash.h b/src/Common/SipHash.h
index 9e6479d81c1..e1cd5cc0aa3 100644
--- a/src/Common/SipHash.h
+++ b/src/Common/SipHash.h
@@ -20,6 +20,7 @@
 #include <base/extended_types.h>
 #include <base/types.h>
 #include <base/unaligned.h>
+#include <base/hex.h>
 #include <Common/Exception.h>
 
 
@@ -284,6 +285,16 @@ inline UInt128 sipHash128(const char * data, const size_t size)
     return sipHash128Keyed(0, 0, data, size);
 }
 
+inline String sipHash128String(const char * data, const size_t size)
+{
+    return getHexUIntLowercase(sipHash128(data, size));
+}
+
+inline String sipHash128String(const String & str)
+{
+    return sipHash128String(str.data(), str.size());
+}
+
 inline UInt128 sipHash128ReferenceKeyed(UInt64 key0, UInt64 key1, const char * data, const size_t size)
 {
     SipHash hash(key0, key1, true);
diff --git a/src/DataTypes/Serializations/ISerialization.h b/src/DataTypes/Serializations/ISerialization.h
index 17e6dfb85bc..ed090cefa38 100644
--- a/src/DataTypes/Serializations/ISerialization.h
+++ b/src/DataTypes/Serializations/ISerialization.h
@@ -368,6 +368,7 @@ public:
 
     static String getFileNameForStream(const NameAndTypePair & column, const SubstreamPath & path);
     static String getFileNameForStream(const String & name_in_storage, const SubstreamPath & path);
+
     static String getSubcolumnNameForStream(const SubstreamPath & path);
     static String getSubcolumnNameForStream(const SubstreamPath & path, size_t prefix_len);
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 78f68ea72fe..2f97edd1a9c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -8,6 +8,7 @@
 #include <Compression/CompressedReadBuffer.h>
 #include <Compression/CompressedWriteBuffer.h>
 #include <Storages/MergeTree/IDataPartStorage.h>
+#include <optional>
 
 
 namespace DB
@@ -340,6 +341,18 @@ MergeTreeDataPartChecksums::Checksum::uint128 MergeTreeDataPartChecksums::getTot
     return ret;
 }
 
+std::optional<String> MergeTreeDataPartChecksums::getFileNameOrHash(const String & name) const
+{
+    if (files.contains(name + ".bin"))
+        return name;
+
+    auto hash = sipHash128String(name);
+    if (files.contains(hash + ".bin"))
+        return hash;
+
+    return std::nullopt;
+}
+
 void MinimalisticDataPartChecksums::serialize(WriteBuffer & to) const
 {
     writeString("checksums format version: 5\n", to);
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index db110043b74..626b0a90839 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -88,6 +88,8 @@ struct MergeTreeDataPartChecksums
     static MergeTreeDataPartChecksums deserializeFrom(const String & s);
 
     UInt64 getTotalSizeOnDisk() const;
+
+    std::optional<String> getFileNameOrHash(const String & name) const;
 };
 
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
index f9fe6f2c8ab..60bb1119770 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
@@ -97,7 +97,15 @@ void MergeTreeDataPartWriterWide::addStreams(
     ISerialization::StreamCallback callback = [&](const auto & substream_path)
     {
         assert(!substream_path.empty());
-        String stream_name = ISerialization::getFileNameForStream(column, substream_path);
+
+        auto storage_settings = storage.getSettings();
+        auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+
+        String stream_name;
+        if (storage_settings->replace_long_file_name_to_hash && full_stream_name.size() > storage_settings->max_file_name_length)
+            stream_name = sipHash128String(full_stream_name);
+        else
+            stream_name = full_stream_name;
 
         /// Shared offsets for Nested type.
         if (column_streams.contains(stream_name))
@@ -126,12 +134,21 @@ void MergeTreeDataPartWriterWide::addStreams(
             marks_compression_codec,
             settings.marks_compress_block_size,
             settings.query_write_settings);
+
+        full_name_to_stream_name.emplace(full_stream_name, stream_name);
     };
 
     ISerialization::SubstreamPath path;
     data_part->getSerialization(column.name)->enumerateStreams(callback, column.type);
 }
 
+const String & MergeTreeDataPartWriterWide::getStreamName(
+    const NameAndTypePair & column,
+    const ISerialization::SubstreamPath & substream_path) const
+{
+    auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+    return full_name_to_stream_name.at(full_stream_name);
+}
 
 ISerialization::OutputStreamGetter MergeTreeDataPartWriterWide::createStreamGetter(
         const NameAndTypePair & column, WrittenOffsetColumns & offset_columns) const
@@ -139,8 +156,7 @@ ISerialization::OutputStreamGetter MergeTreeDataPartWriterWide::createStreamGett
     return [&, this] (const ISerialization::SubstreamPath & substream_path) -> WriteBuffer *
     {
         bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
-
-        String stream_name = ISerialization::getFileNameForStream(column, substream_path);
+        auto stream_name = getStreamName(column, substream_path);
 
         /// Don't write offsets more than one time for Nested type.
         if (is_offsets && offset_columns.contains(stream_name))
@@ -289,8 +305,7 @@ StreamsWithMarks MergeTreeDataPartWriterWide::getCurrentMarksForColumn(
     data_part->getSerialization(column.name)->enumerateStreams([&] (const ISerialization::SubstreamPath & substream_path)
     {
         bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
-
-        String stream_name = ISerialization::getFileNameForStream(column, substream_path);
+        auto stream_name = getStreamName(column, substream_path);
 
         /// Don't write offsets more than one time for Nested type.
         if (is_offsets && offset_columns.contains(stream_name))
@@ -328,14 +343,13 @@ void MergeTreeDataPartWriterWide::writeSingleGranule(
     serialization->enumerateStreams([&] (const ISerialization::SubstreamPath & substream_path)
     {
         bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
-
-        String stream_name = ISerialization::getFileNameForStream(name_and_type, substream_path);
+        auto stream_name = getStreamName(name_and_type, substream_path);
 
         /// Don't write offsets more than one time for Nested type.
         if (is_offsets && offset_columns.contains(stream_name))
             return;
 
-        column_streams[stream_name]->compressed_hashing.nextIfAtEnd();
+        column_streams.at(stream_name)->compressed_hashing.nextIfAtEnd();
     });
 }
 
@@ -406,10 +420,7 @@ void MergeTreeDataPartWriterWide::writeColumn(
     {
         bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
         if (is_offsets)
-        {
-            String stream_name = ISerialization::getFileNameForStream(name_and_type, substream_path);
-            offset_columns.insert(stream_name);
-        }
+            offset_columns.insert(getStreamName(name_and_type, substream_path));
     });
 }
 
@@ -656,10 +667,7 @@ void MergeTreeDataPartWriterWide::writeFinalMark(
     {
         bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
         if (is_offsets)
-        {
-            String stream_name = ISerialization::getFileNameForStream(column, substream_path);
-            offset_columns.insert(stream_name);
-        }
+            offset_columns.insert(getStreamName(column, substream_path));
     });
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
index 633b5119474..de7419fedb2 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
@@ -101,6 +101,7 @@ private:
     void adjustLastMarkIfNeedAndFlushToDisk(size_t new_rows_in_last_mark);
 
     ISerialization::OutputStreamGetter createStreamGetter(const NameAndTypePair & column, WrittenOffsetColumns & offset_columns) const;
+    const String & getStreamName(const NameAndTypePair & column, const ISerialization::SubstreamPath & substream_path) const;
 
     using SerializationState = ISerialization::SerializeBinaryBulkStatePtr;
     using SerializationStates = std::unordered_map<String, SerializationState>;
@@ -110,6 +111,9 @@ private:
     using ColumnStreams = std::map<String, StreamPtr>;
     ColumnStreams column_streams;
 
+    /// TODO:
+    std::unordered_map<String, String> full_name_to_stream_name;
+
     /// Non written marks to disk (for each column). Waiting until all rows for
     /// this marks will be written to disk.
     using MarksForColumns = std::unordered_map<String, StreamsWithMarks>;
diff --git a/src/Storages/MergeTree/MergeTreeReaderWide.cpp b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
index baacfa55c94..cd641a5cd2a 100644
--- a/src/Storages/MergeTree/MergeTreeReaderWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
@@ -198,13 +198,21 @@ size_t MergeTreeReaderWide::readRows(
     catch (...)
     {
         data_part_info_for_read->reportBroken();
-
         throw;
     }
 
     return read_rows;
 }
 
+std::optional<String> getStreamName(
+    const NameAndTypePair & column,
+    const ISerialization::SubstreamPath & substream_path,
+    const MergeTreeDataPartChecksums & checksums)
+{
+    auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+    return checksums.getFileNameOrHash(full_stream_name);
+}
+
 void MergeTreeReaderWide::addStreams(
     const NameAndTypePair & name_and_type,
     const SerializationPtr & serialization,
@@ -216,35 +224,33 @@ void MergeTreeReaderWide::addStreams(
 
     ISerialization::StreamCallback callback = [&] (const ISerialization::SubstreamPath & substream_path)
     {
-        String stream_name = ISerialization::getFileNameForStream(name_and_type, substream_path);
-
-        if (streams.contains(stream_name))
-        {
-            has_any_stream = true;
-            return;
-        }
-
-        bool data_file_exists = data_part_info_for_read->getChecksums().files.contains(stream_name + DATA_FILE_EXTENSION);
+        auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
         /** If data file is missing then we will not try to open it.
           * It is necessary since it allows to add new column to structure of the table without creating new files for old parts.
           */
-        if (!data_file_exists)
+        if (!stream_name)
         {
             has_all_streams = false;
             return;
         }
 
+        if (streams.contains(*stream_name))
+        {
+            has_any_stream = true;
+            return;
+        }
+
         has_any_stream = true;
         bool is_lc_dict = substream_path.size() > 1 && substream_path[substream_path.size() - 2].type == ISerialization::Substream::Type::DictionaryKeys;
 
         auto context = data_part_info_for_read->getContext();
         auto * load_marks_threadpool = settings.read_settings.load_marks_asynchronously ? &context->getLoadMarksThreadpool() : nullptr;
 
-        streams.emplace(stream_name, std::make_unique<MergeTreeReaderStream>(
-            data_part_info_for_read, stream_name, DATA_FILE_EXTENSION,
+        streams.emplace(*stream_name, std::make_unique<MergeTreeReaderStream>(
+            data_part_info_for_read, *stream_name, DATA_FILE_EXTENSION,
             data_part_info_for_read->getMarksCount(), all_mark_ranges, settings, mark_cache,
-            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(stream_name + DATA_FILE_EXTENSION),
+            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(*stream_name + DATA_FILE_EXTENSION),
             &data_part_info_for_read->getIndexGranularityInfo(),
             profile_callback, clock_type, is_lc_dict, load_marks_threadpool));
     };
@@ -255,13 +261,14 @@ void MergeTreeReaderWide::addStreams(
         partially_read_columns.insert(name_and_type.name);
 }
 
-
 static ReadBuffer * getStream(
     bool seek_to_start,
     const ISerialization::SubstreamPath & substream_path,
+    const MergeTreeDataPartChecksums & checksums,
     MergeTreeReaderWide::FileStreams & streams,
     const NameAndTypePair & name_and_type,
-    size_t from_mark, bool seek_to_mark,
+    size_t from_mark,
+    bool seek_to_mark,
     size_t current_task_last_mark,
     ISerialization::SubstreamsCache & cache)
 {
@@ -269,9 +276,12 @@ static ReadBuffer * getStream(
     if (cache.contains(ISerialization::getSubcolumnNameForStream(substream_path)))
         return nullptr;
 
-    String stream_name = ISerialization::getFileNameForStream(name_and_type, substream_path);
+    auto stream_name = getStreamName(name_and_type, substream_path, checksums);
 
-    auto it = streams.find(stream_name);
+    if (!stream_name)
+        return nullptr;
+
+    auto it = streams.find(*stream_name);
     if (it == streams.end())
         return nullptr;
 
@@ -298,7 +308,7 @@ void MergeTreeReaderWide::deserializePrefix(
         ISerialization::DeserializeBinaryBulkSettings deserialize_settings;
         deserialize_settings.getter = [&](const ISerialization::SubstreamPath & substream_path)
         {
-            return getStream(/* seek_to_start = */true, substream_path, streams, name_and_type, 0, /* seek_to_mark = */false, current_task_last_mark, cache);
+            return getStream(/* seek_to_start = */true, substream_path, data_part_info_for_read->getChecksums(), streams, name_and_type, 0, /* seek_to_mark = */false, current_task_last_mark, cache);
         };
         serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, deserialize_binary_bulk_state_map[name]);
     }
@@ -317,15 +327,15 @@ void MergeTreeReaderWide::prefetchForColumn(
 
     serialization->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
-        String stream_name = ISerialization::getFileNameForStream(name_and_type, substream_path);
+        auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
-        if (!prefetched_streams.contains(stream_name))
+        if (stream_name && !prefetched_streams.contains(*stream_name))
         {
             bool seek_to_mark = !continue_reading;
-            if (ReadBuffer * buf = getStream(false, substream_path, streams, name_and_type, from_mark, seek_to_mark, current_task_last_mark, cache))
+            if (ReadBuffer * buf = getStream(false, substream_path, data_part_info_for_read->getChecksums(), streams, name_and_type, from_mark, seek_to_mark, current_task_last_mark, cache))
             {
                 buf->prefetch(priority);
-                prefetched_streams.insert(stream_name);
+                prefetched_streams.insert(*stream_name);
             }
         }
     });
@@ -348,8 +358,9 @@ void MergeTreeReaderWide::readData(
         bool seek_to_mark = !was_prefetched && !continue_reading;
 
         return getStream(
-            /* seek_to_start = */false, substream_path, streams, name_and_type, from_mark,
-            seek_to_mark, current_task_last_mark, cache);
+            /* seek_to_start = */false, substream_path,
+            data_part_info_for_read->getChecksums(), streams,
+            name_and_type, from_mark, seek_to_mark, current_task_last_mark, cache);
     };
 
     deserialize_settings.continuous_reading = continue_reading;
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 5ea99009756..ae4d585e5fe 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -34,6 +34,8 @@ struct Settings;
     M(UInt64, min_bytes_for_wide_part, 10485760, "Minimal uncompressed size in bytes to create part in wide format instead of compact", 0) \
     M(UInt64, min_rows_for_wide_part, 0, "Minimal number of rows to create part in wide format instead of compact", 0) \
     M(Float, ratio_of_defaults_for_sparse_serialization, 1.0, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
+    M(Bool, replace_long_file_name_to_hash, false, "", 0) \
+    M(UInt64, max_file_name_length, 128, "", 0) \
     \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \

From b30544a6ab6b773ed3dc7bd6c3cffcebbb6ae1b8 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 6 Jun 2023 01:39:45 +0000
Subject: [PATCH 014/101] allow to replace long file names to hashes

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  6 +++-
 .../MergeTree/IMergedBlockOutputStream.cpp    |  8 +++--
 .../MergeTree/MergeTreeDataPartChecksum.cpp   |  4 +--
 .../MergeTree/MergeTreeDataPartChecksum.h     |  2 +-
 .../MergeTree/MergeTreeDataPartWide.cpp       | 24 +++++++++-----
 .../MergeTree/MergeTreeReaderWide.cpp         | 33 +++++++++----------
 src/Storages/MergeTree/MergeTreeSettings.h    |  4 +--
 src/Storages/MergeTree/MutateTask.cpp         | 15 ++++++---
 src/Storages/MergeTree/checkDataPart.cpp      | 13 +++++++-
 .../System/StorageSystemPartsColumns.cpp      |  7 ++--
 10 files changed, 75 insertions(+), 41 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index d27b03fff44..dfc1fe0c262 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1,4 +1,5 @@
 #include "IMergeTreeDataPart.h"
+#include "Common/SipHash.h"
 #include "Storages/MergeTree/IDataPartStorage.h"
 
 #include <optional>
@@ -1015,7 +1016,10 @@ CompressionCodecPtr IMergeTreeDataPart::detectDefaultCompressionCodec() const
             {
                 if (path_to_data_file.empty())
                 {
-                    String candidate_path = /*fs::path(getRelativePath()) */ (ISerialization::getFileNameForStream(part_column, substream_path) + ".bin");
+                    auto candidate_path = ISerialization::getFileNameForStream(part_column, substream_path) + ".bin";
+
+                    if (!getDataPartStorage().exists(candidate_path))
+                        candidate_path = sipHash128String(candidate_path) + ".bin";
 
                     /// We can have existing, but empty .bin files. Example: LowCardinality(Nullable(...)) columns and column_name.dict.null.bin file.
                     if (getDataPartStorage().exists(candidate_path) && getDataPartStorage().getFileSize(candidate_path) != 0)
diff --git a/src/Storages/MergeTree/IMergedBlockOutputStream.cpp b/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
index 21bead2864a..2df3b6d15a6 100644
--- a/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
@@ -51,7 +51,9 @@ NameSet IMergedBlockOutputStream::removeEmptyColumnsFromPart(
         data_part->getSerialization(column.name)->enumerateStreams(
             [&](const ISerialization::SubstreamPath & substream_path)
             {
-                ++stream_counts[ISerialization::getFileNameForStream(column.name, substream_path)];
+                auto full_stream_name = ISerialization::getFileNameForStream(column.name, substream_path);
+                auto stream_name = checksums.getFileNameOrHash(full_stream_name);
+                ++stream_counts[stream_name];
             });
     }
 
@@ -65,7 +67,9 @@ NameSet IMergedBlockOutputStream::removeEmptyColumnsFromPart(
 
         ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
         {
-            String stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+            auto full_stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+            auto stream_name = checksums.getFileNameOrHash(full_stream_name);
+
             /// Delete files if they are no longer shared with another column.
             if (--stream_counts[stream_name] == 0)
             {
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 2f97edd1a9c..7d39ea0707f 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -341,7 +341,7 @@ MergeTreeDataPartChecksums::Checksum::uint128 MergeTreeDataPartChecksums::getTot
     return ret;
 }
 
-std::optional<String> MergeTreeDataPartChecksums::getFileNameOrHash(const String & name) const
+String MergeTreeDataPartChecksums::getFileNameOrHash(const String & name) const
 {
     if (files.contains(name + ".bin"))
         return name;
@@ -350,7 +350,7 @@ std::optional<String> MergeTreeDataPartChecksums::getFileNameOrHash(const String
     if (files.contains(hash + ".bin"))
         return hash;
 
-    return std::nullopt;
+    return name;
 }
 
 void MinimalisticDataPartChecksums::serialize(WriteBuffer & to) const
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 626b0a90839..2a38b52c72a 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -89,7 +89,7 @@ struct MergeTreeDataPartChecksums
 
     UInt64 getTotalSizeOnDisk() const;
 
-    std::optional<String> getFileNameOrHash(const String & name) const;
+    String getFileNameOrHash(const String & name) const;
 };
 
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index f44cbdd8628..645e16eed38 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -73,19 +73,20 @@ ColumnSize MergeTreeDataPartWide::getColumnSizeImpl(
 
     getSerialization(column.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
-        String file_name = ISerialization::getFileNameForStream(column, substream_path);
+        auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+        auto stream_name = checksums.getFileNameOrHash(full_stream_name);
 
-        if (processed_substreams && !processed_substreams->insert(file_name).second)
+        if (processed_substreams && !processed_substreams->insert(stream_name).second)
             return;
 
-        auto bin_checksum = checksums.files.find(file_name + ".bin");
+        auto bin_checksum = checksums.files.find(stream_name + ".bin");
         if (bin_checksum != checksums.files.end())
         {
             size.data_compressed += bin_checksum->second.file_size;
             size.data_uncompressed += bin_checksum->second.uncompressed_size;
         }
 
-        auto mrk_checksum = checksums.files.find(file_name + getMarksFileExtension());
+        auto mrk_checksum = checksums.files.find(stream_name + getMarksFileExtension());
         if (mrk_checksum != checksums.files.end())
             size.marks += mrk_checksum->second.file_size;
     });
@@ -185,9 +186,11 @@ void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
             {
                 getSerialization(name_type.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
                 {
-                    String file_name = ISerialization::getFileNameForStream(name_type, substream_path);
-                    String mrk_file_name = file_name + marks_file_extension;
-                    String bin_file_name = file_name + DATA_FILE_EXTENSION;
+                    String full_stream_name = ISerialization::getFileNameForStream(name_type, substream_path);
+                    String stream_name = checksums.getFileNameOrHash(full_stream_name);
+
+                    String mrk_file_name = stream_name + marks_file_extension;
+                    String bin_file_name = stream_name + DATA_FILE_EXTENSION;
 
                     if (!checksums.files.contains(mrk_file_name))
                         throw Exception(
@@ -213,6 +216,8 @@ void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
             getSerialization(name_type.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
             {
                 auto file_path = ISerialization::getFileNameForStream(name_type, substream_path) + marks_file_extension;
+                if (!getDataPartStorage().exists(file_path))
+                    file_path = sipHash128String(file_path) + marks_file_extension;
 
                 /// Missing file is Ok for case when new column was added.
                 if (getDataPartStorage().exists(file_path))
@@ -266,7 +271,10 @@ String MergeTreeDataPartWide::getFileNameForColumn(const NameAndTypePair & colum
     getSerialization(column.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
         if (filename.empty())
-            filename = ISerialization::getFileNameForStream(column, substream_path);
+        {
+            auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+            auto filname = checksums.getFileNameOrHash(full_stream_name);
+        }
     });
     return filename;
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderWide.cpp b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
index cd641a5cd2a..0ce20dc02f0 100644
--- a/src/Storages/MergeTree/MergeTreeReaderWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
@@ -204,7 +204,7 @@ size_t MergeTreeReaderWide::readRows(
     return read_rows;
 }
 
-std::optional<String> getStreamName(
+String getStreamName(
     const NameAndTypePair & column,
     const ISerialization::SubstreamPath & substream_path,
     const MergeTreeDataPartChecksums & checksums)
@@ -226,18 +226,20 @@ void MergeTreeReaderWide::addStreams(
     {
         auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
-        /** If data file is missing then we will not try to open it.
-          * It is necessary since it allows to add new column to structure of the table without creating new files for old parts.
-          */
-        if (!stream_name)
+        if (streams.contains(stream_name))
         {
-            has_all_streams = false;
+            has_any_stream = true;
             return;
         }
 
-        if (streams.contains(*stream_name))
+        bool data_file_exists = data_part_info_for_read->getChecksums().files.contains(stream_name + DATA_FILE_EXTENSION);
+
+        /** If data file is missing then we will not try to open it.
+          * It is necessary since it allows to add new column to structure of the table without creating new files for old parts.
+          */
+        if (!data_file_exists)
         {
-            has_any_stream = true;
+            has_all_streams = false;
             return;
         }
 
@@ -247,10 +249,10 @@ void MergeTreeReaderWide::addStreams(
         auto context = data_part_info_for_read->getContext();
         auto * load_marks_threadpool = settings.read_settings.load_marks_asynchronously ? &context->getLoadMarksThreadpool() : nullptr;
 
-        streams.emplace(*stream_name, std::make_unique<MergeTreeReaderStream>(
-            data_part_info_for_read, *stream_name, DATA_FILE_EXTENSION,
+        streams.emplace(stream_name, std::make_unique<MergeTreeReaderStream>(
+            data_part_info_for_read, stream_name, DATA_FILE_EXTENSION,
             data_part_info_for_read->getMarksCount(), all_mark_ranges, settings, mark_cache,
-            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(*stream_name + DATA_FILE_EXTENSION),
+            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(stream_name + DATA_FILE_EXTENSION),
             &data_part_info_for_read->getIndexGranularityInfo(),
             profile_callback, clock_type, is_lc_dict, load_marks_threadpool));
     };
@@ -278,10 +280,7 @@ static ReadBuffer * getStream(
 
     auto stream_name = getStreamName(name_and_type, substream_path, checksums);
 
-    if (!stream_name)
-        return nullptr;
-
-    auto it = streams.find(*stream_name);
+    auto it = streams.find(stream_name);
     if (it == streams.end())
         return nullptr;
 
@@ -329,13 +328,13 @@ void MergeTreeReaderWide::prefetchForColumn(
     {
         auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
-        if (stream_name && !prefetched_streams.contains(*stream_name))
+        if (!prefetched_streams.contains(stream_name))
         {
             bool seek_to_mark = !continue_reading;
             if (ReadBuffer * buf = getStream(false, substream_path, data_part_info_for_read->getChecksums(), streams, name_and_type, from_mark, seek_to_mark, current_task_last_mark, cache))
             {
                 buf->prefetch(priority);
-                prefetched_streams.insert(*stream_name);
+                prefetched_streams.insert(stream_name);
             }
         }
     });
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index ae4d585e5fe..0d32567d2fa 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -34,8 +34,8 @@ struct Settings;
     M(UInt64, min_bytes_for_wide_part, 10485760, "Minimal uncompressed size in bytes to create part in wide format instead of compact", 0) \
     M(UInt64, min_rows_for_wide_part, 0, "Minimal number of rows to create part in wide format instead of compact", 0) \
     M(Float, ratio_of_defaults_for_sparse_serialization, 1.0, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
-    M(Bool, replace_long_file_name_to_hash, false, "", 0) \
-    M(UInt64, max_file_name_length, 128, "", 0) \
+    M(Bool, replace_long_file_name_to_hash, false, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
+    M(UInt64, max_file_name_length, 128, "The maximal length of the file name to keep it as is without hashing", 0) \
     \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 76096d00641..4bcaea53337 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -1,3 +1,4 @@
+#include "Common/SipHash.h"
 #include <Storages/MergeTree/MutateTask.h>
 
 #include <Common/logger_useful.h>
@@ -591,7 +592,8 @@ static std::unordered_map<String, size_t> getStreamCounts(
         {
             auto callback = [&](const ISerialization::SubstreamPath & substream_path)
             {
-                auto stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+                auto full_stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+                auto stream_name = data_part->checksums.getFileNameOrHash(full_stream_name);
                 ++stream_counts[stream_name];
             };
 
@@ -705,7 +707,9 @@ static NameToNameVector collectFilesForRenames(
         {
             ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
             {
-                String stream_name = ISerialization::getFileNameForStream({command.column_name, command.data_type}, substream_path);
+                auto full_stream_name = ISerialization::getFileNameForStream({command.column_name, command.data_type}, substream_path);
+                auto stream_name = source_part->checksums.getFileNameOrHash(full_stream_name);
+
                 /// Delete files if they are no longer shared with another column.
                 if (--stream_counts[stream_name] == 0)
                 {
@@ -724,8 +728,11 @@ static NameToNameVector collectFilesForRenames(
 
             ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
             {
-                String stream_from = ISerialization::getFileNameForStream(command.column_name, substream_path);
-                String stream_to = boost::replace_first_copy(stream_from, escaped_name_from, escaped_name_to);
+                String full_stream_from = ISerialization::getFileNameForStream(command.column_name, substream_path);
+                String full_stream_to = boost::replace_first_copy(full_stream_from, escaped_name_from, escaped_name_to);
+
+                String stream_from = source_part->checksums.getFileNameOrHash(full_stream_from);
+                String stream_to = stream_from == full_stream_from ? full_stream_to : sipHash128String(full_stream_to);
 
                 if (stream_from != stream_to)
                 {
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 00710ed3ed6..561f76d8b5f 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -11,6 +11,7 @@
 #include <Compression/CompressedReadBuffer.h>
 #include <IO/HashingReadBuffer.h>
 #include <Common/CurrentMetrics.h>
+#include <Common/SipHash.h>
 
 
 namespace CurrentMetrics
@@ -30,6 +31,7 @@ namespace ErrorCodes
     extern const int CANNOT_MUNMAP;
     extern const int CANNOT_MREMAP;
     extern const int UNEXPECTED_FILE_IN_DATA_PART;
+    extern const int NO_FILE_IN_DATA_PART;
 }
 
 
@@ -137,7 +139,16 @@ IMergeTreeDataPart::Checksums checkDataPart(
         {
             get_serialization(column)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
             {
-                String file_name = ISerialization::getFileNameForStream(column, substream_path) + ".bin";
+                auto file_name = ISerialization::getFileNameForStream(column, substream_path) + ".bin";
+
+                if (!data_part_storage.exists(file_name))
+                    file_name = sipHash128String(file_name);
+
+                if (!data_part_storage.exists(file_name))
+                    throw Exception(ErrorCodes::NO_FILE_IN_DATA_PART,
+                        "There is no file for column '{}' in data part '{}'",
+                        column.name, data_part->name);
+
                 checksums_data.files[file_name] = checksum_compressed_file(data_part_storage, file_name);
             });
         }
diff --git a/src/Storages/System/StorageSystemPartsColumns.cpp b/src/Storages/System/StorageSystemPartsColumns.cpp
index 00b958b015f..de874b22e7e 100644
--- a/src/Storages/System/StorageSystemPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemPartsColumns.cpp
@@ -261,16 +261,17 @@ void StorageSystemPartsColumns::processNextStorage(
 
                 ColumnSize size;
                 NameAndTypePair subcolumn(column.name, name, column.type, data.type);
-                String file_name = ISerialization::getFileNameForStream(subcolumn, subpath);
+                String full_stream_name = ISerialization::getFileNameForStream(subcolumn, subpath);
+                String stream_name = part->checksums.getFileNameOrHash(full_stream_name);
 
-                auto bin_checksum = part->checksums.files.find(file_name + ".bin");
+                auto bin_checksum = part->checksums.files.find(stream_name + ".bin");
                 if (bin_checksum != part->checksums.files.end())
                 {
                     size.data_compressed += bin_checksum->second.file_size;
                     size.data_uncompressed += bin_checksum->second.uncompressed_size;
                 }
 
-                auto mrk_checksum = part->checksums.files.find(file_name + part->index_granularity_info.mark_type.getFileExtension());
+                auto mrk_checksum = part->checksums.files.find(stream_name + part->index_granularity_info.mark_type.getFileExtension());
                 if (mrk_checksum != part->checksums.files.end())
                     size.marks += mrk_checksum->second.file_size;
 

From 0b06f247829d15fcf493d3d1804592ef0b9bd9c2 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 6 Jun 2023 01:40:34 +0000
Subject: [PATCH 015/101] temporarly enable hashing of names

---
 src/Storages/MergeTree/MergeTreeSettings.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 0d32567d2fa..d63e33e2477 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -34,8 +34,8 @@ struct Settings;
     M(UInt64, min_bytes_for_wide_part, 10485760, "Minimal uncompressed size in bytes to create part in wide format instead of compact", 0) \
     M(UInt64, min_rows_for_wide_part, 0, "Minimal number of rows to create part in wide format instead of compact", 0) \
     M(Float, ratio_of_defaults_for_sparse_serialization, 1.0, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
-    M(Bool, replace_long_file_name_to_hash, false, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
-    M(UInt64, max_file_name_length, 128, "The maximal length of the file name to keep it as is without hashing", 0) \
+    M(Bool, replace_long_file_name_to_hash, true, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
+    M(UInt64, max_file_name_length, 0, "The maximal length of the file name to keep it as is without hashing", 0) \
     \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \

From a8a561b28cd8f1f5835c0bce288755fbe0819928 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 6 Jun 2023 01:54:01 +0000
Subject: [PATCH 016/101] fix typo

---
 src/Storages/MergeTree/MergeTreeDataPartWide.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index 645e16eed38..04e672933a5 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -273,7 +273,7 @@ String MergeTreeDataPartWide::getFileNameForColumn(const NameAndTypePair & colum
         if (filename.empty())
         {
             auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
-            auto filname = checksums.getFileNameOrHash(full_stream_name);
+            filename = checksums.getFileNameOrHash(full_stream_name);
         }
     });
     return filename;

From 562ad9536669b9932cc196852354bfdb8f484402 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 6 Jun 2023 18:01:11 +0000
Subject: [PATCH 017/101] fix getting the size of column

---
 src/Storages/MergeTree/MergeTreeDataPartWide.cpp | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index 04e672933a5..f8627ec8073 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -257,8 +257,10 @@ bool MergeTreeDataPartWide::hasColumnFiles(const NameAndTypePair & column) const
     bool res = true;
     getSerialization(column.name)->enumerateStreams([&](const auto & substream_path)
     {
-        String file_name = ISerialization::getFileNameForStream(column, substream_path);
-        if (!check_stream_exists(file_name))
+        auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+        auto stream_name = checksums.getFileNameOrHash(full_stream_name);
+
+        if (!check_stream_exists(stream_name))
             res = false;
     });
 

From 8864e30d2eee950d5d4d6eaaa910754cb66b9343 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 22 Jun 2023 15:17:13 +0000
Subject: [PATCH 018/101] fix replacing column names after mutation

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  1 -
 .../MergeTree/IMergeTreeDataPartWriter.h      |  2 +-
 .../MergeTree/MergeTreeDataPartChecksum.cpp   | 37 ++++++-------------
 .../MergeTreeDataPartWriterCompact.cpp        |  2 +-
 .../MergeTreeDataPartWriterCompact.h          |  2 +-
 .../MergeTreeDataPartWriterInMemory.cpp       |  2 +-
 .../MergeTreeDataPartWriterInMemory.h         |  2 +-
 .../MergeTree/MergeTreeDataPartWriterWide.cpp | 22 ++++++++---
 .../MergeTree/MergeTreeDataPartWriterWide.h   |  9 +++--
 .../MergeTree/MergedBlockOutputStream.cpp     |  6 ++-
 .../MergedColumnOnlyOutputStream.cpp          | 10 +++--
 .../configs/wide_parts_only.xml               |  1 +
 .../configs/wide_parts_only.xml               |  1 +
 .../test_filesystem_layout/test.py            |  2 +-
 .../configs/wide_parts_only.xml               |  1 +
 tests/integration/test_partition/test.py      |  2 +-
 16 files changed, 54 insertions(+), 48 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index fa33bef1582..289c41e5d10 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1,5 +1,4 @@
 #include "IMergeTreeDataPart.h"
-#include "Common/SipHash.h"
 #include "Storages/MergeTree/IDataPartStorage.h"
 
 #include <optional>
diff --git a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
index fa3c675f7da..3f359904ddd 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartWriter.h
@@ -32,7 +32,7 @@ public:
 
     virtual void write(const Block & block, const IColumn::Permutation * permutation) = 0;
 
-    virtual void fillChecksums(IMergeTreeDataPart::Checksums & checksums) = 0;
+    virtual void fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove) = 0;
 
     virtual void finish(bool sync) = 0;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 7d39ea0707f..5dc71147246 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -68,44 +68,35 @@ void MergeTreeDataPartChecksum::checkSize(const IDataPartStorage & storage, cons
 
 void MergeTreeDataPartChecksums::checkEqual(const MergeTreeDataPartChecksums & rhs, bool have_uncompressed) const
 {
-    for (const auto & it : rhs.files)
-    {
-        const String & name = it.first;
-
+    for (const auto & [name, _] : rhs.files)
         if (!files.contains(name))
             throw Exception(ErrorCodes::UNEXPECTED_FILE_IN_DATA_PART, "Unexpected file {} in data part", name);
-    }
 
-    for (const auto & it : files)
+    for (const auto & [name, checksum] : files)
     {
-        const String & name = it.first;
-
         /// Exclude files written by inverted index from check. No correct checksums are available for them currently.
         if (name.ends_with(".gin_dict") || name.ends_with(".gin_post") || name.ends_with(".gin_seg") || name.ends_with(".gin_sid"))
             continue;
 
-        auto jt = rhs.files.find(name);
-        if (jt == rhs.files.end())
+        auto it = rhs.files.find(name);
+        if (it == rhs.files.end())
             throw Exception(ErrorCodes::NO_FILE_IN_DATA_PART, "No file {} in data part", name);
 
-        it.second.checkEqual(jt->second, have_uncompressed, name);
+        checksum.checkEqual(it->second, have_uncompressed, name);
     }
 }
 
 void MergeTreeDataPartChecksums::checkSizes(const IDataPartStorage & storage) const
 {
-    for (const auto & it : files)
-    {
-        const String & name = it.first;
-        it.second.checkSize(storage, name);
-    }
+    for (const auto & [name, checksum] : files)
+        checksum.checkSize(storage, name);
 }
 
 UInt64 MergeTreeDataPartChecksums::getTotalSizeOnDisk() const
 {
     UInt64 res = 0;
-    for (const auto & it : files)
-        res += it.second.file_size;
+    for (const auto & [_, checksum] : files)
+        res += checksum.file_size;
     return res;
 }
 
@@ -219,11 +210,8 @@ void MergeTreeDataPartChecksums::write(WriteBuffer & to) const
 
     writeVarUInt(files.size(), out);
 
-    for (const auto & it : files)
+    for (const auto & [name, sum] : files)
     {
-        const String & name = it.first;
-        const Checksum & sum = it.second;
-
         writeBinary(name, out);
         writeVarUInt(sum.file_size, out);
         writePODBinary(sum.file_hash, out);
@@ -256,11 +244,8 @@ void MergeTreeDataPartChecksums::add(MergeTreeDataPartChecksums && rhs_checksums
 void MergeTreeDataPartChecksums::computeTotalChecksumDataOnly(SipHash & hash) const
 {
     /// We use fact that iteration is in deterministic (lexicographical) order.
-    for (const auto & it : files)
+    for (const auto & [name, sum] : files)
     {
-        const String & name = it.first;
-        const Checksum & sum = it.second;
-
         if (!endsWith(name, ".bin"))
             continue;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
index 0b650eb9f16..9b8f1155912 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
@@ -403,7 +403,7 @@ size_t MergeTreeDataPartWriterCompact::ColumnsBuffer::size() const
     return accumulated_columns.at(0)->size();
 }
 
-void MergeTreeDataPartWriterCompact::fillChecksums(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterCompact::fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & /*checksums_to_remove*/)
 {
     // If we don't have anything to write, skip finalization.
     if (!columns_list.empty())
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
index 06f8122393f..b1cfefd2d8f 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.h
@@ -22,7 +22,7 @@ public:
 
     void write(const Block & block, const IColumn::Permutation * permutation) override;
 
-    void fillChecksums(IMergeTreeDataPart::Checksums & checksums) override;
+    void fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove) override;
     void finish(bool sync) override;
 
 private:
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
index 9afa7a1e80d..048339b58c9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.cpp
@@ -76,7 +76,7 @@ void MergeTreeDataPartWriterInMemory::calculateAndSerializePrimaryIndex(const Bl
     }
 }
 
-void MergeTreeDataPartWriterInMemory::fillChecksums(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterInMemory::fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & /*checksums_to_remove*/)
 {
     /// If part is empty we still need to initialize block by empty columns.
     if (!part_in_memory->block)
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
index 9e1e868beac..2d333822652 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterInMemory.h
@@ -18,7 +18,7 @@ public:
     /// You can write only one block. In-memory part can be written only at INSERT.
     void write(const Block & block, const IColumn::Permutation * permutation) override;
 
-    void fillChecksums(IMergeTreeDataPart::Checksums & checksums) override;
+    void fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove) override;
     void finish(bool /*sync*/) override {}
 
 private:
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
index 60bb1119770..c9dae9a1f2c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
@@ -136,6 +136,7 @@ void MergeTreeDataPartWriterWide::addStreams(
             settings.query_write_settings);
 
         full_name_to_stream_name.emplace(full_stream_name, stream_name);
+        stream_name_to_full_name.emplace(stream_name, full_stream_name);
     };
 
     ISerialization::SubstreamPath path;
@@ -562,7 +563,7 @@ void MergeTreeDataPartWriterWide::validateColumnOfFixedSize(const NameAndTypePai
 
 }
 
-void MergeTreeDataPartWriterWide::fillDataChecksums(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterWide::fillDataChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove)
 {
     const auto & global_settings = storage.getContext()->getSettingsRef();
     ISerialization::SerializeBinaryBulkSettings serialize_settings;
@@ -598,10 +599,19 @@ void MergeTreeDataPartWriterWide::fillDataChecksums(IMergeTreeDataPart::Checksum
         }
     }
 
-    for (auto & stream : column_streams)
+    for (auto & [stream_name, stream] : column_streams)
     {
-        stream.second->preFinalize();
-        stream.second->addToChecksums(checksums);
+        /// Remove checksums for old stream name if file was
+        /// renamed due to replacing the name to the hash of name.
+        const auto & full_stream_name = stream_name_to_full_name.at(stream_name);
+        if (stream_name != full_stream_name)
+        {
+            checksums_to_remove.insert(full_stream_name + stream->data_file_extension);
+            checksums_to_remove.insert(full_stream_name + stream->marks_file_extension);
+        }
+
+        stream->preFinalize();
+        stream->addToChecksums(checksums);
     }
 }
 
@@ -633,11 +643,11 @@ void MergeTreeDataPartWriterWide::finishDataSerialization(bool sync)
 
 }
 
-void MergeTreeDataPartWriterWide::fillChecksums(IMergeTreeDataPart::Checksums & checksums)
+void MergeTreeDataPartWriterWide::fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove)
 {
     // If we don't have anything to write, skip finalization.
     if (!columns_list.empty())
-        fillDataChecksums(checksums);
+        fillDataChecksums(checksums, checksums_to_remove);
 
     if (settings.rewrite_primary_key)
         fillPrimaryIndexChecksums(checksums);
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
index de7419fedb2..c274fc9807c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
@@ -29,14 +29,14 @@ public:
 
     void write(const Block & block, const IColumn::Permutation * permutation) override;
 
-    void fillChecksums(IMergeTreeDataPart::Checksums & checksums) final;
+    void fillChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove) final;
 
     void finish(bool sync) final;
 
 private:
     /// Finish serialization of data: write final mark if required and compute checksums
     /// Also validate written data in debug mode
-    void fillDataChecksums(IMergeTreeDataPart::Checksums & checksums);
+    void fillDataChecksums(IMergeTreeDataPart::Checksums & checksums, NameSet & checksums_to_remove);
     void finishDataSerialization(bool sync);
 
     /// Write data of one column.
@@ -111,8 +111,11 @@ private:
     using ColumnStreams = std::map<String, StreamPtr>;
     ColumnStreams column_streams;
 
-    /// TODO:
+    /// Some long column names may be replaced to hashes.
+    /// Below are mapping from original stream name to actual
+    /// stream name (probably hash of the stream) and vice versa.
     std::unordered_map<String, String> full_name_to_stream_name;
+    std::unordered_map<String, String> stream_name_to_full_name;
 
     /// Non written marks to disk (for each column). Waiting until all rows for
     /// this marks will be written to disk.
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index c93ad135835..1ebb1d87aae 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -142,12 +142,16 @@ MergedBlockOutputStream::Finalizer MergedBlockOutputStream::finalizePartAsync(
 {
     /// Finish write and get checksums.
     MergeTreeData::DataPart::Checksums checksums;
+    NameSet checksums_to_remove;
 
     if (additional_column_checksums)
         checksums = std::move(*additional_column_checksums);
 
     /// Finish columns serialization.
-    writer->fillChecksums(checksums);
+    writer->fillChecksums(checksums, checksums_to_remove);
+
+    for (const auto & name : checksums_to_remove)
+        checksums.files.erase(name);
 
     LOG_TRACE(&Poco::Logger::get("MergedBlockOutputStream"), "filled checksums {}", new_part->getNameWithState());
 
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
index 3b2eb96f2d4..108f364fc2d 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
@@ -63,7 +63,11 @@ MergedColumnOnlyOutputStream::fillChecksums(
 {
     /// Finish columns serialization.
     MergeTreeData::DataPart::Checksums checksums;
-    writer->fillChecksums(checksums);
+    NameSet checksums_to_remove;
+    writer->fillChecksums(checksums, checksums_to_remove);
+
+    for (const auto & filename : checksums_to_remove)
+        all_checksums.files.erase(filename);
 
     for (const auto & [projection_name, projection_part] : new_part->getProjectionParts())
         checksums.addFile(
@@ -80,9 +84,7 @@ MergedColumnOnlyOutputStream::fillChecksums(
     for (const String & removed_file : removed_files)
     {
         new_part->getDataPartStorage().removeFileIfExists(removed_file);
-
-        if (all_checksums.files.contains(removed_file))
-            all_checksums.files.erase(removed_file);
+        all_checksums.files.erase(removed_file);
     }
 
     new_part->setColumns(columns, serialization_infos, metadata_snapshot->getMetadataVersion());
diff --git a/tests/integration/test_backward_compatibility/configs/wide_parts_only.xml b/tests/integration/test_backward_compatibility/configs/wide_parts_only.xml
index e9cf053f1c5..674ffff6c93 100644
--- a/tests/integration/test_backward_compatibility/configs/wide_parts_only.xml
+++ b/tests/integration/test_backward_compatibility/configs/wide_parts_only.xml
@@ -1,5 +1,6 @@
 <clickhouse>
     <merge_tree>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
+        <replace_long_file_name_to_hash>0</replace_long_file_name_to_hash>
     </merge_tree>
 </clickhouse>
diff --git a/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml b/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
index 10b9edef36d..4d1a3357799 100644
--- a/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
+++ b/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
@@ -2,5 +2,6 @@
     <merge_tree>
         <min_rows_for_wide_part>0</min_rows_for_wide_part>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
+        <replace_long_file_name_to_hash>0</replace_long_file_name_to_hash>
     </merge_tree>
 </clickhouse>
diff --git a/tests/integration/test_filesystem_layout/test.py b/tests/integration/test_filesystem_layout/test.py
index 2be478f95d0..81f3b67cb75 100644
--- a/tests/integration/test_filesystem_layout/test.py
+++ b/tests/integration/test_filesystem_layout/test.py
@@ -23,7 +23,7 @@ def test_file_path_escaping(started_cluster):
     node.query(
         """
         CREATE TABLE test.`T.a_b,l-e!` (`~Id` UInt32)
-        ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0;
+        ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
         """
     )
     node.query("""INSERT INTO test.`T.a_b,l-e!` VALUES (1);""")
diff --git a/tests/integration/test_mutations_hardlinks/configs/wide_parts_only.xml b/tests/integration/test_mutations_hardlinks/configs/wide_parts_only.xml
index 10b9edef36d..4d1a3357799 100644
--- a/tests/integration/test_mutations_hardlinks/configs/wide_parts_only.xml
+++ b/tests/integration/test_mutations_hardlinks/configs/wide_parts_only.xml
@@ -2,5 +2,6 @@
     <merge_tree>
         <min_rows_for_wide_part>0</min_rows_for_wide_part>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
+        <replace_long_file_name_to_hash>0</replace_long_file_name_to_hash>
     </merge_tree>
 </clickhouse>
diff --git a/tests/integration/test_partition/test.py b/tests/integration/test_partition/test.py
index 93f03f4420e..7634c81f807 100644
--- a/tests/integration/test_partition/test.py
+++ b/tests/integration/test_partition/test.py
@@ -150,7 +150,7 @@ def partition_table_complex(started_cluster):
     q("DROP TABLE IF EXISTS test.partition_complex")
     q(
         "CREATE TABLE test.partition_complex (p Date, k Int8, v1 Int8 MATERIALIZED k + 1) "
-        "ENGINE = MergeTree PARTITION BY p ORDER BY k SETTINGS index_granularity=1, index_granularity_bytes=0, compress_marks=false, compress_primary_key=false"
+        "ENGINE = MergeTree PARTITION BY p ORDER BY k SETTINGS index_granularity=1, index_granularity_bytes=0, compress_marks=false, compress_primary_key=false, replace_long_file_name_to_hash = false"
     )
     q("INSERT INTO test.partition_complex (p, k) VALUES(toDate(31), 1)")
     q("INSERT INTO test.partition_complex (p, k) VALUES(toDate(1), 2)")

From a71cd56a906a05fd31e878112b79f58676a8156e Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 1 Aug 2023 10:06:56 +0000
Subject: [PATCH 019/101] Output valid JSON/XML on excetpion during HTTP query
 execution

---
 docs/en/interfaces/http.md                    |  13 +
 src/Core/Settings.h                           |   1 +
 src/Core/SettingsChangesHistory.h             |   1 +
 src/Formats/FormatFactory.cpp                 |   8 +-
 src/Formats/FormatSettings.h                  |   6 +
 src/Formats/JSONUtils.cpp                     |   6 +
 src/Formats/JSONUtils.h                       |   2 +
 src/IO/PeekableWriteBuffer.cpp                |  85 ++++
 src/IO/PeekableWriteBuffer.h                  |  59 +++
 src/Interpreters/executeQuery.cpp             |  18 +-
 src/Interpreters/executeQuery.h               |   5 +-
 src/Processors/Formats/IOutputFormat.h        |   8 +
 .../Impl/JSONColumnsBlockOutputFormatBase.cpp |   3 +-
 .../Impl/JSONColumnsBlockOutputFormatBase.h   |   1 +
 .../JSONCompactEachRowRowOutputFormat.cpp     |  16 +-
 .../Impl/JSONCompactEachRowRowOutputFormat.h  |   8 +-
 .../Impl/JSONEachRowRowOutputFormat.cpp       |  18 +-
 .../Formats/Impl/JSONEachRowRowOutputFormat.h |   9 +-
 .../Impl/JSONObjectEachRowRowOutputFormat.cpp |   7 +
 .../Formats/Impl/JSONRowOutputFormat.cpp      |  13 +-
 .../Formats/Impl/JSONRowOutputFormat.h        |   5 +-
 .../Impl/ParallelFormattingOutputFormat.cpp   |  48 +-
 .../Impl/ParallelFormattingOutputFormat.h     |  27 ++
 .../Formats/Impl/XMLRowOutputFormat.cpp       |  13 +-
 .../Formats/Impl/XMLRowOutputFormat.h         |   5 +-
 .../OutputFormatWithExceptionHandlerAdaptor.h |  75 +++
 .../OutputFormatWithUTF8ValidationAdaptor.h   |  32 +-
 ...wOutputFormatWithExceptionHandlerAdaptor.h | 104 +++++
 src/Server/HTTPHandler.cpp                    |  80 ++--
 src/Server/HTTPHandler.h                      |   2 +
 ...d_json_and_xml_on_http_exception.reference | 432 ++++++++++++++++++
 ...41_valid_json_and_xml_on_http_exception.sh | 106 +++++
 32 files changed, 1138 insertions(+), 78 deletions(-)
 create mode 100644 src/IO/PeekableWriteBuffer.cpp
 create mode 100644 src/IO/PeekableWriteBuffer.h
 create mode 100644 src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h
 create mode 100644 src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
 create mode 100644 tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
 create mode 100755 tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh

diff --git a/docs/en/interfaces/http.md b/docs/en/interfaces/http.md
index 37821f0fee1..b28180fec67 100644
--- a/docs/en/interfaces/http.md
+++ b/docs/en/interfaces/http.md
@@ -697,3 +697,16 @@ $ curl -vv -H 'XXX:xxx' 'http://localhost:8123/get_relative_path_static_handler'
 <html><body>Relative Path File</body></html>
 * Connection #0 to host localhost left intact
 ```
+
+## Valid JSON/XML response on exception during HTTP streaming {valid-output-on-exception-http-streaming} 
+
+While query execution over HTTP an exception can happen when part of the data has already been sent. Usually an exception is sent to the client in plain text
+even if some specific data format was used to output data and the output may become invalid in terms of specified data format.
+To prevent it, you can use setting `http_write_exception_in_output_format` (enabled by default) that will tell ClickHouse to write an exception in specified format (currently supported for XML and JSON* formats).
+
+Examples:
+
+```bash
+
+```
+
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index c69d132ea25..b8ba6454f61 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -276,6 +276,7 @@ class IColumn;
     \
     M(UInt64, http_headers_progress_interval_ms, 100, "Do not send HTTP headers X-ClickHouse-Progress more frequently than at each specified interval.", 0) \
     M(Bool, http_wait_end_of_query, false, "Enable HTTP response buffering on the server-side.", 0) \
+    M(Bool, http_write_exception_in_output_format, true, "Write exception in output format to produce valid output. Works with JSON and XML formats.", 0) \
     M(UInt64, http_response_buffer_size, 0, "The number of bytes to buffer in the server memory before sending a HTTP response to the client or flushing to disk (when http_wait_end_of_query is enabled).", 0) \
     \
     M(Bool, fsync_metadata, true, "Do fsync after changing metadata for tables and databases (.sql files). Could be disabled in case of poor latency on server with high load of DDL queries and high load of disk subsystem.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 70b702f1b33..3172b246d68 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -80,6 +80,7 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
+    {"23.8", {{"http_write_exception_in_output_format", false, true, "Output valid JSON/XML on exception in HTTP streaming."}}},
     {"23.7", {{"function_sleep_max_microseconds_per_block", 0, 3000000, "In previous versions, the maximum sleep time of 3 seconds was applied only for `sleep`, but not for `sleepEachRow` function. In the new version, we introduce this setting. If you set compatibility with the previous versions, we will disable the limit altogether."}}},
     {"23.6", {{"http_send_timeout", 180, 30, "3 minutes seems crazy long. Note that this is timeout for a single network write call, not for the whole upload operation."},
               {"http_receive_timeout", 180, 30, "See http_send_timeout."}}},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 663b7f1ba95..4cd2ad5be03 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -1,7 +1,7 @@
 #include <Formats/FormatFactory.h>
 
 #include <algorithm>
-#include <Core/Settings.h>
+//#include <Core/Settings.h>
 #include <Formats/FormatSettings.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/ProcessList.h>
@@ -224,6 +224,12 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
             context->getRemoteHostFilter().checkURL(avro_schema_registry_url);
     }
 
+    if (context->getClientInfo().interface == ClientInfo::Interface::HTTP && context->getSettingsRef().http_write_exception_in_output_format.value)
+    {
+        format_settings.json.valid_output_on_exception = true;
+        format_settings.xml.valid_output_on_exception = true;
+    }
+
     return format_settings;
 }
 
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 3259c46e5ff..a2ef0b035e9 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -198,6 +198,7 @@ struct FormatSettings
         bool validate_types_from_metadata = true;
         bool validate_utf8 = false;
         bool allow_object_type = false;
+        bool valid_output_on_exception = false;
     } json;
 
     struct
@@ -399,6 +400,11 @@ struct FormatSettings
     {
         bool allow_types_conversion = true;
     } native;
+
+    struct
+    {
+        bool valid_output_on_exception = false;
+    } xml;
 };
 
 }
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 0aac72c68fe..aead2a3806a 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -451,6 +451,12 @@ namespace JSONUtils
         }
     }
 
+    void writeException(const String & exception_message, WriteBuffer & out, const FormatSettings & settings, size_t indent)
+    {
+        writeTitle("exception", out, indent, " ");
+        writeJSONString(exception_message, out, settings);
+    }
+
     Strings makeNamesValidJSONStrings(const Strings & names, const FormatSettings & settings, bool validate_utf8)
     {
         Strings result;
diff --git a/src/Formats/JSONUtils.h b/src/Formats/JSONUtils.h
index fd1ba7db980..c023125ce66 100644
--- a/src/Formats/JSONUtils.h
+++ b/src/Formats/JSONUtils.h
@@ -105,6 +105,8 @@ namespace JSONUtils
         bool write_statistics,
         WriteBuffer & out);
 
+    void writeException(const String & exception_message, WriteBuffer & out, const FormatSettings & settings, size_t indent = 0);
+
     void skipColon(ReadBuffer & in);
     void skipComma(ReadBuffer & in);
 
diff --git a/src/IO/PeekableWriteBuffer.cpp b/src/IO/PeekableWriteBuffer.cpp
new file mode 100644
index 00000000000..dc7f87dd539
--- /dev/null
+++ b/src/IO/PeekableWriteBuffer.cpp
@@ -0,0 +1,85 @@
+#include <IO/PeekableWriteBuffer.h>
+
+namespace DB
+{
+
+PeekableWriteBuffer::PeekableWriteBuffer(DB::WriteBuffer & sub_buf_) : BufferWithOwnMemory(0), sub_buf(sub_buf_)
+{
+    Buffer & sub_working = sub_buf.buffer();
+    BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf.offset());
+}
+
+void PeekableWriteBuffer::nextImpl()
+{
+    if (checkpoint)
+    {
+        if (write_to_own_memory)
+        {
+            size_t prev_size = position() - memory.data();
+            size_t new_size = memory.size() * 2;
+            memory.resize(new_size);
+            BufferBase::set(memory.data(), memory.size(), prev_size);
+            return;
+        }
+
+        if (memory.size() == 0)
+            memory.resize(DBMS_DEFAULT_BUFFER_SIZE);
+
+        sub_buf.position() = position();
+        BufferBase::set(memory.data(), memory.size(), 0);
+        write_to_own_memory = true;
+        return;
+    }
+
+    sub_buf.position() = position();
+    sub_buf.next();
+    BufferBase::set(sub_buf.buffer().begin(), sub_buf.buffer().size(), sub_buf.offset());
+}
+
+
+void PeekableWriteBuffer::dropCheckpoint()
+{
+    assert(checkpoint);
+    checkpoint = std::nullopt;
+    /// If we have saved data in own memory, write it to sub-buf.
+    if (write_to_own_memory)
+    {
+        try
+        {
+            sub_buf.next();
+            sub_buf.write(memory.data(), position() - memory.data());
+            Buffer & sub_working = sub_buf.buffer();
+            BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf.offset());
+            write_to_own_memory = false;
+        }
+        catch (...)
+        {
+            /// If exception happened during writing to sub buffer, we should
+            /// update buffer to not leave it in invalid state.
+            Buffer & sub_working = sub_buf.buffer();
+            BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf.offset());
+            write_to_own_memory = false;
+        }
+    }
+
+}
+
+void PeekableWriteBuffer::rollbackToCheckpoint(bool drop)
+{
+    assert(checkpoint);
+
+    /// Just ignore all data written after checkpoint.
+    if (write_to_own_memory)
+    {
+        Buffer & sub_working = sub_buf.buffer();
+        BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf.offset());
+        write_to_own_memory = false;
+    }
+
+    position() = *checkpoint;
+
+    if (drop)
+        checkpoint = std::nullopt;
+}
+
+}
diff --git a/src/IO/PeekableWriteBuffer.h b/src/IO/PeekableWriteBuffer.h
new file mode 100644
index 00000000000..e7094f11fcb
--- /dev/null
+++ b/src/IO/PeekableWriteBuffer.h
@@ -0,0 +1,59 @@
+#pragma once
+#include <IO/WriteBuffer.h>
+#include <IO/BufferWithOwnMemory.h>
+#include <stack>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+/// Similar to PeekableReadBuffer.
+/// Allows to set checkpoint at some position in stream and come back to this position later.
+/// When next() is called, saves data between checkpoint and current position to own memory instead of writing it to sub-buffer.
+/// So, all the data after checkpoint won't be written in sub-buffer until checkpoint is dropped.
+/// Rollback to checkpoint means that all data after checkpoint will be ignored and not sent to sub-buffer.
+/// Sub-buffer should not be accessed directly during the lifetime of peekable buffer (unless
+/// you reset() the state of peekable buffer after each change of underlying buffer)
+/// If position() of peekable buffer is explicitly set to some position before checkpoint
+/// (e.g. by istr.position() = prev_pos), behavior is undefined.
+class PeekableWriteBuffer : public BufferWithOwnMemory<WriteBuffer>
+{
+    friend class PeekableWriteBufferCheckpoint;
+public:
+    explicit PeekableWriteBuffer(WriteBuffer & sub_buf_);
+
+    /// Sets checkpoint at current position
+    ALWAYS_INLINE inline void setCheckpoint()
+    {
+        if (checkpoint)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "PeekableWriteBuffer does not support recursive checkpoints.");
+
+        checkpoint.emplace(pos);
+    }
+
+    /// Forget checkpoint and send all data from checkpoint to position to sub-buffer.
+    void dropCheckpoint();
+
+    /// Sets position at checkpoint and forget all data written from checkpoint to position.
+    /// All pointers (such as this->buffer().end()) may be invalidated
+    void rollbackToCheckpoint(bool drop = false);
+
+    void finalizeImpl() override
+    {
+        assert(!checkpoint);
+        sub_buf.position() = position();
+    }
+
+private:
+    void nextImpl() override;
+
+    WriteBuffer & sub_buf;
+    bool write_to_own_memory = false;
+    std::optional<Position> checkpoint = std::nullopt;
+};
+
+}
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 578ca3b41f9..651305d9c52 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -1250,7 +1250,8 @@ void executeQuery(
     bool allow_into_outfile,
     ContextMutablePtr context,
     SetResultDetailsFunc set_result_details,
-    const std::optional<FormatSettings> & output_format_settings)
+    const std::optional<FormatSettings> & output_format_settings,
+    HandleExceptionInOutputFormatFunc handle_exception_in_output_format)
 {
     PODArray<char> parse_buf;
     const char * begin;
@@ -1308,6 +1309,7 @@ void executeQuery(
 
     ASTPtr ast;
     BlockIO streams;
+    OutputFormatPtr output_format;
 
     std::tie(ast, streams) = executeQueryImpl(begin, end, context, false, QueryProcessingStage::Complete, &istr);
     auto & pipeline = streams.pipeline;
@@ -1350,30 +1352,30 @@ void executeQuery(
                                     ? getIdentifierName(ast_query_with_output->format)
                                     : context->getDefaultFormat();
 
-            auto out = FormatFactory::instance().getOutputFormatParallelIfPossible(
+            output_format = FormatFactory::instance().getOutputFormatParallelIfPossible(
                 format_name,
                 compressed_buffer ? *compressed_buffer : *out_buf,
                 materializeBlock(pipeline.getHeader()),
                 context,
                 output_format_settings);
 
-            out->setAutoFlush();
+            output_format->setAutoFlush();
 
             /// Save previous progress callback if any. TODO Do it more conveniently.
             auto previous_progress_callback = context->getProgressCallback();
 
             /// NOTE Progress callback takes shared ownership of 'out'.
-            pipeline.setProgressCallback([out, previous_progress_callback] (const Progress & progress)
+            pipeline.setProgressCallback([output_format, previous_progress_callback] (const Progress & progress)
             {
                 if (previous_progress_callback)
                     previous_progress_callback(progress);
-                out->onProgress(progress);
+                output_format->onProgress(progress);
             });
 
-            result_details.content_type = out->getContentType();
+            result_details.content_type = output_format->getContentType();
             result_details.format = format_name;
 
-            pipeline.complete(std::move(out));
+            pipeline.complete(output_format);
         }
         else
         {
@@ -1403,6 +1405,8 @@ void executeQuery(
     }
     catch (...)
     {
+        if (handle_exception_in_output_format && output_format)
+            handle_exception_in_output_format(*output_format);
         streams.onException();
         throw;
     }
diff --git a/src/Interpreters/executeQuery.h b/src/Interpreters/executeQuery.h
index f2a12bbef18..11ef17aaade 100644
--- a/src/Interpreters/executeQuery.h
+++ b/src/Interpreters/executeQuery.h
@@ -15,6 +15,7 @@ namespace DB
 class IInterpreter;
 class ReadBuffer;
 class WriteBuffer;
+class IOutputFormat;
 struct QueryStatusInfo;
 
 struct QueryResultDetails
@@ -26,6 +27,7 @@ struct QueryResultDetails
 };
 
 using SetResultDetailsFunc = std::function<void(const QueryResultDetails &)>;
+using HandleExceptionInOutputFormatFunc = std::function<void(IOutputFormat & output_format)>;
 
 /// Parse and execute a query.
 void executeQuery(
@@ -34,7 +36,8 @@ void executeQuery(
     bool allow_into_outfile,            /// If true and the query contains INTO OUTFILE section, redirect output to that file.
     ContextMutablePtr context,          /// DB, tables, data types, storage engines, functions, aggregate functions...
     SetResultDetailsFunc set_result_details, /// If a non-empty callback is passed, it will be called with the query id, the content-type, the format, and the timezone.
-    const std::optional<FormatSettings> & output_format_settings = std::nullopt /// Format settings for output format, will be calculated from the context if not set.
+    const std::optional<FormatSettings> & output_format_settings = std::nullopt, /// Format settings for output format, will be calculated from the context if not set.
+    HandleExceptionInOutputFormatFunc handle_exception_in_output_format = {} /// If a non-empty callback is passed, it will be called on exception with created output format.
 );
 
 
diff --git a/src/Processors/Formats/IOutputFormat.h b/src/Processors/Formats/IOutputFormat.h
index 58700a978ff..cae2ab7691e 100644
--- a/src/Processors/Formats/IOutputFormat.h
+++ b/src/Processors/Formats/IOutputFormat.h
@@ -71,6 +71,9 @@ public:
         consumeExtremes(Chunk(extremes.getColumns(), extremes.rows()));
     }
 
+    virtual bool supportsWritingException() const { return false; }
+    virtual void setException(const String & /*exception_message*/) {}
+
     size_t getResultRows() const { return result_rows; }
     size_t getResultBytes() const { return result_bytes; }
 
@@ -162,6 +165,11 @@ protected:
     /// outputs them in finalize() method.
     virtual bool areTotalsAndExtremesUsedInFinalize() const { return false; }
 
+    /// Derived classes can use some wrappers around out WriteBuffer
+    /// and can override this method to return wrapper
+    /// that should be used in its derived classes.
+    virtual WriteBuffer * getWriteBufferPtr() { return &out; }
+
     WriteBuffer & out;
 
     Chunk current_chunk;
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.cpp
index 490516b7eb4..72a009c20bf 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.cpp
@@ -9,10 +9,11 @@ namespace DB
 
 JSONColumnsBlockOutputFormatBase::JSONColumnsBlockOutputFormatBase(
     WriteBuffer & out_, const Block & header_, const FormatSettings & format_settings_, bool validate_utf8)
-    : OutputFormatWithUTF8ValidationAdaptor(validate_utf8, header_, out_)
+    : OutputFormatWithUTF8ValidationAdaptor(header_, out_, validate_utf8)
     , format_settings(format_settings_)
     , serializations(header_.getSerializations())
 {
+    ostr = OutputFormatWithUTF8ValidationAdaptor::getWriteBufferPtr();
 }
 
 void JSONColumnsBlockOutputFormatBase::consume(Chunk chunk)
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.h b/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.h
index 235a6d4da96..d73ac53b97a 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.h
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockOutputFormatBase.h
@@ -38,6 +38,7 @@ protected:
     Chunk mono_chunk;
 
     size_t written_rows = 0;
+    WriteBuffer * ostr;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
index 0cafc053467..c5c9af60982 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
@@ -15,12 +15,13 @@ JSONCompactEachRowRowOutputFormat::JSONCompactEachRowRowOutputFormat(WriteBuffer
         bool with_names_,
         bool with_types_,
         bool yield_strings_)
-    : RowOutputFormatWithUTF8ValidationAdaptor(settings_.json.validate_utf8, header_, out_)
+    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(header_, out_, settings_.json.valid_output_on_exception, settings_.json.validate_utf8)
     , settings(settings_)
     , with_names(with_names_)
     , with_types(with_types_)
     , yield_strings(yield_strings_)
 {
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
 }
 
 
@@ -102,6 +103,19 @@ void JSONCompactEachRowRowOutputFormat::consumeTotals(DB::Chunk chunk)
         IRowOutputFormat::consumeTotals(std::move(chunk));
 }
 
+void JSONCompactEachRowRowOutputFormat::writeSuffix()
+{
+    if (!exception_message.empty())
+    {
+        if (haveWrittenData())
+            writeRowBetweenDelimiter();
+
+        writeRowStartDelimiter();
+        writeJSONString(exception_message, *ostr, settings);
+        writeRowEndDelimiter();
+    }
+}
+
 void registerOutputFormatJSONCompactEachRow(FormatFactory & factory)
 {
     for (bool yield_strings : {false, true})
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
index 2be39669dd2..a05fff699a5 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
@@ -3,15 +3,16 @@
 #include <Core/Block.h>
 #include <IO/WriteBuffer.h>
 #include <Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h>
+#include <Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h>
 #include <Formats/FormatSettings.h>
 
 
 namespace DB
 {
 
-/** The stream for outputting data in JSON format, by object per line.
+/** The stream for outputting data in JSON format, by JSON array per line.
   */
-class JSONCompactEachRowRowOutputFormat final : public RowOutputFormatWithUTF8ValidationAdaptor
+class JSONCompactEachRowRowOutputFormat final : public RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>
 {
 public:
     JSONCompactEachRowRowOutputFormat(
@@ -33,6 +34,7 @@ private:
     void writeFieldDelimiter() override;
     void writeRowStartDelimiter() override;
     void writeRowEndDelimiter() override;
+    void writeSuffix() override;
 
     bool supportTotals() const override { return true; }
     void consumeTotals(Chunk) override;
@@ -43,5 +45,7 @@ private:
     bool with_names;
     bool with_types;
     bool yield_strings;
+
+    WriteBuffer * ostr;
 };
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
index 5b8f6cc1af7..2169d815fbf 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
@@ -3,6 +3,7 @@
 #include <Processors/Formats/Impl/JSONEachRowRowOutputFormat.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/JSONUtils.h>
+#include <Common/logger_useful.h>
 
 
 namespace DB
@@ -14,10 +15,12 @@ JSONEachRowRowOutputFormat::JSONEachRowRowOutputFormat(
     const Block & header_,
     const FormatSettings & settings_,
     bool pretty_json_)
-        : RowOutputFormatWithUTF8ValidationAdaptor(settings_.json.validate_utf8, header_, out_),
-        pretty_json(pretty_json_),
-        settings(settings_)
+    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(
+        header_, out_, settings_.json.valid_output_on_exception, settings_.json.validate_utf8)
+    , pretty_json(pretty_json_)
+    , settings(settings_)
 {
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
     fields = JSONUtils::makeNamesValidJSONStrings(getPort(PortKind::Main).getHeader().getNames(), settings, settings.json.validate_utf8);
 }
 
@@ -76,6 +79,15 @@ void JSONEachRowRowOutputFormat::writePrefix()
 
 void JSONEachRowRowOutputFormat::writeSuffix()
 {
+    if (!exception_message.empty())
+    {
+        if (haveWrittenData())
+            writeRowBetweenDelimiter();
+        writeRowStartDelimiter();
+        JSONUtils::writeException(exception_message, *ostr, settings, pretty_json ? 1 : 0);
+        writeRowEndDelimiter();
+    }
+
     if (settings.json.array_of_rows)
         writeCString("\n]\n", *ostr);
 }
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
index e05d189afe9..28bfbf2e6ac 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
@@ -2,7 +2,9 @@
 
 #include <Core/Block.h>
 #include <IO/WriteBuffer.h>
+#include <IO/PeekableWriteBuffer.h>
 #include <Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h>
+#include <Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h>
 #include <Formats/FormatSettings.h>
 
 
@@ -11,7 +13,7 @@ namespace DB
 
 /** The stream for outputting data in JSON format, by object per line.
   */
-class JSONEachRowRowOutputFormat : public RowOutputFormatWithUTF8ValidationAdaptor
+class JSONEachRowRowOutputFormat : public RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>
 {
 public:
     JSONEachRowRowOutputFormat(
@@ -40,10 +42,11 @@ protected:
     size_t field_number = 0;
     bool pretty_json;
 
+    FormatSettings settings;
+    WriteBuffer * ostr;
+
 private:
     Names fields;
-
-    FormatSettings settings;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
index a02199d6075..8f4d11a604a 100644
--- a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
@@ -62,6 +62,13 @@ void JSONObjectEachRowRowOutputFormat::writeRowBetweenDelimiter()
 
 void JSONObjectEachRowRowOutputFormat::writeSuffix()
 {
+    if (!exception_message.empty())
+    {
+        if (haveWrittenData())
+            writeRowBetweenDelimiter();
+        JSONUtils::writeException(exception_message, *ostr, settings, 1);
+    }
+    
     JSONUtils::writeObjectEnd(*ostr);
     writeChar('\n', *ostr);
 }
diff --git a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
index 0193ec7e3d3..e4c4e2a3bc6 100644
--- a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
@@ -13,9 +13,10 @@ JSONRowOutputFormat::JSONRowOutputFormat(
     const Block & header,
     const FormatSettings & settings_,
     bool yield_strings_)
-    : RowOutputFormatWithUTF8ValidationAdaptor(true, header, out_), settings(settings_), yield_strings(yield_strings_)
+    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(header, out_, settings_.json.valid_output_on_exception, true), settings(settings_), yield_strings(yield_strings_)
 {
     names = JSONUtils::makeNamesValidJSONStrings(header.getNames(), settings, true);
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
 }
 
 
@@ -117,9 +118,15 @@ void JSONRowOutputFormat::finalizeImpl()
         statistics.applied_limit,
         statistics.watch,
         statistics.progress,
-        settings.write_statistics,
+        settings.write_statistics && exception_message.empty(),
         *ostr);
 
+    if (!exception_message.empty())
+    {
+        writeCString(",\n\n", *ostr);
+        JSONUtils::writeException(exception_message, *ostr, settings, 1);
+    }
+
     JSONUtils::writeObjectEnd(*ostr);
     writeChar('\n', *ostr);
     ostr->next();
@@ -127,7 +134,7 @@ void JSONRowOutputFormat::finalizeImpl()
 
 void JSONRowOutputFormat::resetFormatterImpl()
 {
-    RowOutputFormatWithUTF8ValidationAdaptor::resetFormatterImpl();
+    RowOutputFormatWithExceptionHandlerAdaptor::resetFormatterImpl();
     row_count = 0;
     statistics = Statistics();
 }
diff --git a/src/Processors/Formats/Impl/JSONRowOutputFormat.h b/src/Processors/Formats/Impl/JSONRowOutputFormat.h
index dc3f0541af0..a38cd0e8db9 100644
--- a/src/Processors/Formats/Impl/JSONRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONRowOutputFormat.h
@@ -3,8 +3,10 @@
 #include <Core/Block.h>
 #include <IO/Progress.h>
 #include <IO/WriteBuffer.h>
+#include <IO/PeekableWriteBuffer.h>
 #include <Common/Stopwatch.h>
 #include <Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h>
+#include <Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h>
 #include <Formats/FormatSettings.h>
 
 
@@ -13,7 +15,7 @@ namespace DB
 
 /** Stream for output data in JSON format.
   */
-class JSONRowOutputFormat : public RowOutputFormatWithUTF8ValidationAdaptor
+class JSONRowOutputFormat : public RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>
 {
 public:
     JSONRowOutputFormat(
@@ -69,6 +71,7 @@ protected:
     FormatSettings settings;
 
     bool yield_strings;
+    WriteBuffer * ostr;
 };
 
 }
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
index 46fe2ba26a8..3e63e2abd6c 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
@@ -8,7 +8,6 @@ namespace DB
     void ParallelFormattingOutputFormat::finalizeImpl()
     {
         need_flush = true;
-        IOutputFormat::finalized = true;
         /// Don't throw any background_exception here, because we want to finalize the execution.
         /// Exception will be checked after main thread is finished.
         addChunk(Chunk{}, ProcessingUnitType::FINALIZE, /*can_throw_exception*/ false);
@@ -24,8 +23,29 @@ namespace DB
             std::lock_guard lock(mutex);
 
             if (background_exception)
-                std::rethrow_exception(background_exception);
+            {
+                collector_finished.set();
+                rethrowBackgroundException();
+            }
         }
+
+        if (collected_prefix && collected_suffix && collected_finalize)
+            return;
+
+        auto formatter = internal_formatter_creator(out);
+        formatter->setRowsReadBefore(rows_collected);
+        formatter->setException(exception_message);
+
+        if (!collected_prefix)
+            formatter->writePrefix();
+
+        if (!collected_suffix)
+            formatter->writeSuffix();
+
+        if (!collected_finalize)
+            formatter->finalizeImpl();
+
+        formatter->finalizeBuffers();
     }
 
     void ParallelFormattingOutputFormat::addChunk(Chunk chunk, ProcessingUnitType type, bool can_throw_exception)
@@ -33,7 +53,7 @@ namespace DB
         {
             std::lock_guard lock(mutex);
             if (background_exception && can_throw_exception)
-                std::rethrow_exception(background_exception);
+                rethrowBackgroundException();
         }
 
         const auto current_unit_number = writer_unit_number % processing_units.size();
@@ -62,7 +82,10 @@ namespace DB
 
         size_t first_row_num = rows_consumed;
         if (unit.type == ProcessingUnitType::PLAIN)
+        {
             rows_consumed += unit.chunk.getNumRows();
+            unit.rows_num = unit.chunk.getNumRows();
+        }
 
         scheduleFormatterThreadForUnitWithNumber(current_unit_number, first_row_num);
         ++writer_unit_number;
@@ -125,7 +148,7 @@ namespace DB
                 assert(unit.status == READY_TO_READ);
 
                 /// Use this copy to after notification to stop the execution.
-                auto copy_if_unit_type = unit.type;
+                auto copy_of_unit_type = unit.type;
 
                 /// Do main work here.
                 out.write(unit.segment.data(), unit.actual_memory_size);
@@ -134,6 +157,7 @@ namespace DB
                     IOutputFormat::flush();
 
                 ++collector_unit_number;
+                rows_collected += unit.rows_num;
 
                 {
                     /// Notify other threads.
@@ -141,9 +165,19 @@ namespace DB
                     unit.status = READY_TO_INSERT;
                     writer_condvar.notify_all();
                 }
-                /// We can exit only after writing last piece of to out buffer.
-                if (copy_if_unit_type == ProcessingUnitType::FINALIZE)
+
+                if (copy_of_unit_type == ProcessingUnitType::START)
                 {
+                    collected_prefix = true;
+                }
+                else if (copy_of_unit_type == ProcessingUnitType::PLAIN_FINISH)
+                {
+                    collected_suffix = true;
+                }
+                /// We can exit only after writing last piece of data to out buffer.
+                else if (copy_of_unit_type == ProcessingUnitType::FINALIZE)
+                {
+                    collected_finalize = true;
                     break;
                 }
             }
@@ -156,7 +190,6 @@ namespace DB
         }
     }
 
-
     void ParallelFormattingOutputFormat::formatterThreadFunction(size_t current_unit_number, size_t first_row_num, const ThreadGroupPtr & thread_group)
     {
         SCOPE_EXIT_SAFE(
@@ -184,6 +217,7 @@ namespace DB
 
             auto formatter = internal_formatter_creator(out_buffer);
             formatter->setRowsReadBefore(first_row_num);
+            formatter->setException(exception_message);
 
             switch (unit.type)
             {
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
index 490f033b87e..b9a3b7638fa 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
@@ -142,6 +142,14 @@ public:
         return internal_formatter_creator(buffer)->getContentType();
     }
 
+    bool supportsWritingException() const override
+    {
+        WriteBufferFromOwnString buffer;
+        return internal_formatter_creator(buffer)->supportsWritingException();
+    }
+
+    void setException(const String & exception_message_) override { exception_message = exception_message_; }
+
 private:
     void consume(Chunk chunk) override final
     {
@@ -214,6 +222,7 @@ private:
         Memory<> segment;
         size_t actual_memory_size{0};
         Statistics statistics;
+        size_t rows_num;
     };
 
     Poco::Event collector_finished{};
@@ -241,12 +250,19 @@ private:
     std::condition_variable writer_condvar;
 
     size_t rows_consumed = 0;
+    size_t rows_collected = 0;
     std::atomic_bool are_totals_written = false;
 
     /// We change statistics in onProgress() which can be called from different threads.
     std::mutex statistics_mutex;
     bool save_totals_and_extremes_in_statistics;
 
+    String exception_message;
+    bool exception_is_rethrown = false;
+    bool collected_prefix = false;
+    bool collected_suffix = false;
+    bool collected_finalize = false;
+
     void finishAndWait();
 
     void onBackgroundException()
@@ -261,6 +277,17 @@ private:
         collector_condvar.notify_all();
     }
 
+    void rethrowBackgroundException()
+    {
+        /// Rethrow background exception only once, because
+        /// OutputFormat can be used after it to write an exception.
+        if (!exception_is_rethrown)
+        {
+            exception_is_rethrown = true;
+            std::rethrow_exception(background_exception);
+        }
+    }
+
     void scheduleFormatterThreadForUnitWithNumber(size_t ticket_number, size_t first_row_num)
     {
         pool.scheduleOrThrowOnError([this, thread_group = CurrentThread::getGroup(), ticket_number, first_row_num]
diff --git a/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp b/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
index 1d6fb62275c..eb735cc93aa 100644
--- a/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
@@ -8,8 +8,9 @@ namespace DB
 {
 
 XMLRowOutputFormat::XMLRowOutputFormat(WriteBuffer & out_, const Block & header_, const FormatSettings & format_settings_)
-    : RowOutputFormatWithUTF8ValidationAdaptor(true, header_, out_), fields(header_.getNamesAndTypes()), format_settings(format_settings_)
+    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(header_, out_, true, format_settings_.xml.valid_output_on_exception), fields(header_.getNamesAndTypes()), format_settings(format_settings_)
 {
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
     const auto & sample = getPort(PortKind::Main).getHeader();
     field_tag_names.resize(sample.columns());
 
@@ -191,7 +192,9 @@ void XMLRowOutputFormat::finalizeImpl()
 
     writeRowsBeforeLimitAtLeast();
 
-    if (format_settings.write_statistics)
+    if (!exception_message.empty())
+        writeException();
+    else if (format_settings.write_statistics)
         writeStatistics();
 
     writeCString("</result>\n", *ostr);
@@ -230,6 +233,12 @@ void XMLRowOutputFormat::writeStatistics()
     writeCString("\t</statistics>\n", *ostr);
 }
 
+void XMLRowOutputFormat::writeException()
+{
+    writeCString("\t<exception>", *ostr);
+    writeXMLStringForTextElement(exception_message, *ostr);
+    writeCString("</exception>\n", *ostr);
+}
 
 void registerOutputFormatXML(FormatFactory & factory)
 {
diff --git a/src/Processors/Formats/Impl/XMLRowOutputFormat.h b/src/Processors/Formats/Impl/XMLRowOutputFormat.h
index e25e7129109..daf03539d0b 100644
--- a/src/Processors/Formats/Impl/XMLRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/XMLRowOutputFormat.h
@@ -6,6 +6,7 @@
 #include <Common/Stopwatch.h>
 #include <Formats/FormatSettings.h>
 #include <Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h>
+#include <Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h>
 
 
 namespace DB
@@ -13,7 +14,7 @@ namespace DB
 
 /** A stream for outputting data in XML format.
   */
-class XMLRowOutputFormat final : public RowOutputFormatWithUTF8ValidationAdaptor
+class XMLRowOutputFormat final : public RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>
 {
 public:
     XMLRowOutputFormat(WriteBuffer & out_, const Block & header_, const FormatSettings & format_settings_);
@@ -56,6 +57,7 @@ private:
     void writeExtremesElement(const char * title, const Columns & columns, size_t row_num);
     void writeRowsBeforeLimitAtLeast();
     void writeStatistics();
+    void writeException();
 
     size_t field_number = 0;
     size_t row_count = 0;
@@ -63,6 +65,7 @@ private:
     Names field_tag_names;
 
     const FormatSettings format_settings;
+    WriteBuffer * ostr;
 };
 
 }
diff --git a/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h b/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h
new file mode 100644
index 00000000000..bb318dae81e
--- /dev/null
+++ b/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h
@@ -0,0 +1,75 @@
+#pragma once
+
+#include <Processors/Formats/IOutputFormat.h>
+#include <Processors/Formats/IRowOutputFormat.h>
+
+#include <IO/WriteBuffer.h>
+#include <IO/PeekableWriteBuffer.h>
+
+namespace DB
+{
+
+template <typename Base, typename... Args>
+class RowOutputFormatWithExceptionHandlerAdaptorBase : public Base
+{
+public:
+    RowOutputFormatWithExceptionHandlerAdaptorBase(bool handle_exceptions, const Block & header, WriteBuffer & out_, Args... args)
+        : Base(header, out_, std::forward<Args>(args)...)
+    {
+        if (handle_exceptions)
+            peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
+    }
+
+    void write(const Columns & columns, size_t row_num)
+    {
+        if (!peekable_out)
+            Base::write(columns, row_num);
+
+
+        PeekableWriteBufferCheckpoint checkpoint(*peekable_out);
+        try
+        {
+            Base::write(columns, row_num);
+        }
+        catch (...)
+        {
+            peekable_out->rollbackToCheckpoint();
+            throw;
+        }
+    }
+
+    void flush() override
+    {
+        getWriteBufferPtr()->next();
+
+        if (peekable_out)
+            Base::getWriteBufferPtr()->next();
+    }
+
+    void finalizeBuffers() override
+    {
+        if (peekable_out)
+            peekable_out->finalize();
+    }
+
+    void resetFormatterImpl() override
+    {
+        peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
+    }
+
+protected:
+    /// Returns buffer that should be used in derived classes instead of out.
+    WriteBuffer * getWriteBufferPtr() override
+    {
+        if (peekable_out)
+            peekable_out.get();
+        return Base::getWriteBufferPtr();
+    }
+
+private:
+
+    std::unique_ptr<PeekableWriteBuffer> peekable_out;
+};
+
+}
+
diff --git a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
index 8d8fb9ef0c6..f86ff278b33 100644
--- a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
+++ b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
@@ -9,12 +9,12 @@
 namespace DB
 {
 
-template <typename Base, typename... Args>
+template <typename Base>
 class OutputFormatWithUTF8ValidationAdaptorBase : public Base
 {
 public:
-    OutputFormatWithUTF8ValidationAdaptorBase(bool validate_utf8, const Block & header, WriteBuffer & out_, Args... args)
-        : Base(header, out_, std::forward<Args>(args)...)
+    OutputFormatWithUTF8ValidationAdaptorBase(const Block & header, WriteBuffer & out_, bool validate_utf8)
+        : Base(header, out_)
     {
         bool values_can_contain_invalid_utf8 = false;
         for (const auto & type : this->getPort(IOutputFormat::PortKind::Main).getHeader().getDataTypes())
@@ -24,37 +24,37 @@ public:
         }
 
         if (validate_utf8 && values_can_contain_invalid_utf8)
-        {
-            validating_ostr = std::make_unique<WriteBufferValidUTF8>(this->out);
-            ostr = validating_ostr.get();
-        }
-        else
-            ostr = &this->out;
+            validating_ostr = std::make_unique<WriteBufferValidUTF8>(*Base::getWriteBufferPtr());
     }
 
     void flush() override
     {
-        ostr->next();
-
         if (validating_ostr)
-            this->out.next();
+            validating_ostr->next();
+        Base::flush();
     }
 
     void finalizeBuffers() override
     {
         if (validating_ostr)
             validating_ostr->finalize();
+        Base::finalizeBuffers();
     }
 
     void resetFormatterImpl() override
     {
-        validating_ostr = std::make_unique<WriteBufferValidUTF8>(this->out);
-        ostr = validating_ostr.get();
+        Base::resetFormatterImpl();
+        validating_ostr = std::make_unique<WriteBufferValidUTF8>(*Base::getWriteBufferPtr());
     }
 
 protected:
-    /// Point to validating_ostr or out from IOutputFormat, should be used in derived classes instead of out.
-    WriteBuffer * ostr;
+    /// Returns buffer that should be used in derived classes instead of out.
+    WriteBuffer * getWriteBufferPtr() override
+    {
+        if (validating_ostr)
+            return validating_ostr.get();
+        return Base::getWriteBufferPtr();
+    }
 
 private:
     /// Validates UTF-8 sequences, replaces bad sequences with replacement character.
diff --git a/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
new file mode 100644
index 00000000000..4e797c521c0
--- /dev/null
+++ b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
@@ -0,0 +1,104 @@
+#pragma once
+
+#include <Processors/Formats/IOutputFormat.h>
+#include <Processors/Formats/IRowOutputFormat.h>
+#include <Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h>
+
+#include <IO/WriteBuffer.h>
+#include <IO/PeekableWriteBuffer.h>
+#include <Common/logger_useful.h>
+
+namespace DB
+{
+
+template <typename Base, typename... Args>
+class RowOutputFormatWithExceptionHandlerAdaptor : public Base
+{
+public:
+    RowOutputFormatWithExceptionHandlerAdaptor(const Block & header, WriteBuffer & out_, bool handle_exceptions, Args... args)
+        : Base(header, out_, std::forward<Args>(args)...)
+    {
+        if (handle_exceptions)
+            peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
+    }
+
+    void consume(DB::Chunk chunk) override
+    {
+        if (!peekable_out)
+        {
+            Base::consume(std::move(chunk));
+            return;
+        }
+
+        auto num_rows = chunk.getNumRows();
+        const auto & columns = chunk.getColumns();
+
+        for (size_t row = 0; row < num_rows; ++row)
+        {
+            /// It's important to set a checkpoint before writing row-between delimiter
+            peekable_out->setCheckpoint();
+
+            if (Base::haveWrittenData())
+                writeRowBetweenDelimiter();
+
+            try
+            {
+                write(columns, row);
+            }
+            catch (...)
+            {
+                peekable_out->rollbackToCheckpoint(/*drop=*/true);
+                throw;
+            }
+            peekable_out->dropCheckpoint();
+
+            Base::first_row = false;
+        }
+    }
+
+    void write(const Columns & columns, size_t row_num) override { Base::write(columns, row_num); }
+    void writeRowBetweenDelimiter() override { Base::writeRowBetweenDelimiter(); }
+
+    void flush() override
+    {
+        if (peekable_out)
+            peekable_out->next();
+
+        Base::flush();
+    }
+
+    void finalizeBuffers() override
+    {
+        if (peekable_out)
+            peekable_out->finalize();
+        Base::finalizeBuffers();
+    }
+
+    void resetFormatterImpl() override
+    {
+        Base::resetFormatterImpl();
+        peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
+    }
+
+    bool supportsWritingException() const override { return true; }
+
+    void setException(const String & exception_message_) override { exception_message = exception_message_; }
+
+protected:
+    /// Returns buffer that should be used in derived classes instead of out.
+    WriteBuffer * getWriteBufferPtr() override
+    {
+        if (peekable_out)
+            return peekable_out.get();
+        return Base::getWriteBufferPtr();
+    }
+
+    String exception_message;
+
+private:
+
+    std::unique_ptr<PeekableWriteBuffer> peekable_out;
+};
+
+}
+
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index a0bfcd49dfd..a5102ea9383 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -28,6 +28,8 @@
 #include <Common/setThreadName.h>
 #include <Common/typeid_cast.h>
 #include <Parsers/ASTSetQuery.h>
+#include <Processors/Formats/IOutputFormat.h>
+#include <Formats/FormatFactory.h>
 
 #include <base/getFQDNOrHostName.h>
 #include <base/scope_guard.h>
@@ -835,23 +837,40 @@ void HTTPHandler::processQuery(
     customizeContext(request, context, *in_post_maybe_compressed);
     in = has_external_data ? std::move(in_param) : std::make_unique<ConcatReadBuffer>(*in_param, *in_post_maybe_compressed);
 
-    executeQuery(*in, *used_output.out_maybe_delayed_and_compressed, /* allow_into_outfile = */ false, context,
-        [&response, this] (const QueryResultDetails & details)
+    auto set_query_result = [&response, this] (const QueryResultDetails & details)
+    {
+        response.add("X-ClickHouse-Query-Id", details.query_id);
+
+        if (content_type_override)
+            response.setContentType(*content_type_override);
+        else if (details.content_type)
+            response.setContentType(*details.content_type);
+
+        if (details.format)
+            response.add("X-ClickHouse-Format", *details.format);
+
+        if (details.timezone)
+            response.add("X-ClickHouse-Timezone", *details.timezone);
+    };
+
+    auto handle_exception_in_output_format = [&](IOutputFormat & output_format)
+    {
+        if (settings.http_write_exception_in_output_format && output_format.supportsWritingException())
         {
-            response.add("X-ClickHouse-Query-Id", details.query_id);
-
-            if (content_type_override)
-                response.setContentType(*content_type_override);
-            else if (details.content_type)
-                response.setContentType(*details.content_type);
-
-            if (details.format)
-                response.add("X-ClickHouse-Format", *details.format);
-
-            if (details.timezone)
-                response.add("X-ClickHouse-Timezone", *details.timezone);
+            output_format.setException(getCurrentExceptionMessage(false));
+            output_format.finalize();
+            used_output.exception_is_written = true;
         }
-    );
+    };
+
+    executeQuery(
+        *in,
+        *used_output.out_maybe_delayed_and_compressed,
+        /* allow_into_outfile = */ false,
+        context,
+        set_query_result,
+        {},
+        handle_exception_in_output_format);
 
     if (used_output.hasDelayed())
     {
@@ -895,7 +914,7 @@ try
         response.setStatusAndReason(exceptionCodeToHTTPStatus(exception_code));
     }
 
-    if (!response.sent() && !used_output.out_maybe_compressed)
+    if (!response.sent() && !used_output.out_maybe_compressed && !used_output.exception_is_written)
     {
         /// If nothing was sent yet and we don't even know if we must compress the response.
         *response.send() << s << std::endl;
@@ -911,21 +930,24 @@ try
             used_output.out_maybe_delayed_and_compressed.reset();
         }
 
-        /// Send the error message into already used (and possibly compressed) stream.
-        /// Note that the error message will possibly be sent after some data.
-        /// Also HTTP code 200 could have already been sent.
-
-        /// If buffer has data, and that data wasn't sent yet, then no need to send that data
-        bool data_sent = used_output.out->count() != used_output.out->offset();
-
-        if (!data_sent)
+        if (!used_output.exception_is_written)
         {
-            used_output.out_maybe_compressed->position() = used_output.out_maybe_compressed->buffer().begin();
-            used_output.out->position() = used_output.out->buffer().begin();
-        }
+            /// Send the error message into already used (and possibly compressed) stream.
+            /// Note that the error message will possibly be sent after some data.
+            /// Also HTTP code 200 could have already been sent.
 
-        writeString(s, *used_output.out_maybe_compressed);
-        writeChar('\n', *used_output.out_maybe_compressed);
+            /// If buffer has data, and that data wasn't sent yet, then no need to send that data
+            bool data_sent = used_output.out->count() != used_output.out->offset();
+
+            if (!data_sent)
+            {
+                used_output.out_maybe_compressed->position() = used_output.out_maybe_compressed->buffer().begin();
+                used_output.out->position() = used_output.out->buffer().begin();
+            }
+
+            writeString(s, *used_output.out_maybe_compressed);
+            writeChar('\n', *used_output.out_maybe_compressed);
+        }
 
         used_output.out_maybe_compressed->next();
     }
diff --git a/src/Server/HTTPHandler.h b/src/Server/HTTPHandler.h
index 5eda5927538..94b5a44f105 100644
--- a/src/Server/HTTPHandler.h
+++ b/src/Server/HTTPHandler.h
@@ -62,6 +62,8 @@ private:
 
         bool finalized = false;
 
+        bool exception_is_written = false;
+
         inline bool hasDelayed() const
         {
             return out_maybe_delayed_and_compressed != out_maybe_compressed;
diff --git a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
new file mode 100644
index 00000000000..452aa9d5022
--- /dev/null
+++ b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
@@ -0,0 +1,432 @@
+One block
+Parallel formatting: 0
+JSON
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+
+	],
+
+	"rows": 0,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONEachRow
+{"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "}
+JSONCompact
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+
+	],
+
+	"rows": 0,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONCompactEachRow
+["Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "]
+JSONObjectEachRow
+{
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+XML
+<?xml version='1.0' encoding='UTF-8' ?>
+<result>
+	<meta>
+		<columns>
+			<column>
+				<name>number</name>
+				<type>UInt64</type>
+			</column>
+			<column>
+				<name>res</name>
+				<type>UInt8</type>
+			</column>
+		</columns>
+	</meta>
+	<data>
+	</data>
+	<rows>0</rows>
+	<exception>Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) </exception>
+</result>
+Parallel formatting: 1
+JSON
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+
+	],
+
+	"rows": 0,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONEachRow
+{"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "}
+JSONCompact
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+
+	],
+
+	"rows": 0,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONCompactEachRow
+["Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "]
+JSONObjectEachRow
+{
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+XML
+<?xml version='1.0' encoding='UTF-8' ?>
+<result>
+	<meta>
+		<columns>
+			<column>
+				<name>number</name>
+				<type>UInt64</type>
+			</column>
+			<column>
+				<name>res</name>
+				<type>UInt8</type>
+			</column>
+		</columns>
+	</meta>
+	<data>
+	</data>
+	<rows>0</rows>
+	<exception>Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) </exception>
+</result>
+Several blocks
+Without parallel formatting
+JSON
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+		{
+			"number": "0",
+			"res": 0
+		},
+		{
+			"number": "1",
+			"res": 0
+		},
+		{
+			"number": "2",
+			"res": 0
+		},
+		{
+			"number": "3",
+			"res": 0
+		}
+	],
+
+	"rows": 4,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONEachRow
+{"number":"0","res":0}
+{"number":"1","res":0}
+{"number":"2","res":0}
+{"number":"3","res":0}
+{"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "}
+JSONCompact
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "res",
+			"type": "UInt8"
+		}
+	],
+
+	"data":
+	[
+		["0", 0],
+		["1", 0],
+		["2", 0],
+		["3", 0]
+	],
+
+	"rows": 4,
+
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+JSONCompactEachRow
+["0", 0]
+["1", 0]
+["2", 0]
+["3", 0]
+["Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "]
+JSONObjectEachRow
+{
+	"row_1": {"number":"0","res":0},
+	"row_1": {"number":"1","res":0},
+	"row_1": {"number":"2","res":0},
+	"row_1": {"number":"3","res":0},
+	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
+}
+XML
+<?xml version='1.0' encoding='UTF-8' ?>
+<result>
+	<meta>
+		<columns>
+			<column>
+				<name>number</name>
+				<type>UInt64</type>
+			</column>
+			<column>
+				<name>res</name>
+				<type>UInt8</type>
+			</column>
+		</columns>
+	</meta>
+	<data>
+		<row>
+			<number>0</number>
+			<res>0</res>
+		</row>
+		<row>
+			<number>1</number>
+			<res>0</res>
+		</row>
+		<row>
+			<number>2</number>
+			<res>0</res>
+		</row>
+		<row>
+			<number>3</number>
+			<res>0</res>
+		</row>
+	</data>
+	<rows>4</rows>
+	<exception>Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) </exception>
+</result>
+With parallel formatting
+JSON
+1
+JSONCompact
+1
+JSONObjectEachRow
+1
+JSONEachRow
+1
+JSONCompactEachRow
+1
+Formatting error
+Without parallel formatting
+JSON
+{
+	"meta":
+	[
+		{
+			"name": "x",
+			"type": "UInt32"
+		},
+		{
+			"name": "s",
+			"type": "String"
+		},
+		{
+			"name": "y",
+			"type": "Enum8('a' = 1)"
+		}
+	],
+
+	"data":
+	[
+		{
+			"x": 1,
+			"s": "str1",
+			"y": "a"
+		},
+		{
+			"x": 2,
+			"s": "str2",
+			"y": "a"
+		},
+		{
+			"x": 3,
+			"s": "str3",
+			"y": "a"
+		}
+	],
+
+	"rows": 3,
+
+	"exception": "Code: 36. : Unexpected value 99 in enum: While executing JSONRowOutputFormat. (BAD_ARGUMENTS) "
+}
+JSONEachRow
+{"x":1,"s":"str1","y":"a"}
+{"x":2,"s":"str2","y":"a"}
+{"x":3,"s":"str3","y":"a"}
+{"exception": "Code: 36. : Unexpected value 99 in enum: While executing JSONEachRowRowOutputFormat. (BAD_ARGUMENTS) "}
+JSONCompact
+{
+	"meta":
+	[
+		{
+			"name": "x",
+			"type": "UInt32"
+		},
+		{
+			"name": "s",
+			"type": "String"
+		},
+		{
+			"name": "y",
+			"type": "Enum8('a' = 1)"
+		}
+	],
+
+	"data":
+	[
+		[1, "str1", "a"],
+		[2, "str2", "a"],
+		[3, "str3", "a"]
+	],
+
+	"rows": 3,
+
+	"exception": "Code: 36. : Unexpected value 99 in enum: While executing JSONCompactRowOutputFormat. (BAD_ARGUMENTS) "
+}
+JSONCompactEachRow
+[1, "str1", "a"]
+[2, "str2", "a"]
+[3, "str3", "a"]
+["Code: 36. : Unexpected value 99 in enum: While executing JSONCompactEachRowRowOutputFormat. (BAD_ARGUMENTS) "]
+JSONObjectEachRow
+{
+	"row_1": {"x":1,"s":"str1","y":"a"},
+	"row_1": {"x":2,"s":"str2","y":"a"},
+	"row_1": {"x":3,"s":"str3","y":"a"},
+	"exception": "Code: 36. : Unexpected value 99 in enum: While executing JSONObjectEachRowRowOutputFormat. (BAD_ARGUMENTS) "
+}
+XML
+<?xml version='1.0' encoding='UTF-8' ?>
+<result>
+	<meta>
+		<columns>
+			<column>
+				<name>x</name>
+				<type>UInt32</type>
+			</column>
+			<column>
+				<name>s</name>
+				<type>String</type>
+			</column>
+			<column>
+				<name>y</name>
+				<type>Enum8('a' = 1)</type>
+			</column>
+		</columns>
+	</meta>
+	<data>
+		<row>
+			<x>1</x>
+			<s>str1</s>
+			<y>a</y>
+		</row>
+		<row>
+			<x>2</x>
+			<s>str2</s>
+			<y>a</y>
+		</row>
+		<row>
+			<x>3</x>
+			<s>str3</s>
+			<y>a</y>
+		</row>
+	</data>
+	<rows>3</rows>
+	<exception>Code: 36. : Unexpected value 99 in enum: While executing XMLRowOutputFormat. (BAD_ARGUMENTS) </exception>
+</result>
+With parallel formatting
+JSON
+1
+JSONCompact
+1
+JSONObjectEachRow
+1
+JSONEachRow
+1
+JSONCompactEachRow
+1
+Test 1
+1
+1
+Test 2
+1
+1
+Test 3
+1
+1
diff --git a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
new file mode 100755
index 00000000000..cb4d1b6aee1
--- /dev/null
+++ b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
@@ -0,0 +1,106 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+echo "One block"
+for parallel in 0 1
+do
+    echo "Parallel formatting: $parallel"
+    for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
+    do
+        echo $format
+        ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from numbers(10) format $format settings output_format_parallel_formatting=$parallel" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+    done
+done
+
+echo "Several blocks"
+echo "Without parallel formatting"
+for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
+do
+    echo $format
+        ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+done
+
+echo "With parallel formatting"
+for format in JSON JSONCompact JSONObjectEachRow
+do
+    echo $format
+    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+done
+
+for format in JSONEachRow JSONCompactEachRow
+do
+    echo $format
+    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
+done
+
+echo "Formatting error"
+$CLICKHOUSE_CLIENT -q "drop table if exists test_02841"
+$CLICKHOUSE_CLIENT -q "create table test_02841 (x UInt32, s String, y Enum('a' = 1)) engine=MergeTree order by x"
+$CLICKHOUSE_CLIENT -q "system stop merges test_02841"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (1, 'str1', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (2, 'str2', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (3, 'str3', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (5, 'str5', 99)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (6, 'str6', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (7, 'str7', 1)"
+
+echo "Without parallel formatting"
+for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
+do
+    echo $format
+    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 order by x format $format settings output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+done
+
+echo "With parallel formatting"
+for format in JSON JSONCompact JSONObjectEachRow
+do
+    echo $format
+    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+done
+
+for format in JSONEachRow JSONCompactEachRow
+do
+    echo $format
+    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
+done
+
+
+echo "Test 1"
+$CLICKHOUSE_CLIENT -q "truncate table test_02841"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select 1, repeat('aaaaa', 1000000), 1"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select 2, repeat('aaaaa', 1000000), 99"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select 3, repeat('aaaaa', 1000000), 1"
+
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+
+
+echo "Test 2"
+$CLICKHOUSE_CLIENT -q "truncate table test_02841"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (1, 'str1', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (2, 'str2', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_1', 1 from numbers(10000)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (3, 'str4', 99)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (4, 'str5', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_2', 1 from numbers(10000)"
+
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+
+echo "Test 3"
+$CLICKHOUSE_CLIENT -q "truncate table test_02841"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (1, 'str1', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (2, 'str2', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_1', number > 9000 ? 99 : 1 from numbers(10000)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (3, 'str4', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 values (4, 'str5', 1)"
+$CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_2', 1 from numbers(10000)"
+
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+
+$CLICKHOUSE_CLIENT -q "drop table test_02841"
+

From fa905ebd27f56c4dcf3b4550963d7f4cab94c2e5 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 1 Aug 2023 10:14:09 +0000
Subject: [PATCH 020/101] Clean up

---
 src/Formats/FormatFactory.cpp                 |  1 -
 .../OutputFormatWithExceptionHandlerAdaptor.h | 75 -------------------
 2 files changed, 76 deletions(-)
 delete mode 100644 src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h

diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index 4cd2ad5be03..1ad2c2285d9 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -1,7 +1,6 @@
 #include <Formats/FormatFactory.h>
 
 #include <algorithm>
-//#include <Core/Settings.h>
 #include <Formats/FormatSettings.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/ProcessList.h>
diff --git a/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h b/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h
deleted file mode 100644
index bb318dae81e..00000000000
--- a/src/Processors/Formats/OutputFormatWithExceptionHandlerAdaptor.h
+++ /dev/null
@@ -1,75 +0,0 @@
-#pragma once
-
-#include <Processors/Formats/IOutputFormat.h>
-#include <Processors/Formats/IRowOutputFormat.h>
-
-#include <IO/WriteBuffer.h>
-#include <IO/PeekableWriteBuffer.h>
-
-namespace DB
-{
-
-template <typename Base, typename... Args>
-class RowOutputFormatWithExceptionHandlerAdaptorBase : public Base
-{
-public:
-    RowOutputFormatWithExceptionHandlerAdaptorBase(bool handle_exceptions, const Block & header, WriteBuffer & out_, Args... args)
-        : Base(header, out_, std::forward<Args>(args)...)
-    {
-        if (handle_exceptions)
-            peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
-    }
-
-    void write(const Columns & columns, size_t row_num)
-    {
-        if (!peekable_out)
-            Base::write(columns, row_num);
-
-
-        PeekableWriteBufferCheckpoint checkpoint(*peekable_out);
-        try
-        {
-            Base::write(columns, row_num);
-        }
-        catch (...)
-        {
-            peekable_out->rollbackToCheckpoint();
-            throw;
-        }
-    }
-
-    void flush() override
-    {
-        getWriteBufferPtr()->next();
-
-        if (peekable_out)
-            Base::getWriteBufferPtr()->next();
-    }
-
-    void finalizeBuffers() override
-    {
-        if (peekable_out)
-            peekable_out->finalize();
-    }
-
-    void resetFormatterImpl() override
-    {
-        peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
-    }
-
-protected:
-    /// Returns buffer that should be used in derived classes instead of out.
-    WriteBuffer * getWriteBufferPtr() override
-    {
-        if (peekable_out)
-            peekable_out.get();
-        return Base::getWriteBufferPtr();
-    }
-
-private:
-
-    std::unique_ptr<PeekableWriteBuffer> peekable_out;
-};
-
-}
-

From 2adb25e5caacc87182ea5aa7c8a431b5867d3180 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 1 Aug 2023 10:21:32 +0000
Subject: [PATCH 021/101] Add examples in docs

---
 docs/en/interfaces/http.md | 68 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 68 insertions(+)

diff --git a/docs/en/interfaces/http.md b/docs/en/interfaces/http.md
index b28180fec67..a66b4ff5d5d 100644
--- a/docs/en/interfaces/http.md
+++ b/docs/en/interfaces/http.md
@@ -707,6 +707,74 @@ To prevent it, you can use setting `http_write_exception_in_output_format` (enab
 Examples:
 
 ```bash
+$ curl 'http://localhost:8123/?query=SELECT+number,+throwIf(number>3)+from+system.numbers+format+JSON+settings+max_block_size=1&http_write_exception_in_output_format=1'
+{
+	"meta":
+	[
+		{
+			"name": "number",
+			"type": "UInt64"
+		},
+		{
+			"name": "throwIf(greater(number, 2))",
+			"type": "UInt8"
+		}
+	],
 
+	"data":
+	[
+		{
+			"number": "0",
+			"throwIf(greater(number, 2))": 0
+		},
+		{
+			"number": "1",
+			"throwIf(greater(number, 2))": 0
+		},
+		{
+			"number": "2",
+			"throwIf(greater(number, 2))": 0
+		}
+	],
+
+	"rows": 3,
+
+	"exception": "Code: 395. DB::Exception: Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 2) :: 2) -> throwIf(greater(number, 2)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) (version 23.8.1.1)"
+}
+```
+
+```bash
+$ curl 'http://localhost:8123/?query=SELECT+number,+throwIf(number>2)+from+system.numbers+format+XML+settings+max_block_size=1&http_write_exception_in_output_format=1'
+<?xml version='1.0' encoding='UTF-8' ?>
+<result>
+	<meta>
+		<columns>
+			<column>
+				<name>number</name>
+				<type>UInt64</type>
+			</column>
+			<column>
+				<name>throwIf(greater(number, 2))</name>
+				<type>UInt8</type>
+			</column>
+		</columns>
+	</meta>
+	<data>
+		<row>
+			<number>0</number>
+			<field>0</field>
+		</row>
+		<row>
+			<number>1</number>
+			<field>0</field>
+		</row>
+		<row>
+			<number>2</number>
+			<field>0</field>
+		</row>
+	</data>
+	<rows>3</rows>
+	<exception>Code: 395. DB::Exception: Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 2) :: 2) -> throwIf(greater(number, 2)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) (version 23.8.1.1)</exception>
+</result>
 ```
 

From d12e96177a390464349d71888aef3d1b19243c2d Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 1 Aug 2023 16:17:03 +0000
Subject: [PATCH 022/101] Fix tests

---
 .../OptimizeDateOrDateTimeConverterWithPreimagePass.cpp     | 2 +-
 src/IO/PeekableWriteBuffer.cpp                              | 2 +-
 .../Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp      | 6 ++++++
 .../Formats/Impl/JSONCompactEachRowRowOutputFormat.h        | 2 ++
 src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp  | 5 +++++
 src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h    | 2 ++
 .../Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp       | 2 +-
 src/Processors/Formats/Impl/JSONRowOutputFormat.cpp         | 1 +
 .../Formats/Impl/ParallelFormattingOutputFormat.cpp         | 4 ++--
 .../Formats/Impl/ParallelFormattingOutputFormat.h           | 4 ++++
 src/Processors/Formats/Impl/XMLRowOutputFormat.cpp          | 5 +++--
 .../Formats/OutputFormatWithUTF8ValidationAdaptor.h         | 6 +++++-
 .../Formats/RowOutputFormatWithExceptionHandlerAdaptor.h    | 4 +++-
 13 files changed, 36 insertions(+), 9 deletions(-)

diff --git a/src/Analyzer/Passes/OptimizeDateOrDateTimeConverterWithPreimagePass.cpp b/src/Analyzer/Passes/OptimizeDateOrDateTimeConverterWithPreimagePass.cpp
index 7205ac299a9..774c07ef1d4 100644
--- a/src/Analyzer/Passes/OptimizeDateOrDateTimeConverterWithPreimagePass.cpp
+++ b/src/Analyzer/Passes/OptimizeDateOrDateTimeConverterWithPreimagePass.cpp
@@ -48,7 +48,7 @@ public:
         return true;
     }
 
-    void visitImpl(QueryTreeNodePtr & node) const
+    void enterImpl(QueryTreeNodePtr & node) const
     {
         const static std::unordered_map<String, String> swap_relations = {
             {"equals", "equals"},
diff --git a/src/IO/PeekableWriteBuffer.cpp b/src/IO/PeekableWriteBuffer.cpp
index dc7f87dd539..87c7291c377 100644
--- a/src/IO/PeekableWriteBuffer.cpp
+++ b/src/IO/PeekableWriteBuffer.cpp
@@ -6,7 +6,7 @@ namespace DB
 PeekableWriteBuffer::PeekableWriteBuffer(DB::WriteBuffer & sub_buf_) : BufferWithOwnMemory(0), sub_buf(sub_buf_)
 {
     Buffer & sub_working = sub_buf.buffer();
-    BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf.offset());
+    BufferBase::set(sub_working.begin() + sub_buf.offset(), sub_working.size() - sub_buf.offset(), 0);
 }
 
 void PeekableWriteBuffer::nextImpl()
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
index c5c9af60982..530d09d5c87 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.cpp
@@ -116,6 +116,12 @@ void JSONCompactEachRowRowOutputFormat::writeSuffix()
     }
 }
 
+void JSONCompactEachRowRowOutputFormat::resetFormatterImpl()
+{
+    RowOutputFormatWithExceptionHandlerAdaptor::resetFormatterImpl();
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
+}
+
 void registerOutputFormatJSONCompactEachRow(FormatFactory & factory)
 {
     for (bool yield_strings : {false, true})
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
index a05fff699a5..bd32592a4a0 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowOutputFormat.h
@@ -36,6 +36,8 @@ private:
     void writeRowEndDelimiter() override;
     void writeSuffix() override;
 
+    void resetFormatterImpl() override;
+
     bool supportTotals() const override { return true; }
     void consumeTotals(Chunk) override;
 
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
index 2169d815fbf..a7118c2154a 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
@@ -92,6 +92,11 @@ void JSONEachRowRowOutputFormat::writeSuffix()
         writeCString("\n]\n", *ostr);
 }
 
+void JSONEachRowRowOutputFormat::resetFormatterImpl()
+{
+    RowOutputFormatWithExceptionHandlerAdaptor::resetFormatterImpl();
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
+}
 
 void registerOutputFormatJSONEachRow(FormatFactory & factory)
 {
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
index 28bfbf2e6ac..2de9369846b 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.h
@@ -39,6 +39,8 @@ protected:
     void writePrefix() override;
     void writeSuffix() override;
 
+    void resetFormatterImpl() override;
+
     size_t field_number = 0;
     bool pretty_json;
 
diff --git a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
index 8f4d11a604a..26aa0aad97c 100644
--- a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
@@ -68,7 +68,7 @@ void JSONObjectEachRowRowOutputFormat::writeSuffix()
             writeRowBetweenDelimiter();
         JSONUtils::writeException(exception_message, *ostr, settings, 1);
     }
-    
+
     JSONUtils::writeObjectEnd(*ostr);
     writeChar('\n', *ostr);
 }
diff --git a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
index e4c4e2a3bc6..20182d84917 100644
--- a/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowOutputFormat.cpp
@@ -135,6 +135,7 @@ void JSONRowOutputFormat::finalizeImpl()
 void JSONRowOutputFormat::resetFormatterImpl()
 {
     RowOutputFormatWithExceptionHandlerAdaptor::resetFormatterImpl();
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
     row_count = 0;
     statistics = Statistics();
 }
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
index 3e63e2abd6c..841ef683228 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
@@ -36,10 +36,10 @@ namespace DB
         formatter->setRowsReadBefore(rows_collected);
         formatter->setException(exception_message);
 
-        if (!collected_prefix)
+        if (!collected_prefix && (need_write_prefix || started_prefix))
             formatter->writePrefix();
 
-        if (!collected_suffix)
+        if (!collected_suffix && (need_write_suffix || started_suffix))
             formatter->writeSuffix();
 
         if (!collected_finalize)
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
index b9a3b7638fa..bf8968dd376 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
@@ -118,6 +118,7 @@ public:
     void writePrefix() override
     {
         addChunk(Chunk{}, ProcessingUnitType::START, /*can_throw_exception*/ true);
+        started_prefix = true;
     }
 
     void onCancel() override
@@ -134,6 +135,7 @@ public:
     void writeSuffix() override
     {
         addChunk(Chunk{}, ProcessingUnitType::PLAIN_FINISH, /*can_throw_exception*/ true);
+        started_suffix = true;
     }
 
     String getContentType() const override
@@ -259,7 +261,9 @@ private:
 
     String exception_message;
     bool exception_is_rethrown = false;
+    bool started_prefix = false;
     bool collected_prefix = false;
+    bool started_suffix = false;
     bool collected_suffix = false;
     bool collected_finalize = false;
 
diff --git a/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp b/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
index eb735cc93aa..52c161c3208 100644
--- a/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/XMLRowOutputFormat.cpp
@@ -8,7 +8,7 @@ namespace DB
 {
 
 XMLRowOutputFormat::XMLRowOutputFormat(WriteBuffer & out_, const Block & header_, const FormatSettings & format_settings_)
-    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(header_, out_, true, format_settings_.xml.valid_output_on_exception), fields(header_.getNamesAndTypes()), format_settings(format_settings_)
+    : RowOutputFormatWithExceptionHandlerAdaptor<RowOutputFormatWithUTF8ValidationAdaptor, bool>(header_, out_, format_settings_.xml.valid_output_on_exception, true), fields(header_.getNamesAndTypes()), format_settings(format_settings_)
 {
     ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
     const auto & sample = getPort(PortKind::Main).getHeader();
@@ -203,7 +203,8 @@ void XMLRowOutputFormat::finalizeImpl()
 
 void XMLRowOutputFormat::resetFormatterImpl()
 {
-    RowOutputFormatWithUTF8ValidationAdaptor::resetFormatterImpl();
+    RowOutputFormatWithExceptionHandlerAdaptor::resetFormatterImpl();
+    ostr = RowOutputFormatWithExceptionHandlerAdaptor::getWriteBufferPtr();
     row_count = 0;
     statistics = Statistics();
 }
diff --git a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
index f86ff278b33..4c5c3ef72e9 100644
--- a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
+++ b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
@@ -6,6 +6,8 @@
 #include <IO/WriteBuffer.h>
 #include <IO/WriteBufferValidUTF8.h>
 
+#include <Common/logger_useful.h>
+
 namespace DB
 {
 
@@ -43,8 +45,10 @@ public:
 
     void resetFormatterImpl() override
     {
+        LOG_DEBUG(&Poco::Logger::get("RowOutputFormatWithExceptionHandlerAdaptor"), "resetFormatterImpl");
         Base::resetFormatterImpl();
-        validating_ostr = std::make_unique<WriteBufferValidUTF8>(*Base::getWriteBufferPtr());
+        if (validating_ostr)
+            validating_ostr = std::make_unique<WriteBufferValidUTF8>(*Base::getWriteBufferPtr());
     }
 
 protected:
diff --git a/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
index 4e797c521c0..22232e9f654 100644
--- a/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
+++ b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
@@ -76,8 +76,10 @@ public:
 
     void resetFormatterImpl() override
     {
+        LOG_DEBUG(&Poco::Logger::get("RowOutputFormatWithExceptionHandlerAdaptor"), "resetFormatterImpl");
         Base::resetFormatterImpl();
-        peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
+        if (peekable_out)
+            peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());
     }
 
     bool supportsWritingException() const override { return true; }

From 81866bcc9c3f7fcf68ec9cd908a0fa7013dbf980 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 2 Aug 2023 12:35:58 +0200
Subject: [PATCH 023/101] Fix special build

---
 .../Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp           | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
index 26aa0aad97c..46b3f56f3cc 100644
--- a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
@@ -28,7 +28,7 @@ void JSONObjectEachRowRowOutputFormat::write(const Columns & columns, size_t row
     else
         object_name = "row_" + std::to_string(row + 1);
 
-    IRowOutputFormat::write(columns, row);
+    RowOutputFormatWithExceptionHandlerAdaptor::write(columns, row);
 }
 
 void JSONObjectEachRowRowOutputFormat::writeFieldDelimiter()

From 77cc84a4d2937bea024c1cefbcf17f99ee7ac7c7 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 2 Aug 2023 12:43:25 +0200
Subject: [PATCH 024/101] Fix test

---
 ...41_valid_json_and_xml_on_http_exception.sh | 28 ++++++++++---------
 1 file changed, 15 insertions(+), 13 deletions(-)

diff --git a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
index cb4d1b6aee1..60ce7eb3b6f 100755
--- a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
+++ b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
@@ -4,6 +4,8 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
+CH_URL='$CLICKHOUSE_URL&http_write_exception_in_output_format=1&allow_experimental_analyzer=0'
+
 echo "One block"
 for parallel in 0 1
 do
@@ -11,7 +13,7 @@ do
     for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
     do
         echo $format
-        ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from numbers(10) format $format settings output_format_parallel_formatting=$parallel" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+        ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select number, throwIf(number > 3) as res from numbers(10) format $format settings output_format_parallel_formatting=$parallel" | sed "s/(version .*)//" | sed "s/DB::Exception//"
     done
 done
 
@@ -20,20 +22,20 @@ echo "Without parallel formatting"
 for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
 do
     echo $format
-        ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+        ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
 done
 
 echo "With parallel formatting"
 for format in JSON JSONCompact JSONObjectEachRow
 do
     echo $format
-    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+    ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
 done
 
 for format in JSONEachRow JSONCompactEachRow
 do
     echo $format
-    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
+    ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select number, throwIf(number > 3) as res from system.numbers format $format settings max_block_size=1, output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
 done
 
 echo "Formatting error"
@@ -51,20 +53,20 @@ echo "Without parallel formatting"
 for format in JSON JSONEachRow JSONCompact JSONCompactEachRow JSONObjectEachRow XML
 do
     echo $format
-    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 order by x format $format settings output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
+    ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 order by x format $format settings output_format_parallel_formatting=0" | sed "s/(version .*)//" | sed "s/DB::Exception//"
 done
 
 echo "With parallel formatting"
 for format in JSON JSONCompact JSONObjectEachRow
 do
     echo $format
-    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+    ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
 done
 
 for format in JSONEachRow JSONCompactEachRow
 do
     echo $format
-    ${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
+    ${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format $format settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=LineAsString -q "select min(isValidJSON(line)) from table"
 done
 
 
@@ -74,8 +76,8 @@ $CLICKHOUSE_CLIENT -q "insert into test_02841 select 1, repeat('aaaaa', 1000000)
 $CLICKHOUSE_CLIENT -q "insert into test_02841 select 2, repeat('aaaaa', 1000000), 99"
 $CLICKHOUSE_CLIENT -q "insert into test_02841 select 3, repeat('aaaaa', 1000000), 1"
 
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
 
 
 echo "Test 2"
@@ -87,8 +89,8 @@ $CLICKHOUSE_CLIENT -q "insert into test_02841 values (3, 'str4', 99)"
 $CLICKHOUSE_CLIENT -q "insert into test_02841 values (4, 'str5', 1)"
 $CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_2', 1 from numbers(10000)"
 
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
 
 echo "Test 3"
 $CLICKHOUSE_CLIENT -q "truncate table test_02841"
@@ -99,8 +101,8 @@ $CLICKHOUSE_CLIENT -q "insert into test_02841 values (3, 'str4', 1)"
 $CLICKHOUSE_CLIENT -q "insert into test_02841 values (4, 'str5', 1)"
 $CLICKHOUSE_CLIENT -q "insert into test_02841 select number, 'str_numbers_2', 1 from numbers(10000)"
 
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
-${CLICKHOUSE_CURL} -sS "$CLICKHOUSE_URL&http_write_exception_in_output_format=1" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=0" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
+${CLICKHOUSE_CURL} -sS "$CH_URL" -d "select * from test_02841 format JSON settings output_format_parallel_formatting=1" | $CLICKHOUSE_LOCAL --input-format=JSONAsString -q "select isValidJSON(json) from table"
 
 $CLICKHOUSE_CLIENT -q "drop table test_02841"
 

From d85b16dc71256049269d279bbcc2aab45ff688ee Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 2 Aug 2023 12:45:26 +0200
Subject: [PATCH 025/101] Fix test reference

---
 ...2841_valid_json_and_xml_on_http_exception.reference | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
index 452aa9d5022..1818ca7b5f2 100644
--- a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
+++ b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.reference
@@ -230,9 +230,9 @@ JSONCompactEachRow
 JSONObjectEachRow
 {
 	"row_1": {"number":"0","res":0},
-	"row_1": {"number":"1","res":0},
-	"row_1": {"number":"2","res":0},
-	"row_1": {"number":"3","res":0},
+	"row_2": {"number":"1","res":0},
+	"row_3": {"number":"2","res":0},
+	"row_4": {"number":"3","res":0},
 	"exception": "Code: 395. : Value passed to 'throwIf' function is non-zero: while executing 'FUNCTION throwIf(greater(number, 3) :: 2) -> throwIf(greater(number, 3)) UInt8 : 1'. (FUNCTION_THROW_IF_VALUE_IS_NON_ZERO) "
 }
 XML
@@ -367,8 +367,8 @@ JSONCompactEachRow
 JSONObjectEachRow
 {
 	"row_1": {"x":1,"s":"str1","y":"a"},
-	"row_1": {"x":2,"s":"str2","y":"a"},
-	"row_1": {"x":3,"s":"str3","y":"a"},
+	"row_2": {"x":2,"s":"str2","y":"a"},
+	"row_3": {"x":3,"s":"str3","y":"a"},
 	"exception": "Code: 36. : Unexpected value 99 in enum: While executing JSONObjectEachRowRowOutputFormat. (BAD_ARGUMENTS) "
 }
 XML

From ab78f9a94301441d077c6fb902618cdff3a3d443 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 4 Aug 2023 19:08:35 +0200
Subject: [PATCH 026/101] Fix test

---
 .../0_stateless/02841_valid_json_and_xml_on_http_exception.sh   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
index 60ce7eb3b6f..26b3ef64d61 100755
--- a/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
+++ b/tests/queries/0_stateless/02841_valid_json_and_xml_on_http_exception.sh
@@ -4,7 +4,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-CH_URL='$CLICKHOUSE_URL&http_write_exception_in_output_format=1&allow_experimental_analyzer=0'
+CH_URL="$CLICKHOUSE_URL&http_write_exception_in_output_format=1&allow_experimental_analyzer=0"
 
 echo "One block"
 for parallel in 0 1

From 67ee1a2385e3dc3235bee24f7d20ff181dc3aa36 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 7 Aug 2023 15:00:25 +0000
Subject: [PATCH 027/101] fix tests

---
 .../test_compression_nested_columns/test.py          |  2 +-
 .../configs/long_names.xml                           |  5 +++++
 .../configs/wide_parts_only.xml                      |  1 -
 .../test_default_compression_codec/test.py           | 12 ++++++++++--
 tests/integration/test_filesystem_layout/test.py     |  2 +-
 5 files changed, 17 insertions(+), 5 deletions(-)
 create mode 100644 tests/integration/test_default_compression_codec/configs/long_names.xml

diff --git a/tests/integration/test_compression_nested_columns/test.py b/tests/integration/test_compression_nested_columns/test.py
index 55d88174287..3541a9f6061 100644
--- a/tests/integration/test_compression_nested_columns/test.py
+++ b/tests/integration/test_compression_nested_columns/test.py
@@ -48,7 +48,7 @@ def test_nested_compression_codec(start_cluster):
             column_array Array(Array(UInt64)) CODEC(T64, LZ4),
             column_bad LowCardinality(Int64) CODEC(Delta)
         ) ENGINE = ReplicatedMergeTree('/t', '{}') ORDER BY tuple() PARTITION BY key
-        SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0;
+        SETTINGS min_rows_for_wide_part = 0, min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
         """.format(
                 i
             ),
diff --git a/tests/integration/test_default_compression_codec/configs/long_names.xml b/tests/integration/test_default_compression_codec/configs/long_names.xml
new file mode 100644
index 00000000000..1dc241dbf05
--- /dev/null
+++ b/tests/integration/test_default_compression_codec/configs/long_names.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <merge_tree>
+        <replace_long_file_name_to_hash>0</replace_long_file_name_to_hash>
+    </merge_tree>
+</clickhouse>
diff --git a/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml b/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
index 4d1a3357799..10b9edef36d 100644
--- a/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
+++ b/tests/integration/test_default_compression_codec/configs/wide_parts_only.xml
@@ -2,6 +2,5 @@
     <merge_tree>
         <min_rows_for_wide_part>0</min_rows_for_wide_part>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
-        <replace_long_file_name_to_hash>0</replace_long_file_name_to_hash>
     </merge_tree>
 </clickhouse>
diff --git a/tests/integration/test_default_compression_codec/test.py b/tests/integration/test_default_compression_codec/test.py
index c7c30f5eea4..abaf160e26a 100644
--- a/tests/integration/test_default_compression_codec/test.py
+++ b/tests/integration/test_default_compression_codec/test.py
@@ -9,12 +9,20 @@ cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance(
     "node1",
-    main_configs=["configs/default_compression.xml", "configs/wide_parts_only.xml"],
+    main_configs=[
+        "configs/default_compression.xml",
+        "configs/wide_parts_only.xml",
+        "configs/long_names.xml",
+    ],
     with_zookeeper=True,
 )
 node2 = cluster.add_instance(
     "node2",
-    main_configs=["configs/default_compression.xml", "configs/wide_parts_only.xml"],
+    main_configs=[
+        "configs/default_compression.xml",
+        "configs/wide_parts_only.xml",
+        "configs/long_names.xml",
+    ],
     with_zookeeper=True,
 )
 node3 = cluster.add_instance(
diff --git a/tests/integration/test_filesystem_layout/test.py b/tests/integration/test_filesystem_layout/test.py
index 81f3b67cb75..4e719aa0fe9 100644
--- a/tests/integration/test_filesystem_layout/test.py
+++ b/tests/integration/test_filesystem_layout/test.py
@@ -48,7 +48,7 @@ def test_file_path_escaping(started_cluster):
     node.query(
         """
         CREATE TABLE `test 2`.`T.a_b,l-e!` UUID '12345678-1000-4000-8000-000000000001' (`~Id` UInt32)
-        ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0;
+        ENGINE = MergeTree() PARTITION BY `~Id` ORDER BY `~Id` SETTINGS min_bytes_for_wide_part = 0, replace_long_file_name_to_hash = 0;
         """
     )
     node.query("""INSERT INTO `test 2`.`T.a_b,l-e!` VALUES (1);""")

From 8fa1f69fdf7143d0fbf27ff93853e6f64844f23c Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 8 Aug 2023 11:16:37 +0000
Subject: [PATCH 028/101] fix part columns modification time

---
 src/Storages/MergeTree/MergeTreeDataPartWide.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index b3ef45b46e5..1b0de863289 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -271,7 +271,8 @@ std::optional<time_t> MergeTreeDataPartWide::getColumnModificationTime(const Str
 {
     try
     {
-        return getDataPartStorage().getFileLastModified(column_name + DATA_FILE_EXTENSION).epochTime();
+        auto name_on_disk = checksums.getFileNameOrHash(column_name);
+        return getDataPartStorage().getFileLastModified(name_on_disk + DATA_FILE_EXTENSION).epochTime();
     }
     catch (const fs::filesystem_error &)
     {

From 078683e226c5beb1ab1870881feab42def97f904 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 10 Aug 2023 13:07:06 +0000
Subject: [PATCH 029/101] Fix tests

---
 .../Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp          | 3 ++-
 src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.h | 1 +
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
index 46b3f56f3cc..5d8e74309e3 100644
--- a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.cpp
@@ -26,8 +26,9 @@ void JSONObjectEachRowRowOutputFormat::write(const Columns & columns, size_t row
     if (field_index_for_object_name)
         object_name = columns[*field_index_for_object_name]->getDataAt(row).toString();
     else
-        object_name = "row_" + std::to_string(row + 1);
+        object_name = "row_" + std::to_string(getRowsReadBefore() + rows + 1);
 
+    ++rows;
     RowOutputFormatWithExceptionHandlerAdaptor::write(columns, row);
 }
 
diff --git a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.h b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.h
index 1981931e91b..d8ab2b09e66 100644
--- a/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/JSONObjectEachRowRowOutputFormat.h
@@ -40,6 +40,7 @@ private:
 
     std::optional<size_t> field_index_for_object_name;
     String object_name;
+    size_t rows = 0;
 };
 
 }

From 2e22b17d57aa772134f64abd41d8377b2191f211 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 15 Aug 2023 00:38:07 +0000
Subject: [PATCH 030/101] add docs and settings randomizations

---
 docs/en/operations/settings/merge-tree-settings.md | 11 +++++++++--
 src/Storages/MergeTree/MergeTreeSettings.h         |  4 ++--
 tests/clickhouse-test                              |  2 ++
 3 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/settings/merge-tree-settings.md b/docs/en/operations/settings/merge-tree-settings.md
index 4122b4af40f..36365c59b35 100644
--- a/docs/en/operations/settings/merge-tree-settings.md
+++ b/docs/en/operations/settings/merge-tree-settings.md
@@ -555,7 +555,7 @@ Merge reads rows from parts in blocks of `merge_max_block_size` rows, then merge
 
 ## number_of_free_entries_in_pool_to_lower_max_size_of_merge {#number-of-free-entries-in-pool-to-lower-max-size-of-merge}
 
-When there is less than specified number of free entries in pool (or replicated queue), start to lower maximum size of merge to process (or to put in queue). 
+When there is less than specified number of free entries in pool (or replicated queue), start to lower maximum size of merge to process (or to put in queue).
 This is to allow small merges to process - not filling the pool with long running merges.
 
 Possible values:
@@ -566,7 +566,7 @@ Default value: 8
 
 ## number_of_free_entries_in_pool_to_execute_mutation {#number-of-free-entries-in-pool-to-execute-mutation}
 
-When there is less than specified number of free entries in pool, do not execute part mutations. 
+When there is less than specified number of free entries in pool, do not execute part mutations.
 This is to leave free threads for regular merges and avoid "Too many parts".
 
 Possible values:
@@ -832,6 +832,13 @@ You can see which parts of `s` were stored using the sparse serialization:
 └────────┴────────────────────┘
 ```
 
+## replace_long_file_name_to_hash {#ratio_of_defaults_for_sparse_serialization}
+If the file name for column is too long (more than `max_file_name_length` bytes) replace it to SipHash128. Default value: `false`.
+
+## max_file_name_length {#max_file_name_length}
+
+The maximal length of the file name to keep it as is without hashing. Takes effect only if setting `replace_long_file_name_to_hash` is enabled. Default value: 128.
+
 ## clean_deleted_rows
 
 Enable/disable automatic deletion of rows flagged as `is_deleted` when perform `OPTIMIZE ... FINAL` on a table using the ReplacingMergeTree engine. When disabled, the `CLEANUP` keyword has to be added to the `OPTIMIZE ... FINAL` to have the same behaviour.
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 802bd74dbf8..38bcb0fc94c 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -34,8 +34,8 @@ struct Settings;
     M(UInt64, min_bytes_for_wide_part, 10485760, "Minimal uncompressed size in bytes to create part in wide format instead of compact", 0) \
     M(UInt64, min_rows_for_wide_part, 0, "Minimal number of rows to create part in wide format instead of compact", 0) \
     M(Float, ratio_of_defaults_for_sparse_serialization, 0.9375f, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
-    M(Bool, replace_long_file_name_to_hash, true, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
-    M(UInt64, max_file_name_length, 0, "The maximal length of the file name to keep it as is without hashing", 0) \
+    M(Bool, replace_long_file_name_to_hash, false, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
+    M(UInt64, max_file_name_length, 128, "The maximal length of the file name to keep it as is without hashing", 0) \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \
     M(UInt64, merge_max_block_size_bytes, 10 * 1024 * 1024, "How many bytes in blocks should be formed for merge operations. By default has the same value as `index_granularity_bytes`.", 0) \
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 1ce5ad981ad..7f8bada4a09 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -668,6 +668,8 @@ class MergeTreeSettingsRandomizer:
         "compress_primary_key": lambda: random.randint(0, 1),
         "marks_compress_block_size": lambda: random.randint(8000, 100000),
         "primary_key_compress_block_size": lambda: random.randint(8000, 100000),
+        "replace_long_file_name_to_hash": lambda: random.randint(0, 1),
+        "max_file_name_length": threshold_generator(0.3, 0.3, 0, 128),
     }
 
     @staticmethod

From 3e9a1825556a12e9dc5362b1bb29b877be158a4e Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 21 Aug 2023 13:49:14 +0000
Subject: [PATCH 031/101] better interfaces for getting of stream name in part

---
 .../settings/merge-tree-settings.md           |   2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  83 +++++++++++--
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  33 +++++-
 .../MergeTree/IMergedBlockOutputStream.cpp    |  15 ++-
 .../MergeTree/MergeTreeDataPartChecksum.cpp   |  12 --
 .../MergeTree/MergeTreeDataPartChecksum.h     |   3 -
 .../MergeTree/MergeTreeDataPartCompact.h      |   2 +-
 .../MergeTree/MergeTreeDataPartInMemory.h     |   2 +-
 .../MergeTree/MergeTreeDataPartWide.cpp       | 110 +++++++++---------
 .../MergeTree/MergeTreeDataPartWide.h         |   2 +-
 .../MergeTree/MergeTreeReaderWide.cpp         |  45 +++----
 src/Storages/MergeTree/MergeTreeSettings.h    |   2 +-
 src/Storages/MergeTree/MutateTask.cpp         |  32 +++--
 src/Storages/MergeTree/checkDataPart.cpp      |   9 +-
 .../System/StorageSystemPartsColumns.cpp      |  22 ++--
 15 files changed, 227 insertions(+), 147 deletions(-)

diff --git a/docs/en/operations/settings/merge-tree-settings.md b/docs/en/operations/settings/merge-tree-settings.md
index 36365c59b35..e1d9e76c2ba 100644
--- a/docs/en/operations/settings/merge-tree-settings.md
+++ b/docs/en/operations/settings/merge-tree-settings.md
@@ -832,7 +832,7 @@ You can see which parts of `s` were stored using the sparse serialization:
 └────────┴────────────────────┘
 ```
 
-## replace_long_file_name_to_hash {#ratio_of_defaults_for_sparse_serialization}
+## replace_long_file_name_to_hash {#replace_long_file_name_to_hash}
 If the file name for column is too long (more than `max_file_name_length` bytes) replace it to SipHash128. Default value: `false`.
 
 ## max_file_name_length {#max_file_name_length}
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 5b2f75b6f00..81330255a5f 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1034,14 +1034,14 @@ CompressionCodecPtr IMergeTreeDataPart::detectDefaultCompressionCodec() const
             {
                 if (path_to_data_file.empty())
                 {
-                    auto candidate_path = ISerialization::getFileNameForStream(part_column, substream_path) + ".bin";
-
-                    if (!getDataPartStorage().exists(candidate_path))
-                        candidate_path = sipHash128String(candidate_path) + ".bin";
+                    auto stream_name = getStreamNameForColumn(part_column, substream_path, ".bin", getDataPartStorage());
+                    if (!stream_name)
+                        return;
 
+                    auto file_name = *stream_name + ".bin";
                     /// We can have existing, but empty .bin files. Example: LowCardinality(Nullable(...)) columns and column_name.dict.null.bin file.
-                    if (getDataPartStorage().exists(candidate_path) && getDataPartStorage().getFileSize(candidate_path) != 0)
-                        path_to_data_file = candidate_path;
+                    if (getDataPartStorage().getFileSize(file_name) != 0)
+                        path_to_data_file = file_name;
                 }
             });
 
@@ -1326,8 +1326,8 @@ void IMergeTreeDataPart::loadColumns(bool require)
     auto metadata_snapshot = storage.getInMemoryMetadataPtr();
     if (parent_part)
         metadata_snapshot = metadata_snapshot->projections.get(name).metadata;
-    NamesAndTypesList loaded_columns;
 
+    NamesAndTypesList loaded_columns;
     bool is_readonly_storage = getDataPartStorage().isReadonly();
 
     if (!metadata_manager->exists("columns.txt"))
@@ -1339,7 +1339,7 @@ void IMergeTreeDataPart::loadColumns(bool require)
 
         /// If there is no file with a list of columns, write it down.
         for (const NameAndTypePair & column : metadata_snapshot->getColumns().getAllPhysical())
-            if (getDataPartStorage().exists(getFileNameForColumn(column) + ".bin"))
+            if (getFileNameForColumn(column))
                 loaded_columns.push_back(column);
 
         if (columns.empty())
@@ -2090,6 +2090,73 @@ IMergeTreeDataPart::uint128 IMergeTreeDataPart::getActualChecksumByFile(const St
     return in_hash.getHash();
 }
 
+std::optional<String> IMergeTreeDataPart::getStreamNameOrHash(
+    const String & stream_name,
+    const Checksums & checksums_)
+{
+    if (checksums_.files.contains(stream_name + ".bin"))
+        return stream_name;
+
+    auto hash = sipHash128String(stream_name);
+    if (checksums_.files.contains(hash + ".bin"))
+        return hash;
+
+    return {};
+}
+
+std::optional<String> IMergeTreeDataPart::getStreamNameOrHash(
+    const String & stream_name,
+    const String & extension,
+    const IDataPartStorage & storage_)
+{
+    if (storage_.exists(stream_name + extension))
+        return stream_name;
+
+    auto hash = sipHash128String(stream_name);
+    if (storage_.exists(hash + extension))
+        return stream_name;
+
+    return {};
+}
+
+std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
+    const String & column_name,
+    const ISerialization::SubstreamPath & substream_path,
+    const Checksums & checksums_)
+{
+    auto stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+    return getStreamNameOrHash(stream_name, checksums_);
+}
+
+std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
+    const NameAndTypePair & column,
+    const ISerialization::SubstreamPath & substream_path,
+    const Checksums & checksums_)
+{
+    auto stream_name = ISerialization::getFileNameForStream(column, substream_path);
+    return getStreamNameOrHash(stream_name, checksums_);
+}
+
+std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
+    const String & column_name,
+    const ISerialization::SubstreamPath & substream_path,
+    const String & extension,
+    const IDataPartStorage & storage_)
+{
+    auto stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
+    return getStreamNameOrHash(stream_name, extension, storage_);
+}
+
+std::optional<String> IMergeTreeDataPart::getStreamNameForColumn(
+    const NameAndTypePair & column,
+    const ISerialization::SubstreamPath & substream_path,
+    const String & extension,
+    const IDataPartStorage & storage_)
+{
+    auto stream_name = ISerialization::getFileNameForStream(column, substream_path);
+    return getStreamNameOrHash(stream_name, extension, storage_);
+}
+
 std::unordered_map<String, IMergeTreeDataPart::uint128> IMergeTreeDataPart::checkMetadata() const
 {
     return metadata_manager->check();
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index a8e053a9c7b..34e6801c3ef 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -131,7 +131,7 @@ public:
     /// Return information about secondary indexes size on disk for all indexes in part
     IndexSize getTotalSeconaryIndicesSize() const { return total_secondary_indices_size; }
 
-    virtual String getFileNameForColumn(const NameAndTypePair & column) const = 0;
+    virtual std::optional<String> getFileNameForColumn(const NameAndTypePair & column) const = 0;
 
     virtual ~IMergeTreeDataPart();
 
@@ -503,6 +503,37 @@ public:
     /// This one is about removing file with version of part's metadata (columns, pk and so on)
     void removeMetadataVersion();
 
+    static std::optional<String> getStreamNameOrHash(
+        const String & name,
+        const IMergeTreeDataPart::Checksums & checksums);
+
+    static std::optional<String> getStreamNameOrHash(
+        const String & name,
+        const String & extension,
+        const IDataPartStorage & storage_);
+
+    static std::optional<String> getStreamNameForColumn(
+        const String & column_name,
+        const ISerialization::SubstreamPath & substream_path,
+        const Checksums & checksums_);
+
+    static std::optional<String> getStreamNameForColumn(
+        const NameAndTypePair & column,
+        const ISerialization::SubstreamPath & substream_path,
+        const Checksums & checksums_);
+
+    static std::optional<String> getStreamNameForColumn(
+        const String & column_name,
+        const ISerialization::SubstreamPath & substream_path,
+        const String & extension,
+        const IDataPartStorage & storage_);
+
+    static std::optional<String> getStreamNameForColumn(
+        const NameAndTypePair & column,
+        const ISerialization::SubstreamPath & substream_path,
+        const String & extension,
+        const IDataPartStorage & storage_);
+
     mutable std::atomic<DataPartRemovalState> removal_state = DataPartRemovalState::NOT_ATTEMPTED;
 
     mutable std::atomic<time_t> last_removal_attempt_time = 0;
diff --git a/src/Storages/MergeTree/IMergedBlockOutputStream.cpp b/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
index 2df3b6d15a6..c8d6aa0ba65 100644
--- a/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
@@ -51,9 +51,9 @@ NameSet IMergedBlockOutputStream::removeEmptyColumnsFromPart(
         data_part->getSerialization(column.name)->enumerateStreams(
             [&](const ISerialization::SubstreamPath & substream_path)
             {
-                auto full_stream_name = ISerialization::getFileNameForStream(column.name, substream_path);
-                auto stream_name = checksums.getFileNameOrHash(full_stream_name);
-                ++stream_counts[stream_name];
+                auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(column, substream_path, checksums);
+                if (stream_name)
+                    ++stream_counts[*stream_name];
             });
     }
 
@@ -67,14 +67,13 @@ NameSet IMergedBlockOutputStream::removeEmptyColumnsFromPart(
 
         ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
         {
-            auto full_stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
-            auto stream_name = checksums.getFileNameOrHash(full_stream_name);
+            auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(column_name, substream_path, checksums);
 
             /// Delete files if they are no longer shared with another column.
-            if (--stream_counts[stream_name] == 0)
+            if (stream_name && --stream_counts[*stream_name] == 0)
             {
-                remove_files.emplace(stream_name + ".bin");
-                remove_files.emplace(stream_name + mrk_extension);
+                remove_files.emplace(*stream_name + ".bin");
+                remove_files.emplace(*stream_name + mrk_extension);
             }
         };
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 794eba809a2..ed2202fcb19 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -312,18 +312,6 @@ MergeTreeDataPartChecksums::Checksum::uint128 MergeTreeDataPartChecksums::getTot
     return getSipHash128AsPair(hash_of_all_files);
 }
 
-String MergeTreeDataPartChecksums::getFileNameOrHash(const String & name) const
-{
-    if (files.contains(name + ".bin"))
-        return name;
-
-    auto hash = sipHash128String(name);
-    if (files.contains(hash + ".bin"))
-        return hash;
-
-    return name;
-}
-
 void MinimalisticDataPartChecksums::serialize(WriteBuffer & to) const
 {
     writeString("checksums format version: 5\n", to);
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 2a38b52c72a..8e5e8c8c448 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -88,11 +88,8 @@ struct MergeTreeDataPartChecksums
     static MergeTreeDataPartChecksums deserializeFrom(const String & s);
 
     UInt64 getTotalSizeOnDisk() const;
-
-    String getFileNameOrHash(const String & name) const;
 };
 
-
 /// A kind of MergeTreeDataPartChecksums intended to be stored in ZooKeeper (to save its RAM)
 /// MinimalisticDataPartChecksums and MergeTreeDataPartChecksums have the same serialization format
 ///  for versions less than MINIMAL_VERSION_WITH_MINIMALISTIC_CHECKSUMS.
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.h b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
index 2bbac766c8e..7850e7c976c 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
@@ -57,7 +57,7 @@ public:
 
     std::optional<time_t> getColumnModificationTime(const String & column_name) const override;
 
-    String getFileNameForColumn(const NameAndTypePair & /* column */) const override { return DATA_FILE_NAME; }
+    std::optional<String> getFileNameForColumn(const NameAndTypePair & /* column */) const override { return DATA_FILE_NAME; }
 
     ~MergeTreeDataPartCompact() override;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h b/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
index 95f7b796f9a..c7b7dde50a6 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
@@ -40,7 +40,7 @@ public:
     bool isStoredOnRemoteDisk() const override { return false; }
     bool isStoredOnRemoteDiskWithZeroCopySupport() const override { return false; }
     bool hasColumnFiles(const NameAndTypePair & column) const override { return !!getColumnPosition(column.getNameInStorage()); }
-    String getFileNameForColumn(const NameAndTypePair & /* column */) const override { return ""; }
+    std::optional<String> getFileNameForColumn(const NameAndTypePair & /* column */) const override { return ""; }
     void renameTo(const String & new_relative_path, bool remove_new_dir_if_exists) override;
     DataPartStoragePtr makeCloneInDetached(const String & prefix, const StorageMetadataPtr & metadata_snapshot,
                                            const DiskTransactionPtr & disk_transaction) const override;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index 417b5f3d19b..9b71c8df3a3 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -73,20 +73,22 @@ ColumnSize MergeTreeDataPartWide::getColumnSizeImpl(
 
     getSerialization(column.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
-        auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
-        auto stream_name = checksums.getFileNameOrHash(full_stream_name);
+        auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(column, substream_path, checksums);
 
-        if (processed_substreams && !processed_substreams->insert(stream_name).second)
+        if (!stream_name)
             return;
 
-        auto bin_checksum = checksums.files.find(stream_name + ".bin");
+        if (processed_substreams && !processed_substreams->insert(*stream_name).second)
+            return;
+
+        auto bin_checksum = checksums.files.find(*stream_name + ".bin");
         if (bin_checksum != checksums.files.end())
         {
             size.data_compressed += bin_checksum->second.file_size;
             size.data_uncompressed += bin_checksum->second.uncompressed_size;
         }
 
-        auto mrk_checksum = checksums.files.find(stream_name + getMarksFileExtension());
+        auto mrk_checksum = checksums.files.find(*stream_name + getMarksFileExtension());
         if (mrk_checksum != checksums.files.end())
             size.marks += mrk_checksum->second.file_size;
     });
@@ -154,7 +156,13 @@ void MergeTreeDataPartWide::loadIndexGranularity()
     if (columns.empty())
         throw Exception(ErrorCodes::NO_FILE_IN_DATA_PART, "No columns in part {}", name);
 
-    loadIndexGranularityImpl(index_granularity, index_granularity_info, getDataPartStorage(), getFileNameForColumn(columns.front()));
+    auto any_column_filename = getFileNameForColumn(columns.front());
+    if (!any_column_filename)
+        throw Exception(ErrorCodes::NO_FILE_IN_DATA_PART,
+            "There are no files for column {} in part {}",
+            columns.front().name, getDataPartStorage().getFullPath());
+
+    loadIndexGranularityImpl(index_granularity, index_granularity_info, getDataPartStorage(), *any_column_filename);
 }
 
 
@@ -186,23 +194,19 @@ void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
             {
                 getSerialization(name_type.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
                 {
-                    String full_stream_name = ISerialization::getFileNameForStream(name_type, substream_path);
-                    String stream_name = checksums.getFileNameOrHash(full_stream_name);
-
-                    String mrk_file_name = stream_name + marks_file_extension;
-                    String bin_file_name = stream_name + DATA_FILE_EXTENSION;
+                    auto stream_name = getStreamNameForColumn(name_type, substream_path, checksums);
+                    if (!stream_name)
+                        throw Exception(
+                            ErrorCodes::NO_FILE_IN_DATA_PART,
+                            "No {}.{} file checksum for column {} in part {}",
+                            *stream_name, DATA_FILE_EXTENSION, name_type.name, getDataPartStorage().getFullPath());
 
+                    auto mrk_file_name = *stream_name + marks_file_extension;
                     if (!checksums.files.contains(mrk_file_name))
                         throw Exception(
                             ErrorCodes::NO_FILE_IN_DATA_PART,
                             "No {} file checksum for column {} in part {} ",
                             mrk_file_name, name_type.name, getDataPartStorage().getFullPath());
-
-                    if (!checksums.files.contains(bin_file_name))
-                        throw Exception(
-                            ErrorCodes::NO_FILE_IN_DATA_PART,
-                            "No {} file checksum for column {} in part {}",
-                            bin_file_name, name_type.name, getDataPartStorage().getFullPath());
                 });
             }
         }
@@ -215,29 +219,28 @@ void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
         {
             getSerialization(name_type.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
             {
-                auto file_path = ISerialization::getFileNameForStream(name_type, substream_path) + marks_file_extension;
-                if (!getDataPartStorage().exists(file_path))
-                    file_path = sipHash128String(file_path) + marks_file_extension;
+                auto stream_name = getStreamNameForColumn(name_type, substream_path, marks_file_extension, getDataPartStorage());
 
                 /// Missing file is Ok for case when new column was added.
-                if (getDataPartStorage().exists(file_path))
-                {
-                    UInt64 file_size = getDataPartStorage().getFileSize(file_path);
+                if (!stream_name)
+                    return;
 
-                    if (!file_size)
-                        throw Exception(
-                            ErrorCodes::BAD_SIZE_OF_FILE_IN_DATA_PART,
-                            "Part {} is broken: {} is empty.",
-                            getDataPartStorage().getFullPath(),
-                            std::string(fs::path(getDataPartStorage().getFullPath()) / file_path));
+                auto file_path = *stream_name + marks_file_extension;
+                UInt64 file_size = getDataPartStorage().getFileSize(file_path);
 
-                    if (!marks_size)
-                        marks_size = file_size;
-                    else if (file_size != *marks_size)
-                        throw Exception(
-                            ErrorCodes::BAD_SIZE_OF_FILE_IN_DATA_PART,
-                            "Part {} is broken: marks have different sizes.", getDataPartStorage().getFullPath());
-                }
+                if (!file_size)
+                    throw Exception(
+                        ErrorCodes::BAD_SIZE_OF_FILE_IN_DATA_PART,
+                        "Part {} is broken: {} is empty.",
+                        getDataPartStorage().getFullPath(),
+                        std::string(fs::path(getDataPartStorage().getFullPath()) / file_path));
+
+                if (!marks_size)
+                    marks_size = file_size;
+                else if (file_size != *marks_size)
+                    throw Exception(
+                        ErrorCodes::BAD_SIZE_OF_FILE_IN_DATA_PART,
+                        "Part {} is broken: marks have different sizes.", getDataPartStorage().getFullPath());
             });
         }
     }
@@ -245,22 +248,13 @@ void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
 
 bool MergeTreeDataPartWide::hasColumnFiles(const NameAndTypePair & column) const
 {
-    std::string marks_file_extension = index_granularity_info.mark_type.getFileExtension();
-    auto check_stream_exists = [this, &marks_file_extension](const String & stream_name)
-    {
-        auto bin_checksum = checksums.files.find(stream_name + DATA_FILE_EXTENSION);
-        auto mrk_checksum = checksums.files.find(stream_name + marks_file_extension);
-
-        return bin_checksum != checksums.files.end() && mrk_checksum != checksums.files.end();
-    };
+    auto marks_file_extension = index_granularity_info.mark_type.getFileExtension();
 
     bool res = true;
     getSerialization(column.name)->enumerateStreams([&](const auto & substream_path)
     {
-        auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
-        auto stream_name = checksums.getFileNameOrHash(full_stream_name);
-
-        if (!check_stream_exists(stream_name))
+        auto stream_name = getStreamNameForColumn(column, substream_path, checksums);
+        if (!stream_name || !checksums.files.contains(*stream_name + marks_file_extension))
             res = false;
     });
 
@@ -271,8 +265,11 @@ std::optional<time_t> MergeTreeDataPartWide::getColumnModificationTime(const Str
 {
     try
     {
-        auto name_on_disk = checksums.getFileNameOrHash(column_name);
-        return getDataPartStorage().getFileLastModified(name_on_disk + DATA_FILE_EXTENSION).epochTime();
+        auto stream_name = getStreamNameOrHash(column_name, checksums);
+        if (!stream_name)
+            return {};
+
+        return getDataPartStorage().getFileLastModified(*stream_name + DATA_FILE_EXTENSION).epochTime();
     }
     catch (const fs::filesystem_error &)
     {
@@ -280,15 +277,18 @@ std::optional<time_t> MergeTreeDataPartWide::getColumnModificationTime(const Str
     }
 }
 
-String MergeTreeDataPartWide::getFileNameForColumn(const NameAndTypePair & column) const
+std::optional<String> MergeTreeDataPartWide::getFileNameForColumn(const NameAndTypePair & column) const
 {
-    String filename;
+    std::optional<String> filename;
     getSerialization(column.name)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
-        if (filename.empty())
+        if (!filename.has_value())
         {
-            auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
-            filename = checksums.getFileNameOrHash(full_stream_name);
+            /// This method may be called when checksums are not initialized yet.
+            if (!checksums.empty())
+                filename = getStreamNameForColumn(column, substream_path, checksums);
+            else
+                filename = getStreamNameForColumn(column, substream_path, DATA_FILE_EXTENSION, getDataPartStorage());
         }
     });
     return filename;
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.h b/src/Storages/MergeTree/MergeTreeDataPartWide.h
index 2076a1ec028..bcf70426fa6 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.h
@@ -48,7 +48,7 @@ public:
 
     bool isStoredOnRemoteDiskWithZeroCopySupport() const override;
 
-    String getFileNameForColumn(const NameAndTypePair & column) const override;
+    std::optional<String> getFileNameForColumn(const NameAndTypePair & column) const override;
 
     ~MergeTreeDataPartWide() override;
 
diff --git a/src/Storages/MergeTree/MergeTreeReaderWide.cpp b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
index 999e3d0f7ec..4ba6402e3c5 100644
--- a/src/Storages/MergeTree/MergeTreeReaderWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
@@ -202,15 +202,6 @@ size_t MergeTreeReaderWide::readRows(
     return read_rows;
 }
 
-String getStreamName(
-    const NameAndTypePair & column,
-    const ISerialization::SubstreamPath & substream_path,
-    const MergeTreeDataPartChecksums & checksums)
-{
-    auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
-    return checksums.getFileNameOrHash(full_stream_name);
-}
-
 void MergeTreeReaderWide::addStreams(
     const NameAndTypePair & name_and_type,
     const SerializationPtr & serialization,
@@ -222,35 +213,33 @@ void MergeTreeReaderWide::addStreams(
 
     ISerialization::StreamCallback callback = [&] (const ISerialization::SubstreamPath & substream_path)
     {
-        auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
-
-        if (streams.contains(stream_name))
-        {
-            has_any_stream = true;
-            return;
-        }
-
-        bool data_file_exists = data_part_info_for_read->getChecksums().files.contains(stream_name + DATA_FILE_EXTENSION);
+        auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
         /** If data file is missing then we will not try to open it.
           * It is necessary since it allows to add new column to structure of the table without creating new files for old parts.
           */
-        if (!data_file_exists)
+        if (!stream_name)
         {
             has_all_streams = false;
             return;
         }
 
+        if (streams.contains(*stream_name))
+        {
+            has_any_stream = true;
+            return;
+        }
+
         has_any_stream = true;
         bool is_lc_dict = substream_path.size() > 1 && substream_path[substream_path.size() - 2].type == ISerialization::Substream::Type::DictionaryKeys;
 
         auto context = data_part_info_for_read->getContext();
         auto * load_marks_threadpool = settings.read_settings.load_marks_asynchronously ? &context->getLoadMarksThreadpool() : nullptr;
 
-        streams.emplace(stream_name, std::make_unique<MergeTreeReaderStream>(
-            data_part_info_for_read, stream_name, DATA_FILE_EXTENSION,
+        streams.emplace(*stream_name, std::make_unique<MergeTreeReaderStream>(
+            data_part_info_for_read, *stream_name, DATA_FILE_EXTENSION,
             data_part_info_for_read->getMarksCount(), all_mark_ranges, settings, mark_cache,
-            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(stream_name + DATA_FILE_EXTENSION),
+            uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(*stream_name + DATA_FILE_EXTENSION),
             &data_part_info_for_read->getIndexGranularityInfo(),
             profile_callback, clock_type, is_lc_dict, load_marks_threadpool));
     };
@@ -276,9 +265,11 @@ static ReadBuffer * getStream(
     if (cache.contains(ISerialization::getSubcolumnNameForStream(substream_path)))
         return nullptr;
 
-    auto stream_name = getStreamName(name_and_type, substream_path, checksums);
+    auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(name_and_type, substream_path, checksums);
+    if (!stream_name)
+        return nullptr;
 
-    auto it = streams.find(stream_name);
+    auto it = streams.find(*stream_name);
     if (it == streams.end())
         return nullptr;
 
@@ -324,15 +315,15 @@ void MergeTreeReaderWide::prefetchForColumn(
 
     serialization->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
     {
-        auto stream_name = getStreamName(name_and_type, substream_path, data_part_info_for_read->getChecksums());
+        auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(name_and_type, substream_path, data_part_info_for_read->getChecksums());
 
-        if (!prefetched_streams.contains(stream_name))
+        if (stream_name && !prefetched_streams.contains(*stream_name))
         {
             bool seek_to_mark = !continue_reading;
             if (ReadBuffer * buf = getStream(false, substream_path, data_part_info_for_read->getChecksums(), streams, name_and_type, from_mark, seek_to_mark, current_task_last_mark, cache))
             {
                 buf->prefetch(priority);
-                prefetched_streams.insert(stream_name);
+                prefetched_streams.insert(*stream_name);
             }
         }
     });
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 38bcb0fc94c..4f02c1c543e 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -35,7 +35,7 @@ struct Settings;
     M(UInt64, min_rows_for_wide_part, 0, "Minimal number of rows to create part in wide format instead of compact", 0) \
     M(Float, ratio_of_defaults_for_sparse_serialization, 0.9375f, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
     M(Bool, replace_long_file_name_to_hash, false, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
-    M(UInt64, max_file_name_length, 128, "The maximal length of the file name to keep it as is without hashing", 0) \
+    M(UInt64, max_file_name_length, 127, "The maximal length of the file name to keep it as is without hashing", 0) \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \
     M(UInt64, merge_max_block_size_bytes, 10 * 1024 * 1024, "How many bytes in blocks should be formed for merge operations. By default has the same value as `index_granularity_bytes`.", 0) \
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 5ce5355c794..6de23f3e294 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -534,9 +534,9 @@ static std::unordered_map<String, size_t> getStreamCounts(
         {
             auto callback = [&](const ISerialization::SubstreamPath & substream_path)
             {
-                auto full_stream_name = ISerialization::getFileNameForStream(column_name, substream_path);
-                auto stream_name = source_part_checksums.getFileNameOrHash(full_stream_name);
-                ++stream_counts[stream_name];
+                auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(column_name, substream_path, source_part_checksums);
+                if (stream_name)
+                    ++stream_counts[*stream_name];
             };
 
             serialization->enumerateStreams(callback);
@@ -654,14 +654,13 @@ static NameToNameVector collectFilesForRenames(
             {
                 ISerialization::StreamCallback callback = [&](const ISerialization::SubstreamPath & substream_path)
                 {
-                    auto full_stream_name = ISerialization::getFileNameForStream({command.column_name, command.data_type}, substream_path);
-                    auto stream_name = source_part->checksums.getFileNameOrHash(full_stream_name);
+                    auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(command.column_name, substream_path, source_part->checksums);
 
                     /// Delete files if they are no longer shared with another column.
-                    if (--stream_counts[stream_name] == 0)
+                    if (stream_name && --stream_counts[*stream_name] == 0)
                     {
-                        add_rename(stream_name + ".bin", "");
-                        add_rename(stream_name + mrk_extension, "");
+                        add_rename(*stream_name + ".bin", "");
+                        add_rename(*stream_name + mrk_extension, "");
                     }
                 };
 
@@ -678,13 +677,22 @@ static NameToNameVector collectFilesForRenames(
                     String full_stream_from = ISerialization::getFileNameForStream(command.column_name, substream_path);
                     String full_stream_to = boost::replace_first_copy(full_stream_from, escaped_name_from, escaped_name_to);
 
-                    String stream_from = source_part->checksums.getFileNameOrHash(full_stream_from);
-                    String stream_to = stream_from == full_stream_from ? full_stream_to : sipHash128String(full_stream_to);
+                    auto stream_from = IMergeTreeDataPart::getStreamNameOrHash(full_stream_from, source_part->checksums);
+                    if (!stream_from)
+                        return;
+
+                    String stream_to;
+                    auto storage_settings = source_part->storage.getSettings();
+
+                    if (storage_settings->replace_long_file_name_to_hash && full_stream_to.size() > storage_settings->max_file_name_length)
+                        stream_to = sipHash128String(full_stream_to);
+                    else
+                        stream_to = full_stream_to;
 
                     if (stream_from != stream_to)
                     {
-                        add_rename(stream_from + ".bin", stream_to + ".bin");
-                        add_rename(stream_from + mrk_extension, stream_to + mrk_extension);
+                        add_rename(*stream_from + ".bin", stream_to + ".bin");
+                        add_rename(*stream_from + mrk_extension, stream_to + mrk_extension);
                     }
                 };
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index 33715785574..f54056421a7 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -165,17 +165,14 @@ static IMergeTreeDataPart::Checksums checkDataPart(
         {
             get_serialization(column)->enumerateStreams([&](const ISerialization::SubstreamPath & substream_path)
             {
-                auto stream_name = ISerialization::getFileNameForStream(column, substream_path);
-                auto file_name = stream_name + ".bin";
+                auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(column, substream_path, ".bin", data_part_storage);
 
-                if (!data_part_storage.exists(file_name))
-                    file_name = sipHash128String(stream_name) + ".bin";
-
-                if (!data_part_storage.exists(file_name))
+                if (!stream_name)
                     throw Exception(ErrorCodes::NO_FILE_IN_DATA_PART,
                         "There is no file for column '{}' in data part '{}'",
                         column.name, data_part->name);
 
+                auto file_name = *stream_name + ".bin";
                 checksums_data.files[file_name] = checksum_compressed_file(data_part_storage, file_name);
             });
         }
diff --git a/src/Storages/System/StorageSystemPartsColumns.cpp b/src/Storages/System/StorageSystemPartsColumns.cpp
index 0510c733e65..275d56c3da5 100644
--- a/src/Storages/System/StorageSystemPartsColumns.cpp
+++ b/src/Storages/System/StorageSystemPartsColumns.cpp
@@ -271,19 +271,21 @@ void StorageSystemPartsColumns::processNextStorage(
 
                 ColumnSize size;
                 NameAndTypePair subcolumn(column.name, name, column.type, data.type);
-                String full_stream_name = ISerialization::getFileNameForStream(subcolumn, subpath);
-                String stream_name = part->checksums.getFileNameOrHash(full_stream_name);
 
-                auto bin_checksum = part->checksums.files.find(stream_name + ".bin");
-                if (bin_checksum != part->checksums.files.end())
+                auto stream_name = IMergeTreeDataPart::getStreamNameForColumn(subcolumn, subpath, part->checksums);
+                if (stream_name)
                 {
-                    size.data_compressed += bin_checksum->second.file_size;
-                    size.data_uncompressed += bin_checksum->second.uncompressed_size;
-                }
+                    auto bin_checksum = part->checksums.files.find(*stream_name + ".bin");
+                    if (bin_checksum != part->checksums.files.end())
+                    {
+                        size.data_compressed += bin_checksum->second.file_size;
+                        size.data_uncompressed += bin_checksum->second.uncompressed_size;
+                    }
 
-                auto mrk_checksum = part->checksums.files.find(stream_name + part->index_granularity_info.mark_type.getFileExtension());
-                if (mrk_checksum != part->checksums.files.end())
-                    size.marks += mrk_checksum->second.file_size;
+                    auto mrk_checksum = part->checksums.files.find(*stream_name + part->index_granularity_info.mark_type.getFileExtension());
+                    if (mrk_checksum != part->checksums.files.end())
+                        size.marks += mrk_checksum->second.file_size;
+                }
 
                 subcolumn_bytes_on_disk.push_back(size.data_compressed + size.marks);
                 subcolumn_data_compressed_bytes.push_back(size.data_compressed);

From 03f5d3feb4c11ebf7ef8fa4af0dd634dfd3fa41b Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 28 Aug 2023 14:58:45 +0000
Subject: [PATCH 032/101] fix checkDataPart

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 81330255a5f..58fa6e2e66d 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -2114,7 +2114,7 @@ std::optional<String> IMergeTreeDataPart::getStreamNameOrHash(
 
     auto hash = sipHash128String(stream_name);
     if (storage_.exists(hash + extension))
-        return stream_name;
+        return hash;
 
     return {};
 }

From 54755d7e095a0818fa5a8bf234114c2e7e192f80 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 29 Aug 2023 12:02:43 +0000
Subject: [PATCH 033/101] fix test

---
 tests/queries/0_stateless/02253_empty_part_checksums.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02253_empty_part_checksums.sh b/tests/queries/0_stateless/02253_empty_part_checksums.sh
index 5d4e750f46d..371c0768e3d 100755
--- a/tests/queries/0_stateless/02253_empty_part_checksums.sh
+++ b/tests/queries/0_stateless/02253_empty_part_checksums.sh
@@ -10,7 +10,7 @@ $CLICKHOUSE_CLIENT -q "drop table if exists rmt sync;"
 $CLICKHOUSE_CLIENT -q "CREATE TABLE rmt (a UInt8, b Int16, c Float32, d String, e Array(UInt8), f Nullable(UUID), g Tuple(UInt8, UInt16))
 ENGINE = ReplicatedMergeTree('/test/02253/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/rmt', '1') ORDER BY a PARTITION BY b % 10
 SETTINGS old_parts_lifetime = 1, cleanup_delay_period = 0, cleanup_delay_period_random_add = 0,
-cleanup_thread_preferred_points_per_iteration=0, min_bytes_for_wide_part=0, remove_empty_parts=0"
+cleanup_thread_preferred_points_per_iteration=0, min_bytes_for_wide_part=0, remove_empty_parts=0, replace_long_file_name_to_hash=0"
 
 $CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 -q "INSERT INTO rmt SELECT rand(1), 0, 1 / rand(3), toString(rand(4)), [rand(5), rand(6)], rand(7) % 2 ? NULL : generateUUIDv4(), (rand(8), rand(9)) FROM numbers(1000);"
 

From 1910434174234ccdf5e30291453eb5ebda687b9b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 30 Aug 2023 20:48:26 +0200
Subject: [PATCH 034/101] Remove CurrentStatusInfo

---
 src/Common/StatusInfo.cpp              | 57 --------------------------
 src/Common/StatusInfo.h                | 39 ------------------
 src/Interpreters/ExternalLoader.cpp    | 10 -----
 src/Server/PrometheusMetricsWriter.cpp | 38 -----------------
 src/Server/PrometheusMetricsWriter.h   |  2 -
 5 files changed, 146 deletions(-)
 delete mode 100644 src/Common/StatusInfo.cpp
 delete mode 100644 src/Common/StatusInfo.h

diff --git a/src/Common/StatusInfo.cpp b/src/Common/StatusInfo.cpp
deleted file mode 100644
index 1f9ddfaf4b9..00000000000
--- a/src/Common/StatusInfo.cpp
+++ /dev/null
@@ -1,57 +0,0 @@
-#include <Common/StatusInfo.h>
-#include <Common/ExternalLoaderStatus.h>
-
-/// Available status. Add something here as you wish.
-#define APPLY_FOR_STATUS(M) \
-    M(DictionaryStatus, "Dictionary Status.", DB::getStatusEnumAllPossibleValues()) \
-
-
-namespace CurrentStatusInfo
-{
-    #define M(NAME, DOCUMENTATION, ENUM) extern const Status NAME = Status(__COUNTER__);
-        APPLY_FOR_STATUS(M)
-    #undef M
-    constexpr Status END = Status(__COUNTER__);
-
-    std::mutex locks[END] {};
-    std::unordered_map<String, Int8> values[END] {};
-
-    const char * getName(Status event)
-    {
-        static const char * strings[] =
-        {
-        #define M(NAME, DOCUMENTATION, ENUM) #NAME,
-            APPLY_FOR_STATUS(M)
-        #undef M
-        };
-
-        return strings[event];
-    }
-
-    const char * getDocumentation(Status event)
-    {
-        static const char * strings[] =
-        {
-        #define M(NAME, DOCUMENTATION, ENUM) #DOCUMENTATION,
-            APPLY_FOR_STATUS(M)
-        #undef M
-        };
-
-        return strings[event];
-    }
-
-    const std::vector<std::pair<String, Int8>> & getAllPossibleValues(Status event)
-    {
-        static const std::vector<std::pair<String, Int8>> enum_values [] =
-        {
-        #define M(NAME, DOCUMENTATION, ENUM) ENUM,
-            APPLY_FOR_STATUS(M)
-        #undef M
-        };
-        return enum_values[event];
-    }
-
-    Status end() { return END; }
-}
-
-#undef APPLY_FOR_STATUS
diff --git a/src/Common/StatusInfo.h b/src/Common/StatusInfo.h
deleted file mode 100644
index 91e6d4d3b85..00000000000
--- a/src/Common/StatusInfo.h
+++ /dev/null
@@ -1,39 +0,0 @@
-#pragma once
-
-#include <stddef.h>
-#include <cstdint>
-#include <utility>
-#include <atomic>
-#include <vector>
-#include <base/types.h>
-#include <base/strong_typedef.h>
-#include <mutex>
-#include <unordered_map>
-
-
-namespace CurrentStatusInfo
-{
-    using Status = StrongTypedef<size_t, struct StatusTag>;
-    using Key = std::string;
-
-    const char * getName(Status event);
-    const char * getDocumentation(Status event);
-    const std::vector<std::pair<String, Int8>> & getAllPossibleValues(Status event);
-
-    extern std::unordered_map<String, Int8> values[];
-    extern std::mutex locks[];
-
-    Status end();
-
-    inline void set(Status status, Key key, Int8 value)
-    {
-        std::lock_guard lock(locks[status]);
-        values[status][key] = value;
-    }
-
-    inline void unset(Status status, Key key)
-    {
-        std::lock_guard lock(locks[status]);
-        values[status].erase(key);
-    }
-}
diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index 5dee750889c..56d480d8735 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -1,7 +1,6 @@
 #include "ExternalLoader.h"
 
 #include <mutex>
-#include <pcg_random.hpp>
 #include <Common/MemoryTrackerBlockerInThread.h>
 #include <Common/Config/AbstractConfigurationComparison.h>
 #include <Common/Exception.h>
@@ -9,7 +8,6 @@
 #include <Common/ThreadPool.h>
 #include <Common/randomSeed.h>
 #include <Common/setThreadName.h>
-#include <Common/StatusInfo.h>
 #include <Common/scope_guard_safe.h>
 #include <Common/logger_useful.h>
 #include <base/chrono_io.h>
@@ -18,12 +16,6 @@
 #include <unordered_set>
 
 
-namespace CurrentStatusInfo
-{
-    extern const Status DictionaryStatus;
-}
-
-
 namespace DB
 {
 namespace ErrorCodes
@@ -1145,7 +1137,6 @@ private:
         if (info && (info->loading_id == loading_id))
         {
             info->loading_id = info->state_id;
-            CurrentStatusInfo::set(CurrentStatusInfo::DictionaryStatus, name, static_cast<Int8>(info->status()));
         }
         min_id_to_finish_loading_dependencies.erase(std::this_thread::get_id());
 
@@ -1307,7 +1298,6 @@ scope_guard ExternalLoader::addConfigRepository(std::unique_ptr<IExternalLoaderC
     return [this, ptr, name]()
     {
         config_files_reader->removeConfigRepository(ptr);
-        CurrentStatusInfo::unset(CurrentStatusInfo::DictionaryStatus, name);
         reloadConfig(name);
     };
 }
diff --git a/src/Server/PrometheusMetricsWriter.cpp b/src/Server/PrometheusMetricsWriter.cpp
index 2331e455225..a7d90b9985c 100644
--- a/src/Server/PrometheusMetricsWriter.cpp
+++ b/src/Server/PrometheusMetricsWriter.cpp
@@ -1,7 +1,6 @@
 #include "PrometheusMetricsWriter.h"
 
 #include <IO/WriteHelpers.h>
-#include <Common/StatusInfo.h>
 #include <regex>    /// TODO: this library is harmful.
 #include <algorithm>
 
@@ -51,7 +50,6 @@ PrometheusMetricsWriter::PrometheusMetricsWriter(
     , send_events(config.getBool(config_name + ".events", true))
     , send_metrics(config.getBool(config_name + ".metrics", true))
     , send_asynchronous_metrics(config.getBool(config_name + ".asynchronous_metrics", true))
-    , send_status_info(config.getBool(config_name + ".status_info", true))
 {
 }
 
@@ -120,42 +118,6 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
             writeOutLine(wb, key, value.value);
         }
     }
-
-    if (send_status_info)
-    {
-        for (size_t i = 0, end = CurrentStatusInfo::end(); i < end; ++i)
-        {
-            std::lock_guard lock(CurrentStatusInfo::locks[static_cast<CurrentStatusInfo::Status>(i)]);
-            std::string metric_name{CurrentStatusInfo::getName(static_cast<CurrentStatusInfo::Status>(i))};
-            std::string metric_doc{CurrentStatusInfo::getDocumentation(static_cast<CurrentStatusInfo::Status>(i))};
-
-            convertHelpToSingleLine(metric_doc);
-
-            if (!replaceInvalidChars(metric_name))
-                continue;
-            std::string key{current_status_prefix + metric_name};
-
-            writeOutLine(wb, "# HELP", key, metric_doc);
-            writeOutLine(wb, "# TYPE", key, "gauge");
-
-            for (const auto & value: CurrentStatusInfo::values[i])
-            {
-                for (const auto & enum_value: CurrentStatusInfo::getAllPossibleValues(static_cast<CurrentStatusInfo::Status>(i)))
-                {
-                    DB::writeText(key, wb);
-                    DB::writeChar('{', wb);
-                    DB::writeText(key, wb);
-                    DB::writeChar('=', wb);
-                    writeDoubleQuotedString(enum_value.first, wb);
-                    DB::writeText(",name=", wb);
-                    writeDoubleQuotedString(value.first, wb);
-                    DB::writeText("} ", wb);
-                    DB::writeText(value.second == enum_value.second, wb);
-                    DB::writeChar('\n', wb);
-                }
-            }
-        }
-    }
 }
 
 }
diff --git a/src/Server/PrometheusMetricsWriter.h b/src/Server/PrometheusMetricsWriter.h
index b4f6ab57def..b05eeaf0a3a 100644
--- a/src/Server/PrometheusMetricsWriter.h
+++ b/src/Server/PrometheusMetricsWriter.h
@@ -27,12 +27,10 @@ private:
     const bool send_events;
     const bool send_metrics;
     const bool send_asynchronous_metrics;
-    const bool send_status_info;
 
     static inline constexpr auto profile_events_prefix = "ClickHouseProfileEvents_";
     static inline constexpr auto current_metrics_prefix = "ClickHouseMetrics_";
     static inline constexpr auto asynchronous_metrics_prefix = "ClickHouseAsyncMetrics_";
-    static inline constexpr auto current_status_prefix = "ClickHouseStatusInfo_";
 };
 
 }

From 9d6dc1067f172187a739e0939e23acad0e631dc1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 30 Aug 2023 20:49:02 +0200
Subject: [PATCH 035/101] Remove CurrentStatusInfo

---
 ...HouseStatusInfo_DictionaryStatus.reference | 18 ---------
 ...s_ClickHouseStatusInfo_DictionaryStatus.sh | 38 -------------------
 2 files changed, 56 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.reference
 delete mode 100755 tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.sh

diff --git a/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.reference b/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.reference
deleted file mode 100644
index 50c91c3fa0c..00000000000
--- a/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.reference
+++ /dev/null
@@ -1,18 +0,0 @@
-status before reload
-status after reload
-NOT_LOADED 0
-LOADED 0
-FAILED 1
-LOADING 0
-FAILED_AND_RELOADING 0
-LOADED_AND_RELOADING 0
-NOT_EXIST 0
-status after reload, table exists
-NOT_LOADED 0
-LOADED 1
-FAILED 0
-LOADING 0
-FAILED_AND_RELOADING 0
-LOADED_AND_RELOADING 0
-NOT_EXIST 0
-status after drop
diff --git a/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.sh b/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.sh
deleted file mode 100755
index 65025858e20..00000000000
--- a/tests/queries/0_stateless/02390_prometheus_ClickHouseStatusInfo_DictionaryStatus.sh
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-ordinary-database
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-function get_dictionary_status()
-{
-    local name=$1 && shift
-    $CLICKHOUSE_CURL -sS "$CLICKHOUSE_URL_PROMETHEUS" | {
-        awk -F'[{}=," ]' -vname="$name" '/ClickHouseStatusInfo_DictionaryStatus{/ && $(NF-3) == name { print $4, $NF }'
-    }
-}
-
-$CLICKHOUSE_CLIENT -q "CREATE DICTIONARY dict (key Int, value String) PRIMARY KEY key SOURCE(CLICKHOUSE(TABLE data)) LAYOUT(HASHED()) LIFETIME(0)"
-uuid="$($CLICKHOUSE_CLIENT -q "SELECT uuid FROM system.dictionaries WHERE database = '$CLICKHOUSE_DATABASE' AND name = 'dict'")"
-
-echo 'status before reload'
-get_dictionary_status "$uuid"
-
-# source table does not exists
-# NOTE: when dictionary does not exist it produce BAD_ARGUMENTS error, so using UNKNOWN_TABLE is safe
-$CLICKHOUSE_CLIENT -n -q "SYSTEM RELOAD DICTIONARY dict -- { serverError UNKNOWN_TABLE }"
-echo 'status after reload'
-get_dictionary_status "$uuid"
-
-# create source
-$CLICKHOUSE_CLIENT -q "CREATE TABLE data (key Int, value String) Engine=Null"
-$CLICKHOUSE_CLIENT -q "SYSTEM RELOAD DICTIONARY dict"
-echo 'status after reload, table exists'
-get_dictionary_status "$uuid"
-
-# remove dictionary
-$CLICKHOUSE_CLIENT -q "DROP DICTIONARY dict"
-$CLICKHOUSE_CLIENT -q "DROP TABLE data"
-echo 'status after drop'
-get_dictionary_status "$uuid"

From bb47e2cc234baab26d018f081cb257ff1d0b9cf0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 30 Aug 2023 20:56:14 +0200
Subject: [PATCH 036/101] Remove CurrentStatusInfo

---
 .../testdata/configs/xml/config.xml           | 21 -------------------
 .../testdata/configs/yandex_xml/config.xml    | 21 -------------------
 programs/server/config.xml                    |  2 --
 .../test_config_xml_full/configs/config.xml   | 21 -------------------
 4 files changed, 65 deletions(-)

diff --git a/programs/diagnostics/testdata/configs/xml/config.xml b/programs/diagnostics/testdata/configs/xml/config.xml
index c08b0b2970f..50352ca800e 100644
--- a/programs/diagnostics/testdata/configs/xml/config.xml
+++ b/programs/diagnostics/testdata/configs/xml/config.xml
@@ -760,27 +760,6 @@
     </graphite>
     -->
 
-    <!-- Serve endpoint for Prometheus monitoring. -->
-    <!--
-        endpoint - mertics path (relative to root, statring with "/")
-        port - port to setup server. If not defined or 0 than http_port used
-        metrics - send data from table system.metrics
-        events - send data from table system.events
-        asynchronous_metrics - send data from table system.asynchronous_metrics
-        status_info - send data from different component from CH, ex: Dictionaries status
-    -->
-    <!--
-    <prometheus>
-        <endpoint>/metrics</endpoint>
-        <port>9363</port>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <asynchronous_metrics>true</asynchronous_metrics>
-        <status_info>true</status_info>
-    </prometheus>
-    -->
-
     <!-- Query log. Used only for queries with setting log_queries = 1. -->
     <query_log>
         <!-- What table to insert data. If table is not exist, it will be created.
diff --git a/programs/diagnostics/testdata/configs/yandex_xml/config.xml b/programs/diagnostics/testdata/configs/yandex_xml/config.xml
index c65418c6363..181f52a92f8 100644
--- a/programs/diagnostics/testdata/configs/yandex_xml/config.xml
+++ b/programs/diagnostics/testdata/configs/yandex_xml/config.xml
@@ -760,27 +760,6 @@
     </graphite>
     -->
 
-    <!-- Serve endpoint for Prometheus monitoring. -->
-    <!--
-        endpoint - mertics path (relative to root, statring with "/")
-        port - port to setup server. If not defined or 0 than http_port used
-        metrics - send data from table system.metrics
-        events - send data from table system.events
-        asynchronous_metrics - send data from table system.asynchronous_metrics
-        status_info - send data from different component from CH, ex: Dictionaries status
-    -->
-    <!--
-    <prometheus>
-        <endpoint>/metrics</endpoint>
-        <port>9363</port>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <asynchronous_metrics>true</asynchronous_metrics>
-        <status_info>true</status_info>
-    </prometheus>
-    -->
-
     <!-- Query log. Used only for queries with setting log_queries = 1. -->
     <query_log>
         <!-- What table to insert data. If table is not exist, it will be created.
diff --git a/programs/server/config.xml b/programs/server/config.xml
index 07052441a01..7f1d395faa4 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -971,7 +971,6 @@
         metrics - send data from table system.metrics
         events - send data from table system.events
         asynchronous_metrics - send data from table system.asynchronous_metrics
-        status_info - send data from different component from CH, ex: Dictionaries status
     -->
     <!--
     <prometheus>
@@ -981,7 +980,6 @@
         <metrics>true</metrics>
         <events>true</events>
         <asynchronous_metrics>true</asynchronous_metrics>
-        <status_info>true</status_info>
     </prometheus>
     -->
 
diff --git a/tests/integration/test_config_xml_full/configs/config.xml b/tests/integration/test_config_xml_full/configs/config.xml
index d142df18af8..ac59b3428e8 100644
--- a/tests/integration/test_config_xml_full/configs/config.xml
+++ b/tests/integration/test_config_xml_full/configs/config.xml
@@ -674,27 +674,6 @@
     </graphite>
     -->
 
-    <!-- Serve endpoint for Prometheus monitoring. -->
-    <!--
-        endpoint - mertics path (relative to root, statring with "/")
-        port - port to setup server. If not defined or 0 than http_port used
-        metrics - send data from table system.metrics
-        events - send data from table system.events
-        asynchronous_metrics - send data from table system.asynchronous_metrics
-        status_info - send data from different component from CH, ex: Dictionaries status
-    -->
-    <!--
-    <prometheus>
-        <endpoint>/metrics</endpoint>
-        <port>9363</port>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <asynchronous_metrics>true</asynchronous_metrics>
-        <status_info>true</status_info>
-    </prometheus>
-    -->
-
     <!-- Query log. Used only for queries with setting log_queries = 1. -->
     <query_log>
         <!-- What table to insert data. If table is not exist, it will be created.

From 35d975bfeaf239e490f55f295468f32052179997 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Fri, 15 Sep 2023 13:07:04 +0000
Subject: [PATCH 037/101] Add comment in ParallelInputFormat, remove unneded
 include

---
 src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp    | 1 -
 .../Formats/Impl/ParallelFormattingOutputFormat.cpp           | 4 ++++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
index a7118c2154a..b805547201f 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowOutputFormat.cpp
@@ -3,7 +3,6 @@
 #include <Processors/Formats/Impl/JSONEachRowRowOutputFormat.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/JSONUtils.h>
-#include <Common/logger_useful.h>
 
 
 namespace DB
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
index 841ef683228..b2871310be5 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.cpp
@@ -29,6 +29,10 @@ namespace DB
             }
         }
 
+        /// The code below is required to write valid output in case of exception during parallel parsing,
+        /// because we finish formatting and collecting threads in case of exception.
+        /// So, in case of exception after finalize we could still not output prefix/suffix or finalize underlying format.
+
         if (collected_prefix && collected_suffix && collected_finalize)
             return;
 

From 7ffe998f1d987d4d86409bc3de87a050c6d25423 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 18 Sep 2023 11:13:32 +0000
Subject: [PATCH 038/101] Randomize settings

---
 tests/config/config.d/keeper_port.xml |  5 ++++-
 tests/config/install.sh               | 14 ++++++++++++--
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/tests/config/config.d/keeper_port.xml b/tests/config/config.d/keeper_port.xml
index beac507304f..1e646cd07a7 100644
--- a/tests/config/config.d/keeper_port.xml
+++ b/tests/config/config.d/keeper_port.xml
@@ -3,7 +3,7 @@
         <tcp_port>9181</tcp_port>
         <server_id>1</server_id>
 
-        <create_snapshot_on_exit>true</create_snapshot_on_exit>
+        <create_snapshot_on_exit>1</create_snapshot_on_exit>
 
         <coordination_settings>
             <operation_timeout_ms>10000</operation_timeout_ms>
@@ -32,7 +32,10 @@
         </raft_configuration>
 
         <feature_flags>
+            <filtered_list>1</filtered_list>
+            <multi_read>1</multi_read>
             <check_not_exists>1</check_not_exists>
+            <create_if_not_exists>1</create_if_not_exists>
         </feature_flags>
     </keeper_server>
 </clickhouse>
diff --git a/tests/config/install.sh b/tests/config/install.sh
index b65f2cc8dd1..66587792dc9 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -123,9 +123,19 @@ else
     ln -sf $SRC_PATH/config.d/zookeeper.xml $DEST_SERVER_PATH/config.d/
 fi
 
+function randomize_config_boolean_value {
+    value=$(($RANDOM % 2))
+    sed --follow-symlinks -i "s|<$1>[01]</$1>|<$1>$value</$1>|" $DEST_SERVER_PATH/config.d/keeper_port.xml
+}
+
 # We randomize creating the snapshot on exit for Keeper to test out using older snapshots
-create_snapshot_on_exit=$(($RANDOM % 2))
-sed --follow-symlinks -i "s|<create_snapshot_on_exit>true</create_snapshot_on_exit>|<create_snapshot_on_exit>$create_snapshot_on_exit</create_snapshot_on_exit>|" $DEST_SERVER_PATH/config.d/keeper_port.xml
+randomize_config_boolean_value create_snapshot_on_exit
+
+# Randomize all Keeper feature flags
+randomize_config_boolean_value filtered_list
+randomize_config_boolean_value multi_read
+randomize_config_boolean_value check_not_exists
+randomize_config_boolean_value create_if_not_exists
 
 if [[ -n "$USE_POLYMORPHIC_PARTS" ]] && [[ "$USE_POLYMORPHIC_PARTS" -eq 1 ]]; then
     ln -sf $SRC_PATH/config.d/polymorphic_parts.xml $DEST_SERVER_PATH/config.d/

From ca64e269943371acdcd70f673beaadc0d6bc2007 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 18 Sep 2023 11:28:36 +0000
Subject: [PATCH 039/101] Automatic style fix

---
 .../test_keeper_feature_flags_config/test.py        | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_keeper_feature_flags_config/test.py b/tests/integration/test_keeper_feature_flags_config/test.py
index 2ec310152a6..5bbd0d668c6 100644
--- a/tests/integration/test_keeper_feature_flags_config/test.py
+++ b/tests/integration/test_keeper_feature_flags_config/test.py
@@ -84,11 +84,20 @@ def test_keeper_feature_flags(started_cluster):
         [("filtered_list", 1), ("multi_read", 1), ("check_not_exists", 0)]
     )
 
-    feature_flags = [("multi_read", 0), ("check_not_exists", 1), ("create_if_not_exists", 1)]
+    feature_flags = [
+        ("multi_read", 0),
+        ("check_not_exists", 1),
+        ("create_if_not_exists", 1),
+    ]
     restart_clickhouse(feature_flags)
     assert_feature_flags(feature_flags + [("filtered_list", 1)])
 
-    feature_flags = [("multi_read", 0), ("check_not_exists", 0), ("filtered_list", 0), ("create_if_not_exists", 0)]
+    feature_flags = [
+        ("multi_read", 0),
+        ("check_not_exists", 0),
+        ("filtered_list", 0),
+        ("create_if_not_exists", 0),
+    ]
     restart_clickhouse(feature_flags)
     assert_feature_flags(feature_flags)
 

From 4373ed0f987711af60fbe73b597683ee2eb87b5b Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 18 Sep 2023 15:26:54 +0000
Subject: [PATCH 040/101] Added field "is_deterministic" to system.functions

---
 .../System/StorageSystemFunctions.cpp         | 57 ++++++++++++-------
 .../02117_show_create_table_system.reference  |  1 +
 2 files changed, 39 insertions(+), 19 deletions(-)

diff --git a/src/Storages/System/StorageSystemFunctions.cpp b/src/Storages/System/StorageSystemFunctions.cpp
index 0c609d84da3..37d536ff6b1 100644
--- a/src/Storages/System/StorageSystemFunctions.cpp
+++ b/src/Storages/System/StorageSystemFunctions.cpp
@@ -1,5 +1,6 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <DataTypes/DataTypeMap.h>
+#include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -29,6 +30,7 @@ namespace
         MutableColumns & res_columns,
         const String & name,
         UInt64 is_aggregate,
+        std::optional<UInt64> is_deterministic,
         const String & create_query,
         FunctionOrigin function_origin,
         const Factory & factory)
@@ -36,53 +38,58 @@ namespace
         res_columns[0]->insert(name);
         res_columns[1]->insert(is_aggregate);
 
+        if (!is_deterministic.has_value())
+            res_columns[2]->insertDefault();
+        else
+            res_columns[2]->insert(*is_deterministic);
+
         if constexpr (std::is_same_v<Factory, UserDefinedSQLFunctionFactory> || std::is_same_v<Factory, UserDefinedExecutableFunctionFactory>)
         {
-            res_columns[2]->insert(false);
-            res_columns[3]->insertDefault();
+            res_columns[3]->insert(false);
+            res_columns[4]->insertDefault();
         }
         else
         {
-            res_columns[2]->insert(factory.isCaseInsensitive(name));
+            res_columns[3]->insert(factory.isCaseInsensitive(name));
             if (factory.isAlias(name))
-                res_columns[3]->insert(factory.aliasTo(name));
+                res_columns[4]->insert(factory.aliasTo(name));
             else
-                res_columns[3]->insertDefault();
+                res_columns[4]->insertDefault();
         }
 
-        res_columns[4]->insert(create_query);
-        res_columns[5]->insert(static_cast<Int8>(function_origin));
+        res_columns[5]->insert(create_query);
+        res_columns[6]->insert(static_cast<Int8>(function_origin));
 
         if constexpr (std::is_same_v<Factory, FunctionFactory>)
         {
             if (factory.isAlias(name))
             {
-                res_columns[6]->insertDefault();
                 res_columns[7]->insertDefault();
                 res_columns[8]->insertDefault();
                 res_columns[9]->insertDefault();
                 res_columns[10]->insertDefault();
                 res_columns[11]->insertDefault();
+                res_columns[12]->insertDefault();
             }
             else
             {
                 auto documentation = factory.getDocumentation(name);
-                res_columns[6]->insert(documentation.description);
-                res_columns[7]->insert(documentation.syntax);
-                res_columns[8]->insert(documentation.argumentsAsString());
-                res_columns[9]->insert(documentation.returned_value);
-                res_columns[10]->insert(documentation.examplesAsString());
-                res_columns[11]->insert(documentation.categoriesAsString());
+                res_columns[7]->insert(documentation.description);
+                res_columns[8]->insert(documentation.syntax);
+                res_columns[9]->insert(documentation.argumentsAsString());
+                res_columns[10]->insert(documentation.returned_value);
+                res_columns[11]->insert(documentation.examplesAsString());
+                res_columns[12]->insert(documentation.categoriesAsString());
             }
         }
         else
         {
-            res_columns[6]->insertDefault();
             res_columns[7]->insertDefault();
             res_columns[8]->insertDefault();
             res_columns[9]->insertDefault();
             res_columns[10]->insertDefault();
             res_columns[11]->insertDefault();
+            res_columns[12]->insertDefault();
         }
     }
 }
@@ -102,6 +109,7 @@ NamesAndTypesList StorageSystemFunctions::getNamesAndTypes()
     return {
         {"name", std::make_shared<DataTypeString>()},
         {"is_aggregate", std::make_shared<DataTypeUInt8>()},
+        {"is_deterministic", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt8>())},
         {"case_insensitive", std::make_shared<DataTypeUInt8>()},
         {"alias_to", std::make_shared<DataTypeString>()},
         {"create_query", std::make_shared<DataTypeString>()},
@@ -121,14 +129,25 @@ void StorageSystemFunctions::fillData(MutableColumns & res_columns, ContextPtr c
     const auto & function_names = functions_factory.getAllRegisteredNames();
     for (const auto & function_name : function_names)
     {
-        fillRow(res_columns, function_name, UInt64(0), "", FunctionOrigin::SYSTEM, functions_factory);
+        std::optional<UInt64> is_deterministic;
+        try
+        {
+            is_deterministic = functions_factory.tryGet(function_name, context)->isDeterministic();
+        }
+        catch (...)
+        {
+            /// Some functions throw because they need special configuration or setup before use.
+            /// Ignore the exception and simply show is_deterministic = NULL.
+        }
+
+        fillRow(res_columns, function_name, 0, is_deterministic, "", FunctionOrigin::SYSTEM, functions_factory);
     }
 
     const auto & aggregate_functions_factory = AggregateFunctionFactory::instance();
     const auto & aggregate_function_names = aggregate_functions_factory.getAllRegisteredNames();
     for (const auto & function_name : aggregate_function_names)
     {
-        fillRow(res_columns, function_name, UInt64(1), "", FunctionOrigin::SYSTEM, aggregate_functions_factory);
+        fillRow(res_columns, function_name, 1, {1}, "", FunctionOrigin::SYSTEM, aggregate_functions_factory);
     }
 
     const auto & user_defined_sql_functions_factory = UserDefinedSQLFunctionFactory::instance();
@@ -136,14 +155,14 @@ void StorageSystemFunctions::fillData(MutableColumns & res_columns, ContextPtr c
     for (const auto & function_name : user_defined_sql_functions_names)
     {
         auto create_query = queryToString(user_defined_sql_functions_factory.get(function_name));
-        fillRow(res_columns, function_name, UInt64(0), create_query, FunctionOrigin::SQL_USER_DEFINED, user_defined_sql_functions_factory);
+        fillRow(res_columns, function_name, 0, {0}, create_query, FunctionOrigin::SQL_USER_DEFINED, user_defined_sql_functions_factory);
     }
 
     const auto & user_defined_executable_functions_factory = UserDefinedExecutableFunctionFactory::instance();
     const auto & user_defined_executable_functions_names = user_defined_executable_functions_factory.getRegisteredNames(context);
     for (const auto & function_name : user_defined_executable_functions_names)
     {
-        fillRow(res_columns, function_name, UInt64(0), "", FunctionOrigin::EXECUTABLE_USER_DEFINED, user_defined_executable_functions_factory);
+        fillRow(res_columns, function_name, 0, {0}, "", FunctionOrigin::EXECUTABLE_USER_DEFINED, user_defined_executable_functions_factory);
     }
 }
 
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 9b633314bd3..a6617cf44c7 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -283,6 +283,7 @@ CREATE TABLE system.functions
 (
     `name` String,
     `is_aggregate` UInt8,
+    `is_deterministic` Nullable(UInt8),
     `case_insensitive` UInt8,
     `alias_to` String,
     `create_query` String,

From d94c1b1ec99b5d462b101ed356e7e9b3a1113d87 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 18 Sep 2023 22:27:04 +0000
Subject: [PATCH 041/101] add check for collisions in filenames

---
 .../settings/merge-tree-settings.md           |  2 +-
 src/DataTypes/NestedUtils.cpp                 |  7 ++-
 src/Storages/MergeTree/MergeTreeData.cpp      | 57 +++++++++++++++++++
 src/Storages/MergeTree/MergeTreeData.h        |  2 +
 .../MergeTree/MergeTreeDataPartWriterWide.cpp |  8 +++
 ...2869_insert_filenames_collisions.reference |  3 +
 .../02869_insert_filenames_collisions.sql     | 44 ++++++++++++++
 7 files changed, 120 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02869_insert_filenames_collisions.reference
 create mode 100644 tests/queries/0_stateless/02869_insert_filenames_collisions.sql

diff --git a/docs/en/operations/settings/merge-tree-settings.md b/docs/en/operations/settings/merge-tree-settings.md
index ded2eef7d6f..f180578ed77 100644
--- a/docs/en/operations/settings/merge-tree-settings.md
+++ b/docs/en/operations/settings/merge-tree-settings.md
@@ -850,7 +850,7 @@ If the file name for column is too long (more than `max_file_name_length` bytes)
 
 ## max_file_name_length {#max_file_name_length}
 
-The maximal length of the file name to keep it as is without hashing. Takes effect only if setting `replace_long_file_name_to_hash` is enabled. Default value: 128.
+The maximal length of the file name to keep it as is without hashing. Takes effect only if setting `replace_long_file_name_to_hash` is enabled. The value of this setting does not include the length of file extension. So, it is recommended to set it below the maximum filename length (usually 255 bytes) with some gap to avoid filesystem errors. Default value: 127.
 
 ## clean_deleted_rows
 
diff --git a/src/DataTypes/NestedUtils.cpp b/src/DataTypes/NestedUtils.cpp
index 9ee803c4235..efac2454a03 100644
--- a/src/DataTypes/NestedUtils.cpp
+++ b/src/DataTypes/NestedUtils.cpp
@@ -164,7 +164,7 @@ NameToDataType getSubcolumnsOfNested(const NamesAndTypesList & names_and_types)
     std::unordered_map<String, NamesAndTypesList> nested;
     for (const auto & name_type : names_and_types)
     {
-        const DataTypeArray * type_arr = typeid_cast<const DataTypeArray *>(name_type.type.get());
+        const auto * type_arr = typeid_cast<const DataTypeArray *>(name_type.type.get());
 
         /// Ignore true Nested type, but try to unite flatten arrays to Nested type.
         if (!isNested(name_type.type) && type_arr)
@@ -191,8 +191,11 @@ NamesAndTypesList collect(const NamesAndTypesList & names_and_types)
     auto nested_types = getSubcolumnsOfNested(names_and_types);
 
     for (const auto & name_type : names_and_types)
-        if (!isArray(name_type.type) || !nested_types.contains(splitName(name_type.name).first))
+    {
+        auto split = splitName(name_type.name);
+        if (!isArray(name_type.type) || split.second.empty() || !nested_types.contains(split.first))
             res.push_back(name_type);
+    }
 
     for (const auto & name_type : nested_types)
         res.emplace_back(name_type.first, name_type.second);
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index f7138e73c77..f5bc3ab61d6 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -399,6 +399,7 @@ MergeTreeData::MergeTreeData(
                               settings->check_sample_column_is_correct && !attach);
     }
 
+    checkColumnFilenamesForCollision(*settings, !attach);
     checkTTLExpressions(metadata_, metadata_);
 
     String reason;
@@ -3549,6 +3550,7 @@ void MergeTreeData::changeSettings(
         auto copy = getDefaultSettings();
         copy->applyChanges(new_changes);
         copy->sanityCheck(getContext()->getMergeMutateExecutor()->getMaxTasksCount());
+        checkColumnFilenamesForCollision(*copy, /*throw_on_error=*/ true);
 
         storage_settings.set(std::move(copy));
         StorageInMemoryMetadata new_metadata = getInMemoryMetadata();
@@ -7358,6 +7360,61 @@ bool MergeTreeData::canUseParallelReplicasBasedOnPKAnalysis(
     return decision;
 }
 
+void MergeTreeData::checkColumnFilenamesForCollision(const MergeTreeSettings & settings, bool throw_on_error) const
+{
+    std::unordered_map<String, std::pair<String, String>> stream_name_to_full_name;
+    auto columns_list = getInMemoryMetadataPtr()->getColumns().getAllPhysical();
+
+    for (const auto & column : Nested::collect(columns_list))
+    {
+        std::unordered_map<String, String> column_streams;
+
+        auto callback = [&](const auto & substream_path)
+        {
+            String stream_name;
+            auto full_stream_name = ISerialization::getFileNameForStream(column, substream_path);
+
+            if (settings.replace_long_file_name_to_hash && full_stream_name.size() > settings.max_file_name_length)
+                stream_name = sipHash128String(full_stream_name);
+            else
+                stream_name = full_stream_name;
+
+            column_streams.emplace(stream_name, full_stream_name);
+        };
+
+        auto serialization = column.type->getDefaultSerialization();
+        serialization->enumerateStreams(callback);
+
+        if (column.type->supportsSparseSerialization() && settings.ratio_of_defaults_for_sparse_serialization < 1.0)
+        {
+            auto sparse_serialization = column.type->getSparseSerialization();
+            sparse_serialization->enumerateStreams(callback);
+        }
+
+        for (const auto & [stream_name, full_stream_name] : column_streams)
+        {
+            auto [it, inserted] = stream_name_to_full_name.emplace(stream_name, std::pair{full_stream_name, column.name});
+            if (!inserted)
+            {
+                const auto & [other_full_name, other_column_name] = it->second;
+                auto other_type = getInMemoryMetadataPtr()->getColumns().getPhysical(other_column_name).type;
+
+                auto message = fmt::format(
+                    "Columns '{} {}' and '{} {}' have streams ({} and {}) with collision in file name {}",
+                    column.name, column.type->getName(), other_column_name, other_type->getName(), full_stream_name, other_full_name, stream_name);
+
+                if (settings.replace_long_file_name_to_hash)
+                    message += ". It may be a a collision between a filename for one column and a hash of filename for another column (see setting 'replace_long_file_name_to_hash')";
+
+                if (throw_on_error)
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "{}", message);
+
+                LOG_ERROR(log, "Table definition is incorrect. {}. It may lead to corruption of data or crashes. You need to resolve it manually", message);
+                return;
+            }
+        }
+    }
+}
 
 MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(IStorage & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const
 {
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 26521dbe90f..c1c5c0191a4 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -1569,6 +1569,8 @@ private:
         ContextPtr query_context,
         const StorageSnapshotPtr & storage_snapshot,
         SelectQueryInfo & query_info) const;
+
+    void checkColumnFilenamesForCollision(const MergeTreeSettings & settings, bool throw_on_error) const;
 };
 
 /// RAII struct to record big parts that are submerging or emerging.
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
index 37cfcce712f..ff535eb4fc2 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
@@ -12,6 +12,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int INCORRECT_FILE_NAME;
 }
 
 namespace
@@ -107,6 +108,13 @@ void MergeTreeDataPartWriterWide::addStreams(
         else
             stream_name = full_stream_name;
 
+        auto it = stream_name_to_full_name.find(stream_name);
+        if (it != stream_name_to_full_name.end() && it->second != full_stream_name)
+            throw Exception(ErrorCodes::INCORRECT_FILE_NAME,
+                "Stream with name {} already created (full stream name: {}). Current full stream name: {}."
+                " It is a collision between a filename for one column and a hash of filename for another column or a bug",
+                stream_name, it->second, full_stream_name);
+
         /// Shared offsets for Nested type.
         if (column_streams.contains(stream_name))
             return;
diff --git a/tests/queries/0_stateless/02869_insert_filenames_collisions.reference b/tests/queries/0_stateless/02869_insert_filenames_collisions.reference
new file mode 100644
index 00000000000..d835614ae16
--- /dev/null
+++ b/tests/queries/0_stateless/02869_insert_filenames_collisions.reference
@@ -0,0 +1,3 @@
+e798545eefc8b7a1c2c81ff00c064ad8
+1	1
+2	2
diff --git a/tests/queries/0_stateless/02869_insert_filenames_collisions.sql b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
new file mode 100644
index 00000000000..234ee0f2c6b
--- /dev/null
+++ b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
@@ -0,0 +1,44 @@
+DROP TABLE IF EXISTS t_collisions;
+
+SELECT lower(hex(reverse(CAST(sipHash128('very_very_long_column_name_that_will_be_replaced_with_hash'), 'FixedString(16)'))));
+
+CREATE TABLE t_collisions
+(
+    `very_very_long_column_name_that_will_be_replaced_with_hash` Int32,
+    `e798545eefc8b7a1c2c81ff00c064ad8` Int32
+)
+ENGINE = MergeTree
+ORDER BY tuple()
+SETTINGS replace_long_file_name_to_hash = 1, max_file_name_length = 42; -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE IF EXISTS t_collisions;
+
+CREATE TABLE t_collisions
+(
+    `very_very_long_column_name_that_will_be_replaced_with_hash` Int32,
+    `e798545eefc8b7a1c2c81ff00c064ad8` Int32
+)
+ENGINE = MergeTree
+ORDER BY tuple();
+
+INSERT INTO t_collisions VALUES (1, 1);
+
+ALTER TABLE t_collisions MODIFY SETTING replace_long_file_name_to_hash = 1, max_file_name_length = 42; -- { serverError BAD_ARGUMENTS }
+
+INSERT INTO t_collisions VALUES (2, 2);
+
+SELECT * FROM t_collisions ORDER BY e798545eefc8b7a1c2c81ff00c064ad8;
+
+DROP TABLE IF EXISTS t_collisions;
+
+CREATE TABLE t_collisions
+(
+    `id` Int,
+    `col` Array(String),
+    `col.s` Array(LowCardinality(String)),
+    `col.u` Array(LowCardinality(String))
+)
+ENGINE = MergeTree
+ORDER BY id; -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE IF EXISTS t_collisions;

From 72f2bfd166220e0cb94dd80e18c95202a4ac8cc0 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 19 Sep 2023 05:35:57 +0000
Subject: [PATCH 042/101] fix build

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 66e39496192..54c8293f515 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -2154,6 +2154,8 @@ std::optional<std::string> getIndexExtensionFromFilesystem(const IDataPartStorag
     {
         for (auto it = data_part_storage.iterate(); it->isValid(); it->next())
         {
+            const auto & extension = fs::path(it->name()).extension();
+            if (extension == getIndexExtension(true))
                 return extension;
         }
     }

From b6078516961c35d5d16b9fed6f416c3b926bdfd8 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 19 Sep 2023 07:34:46 +0000
Subject: [PATCH 043/101] Fix test

---
 .../0_stateless/02735_system_zookeeper_connection.reference     | 2 +-
 tests/queries/0_stateless/02735_system_zookeeper_connection.sql | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
index c046c64acb2..f8605cb87cf 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
@@ -1,2 +1,2 @@
-default	::1	9181	0	0	0	1	1	['FILTERED_LIST','MULTI_READ','CHECK_NOT_EXISTS','CREATE_IF_NOT_EXISTS']
+default	::1	9181	0	0	0	1	1
 zookeeper2	::1	9181	0	0	0	1
diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
index f999da51225..863d90e1654 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
@@ -9,7 +9,7 @@ ENGINE ReplicatedMergeTree('zookeeper2:/clickhouse/{database}/02731_zk_connectio
 ORDER BY tuple();
 
 select name, host, port, index, is_expired, keeper_api_version, (connected_time between yesterday() and now()),
-       (abs(session_uptime_elapsed_seconds  - zookeeperSessionUptime()) < 10), enabled_feature_flags
+       (abs(session_uptime_elapsed_seconds  - zookeeperSessionUptime()) < 10)
 from system.zookeeper_connection where name='default';
 
 -- keeper_api_version will by 0 for auxiliary_zookeeper2, because we fail to get /api_version due to chroot

From 76ba5d9d98ed91b81975dea5b1fc1083d0eda43b Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 19 Sep 2023 08:48:40 +0000
Subject: [PATCH 044/101] fix test

---
 .../queries/0_stateless/02869_insert_filenames_collisions.sql  | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02869_insert_filenames_collisions.sql b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
index 234ee0f2c6b..a8c39a8a687 100644
--- a/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
+++ b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
@@ -19,7 +19,8 @@ CREATE TABLE t_collisions
     `e798545eefc8b7a1c2c81ff00c064ad8` Int32
 )
 ENGINE = MergeTree
-ORDER BY tuple();
+ORDER BY tuple()
+SETTINGS replace_long_file_name_to_hash = 0;
 
 INSERT INTO t_collisions VALUES (1, 1);
 

From 3c83e43351280a0d5932afe7a6ac1f42b4ed657b Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 19 Sep 2023 13:38:43 +0200
Subject: [PATCH 045/101] Remove debug logging

---
 .../Formats/RowOutputFormatWithExceptionHandlerAdaptor.h        | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
index 22232e9f654..e1426bb9743 100644
--- a/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
+++ b/src/Processors/Formats/RowOutputFormatWithExceptionHandlerAdaptor.h
@@ -6,7 +6,6 @@
 
 #include <IO/WriteBuffer.h>
 #include <IO/PeekableWriteBuffer.h>
-#include <Common/logger_useful.h>
 
 namespace DB
 {
@@ -76,7 +75,6 @@ public:
 
     void resetFormatterImpl() override
     {
-        LOG_DEBUG(&Poco::Logger::get("RowOutputFormatWithExceptionHandlerAdaptor"), "resetFormatterImpl");
         Base::resetFormatterImpl();
         if (peekable_out)
             peekable_out = std::make_unique<PeekableWriteBuffer>(*Base::getWriteBufferPtr());

From f3bf8388b69f59c63dfb67b53ef06c196692abb2 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 20 Sep 2023 10:00:00 +0000
Subject: [PATCH 046/101] Incorporate feedback

---
 docs/en/operations/system-tables/functions.md | 38 +++++++++++--------
 .../System/StorageSystemFunctions.cpp         | 20 +++++++++-
 2 files changed, 40 insertions(+), 18 deletions(-)

diff --git a/docs/en/operations/system-tables/functions.md b/docs/en/operations/system-tables/functions.md
index 60bfa08975b..1c8f6ac8a6d 100644
--- a/docs/en/operations/system-tables/functions.md
+++ b/docs/en/operations/system-tables/functions.md
@@ -7,28 +7,34 @@ Contains information about normal and aggregate functions.
 
 Columns:
 
-- `name`(`String`) – The name of the function.
-- `is_aggregate`(`UInt8`) — Whether the function is aggregate.
+- `name` ([String](../../sql-reference/datatypes/string.md)) – The name of the function.
+- `is_aggregate` ([UInt8](../../sql-reference/datatypes/int-uint.md)) — Whether the function is an aggregate function.
+- `is_deterministic` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt8](../../sql-reference/data-types/int-uint.md))) - Whether the function is deterministic.
+- `case_insensitive`, ([UInt8](../../sql-reference/datatypes/int-uint.md)) - Whether the function name can be used case-insensitively.
+- `alias_to`, ([String](../../sql-reference/datatypes/string.md)) - The original function name, if the function name is an alias.
+- `create_query`, ([String](../../sql-reference/datatypes/enum.md)) - Unused.
+- `origin`, ([Enum8](../../sql-reference/datatypes/string.md)) - Unused.
+- `description`, ([String](../../sql-reference/datatypes/string.md)) - A high-level description what the function does.
+- `syntax`, ([String](../../sql-reference/datatypes/string.md)) - Signature of the function.
+- `arguments`, ([String](../../sql-reference/datatypes/string.md)) - What arguments does the function take.
+- `returned_value`, ([String](../../sql-reference/datatypes/string.md)) - What does the function return.
+- `examples`, ([String](../../sql-reference/datatypes/string.md)) - Example usage of the function.
+- `categories`, ([String](../../sql-reference/datatypes/string.md)) - The category of the function.
 
 **Example**
 
 ```sql
- SELECT * FROM system.functions LIMIT 10;
+ SELECT name, is_aggregate, is_deterministic, case_insensitive, alias_to FROM system.functions LIMIT 5;
 ```
 
 ```text
-┌─name──────────────────┬─is_aggregate─┬─case_insensitive─┬─alias_to─┬─create_query─┬─origin─┐
-│ logTrace              │            0 │                0 │          │              │ System │
-│ aes_decrypt_mysql     │            0 │                0 │          │              │ System │
-│ aes_encrypt_mysql     │            0 │                0 │          │              │ System │
-│ decrypt               │            0 │                0 │          │              │ System │
-│ encrypt               │            0 │                0 │          │              │ System │
-│ toBool                │            0 │                0 │          │              │ System │
-│ windowID              │            0 │                0 │          │              │ System │
-│ hopStart              │            0 │                0 │          │              │ System │
-│ hop                   │            0 │                0 │          │              │ System │
-│ snowflakeToDateTime64 │            0 │                0 │          │              │ System │
-└───────────────────────┴──────────────┴──────────────────┴──────────┴──────────────┴────────┘
+┌─name─────────────────────┬─is_aggregate─┬─is_deterministic─┬─case_insensitive─┬─alias_to─┐
+│ BLAKE3                   │            0 │                1 │                0 │          │
+│ sipHash128Reference      │            0 │                1 │                0 │          │
+│ mapExtractKeyLike        │            0 │                1 │                0 │          │
+│ sipHash128ReferenceKeyed │            0 │                1 │                0 │          │
+│ mapPartialSort           │            0 │                1 │                0 │          │
+└──────────────────────────┴──────────────┴──────────────────┴──────────────────┴──────────┘
 
-10 rows in set. Elapsed: 0.002 sec.
+5 rows in set. Elapsed: 0.002 sec.
 ```
diff --git a/src/Storages/System/StorageSystemFunctions.cpp b/src/Storages/System/StorageSystemFunctions.cpp
index 37d536ff6b1..968f41392c8 100644
--- a/src/Storages/System/StorageSystemFunctions.cpp
+++ b/src/Storages/System/StorageSystemFunctions.cpp
@@ -16,6 +16,14 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int DICTIONARIES_WAS_NOT_LOADED;
+    extern const int FUNCTION_NOT_ALLOWED;
+    extern const int NOT_IMPLEMENTED;
+    extern const int SUPPORT_IS_DISABLED;
+};
+
 enum class FunctionOrigin : Int8
 {
     SYSTEM = 0,
@@ -134,10 +142,18 @@ void StorageSystemFunctions::fillData(MutableColumns & res_columns, ContextPtr c
         {
             is_deterministic = functions_factory.tryGet(function_name, context)->isDeterministic();
         }
-        catch (...)
+        catch (const Exception & e)
         {
             /// Some functions throw because they need special configuration or setup before use.
-            /// Ignore the exception and simply show is_deterministic = NULL.
+            if (e.code() == ErrorCodes::DICTIONARIES_WAS_NOT_LOADED
+                || e.code() == ErrorCodes::FUNCTION_NOT_ALLOWED
+                || e.code() == ErrorCodes::NOT_IMPLEMENTED
+                || e.code() == ErrorCodes::SUPPORT_IS_DISABLED)
+            {
+                /// Ignore exception, show is_deterministic = NULL.
+            }
+            else
+                throw;
         }
 
         fillRow(res_columns, function_name, 0, is_deterministic, "", FunctionOrigin::SYSTEM, functions_factory);

From a4eeed50b64eaae9e84a89b70651996b37a99813 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 20 Sep 2023 12:49:15 +0000
Subject: [PATCH 047/101] Mark obsolete settings in system.merge_tree_settings
 as is_obsolete = 1

---
 src/Storages/MergeTree/MergeTreeSettings.h | 49 +++++++++++++---------
 1 file changed, 29 insertions(+), 20 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 4f36da048c2..1c338f3817c 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -24,7 +24,7 @@ struct Settings;
   * and should not be changed by the user without a reason.
   */
 
-#define LIST_OF_MERGE_TREE_SETTINGS(M, ALIAS) \
+#define MERGE_TREE_SETTINGS(M, ALIAS) \
     M(UInt64, min_compress_block_size, 0, "When granule is written, compress the data in buffer if the size of pending uncompressed data is larger or equal than the specified threshold. If this setting is not set, the corresponding global setting is used.", 0) \
     M(UInt64, max_compress_block_size, 0, "Compress the pending uncompressed data in buffer if its size is larger or equal than the specified threshold. Block of data will be compressed even if the current granule is not finished. If this setting is not set, the corresponding global setting is used.", 0) \
     M(UInt64, index_granularity, 8192, "How many rows correspond to one primary key value.", 0) \
@@ -165,6 +165,7 @@ struct Settings;
     M(Bool, allow_vertical_merges_from_compact_to_wide_parts, true, "Allows vertical merges from compact to wide parts. This settings must have the same value on all replicas", 0) \
     M(Bool, enable_the_endpoint_id_with_zookeeper_name_prefix, false, "Enable the endpoint id with zookeeper name prefix for the replicated merge tree table", 0) \
     M(UInt64, zero_copy_merge_mutation_min_parts_size_sleep_before_lock, 1ULL * 1024 * 1024 * 1024, "If zero copy replication is enabled sleep random amount of time before trying to lock depending on parts size for merge or mutation", 0) \
+    M(Bool, allow_floating_point_partition_key, false, "Allow floating point as partition key", 0) \
     \
     /** Experimental/work in progress feature. Unsafe for production. */ \
     M(UInt64, part_moves_between_shards_enable, 0, "Experimental/Incomplete feature to move parts between shards. Does not take into account sharding expressions.", 0) \
@@ -181,31 +182,39 @@ struct Settings;
     M(UInt64, marks_compress_block_size, 65536, "Mark compress block size, the actual size of the block to compress.", 0) \
     M(UInt64, primary_key_compress_block_size, 65536, "Primary compress block size, the actual size of the block to compress.", 0) \
     \
-    /** Obsolete settings. Kept for backward compatibility only. */ \
-    M(UInt64, min_relative_delay_to_yield_leadership, 120, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, check_delay_period, 60, "Obsolete setting, does nothing.", 0) \
-    M(Bool, allow_floating_point_partition_key, false, "Allow floating point as partition key", 0) \
-    M(UInt64, replicated_max_parallel_sends, 0, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, replicated_max_parallel_sends_for_table, 0, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, replicated_max_parallel_fetches, 0, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, replicated_max_parallel_fetches_for_table, 0, "Obsolete setting, does nothing.", 0) \
-    M(Bool, write_final_mark, true, "Obsolete setting, does nothing.", 0)                                                                                                                                                                                            \
-    M(UInt64, min_bytes_for_compact_part, 0, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, min_rows_for_compact_part, 0, "Obsolete setting, does nothing.", 0) \
-    M(Bool, in_memory_parts_enable_wal, true, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, write_ahead_log_max_bytes, 1024 * 1024 * 1024, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, write_ahead_log_bytes_to_fsync, 100ULL * 1024 * 1024, "Obsolete setting, does nothing.", 0) \
-    M(UInt64, write_ahead_log_interval_ms_to_fsync, 100, "Obsolete setting, does nothing.", 0) \
-    M(Bool, in_memory_parts_insert_sync, false, "Obsolete setting, does nothing.", 0) \
-    M(MaxThreads, max_part_loading_threads, 0, "Obsolete setting, does nothing.", 0) \
-    M(MaxThreads, max_part_removal_threads, 0, "Obsolete setting, does nothing.", 0) \
-    M(Bool, use_metadata_cache, false, "Obsolete setting, does nothing.", 0) \
+
+#define MAKE_OBSOLETE_MERGE_TREE_SETTING(M, TYPE, NAME, DEFAULT) \
+    M(TYPE, NAME, DEFAULT, "Obsolete setting, does nothing.", BaseSettingsHelpers::Flags::OBSOLETE)
+
+#define OBSOLETE_MERGE_TREE_SETTINGS(M, ALIAS) \
+    /** Obsolete settings that do nothing but left for compatibility reasons. */ \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, min_relative_delay_to_yield_leadership, 120) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, check_delay_period, 60) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, replicated_max_parallel_sends, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, replicated_max_parallel_sends_for_table, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, replicated_max_parallel_fetches, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, replicated_max_parallel_fetches_for_table, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Bool, write_final_mark, true) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, min_bytes_for_compact_part, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, min_rows_for_compact_part, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Bool, in_memory_parts_enable_wal, true) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, write_ahead_log_max_bytes, 1024 * 1024 * 1024) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, write_ahead_log_bytes_to_fsync, 100ULL * 1024 * 1024) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, write_ahead_log_interval_ms_to_fsync, 100) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Bool, in_memory_parts_insert_sync, false) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, MaxThreads, max_part_loading_threads, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, MaxThreads, max_part_removal_threads, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Bool, use_metadata_cache, false) \
 
     /// Settings that should not change after the creation of a table.
     /// NOLINTNEXTLINE
 #define APPLY_FOR_IMMUTABLE_MERGE_TREE_SETTINGS(M) \
     M(index_granularity)
 
+#define LIST_OF_MERGE_TREE_SETTINGS(M, ALIAS) \
+    MERGE_TREE_SETTINGS(M, ALIAS)             \
+    OBSOLETE_MERGE_TREE_SETTINGS(M, ALIAS)
+
 DECLARE_SETTINGS_TRAITS(MergeTreeSettingsTraits, LIST_OF_MERGE_TREE_SETTINGS)
 
 
From 28ca5cad7d62cfe8e3b0bee948088436a00f21e1 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 20 Sep 2023 21:15:52 +0000
Subject: [PATCH 048/101] Fix spelling

---
 docs/en/operations/system-tables/functions.md | 24 +++++++++----------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/docs/en/operations/system-tables/functions.md b/docs/en/operations/system-tables/functions.md
index 1c8f6ac8a6d..d52bf24f289 100644
--- a/docs/en/operations/system-tables/functions.md
+++ b/docs/en/operations/system-tables/functions.md
@@ -7,19 +7,19 @@ Contains information about normal and aggregate functions.
 
 Columns:
 
-- `name` ([String](../../sql-reference/datatypes/string.md)) – The name of the function.
-- `is_aggregate` ([UInt8](../../sql-reference/datatypes/int-uint.md)) — Whether the function is an aggregate function.
+- `name` ([String](../../sql-reference/data-types/string.md)) – The name of the function.
+- `is_aggregate` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Whether the function is an aggregate function.
 - `is_deterministic` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt8](../../sql-reference/data-types/int-uint.md))) - Whether the function is deterministic.
-- `case_insensitive`, ([UInt8](../../sql-reference/datatypes/int-uint.md)) - Whether the function name can be used case-insensitively.
-- `alias_to`, ([String](../../sql-reference/datatypes/string.md)) - The original function name, if the function name is an alias.
-- `create_query`, ([String](../../sql-reference/datatypes/enum.md)) - Unused.
-- `origin`, ([Enum8](../../sql-reference/datatypes/string.md)) - Unused.
-- `description`, ([String](../../sql-reference/datatypes/string.md)) - A high-level description what the function does.
-- `syntax`, ([String](../../sql-reference/datatypes/string.md)) - Signature of the function.
-- `arguments`, ([String](../../sql-reference/datatypes/string.md)) - What arguments does the function take.
-- `returned_value`, ([String](../../sql-reference/datatypes/string.md)) - What does the function return.
-- `examples`, ([String](../../sql-reference/datatypes/string.md)) - Example usage of the function.
-- `categories`, ([String](../../sql-reference/datatypes/string.md)) - The category of the function.
+- `case_insensitive`, ([UInt8](../../sql-reference/data-types/int-uint.md)) - Whether the function name can be used case-insensitively.
+- `alias_to`, ([String](../../sql-reference/data-types/string.md)) - The original function name, if the function name is an alias.
+- `create_query`, ([String](../../sql-reference/data-types/enum.md)) - Unused.
+- `origin`, ([Enum8](../../sql-reference/data-types/string.md)) - Unused.
+- `description`, ([String](../../sql-reference/data-types/string.md)) - A high-level description what the function does.
+- `syntax`, ([String](../../sql-reference/data-types/string.md)) - Signature of the function.
+- `arguments`, ([String](../../sql-reference/data-types/string.md)) - What arguments does the function take.
+- `returned_value`, ([String](../../sql-reference/data-types/string.md)) - What does the function return.
+- `examples`, ([String](../../sql-reference/data-types/string.md)) - Example usage of the function.
+- `categories`, ([String](../../sql-reference/data-types/string.md)) - The category of the function.
 
 **Example**
 

From 4d7ecf39ac58c482166656b88283b17987d8214f Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 21 Sep 2023 14:16:03 +0000
Subject: [PATCH 049/101] check file collisions on all alters

---
 src/Storages/MergeTree/MergeTreeData.cpp      | 26 ++++++++++++-----
 src/Storages/MergeTree/MergeTreeData.h        |  3 +-
 .../02869_insert_filenames_collisions.sql     | 28 +++++++++++++++++++
 3 files changed, 49 insertions(+), 8 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 6293313d438..f8661a902b5 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -398,7 +398,7 @@ MergeTreeData::MergeTreeData(
                               settings->check_sample_column_is_correct && !attach);
     }
 
-    checkColumnFilenamesForCollision(*settings, !attach);
+    checkColumnFilenamesForCollision(metadata_.getColumns(), *settings, !attach);
     checkTTLExpressions(metadata_, metadata_);
 
     String reason;
@@ -3350,6 +3350,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
         }
     }
 
+    checkColumnFilenamesForCollision(new_metadata, /*throw_on_error=*/ true);
     checkProperties(new_metadata, old_metadata, false, false, local_context);
     checkTTLExpressions(new_metadata, old_metadata);
 
@@ -3530,7 +3531,6 @@ void MergeTreeData::changeSettings(
         auto copy = getDefaultSettings();
         copy->applyChanges(new_changes);
         copy->sanityCheck(getContext()->getMergeMutateExecutor()->getMaxTasksCount());
-        checkColumnFilenamesForCollision(*copy, /*throw_on_error=*/ true);
 
         storage_settings.set(std::move(copy));
         StorageInMemoryMetadata new_metadata = getInMemoryMetadata();
@@ -7445,12 +7445,24 @@ bool MergeTreeData::canUseParallelReplicasBasedOnPKAnalysis(
     return decision;
 }
 
-void MergeTreeData::checkColumnFilenamesForCollision(const MergeTreeSettings & settings, bool throw_on_error) const
+void MergeTreeData::checkColumnFilenamesForCollision(const StorageInMemoryMetadata & metadata, bool throw_on_error) const
+{
+    auto settings = getDefaultSettings();
+    if (metadata.settings_changes)
+    {
+        const auto & changes = metadata.settings_changes->as<const ASTSetQuery &>().changes;
+        settings->applyChanges(changes);
+    }
+
+    checkColumnFilenamesForCollision(metadata.getColumns(), *settings, throw_on_error);
+}
+
+void MergeTreeData::checkColumnFilenamesForCollision(const ColumnsDescription & columns, const MergeTreeSettings & settings, bool throw_on_error) const
 {
     std::unordered_map<String, std::pair<String, String>> stream_name_to_full_name;
-    auto columns_list = getInMemoryMetadataPtr()->getColumns().getAllPhysical();
+    auto columns_list = Nested::collect(columns.getAllPhysical());
 
-    for (const auto & column : Nested::collect(columns_list))
+    for (const auto & column : columns_list)
     {
         std::unordered_map<String, String> column_streams;
 
@@ -7482,14 +7494,14 @@ void MergeTreeData::checkColumnFilenamesForCollision(const MergeTreeSettings & s
             if (!inserted)
             {
                 const auto & [other_full_name, other_column_name] = it->second;
-                auto other_type = getInMemoryMetadataPtr()->getColumns().getPhysical(other_column_name).type;
+                auto other_type = columns.getPhysical(other_column_name).type;
 
                 auto message = fmt::format(
                     "Columns '{} {}' and '{} {}' have streams ({} and {}) with collision in file name {}",
                     column.name, column.type->getName(), other_column_name, other_type->getName(), full_stream_name, other_full_name, stream_name);
 
                 if (settings.replace_long_file_name_to_hash)
-                    message += ". It may be a a collision between a filename for one column and a hash of filename for another column (see setting 'replace_long_file_name_to_hash')";
+                    message += ". It may be a collision between a filename for one column and a hash of filename for another column (see setting 'replace_long_file_name_to_hash')";
 
                 if (throw_on_error)
                     throw Exception(ErrorCodes::BAD_ARGUMENTS, "{}", message);
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 6b2c80217b5..e1264b8ee32 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -1575,7 +1575,8 @@ private:
         const StorageSnapshotPtr & storage_snapshot,
         SelectQueryInfo & query_info) const;
 
-    void checkColumnFilenamesForCollision(const MergeTreeSettings & settings, bool throw_on_error) const;
+    void checkColumnFilenamesForCollision(const StorageInMemoryMetadata & metadata, bool throw_on_error) const;
+    void checkColumnFilenamesForCollision(const ColumnsDescription & columns, const MergeTreeSettings & settings, bool throw_on_error) const;
 };
 
 /// RAII struct to record big parts that are submerging or emerging.
diff --git a/tests/queries/0_stateless/02869_insert_filenames_collisions.sql b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
index a8c39a8a687..44135593005 100644
--- a/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
+++ b/tests/queries/0_stateless/02869_insert_filenames_collisions.sql
@@ -13,6 +13,20 @@ SETTINGS replace_long_file_name_to_hash = 1, max_file_name_length = 42; -- { ser
 
 DROP TABLE IF EXISTS t_collisions;
 
+CREATE TABLE t_collisions
+(
+    `col1` Int32,
+    `e798545eefc8b7a1c2c81ff00c064ad8` Int32
+)
+ENGINE = MergeTree
+ORDER BY tuple()
+SETTINGS replace_long_file_name_to_hash = 1, max_file_name_length = 42;
+
+ALTER TABLE t_collisions ADD COLUMN very_very_long_column_name_that_will_be_replaced_with_hash Int32;  -- { serverError BAD_ARGUMENTS }
+ALTER TABLE t_collisions RENAME COLUMN col1 TO very_very_long_column_name_that_will_be_replaced_with_hash;  -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE IF EXISTS t_collisions;
+
 CREATE TABLE t_collisions
 (
     `very_very_long_column_name_that_will_be_replaced_with_hash` Int32,
@@ -43,3 +57,17 @@ ENGINE = MergeTree
 ORDER BY id; -- { serverError BAD_ARGUMENTS }
 
 DROP TABLE IF EXISTS t_collisions;
+
+CREATE TABLE t_collisions
+(
+    `id` Int,
+    `col` String,
+    `col.s` Array(LowCardinality(String)),
+    `col.u` Array(LowCardinality(String))
+)
+ENGINE = MergeTree
+ORDER BY id;
+
+ALTER TABLE t_collisions MODIFY COLUMN col Array(String); -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE IF EXISTS t_collisions;

From 3dbb6dcf4ed39ace1d362ca3e15b1732abc6e722 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 22 Sep 2023 13:47:28 +0000
Subject: [PATCH 050/101] Better

---
 docker/test/stateless/stress_tests.lib            | 15 +++++++++++++++
 tests/config/install.sh                           | 14 ++------------
 .../02735_system_zookeeper_connection.reference   |  2 +-
 .../02735_system_zookeeper_connection.sql         |  2 +-
 4 files changed, 19 insertions(+), 14 deletions(-)

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index e56369ce161..11945b68f70 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -52,6 +52,21 @@ function configure()
       | sed "s|<snapshot_distance>100000</snapshot_distance>|<snapshot_distance>10000</snapshot_distance>|" \
       > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
     sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+
+    function randomize_config_boolean_value {
+        value=$(($RANDOM % 2))
+        sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
+        | sed "s|<$1>[01]</$1>|<$1>$value</$1>|" \
+        > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
+        sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+    }
+
+    # Randomize all Keeper feature flags
+    randomize_config_boolean_value filtered_list
+    randomize_config_boolean_value multi_read
+    randomize_config_boolean_value check_not_exists
+    randomize_config_boolean_value create_if_not_exists
+
     sudo chown clickhouse /etc/clickhouse-server/config.d/keeper_port.xml
     sudo chgrp clickhouse /etc/clickhouse-server/config.d/keeper_port.xml
 
diff --git a/tests/config/install.sh b/tests/config/install.sh
index 66587792dc9..9e3b235515d 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -123,19 +123,9 @@ else
     ln -sf $SRC_PATH/config.d/zookeeper.xml $DEST_SERVER_PATH/config.d/
 fi
 
-function randomize_config_boolean_value {
-    value=$(($RANDOM % 2))
-    sed --follow-symlinks -i "s|<$1>[01]</$1>|<$1>$value</$1>|" $DEST_SERVER_PATH/config.d/keeper_port.xml
-}
-
 # We randomize creating the snapshot on exit for Keeper to test out using older snapshots
-randomize_config_boolean_value create_snapshot_on_exit
-
-# Randomize all Keeper feature flags
-randomize_config_boolean_value filtered_list
-randomize_config_boolean_value multi_read
-randomize_config_boolean_value check_not_exists
-randomize_config_boolean_value create_if_not_exists
+value=$(($RANDOM % 2))
+sed --follow-symlinks -i "s|<create_snapshot_on_exit>[01]</create_snapshot_on_exit>|<create_snapshot_on_exit>$value</create_snapshot_on_exit>|" $DEST_SERVER_PATH/config.d/keeper_port.xml
 
 if [[ -n "$USE_POLYMORPHIC_PARTS" ]] && [[ "$USE_POLYMORPHIC_PARTS" -eq 1 ]]; then
     ln -sf $SRC_PATH/config.d/polymorphic_parts.xml $DEST_SERVER_PATH/config.d/
diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
index f8605cb87cf..c046c64acb2 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.reference
@@ -1,2 +1,2 @@
-default	::1	9181	0	0	0	1	1
+default	::1	9181	0	0	0	1	1	['FILTERED_LIST','MULTI_READ','CHECK_NOT_EXISTS','CREATE_IF_NOT_EXISTS']
 zookeeper2	::1	9181	0	0	0	1
diff --git a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
index 863d90e1654..f999da51225 100644
--- a/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
+++ b/tests/queries/0_stateless/02735_system_zookeeper_connection.sql
@@ -9,7 +9,7 @@ ENGINE ReplicatedMergeTree('zookeeper2:/clickhouse/{database}/02731_zk_connectio
 ORDER BY tuple();
 
 select name, host, port, index, is_expired, keeper_api_version, (connected_time between yesterday() and now()),
-       (abs(session_uptime_elapsed_seconds  - zookeeperSessionUptime()) < 10)
+       (abs(session_uptime_elapsed_seconds  - zookeeperSessionUptime()) < 10), enabled_feature_flags
 from system.zookeeper_connection where name='default';
 
 -- keeper_api_version will by 0 for auxiliary_zookeeper2, because we fail to get /api_version due to chroot

From 1e567d5008b01809e9b5361a1b3385477271659a Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 21 Sep 2023 18:50:35 +0200
Subject: [PATCH 051/101] Retry backup s3 operations after
 ConnectionResetException.

---
 src/Backups/BackupIO_S3.cpp | 37 ++++++++++++++++++++++---------------
 src/Backups/BackupIO_S3.h   | 10 +++++-----
 src/IO/S3/Client.cpp        |  6 +++++-
 3 files changed, 32 insertions(+), 21 deletions(-)

diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index 5b08683b157..8bb2f895e38 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -32,11 +32,13 @@ namespace ErrorCodes
 
 namespace
 {
-    std::shared_ptr<S3::Client>
-    makeS3Client(const S3::URI & s3_uri, const String & access_key_id, const String & secret_access_key, const ContextPtr & context)
+    std::shared_ptr<S3::Client> makeS3Client(
+        const S3::URI & s3_uri,
+        const String & access_key_id,
+        const String & secret_access_key,
+        const S3Settings & settings,
+        const ContextPtr & context)
     {
-        auto settings = context->getStorageS3Settings().getSettings(s3_uri.uri.toString());
-
         Aws::Auth::AWSCredentials credentials(access_key_id, secret_access_key);
         HTTPHeaderEntries headers;
         if (access_key_id.empty())
@@ -45,13 +47,15 @@ namespace
             headers = settings.auth_settings.headers;
         }
 
+        const auto & request_settings = settings.request_settings;
+
         S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
             settings.auth_settings.region,
             context->getRemoteHostFilter(),
             static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_max_redirects),
             static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_retry_attempts),
             context->getGlobalContext()->getSettingsRef().enable_s3_requests_logging,
-            /* for_disk_s3 = */ false, settings.request_settings.get_request_throttler, settings.request_settings.put_request_throttler,
+            /* for_disk_s3 = */ false, request_settings.get_request_throttler, request_settings.put_request_throttler,
             s3_uri.uri.getScheme());
 
         client_configuration.endpointOverride = s3_uri.endpoint;
@@ -60,6 +64,7 @@ namespace
         client_configuration.connectTimeoutMs = 10 * 1000;
         /// Requests in backups can be extremely long, set to one hour
         client_configuration.requestTimeoutMs = 60 * 60 * 1000;
+        client_configuration.retryStrategy = std::make_shared<Aws::Client::DefaultRetryStrategy>(request_settings.retry_attempts);
 
         return S3::ClientFactory::instance().create(
             client_configuration,
@@ -112,13 +117,14 @@ BackupReaderS3::BackupReaderS3(
     const ContextPtr & context_)
     : BackupReaderDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupReaderS3"))
     , s3_uri(s3_uri_)
-    , client(makeS3Client(s3_uri_, access_key_id_, secret_access_key_, context_))
-    , request_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()).request_settings)
     , data_source_description{DataSourceType::S3, s3_uri.endpoint, false, false}
+    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()))
 {
+    auto & request_settings = s3_settings.request_settings;
     request_settings.updateFromSettings(context_->getSettingsRef());
     request_settings.max_single_read_retries = context_->getSettingsRef().s3_max_single_read_retries; // FIXME: Avoid taking value for endpoint
     request_settings.allow_native_copy = allow_s3_native_copy;
+    client = makeS3Client(s3_uri_, access_key_id_, secret_access_key_, s3_settings, context_);
 }
 
 BackupReaderS3::~BackupReaderS3() = default;
@@ -139,7 +145,7 @@ UInt64 BackupReaderS3::getFileSize(const String & file_name)
 std::unique_ptr<SeekableReadBuffer> BackupReaderS3::readFile(const String & file_name)
 {
     return std::make_unique<ReadBufferFromS3>(
-        client, s3_uri.bucket, fs::path(s3_uri.key) / file_name, s3_uri.version_id, request_settings, read_settings);
+        client, s3_uri.bucket, fs::path(s3_uri.key) / file_name, s3_uri.version_id, s3_settings.request_settings, read_settings);
 }
 
 void BackupReaderS3::copyFileToDisk(const String & path_in_backup, size_t file_size, bool encrypted_in_backup,
@@ -169,7 +175,7 @@ void BackupReaderS3::copyFileToDisk(const String & path_in_backup, size_t file_s
                 file_size,
                 /* dest_bucket= */ blob_path[1],
                 /* dest_key= */ blob_path[0],
-                request_settings,
+                s3_settings.request_settings,
                 read_settings,
                 object_attributes,
                 threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupReaderS3"),
@@ -198,14 +204,15 @@ BackupWriterS3::BackupWriterS3(
     const ContextPtr & context_)
     : BackupWriterDefault(read_settings_, write_settings_, &Poco::Logger::get("BackupWriterS3"))
     , s3_uri(s3_uri_)
-    , client(makeS3Client(s3_uri_, access_key_id_, secret_access_key_, context_))
-    , request_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()).request_settings)
     , data_source_description{DataSourceType::S3, s3_uri.endpoint, false, false}
+    , s3_settings(context_->getStorageS3Settings().getSettings(s3_uri.uri.toString()))
 {
+    auto & request_settings = s3_settings.request_settings;
     request_settings.updateFromSettings(context_->getSettingsRef());
     request_settings.max_single_read_retries = context_->getSettingsRef().s3_max_single_read_retries; // FIXME: Avoid taking value for endpoint
     request_settings.allow_native_copy = allow_s3_native_copy;
     request_settings.setStorageClassName(storage_class_name);
+    client = makeS3Client(s3_uri_, access_key_id_, secret_access_key_, s3_settings, context_);
 }
 
 void BackupWriterS3::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
@@ -230,7 +237,7 @@ void BackupWriterS3::copyFileFromDisk(const String & path_in_backup, DiskPtr src
                 length,
                 s3_uri.bucket,
                 fs::path(s3_uri.key) / path_in_backup,
-                request_settings,
+                s3_settings.request_settings,
                 read_settings,
                 {},
                 threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
@@ -244,7 +251,7 @@ void BackupWriterS3::copyFileFromDisk(const String & path_in_backup, DiskPtr src
 
 void BackupWriterS3::copyDataToFile(const String & path_in_backup, const CreateReadBufferFunction & create_read_buffer, UInt64 start_pos, UInt64 length)
 {
-    copyDataToS3File(create_read_buffer, start_pos, length, client, client, s3_uri.bucket, fs::path(s3_uri.key) / path_in_backup, request_settings, {},
+    copyDataToS3File(create_read_buffer, start_pos, length, client, client, s3_uri.bucket, fs::path(s3_uri.key) / path_in_backup, s3_settings.request_settings, {},
                      threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"));
 }
 
@@ -266,7 +273,7 @@ UInt64 BackupWriterS3::getFileSize(const String & file_name)
 std::unique_ptr<ReadBuffer> BackupWriterS3::readFile(const String & file_name, size_t expected_file_size)
 {
     return std::make_unique<ReadBufferFromS3>(
-            client, s3_uri.bucket, fs::path(s3_uri.key) / file_name, s3_uri.version_id, request_settings, read_settings,
+            client, s3_uri.bucket, fs::path(s3_uri.key) / file_name, s3_uri.version_id, s3_settings.request_settings, read_settings,
             false, 0, 0, false, expected_file_size);
 }
 
@@ -278,7 +285,7 @@ std::unique_ptr<WriteBuffer> BackupWriterS3::writeFile(const String & file_name)
         s3_uri.bucket,
         fs::path(s3_uri.key) / file_name,
         DBMS_DEFAULT_BUFFER_SIZE,
-        request_settings,
+        s3_settings.request_settings,
         std::nullopt,
         threadPoolCallbackRunner<void>(getBackupsIOThreadPool().get(), "BackupWriterS3"),
         write_settings);
diff --git a/src/Backups/BackupIO_S3.h b/src/Backups/BackupIO_S3.h
index a29c91498ec..4abcbedf89f 100644
--- a/src/Backups/BackupIO_S3.h
+++ b/src/Backups/BackupIO_S3.h
@@ -29,9 +29,9 @@ public:
 
 private:
     const S3::URI s3_uri;
-    const std::shared_ptr<S3::Client> client;
-    S3Settings::RequestSettings request_settings;
     const DataSourceDescription data_source_description;
+    S3Settings s3_settings;
+    std::shared_ptr<S3::Client> client;
 };
 
 
@@ -57,10 +57,10 @@ private:
     void removeFilesBatch(const Strings & file_names);
 
     const S3::URI s3_uri;
-    const std::shared_ptr<S3::Client> client;
-    S3Settings::RequestSettings request_settings;
-    std::optional<bool> supports_batch_delete;
     const DataSourceDescription data_source_description;
+    S3Settings s3_settings;
+    std::shared_ptr<S3::Client> client;
+    std::optional<bool> supports_batch_delete;
 };
 
 }
diff --git a/src/IO/S3/Client.cpp b/src/IO/S3/Client.cpp
index 21d87c58d20..79f150259db 100644
--- a/src/IO/S3/Client.cpp
+++ b/src/IO/S3/Client.cpp
@@ -27,6 +27,8 @@
 #include <Common/logger_useful.h>
 #include <Common/ProxyConfigurationResolverProvider.h>
 
+#include <base/sleep.h>
+
 
 namespace ProfileEvents
 {
@@ -599,7 +601,9 @@ Client::doRequestWithRetryNetworkErrors(const RequestType & request, RequestFn r
                 last_exception = std::current_exception();
 
                 auto error = Aws::Client::AWSError<Aws::Client::CoreErrors>(Aws::Client::CoreErrors::NETWORK_CONNECTION, /*retry*/ true);
-                client_configuration.retryStrategy->CalculateDelayBeforeNextRetry(error, attempt_no);
+                auto sleep_ms = client_configuration.retryStrategy->CalculateDelayBeforeNextRetry(error, attempt_no);
+                LOG_WARNING(log, "Request failed, now waiting {} ms before attempting again", sleep_ms);
+                sleepForMilliseconds(sleep_ms);
                 continue;
             }
         }

From 3d5e7aefe97b4a674223144425a082d20d371a60 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Sep 2023 21:01:55 +0200
Subject: [PATCH 052/101] Remove status_info from testdata

---
 programs/diagnostics/testdata/configs/yaml/config.yaml | 2 --
 1 file changed, 2 deletions(-)

diff --git a/programs/diagnostics/testdata/configs/yaml/config.yaml b/programs/diagnostics/testdata/configs/yaml/config.yaml
index 80d65e6b187..354065a8a9b 100644
--- a/programs/diagnostics/testdata/configs/yaml/config.yaml
+++ b/programs/diagnostics/testdata/configs/yaml/config.yaml
@@ -638,7 +638,6 @@ default_session_timeout: 60
 # metrics - send data from table system.metrics
 # events - send data from table system.events
 # asynchronous_metrics - send data from table system.asynchronous_metrics
-# status_info - send data from different component from CH, ex: Dictionaries status
 
 # prometheus:
 #     endpoint: /metrics
@@ -647,7 +646,6 @@ default_session_timeout: 60
 #     metrics: true
 #     events: true
 #     asynchronous_metrics: true
-#     status_info: true
 
 # Query log. Used only for queries with setting log_queries = 1.
 query_log:

From 51ef0ec4bc5f41078cf54539b248ba3354fac0ca Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Sep 2023 21:02:23 +0200
Subject: [PATCH 053/101] Remove status_info from example

---
 programs/server/config.yaml.example | 2 --
 1 file changed, 2 deletions(-)

diff --git a/programs/server/config.yaml.example b/programs/server/config.yaml.example
index a8f97ae5632..b472b6f4a45 100644
--- a/programs/server/config.yaml.example
+++ b/programs/server/config.yaml.example
@@ -639,7 +639,6 @@ default_session_timeout: 60
 # metrics - send data from table system.metrics
 # events - send data from table system.events
 # asynchronous_metrics - send data from table system.asynchronous_metrics
-# status_info - send data from different component from CH, ex: Dictionaries status
 
 # prometheus:
 #     endpoint: /metrics
@@ -648,7 +647,6 @@ default_session_timeout: 60
 #     metrics: true
 #     events: true
 #     asynchronous_metrics: true
-#     status_info: true
 
 # Query log. Used only for queries with setting log_queries = 1.
 query_log:

From 59068ec59da0e8fe6a5a321a29ddbab81ec97f5b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 25 Sep 2023 13:30:57 +0200
Subject: [PATCH 054/101] Add assertion

---
 src/Interpreters/Cache/FileCache.cpp | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 01ee788cc74..160994fadd5 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -1059,6 +1059,9 @@ void FileCache::loadMetadataForKeys(const fs::path & keys_dir)
 FileCache::~FileCache()
 {
     deactivateBackgroundOperations();
+#ifdef ABORT_ON_LOGICAL_ERROR
+    assertCacheCorrectness();
+#endif
 }
 
 void FileCache::deactivateBackgroundOperations()
@@ -1143,14 +1146,15 @@ size_t FileCache::getFileSegmentsNum() const
 
 void FileCache::assertCacheCorrectness()
 {
-    auto lock = lockCache();
-    main_priority->iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
+    metadata.iterate([&](LockedKey & locked_key)
     {
-        const auto & file_segment = *segment_metadata->file_segment;
-        UNUSED(file_segment);
-        chassert(file_segment.assertCorrectness());
-        return PriorityIterationResult::CONTINUE;
-    }, lock);
+        for (const auto & [_, file_segment_metadata] : locked_key)
+        {
+            const auto & file_segment = *file_segment_metadata->file_segment;
+            UNUSED(file_segment);
+            chassert(file_segment.assertCorrectness());
+        }
+    });
 }
 
 FileCache::QueryContextHolder::QueryContextHolder(

From ce583cb7feb0b89c73214c0035d694f7314610a0 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 25 Sep 2023 13:21:37 +0000
Subject: [PATCH 055/101] Fix upgrade tests

---
 docker/test/upgrade/run.sh | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 96c11e75f50..c69d90b9af0 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -60,11 +60,19 @@ install_packages previous_release_package_folder
 # available for dump via clickhouse-local
 configure
 
+function remove_keeper_config()
+{
+  sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
+    | sed "/<$1>$2<\/$1>/d" \
+    > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
+  sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+}
+
 # async_replication setting doesn't exist on some older versions
-sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
-  | sed "/<async_replication>1<\/async_replication>/d" \
-  > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+remove_keeper_config "async_replication" "1"
+
+# create_if_not_exists feature flag doesn't exist on some older versions
+remove_keeper_config "create_if_not_exists" "[01]"
 
 # it contains some new settings, but we can safely remove it
 rm /etc/clickhouse-server/config.d/merge_tree.xml
@@ -89,10 +97,10 @@ sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
 sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
 
 # async_replication setting doesn't exist on some older versions
-sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
-  | sed "/<async_replication>1<\/async_replication>/d" \
-  > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+remove_keeper_config "async_replication" "1"
+
+# create_if_not_exists feature flag doesn't exist on some older versions
+remove_keeper_config "create_if_not_exists" "[01]"
 
 # But we still need default disk because some tables loaded only into it
 sudo cat /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml \

From 9bc9e87cbaff2b2fa8c739df47a4f08b9ae80037 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 5 Apr 2022 14:32:50 +0200
Subject: [PATCH 056/101] DecimalColumn improve getPermutation performance
 using RadixSort

---
 src/Columns/ColumnDecimal.cpp | 54 ++++++++++++++++++++++++++++++
 src/Columns/ColumnVector.cpp  | 62 +++++++++++++----------------------
 2 files changed, 76 insertions(+), 40 deletions(-)

diff --git a/src/Columns/ColumnDecimal.cpp b/src/Columns/ColumnDecimal.cpp
index 0d82818a431..e5ebdc3666f 100644
--- a/src/Columns/ColumnDecimal.cpp
+++ b/src/Columns/ColumnDecimal.cpp
@@ -4,6 +4,7 @@
 #include <Common/assert_cast.h>
 #include <Common/WeakHash.h>
 #include <Common/HashTable/Hash.h>
+#include <Common/RadixSort.h>
 
 #include <base/unaligned.h>
 #include <base/sort.h>
@@ -138,6 +139,26 @@ void ColumnDecimal<T>::updateHashFast(SipHash & hash) const
     hash.update(reinterpret_cast<const char *>(data.data()), size() * sizeof(data[0]));
 }
 
+namespace
+{
+    template <typename T>
+    struct ValueWithIndex
+    {
+        T value;
+        UInt32 index;
+    };
+
+    template <typename T>
+    struct RadixSortTraits : RadixSortNumTraits<T>
+    {
+        using Element = ValueWithIndex<T>;
+        using Result = size_t;
+
+        static T & extractKey(Element & elem) { return elem.value; }
+        static size_t extractResult(Element & elem) { return elem.index; }
+    };
+}
+
 template <is_decimal T>
 void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                                     size_t limit, int, IColumn::Permutation & res) const
@@ -159,6 +180,39 @@ void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection directio
         return data[lhs] > data[rhs];
     };
 
+    size_t data_size = data.size();
+    res.resize(data_size);
+
+    if (limit >= data_size) {
+        limit = 0;
+    }
+
+    if (!limit)
+    {
+        /// A case for radix sort
+        /// LSD RadixSort is stable
+        if constexpr (is_arithmetic_v<NativeT> && !is_big_int_v<NativeT>)
+        {
+            bool reverse = direction == IColumn::PermutationSortDirection::Descending;
+            bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
+            bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
+
+            /// TODO: LSD RadixSort is currently not stable if direction is descending
+            bool use_radix_sort = (sort_is_stable && ascending) || !sort_is_stable;
+
+            /// Thresholds on size. Lower threshold is arbitrary. Upper threshold is chosen by the type for histogram counters.
+            if (data_size >= 256 && data_size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
+            {
+                PaddedPODArray<ValueWithIndex<NativeT>> pairs(data_size);
+                for (UInt32 i = 0; i < UInt32(data_size); ++i)
+                    pairs[i] = {data[i].value, i};
+
+                RadixSort<RadixSortTraits<NativeT>>::executeLSD(pairs.data(), data_size, reverse, res.data());
+                return;
+            }
+        }
+    }
+
     if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
         this->getPermutationImpl(limit, res, comparator_ascending, DefaultSort(), DefaultPartialSort());
     else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index e46384e4d03..c1150957a8f 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -254,31 +254,16 @@ template <typename T>
 void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                                     size_t limit, int nan_direction_hint, IColumn::Permutation & res) const
 {
-    size_t s = data.size();
-    res.resize(s);
+    size_t data_size = data.size();
+    res.resize(data_size);
 
-    if (s == 0)
+    if (data_size == 0)
         return;
 
-    if (limit >= s)
+    if (limit >= data_size)
         limit = 0;
 
-    if (limit)
-    {
-        for (size_t i = 0; i < s; ++i)
-            res[i] = i;
-
-        if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
-            ::partial_sort(res.begin(), res.begin() + limit, res.end(), less(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
-            ::partial_sort(res.begin(), res.begin() + limit, res.end(), less_stable(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Unstable)
-            ::partial_sort(res.begin(), res.begin() + limit, res.end(), greater(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Stable)
-            ::partial_sort(res.begin(), res.begin() + limit, res.end(), greater_stable(*this, nan_direction_hint));
-    }
-    else
-    {
+    if (!limit) {
         /// A case for radix sort
         /// LSD RadixSort is stable
         if constexpr (is_arithmetic_v<T> && !is_big_int_v<T>)
@@ -291,13 +276,13 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
             bool use_radix_sort = (sort_is_stable && ascending && !std::is_floating_point_v<T>) || !sort_is_stable;
 
             /// Thresholds on size. Lower threshold is arbitrary. Upper threshold is chosen by the type for histogram counters.
-            if (s >= 256 && s <= std::numeric_limits<UInt32>::max() && use_radix_sort)
+            if (data_size >= 256 && data_size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
             {
-                PaddedPODArray<ValueWithIndex<T>> pairs(s);
-                for (UInt32 i = 0; i < static_cast<UInt32>(s); ++i)
+                PaddedPODArray<ValueWithIndex<T>> pairs(data_size);
+                for (UInt32 i = 0; i < static_cast<UInt32>(data_size); ++i)
                     pairs[i] = {data[i], i};
 
-                RadixSort<RadixSortTraits<T>>::executeLSD(pairs.data(), s, reverse, res.data());
+                RadixSort<RadixSortTraits<T>>::executeLSD(pairs.data(), data_size, reverse, res.data());
 
                 /// Radix sort treats all NaNs to be greater than all numbers.
                 /// If the user needs the opposite, we must move them accordingly.
@@ -305,9 +290,9 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
                 {
                     size_t nans_to_move = 0;
 
-                    for (size_t i = 0; i < s; ++i)
+                    for (size_t i = 0; i < data_size; ++i)
                     {
-                        if (isNaN(data[res[reverse ? i : s - 1 - i]]))
+                        if (isNaN(data[res[reverse ? i : data_size - 1 - i]]))
                             ++nans_to_move;
                         else
                             break;
@@ -315,26 +300,23 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
 
                     if (nans_to_move)
                     {
-                        std::rotate(std::begin(res), std::begin(res) + (reverse ? nans_to_move : s - nans_to_move), std::end(res));
+                        std::rotate(std::begin(res), std::begin(res) + (reverse ? nans_to_move : data_size - nans_to_move), std::end(res));
                     }
                 }
+
                 return;
             }
         }
-
-        /// Default sorting algorithm.
-        for (size_t i = 0; i < s; ++i)
-            res[i] = i;
-
-        if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
-            ::sort(res.begin(), res.end(), less(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
-            ::sort(res.begin(), res.end(), less_stable(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Unstable)
-            ::sort(res.begin(), res.end(), greater(*this, nan_direction_hint));
-        else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Stable)
-            ::sort(res.begin(), res.end(), greater_stable(*this, nan_direction_hint));
     }
+
+    if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
+        this->getPermutationImpl(limit, res, less(*this, nan_direction_hint), DefaultSort(), DefaultPartialSort());
+    else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
+        this->getPermutationImpl(limit, res, less_stable(*this, nan_direction_hint), DefaultSort(), DefaultPartialSort());
+    else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Unstable)
+        this->getPermutationImpl(limit, res, greater(*this, nan_direction_hint), DefaultSort(), DefaultPartialSort());
+    else
+        this->getPermutationImpl(limit, res, greater_stable(*this, nan_direction_hint), DefaultSort(), DefaultPartialSort());
 }
 
 template <typename T>

From 0a9835d0858e34a4b22231a8117c7e3a6c6326c1 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 5 Apr 2022 20:39:21 +0200
Subject: [PATCH 057/101] Added performance tests

---
 tests/performance/merge_tree_insert.xml | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/tests/performance/merge_tree_insert.xml b/tests/performance/merge_tree_insert.xml
index 1e987d27d50..ec991c458c2 100644
--- a/tests/performance/merge_tree_insert.xml
+++ b/tests/performance/merge_tree_insert.xml
@@ -18,15 +18,29 @@
                 <value>merge_tree_insert_6</value>
             </values>
         </substitution>
+
+        <substitution>
+            <name>decimal_primary_key_table_name</name>
+            <values>
+                <value>merge_tree_insert_7</value>
+                <value>merge_tree_insert_8</value>
+                <value>merge_tree_insert_9</value>
+            </values>
+        </substitution>
     </substitutions>
 
     <create_query>CREATE TABLE merge_tree_insert_1 (value_1 UInt64, value_2 UInt64, value_3 UInt64) ENGINE = MergeTree ORDER BY (value_1)</create_query>
     <create_query>CREATE TABLE merge_tree_insert_2 (value_1 UInt64, value_2 UInt64, value_3 UInt64) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
     <create_query>CREATE TABLE merge_tree_insert_3 (value_1 UInt64, value_2 UInt64, value_3 UInt64) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
+
     <create_query>CREATE TABLE merge_tree_insert_4 (value_1 String, value_2 String, value_3 String) ENGINE = MergeTree ORDER BY (value_1)</create_query>
     <create_query>CREATE TABLE merge_tree_insert_5 (value_1 String, value_2 String, value_3 String) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
     <create_query>CREATE TABLE merge_tree_insert_6 (value_1 String, value_2 String, value_3 String) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
 
+    <create_query>CREATE TABLE merge_tree_insert_4 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1)</create_query>
+    <create_query>CREATE TABLE merge_tree_insert_5 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
+    <create_query>CREATE TABLE merge_tree_insert_6 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
+
     <query>INSERT INTO {integer_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 500000</query>
     <query>INSERT INTO {integer_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1000000</query>
     <query>INSERT INTO {integer_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1500000</query>
@@ -35,7 +49,12 @@
     <query>INSERT INTO {string_primary_key_table_name} SELECT toString(rand64(0)), toString(rand64(1)), toString(rand64(2)) FROM system.numbers LIMIT 1000000</query>
     <query>INSERT INTO {string_primary_key_table_name} SELECT toString(rand64(0)), toString(rand64(1)), toString(rand64(2)) FROM system.numbers LIMIT 1500000</query>
 
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 500000</query>
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1000000</query>
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1500000</query>
+
     <drop_query>DROP TABLE IF EXISTS {integer_primary_key_table_name}</drop_query>
     <drop_query>DROP TABLE IF EXISTS {string_primary_key_table_name}</drop_query>
+    <drop_query>DROP TABLE IF EXISTS {decimal_primary_key_table_name}</drop_query>
 
 </test>

From 1de95d8c369ef3abbbe7e3e2b22b6e82e9a71035 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Thu, 21 Sep 2023 14:20:11 +0300
Subject: [PATCH 058/101] Updated implementation

---
 base/base/sort.h                        |  19 +++
 contrib/pdqsort/pdqsort.h               | 200 +++++++++++++++++++++++-
 src/Columns/ColumnDecimal.cpp           |  87 +++++++----
 src/Columns/ColumnVector.cpp            |  60 +++----
 src/Columns/RadixSortHelper.h           |  25 +++
 tests/performance/merge_tree_insert.xml |  12 +-
 tests/performance/sort_patterns.xml     |  22 +++
 7 files changed, 362 insertions(+), 63 deletions(-)
 create mode 100644 src/Columns/RadixSortHelper.h
 create mode 100644 tests/performance/sort_patterns.xml

diff --git a/base/base/sort.h b/base/base/sort.h
index 912545979dc..cda03d92451 100644
--- a/base/base/sort.h
+++ b/base/base/sort.h
@@ -131,3 +131,22 @@ void sort(RandomIt first, RandomIt last)
     using comparator = std::less<value_type>;
     ::sort(first, last, comparator());
 }
+
+template <typename RandomIt, typename Compare>
+bool trySort(RandomIt first, RandomIt last, Compare compare)
+{
+#ifndef NDEBUG
+    ::shuffle(first, last);
+#endif
+
+    ComparatorWrapper<Compare> compare_wrapper = compare;
+    return ::pdqsort_try_sort(first, last, compare_wrapper);
+}
+
+template <typename RandomIt>
+bool trySort(RandomIt first, RandomIt last)
+{
+    using value_type = typename std::iterator_traits<RandomIt>::value_type;
+    using comparator = std::less<value_type>;
+    return ::pdqsort_try_sort(first, last, comparator());
+}
diff --git a/contrib/pdqsort/pdqsort.h b/contrib/pdqsort/pdqsort.h
index 01e82b710ee..cbfc82a4f41 100644
--- a/contrib/pdqsort/pdqsort.h
+++ b/contrib/pdqsort/pdqsort.h
@@ -54,8 +54,10 @@ namespace pdqsort_detail {
         block_size = 64,
 
         // Cacheline size, assumes power of two.
-        cacheline_size = 64
+        cacheline_size = 64,
 
+        /// Try sort allowed iterations
+        try_sort_iterations = 3,
     };
 
 #if __cplusplus >= 201103L
@@ -501,6 +503,167 @@ namespace pdqsort_detail {
             leftmost = false;
         }
     }
+
+    template<class Iter, class Compare, bool Branchless>
+    inline bool pdqsort_try_sort_loop(Iter begin,
+        Iter end,
+        Compare comp,
+        size_t bad_allowed,
+        size_t iterations_allowed,
+        bool force_sort = false,
+        bool leftmost = true) {
+        typedef typename std::iterator_traits<Iter>::difference_type diff_t;
+
+        // Use a while loop for tail recursion elimination.
+        while (true) {
+            if (!force_sort && iterations_allowed == 0) {
+                return false;
+            }
+
+            diff_t size = end - begin;
+
+            // Insertion sort is faster for small arrays.
+            if (size < insertion_sort_threshold) {
+                if (leftmost) insertion_sort(begin, end, comp);
+                else unguarded_insertion_sort(begin, end, comp);
+
+                return true;
+            }
+
+            // Choose pivot as median of 3 or pseudomedian of 9.
+            diff_t s2 = size / 2;
+            if (size > ninther_threshold) {
+                sort3(begin, begin + s2, end - 1, comp);
+                sort3(begin + 1, begin + (s2 - 1), end - 2, comp);
+                sort3(begin + 2, begin + (s2 + 1), end - 3, comp);
+                sort3(begin + (s2 - 1), begin + s2, begin + (s2 + 1), comp);
+                std::iter_swap(begin, begin + s2);
+            } else sort3(begin + s2, begin, end - 1, comp);
+
+            // If *(begin - 1) is the end of the right partition of a previous partition operation
+            // there is no element in [begin, end) that is smaller than *(begin - 1). Then if our
+            // pivot compares equal to *(begin - 1) we change strategy, putting equal elements in
+            // the left partition, greater elements in the right partition. We do not have to
+            // recurse on the left partition, since it's sorted (all equal).
+            if (!leftmost && !comp(*(begin - 1), *begin)) {
+                begin = partition_left(begin, end, comp) + 1;
+                continue;
+            }
+
+            // Partition and get results.
+            std::pair<Iter, bool> part_result =
+                Branchless ? partition_right_branchless(begin, end, comp)
+                           : partition_right(begin, end, comp);
+            Iter pivot_pos = part_result.first;
+            bool already_partitioned = part_result.second;
+
+            // Check for a highly unbalanced partition.
+            diff_t l_size = pivot_pos - begin;
+            diff_t r_size = end - (pivot_pos + 1);
+            bool highly_unbalanced = l_size < size / 8 || r_size < size / 8;
+
+            // If we got a highly unbalanced partition we shuffle elements to break many patterns.
+            if (highly_unbalanced) {
+                if (!force_sort) {
+                    return false;
+                }
+
+                // If we had too many bad partitions, switch to heapsort to guarantee O(n log n).
+                if (--bad_allowed == 0) {
+                    std::make_heap(begin, end, comp);
+                    std::sort_heap(begin, end, comp);
+                    return true;
+                }
+
+                if (l_size >= insertion_sort_threshold) {
+                    std::iter_swap(begin,             begin + l_size / 4);
+                    std::iter_swap(pivot_pos - 1, pivot_pos - l_size / 4);
+
+                    if (l_size > ninther_threshold) {
+                        std::iter_swap(begin + 1,         begin + (l_size / 4 + 1));
+                        std::iter_swap(begin + 2,         begin + (l_size / 4 + 2));
+                        std::iter_swap(pivot_pos - 2, pivot_pos - (l_size / 4 + 1));
+                        std::iter_swap(pivot_pos - 3, pivot_pos - (l_size / 4 + 2));
+                    }
+                }
+
+                if (r_size >= insertion_sort_threshold) {
+                    std::iter_swap(pivot_pos + 1, pivot_pos + (1 + r_size / 4));
+                    std::iter_swap(end - 1,                   end - r_size / 4);
+
+                    if (r_size > ninther_threshold) {
+                        std::iter_swap(pivot_pos + 2, pivot_pos + (2 + r_size / 4));
+                        std::iter_swap(pivot_pos + 3, pivot_pos + (3 + r_size / 4));
+                        std::iter_swap(end - 2,             end - (1 + r_size / 4));
+                        std::iter_swap(end - 3,             end - (2 + r_size / 4));
+                    }
+                }
+            } else {
+                // If we were decently balanced and we tried to sort an already partitioned
+                // sequence try to use insertion sort.
+                if (already_partitioned && partial_insertion_sort(begin, pivot_pos, comp)
+                                        && partial_insertion_sort(pivot_pos + 1, end, comp)) {
+                    return true;
+                }
+            }
+
+            // Sort the left partition first using recursion and do tail recursion elimination for
+            // the right-hand partition.
+            if (pdqsort_try_sort_loop<Iter, Compare, Branchless>(begin,
+                pivot_pos,
+                comp,
+                bad_allowed,
+                iterations_allowed - 1,
+                force_sort,
+                leftmost)) {
+                force_sort = true;
+            } else {
+                return false;
+            }
+
+            --iterations_allowed;
+            begin = pivot_pos + 1;
+            leftmost = false;
+        }
+
+        return false;
+    }
+
+    template<class Iter, class Compare, bool Branchless>
+    inline bool pdqsort_try_sort_impl(Iter begin, Iter end, Compare comp, size_t bad_allowed)
+    {
+        typedef typename std::iterator_traits<Iter>::difference_type diff_t;
+
+        static constexpr size_t iterations_allowed = pdqsort_detail::try_sort_iterations;
+        static constexpr size_t num_to_try = 16;
+
+        diff_t size = end - begin;
+
+        if (size > num_to_try * 10)
+        {
+            size_t out_of_order_elements = 0;
+
+            for (size_t i = 1; i < num_to_try; ++i)
+            {
+                diff_t offset = size / num_to_try;
+
+                diff_t prev_position = offset * (i - 1);
+                diff_t curr_position = offset * i;
+                diff_t next_position = offset * (i + 1) - 1;
+
+                bool prev_less_than_curr = comp(*(begin + prev_position), *(begin + curr_position));
+                bool curr_less_than_next = comp(*(begin + curr_position), *(begin + next_position));
+                if ((prev_less_than_curr && curr_less_than_next) || (!prev_less_than_curr && !curr_less_than_next))
+                    continue;
+
+                ++out_of_order_elements;
+                if (out_of_order_elements > iterations_allowed)
+                    return false;
+            }
+        }
+
+        return pdqsort_try_sort_loop<Iter, Compare, Branchless>(begin, end, comp, bad_allowed, iterations_allowed);
+    }
 }
 
 
@@ -538,6 +701,41 @@ inline void pdqsort_branchless(Iter begin, Iter end) {
     pdqsort_branchless(begin, end, std::less<T>());
 }
 
+template<class Iter, class Compare>
+inline bool pdqsort_try_sort(Iter begin, Iter end, Compare comp) {
+    if (begin == end) return true;
+
+#if __cplusplus >= 201103L
+    return pdqsort_detail::pdqsort_try_sort_impl<Iter, Compare,
+        pdqsort_detail::is_default_compare<typename std::decay<Compare>::type>::value &&
+        std::is_arithmetic<typename std::iterator_traits<Iter>::value_type>::value>(
+        begin, end, comp, pdqsort_detail::log2(end - begin));
+#else
+    return pdqsort_detail::pdqsort_try_sort_impl<Iter, Compare, false>(
+        begin, end, comp, pdqsort_detail::log2(end - begin));
+#endif
+}
+
+template<class Iter>
+inline bool pdqsort_try_sort(Iter begin, Iter end) {
+    typedef typename std::iterator_traits<Iter>::value_type T;
+    return pdqsort_try_sort(begin, end, std::less<T>());
+}
+
+template<class Iter, class Compare>
+inline bool pdqsort_try_sort_branchless(Iter begin, Iter end, Compare comp) {
+    if (begin == end) return true;
+
+    return pdqsort_detail::pdqsort_try_sort_impl<Iter, Compare, true>(
+        begin, end, comp, pdqsort_detail::log2(end - begin));
+}
+
+template<class Iter>
+inline bool pdqsort_try_sort_branchless(Iter begin, Iter end) {
+    typedef typename std::iterator_traits<Iter>::value_type T;
+    return pdqsort_try_sort_branchless(begin, end, std::less<T>());
+}
+
 
 #undef PDQSORT_PREFER_MOVE
 
diff --git a/src/Columns/ColumnDecimal.cpp b/src/Columns/ColumnDecimal.cpp
index e5ebdc3666f..111c0e3cb1c 100644
--- a/src/Columns/ColumnDecimal.cpp
+++ b/src/Columns/ColumnDecimal.cpp
@@ -16,6 +16,7 @@
 #include <Columns/ColumnDecimal.h>
 #include <Columns/ColumnCompressed.h>
 #include <Columns/MaskOperations.h>
+#include <Columns/RadixSortHelper.h>
 #include <Processors/Transforms/ColumnGathererTransform.h>
 
 
@@ -139,26 +140,6 @@ void ColumnDecimal<T>::updateHashFast(SipHash & hash) const
     hash.update(reinterpret_cast<const char *>(data.data()), size() * sizeof(data[0]));
 }
 
-namespace
-{
-    template <typename T>
-    struct ValueWithIndex
-    {
-        T value;
-        UInt32 index;
-    };
-
-    template <typename T>
-    struct RadixSortTraits : RadixSortNumTraits<T>
-    {
-        using Element = ValueWithIndex<T>;
-        using Result = size_t;
-
-        static T & extractKey(Element & elem) { return elem.value; }
-        static size_t extractResult(Element & elem) { return elem.index; }
-    };
-}
-
 template <is_decimal T>
 void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                                     size_t limit, int, IColumn::Permutation & res) const
@@ -183,16 +164,19 @@ void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection directio
     size_t data_size = data.size();
     res.resize(data_size);
 
-    if (limit >= data_size) {
+    if (limit >= data_size)
         limit = 0;
-    }
 
-    if (!limit)
+    for (size_t i = 0; i < data_size; ++i)
+        res[i] = i;
+
+    if constexpr (is_arithmetic_v<NativeT> && !is_big_int_v<NativeT>)
     {
-        /// A case for radix sort
-        /// LSD RadixSort is stable
-        if constexpr (is_arithmetic_v<NativeT> && !is_big_int_v<NativeT>)
+        if (!limit)
         {
+            /// A case for radix sort
+            /// LSD RadixSort is stable
+
             bool reverse = direction == IColumn::PermutationSortDirection::Descending;
             bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
             bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
@@ -203,8 +187,25 @@ void ColumnDecimal<T>::getPermutation(IColumn::PermutationSortDirection directio
             /// Thresholds on size. Lower threshold is arbitrary. Upper threshold is chosen by the type for histogram counters.
             if (data_size >= 256 && data_size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
             {
+                for (size_t i = 0; i < data_size; ++i)
+                    res[i] = i;
+
+                bool try_sort = false;
+
+                if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
+                    try_sort = trySort(res.begin(), res.end(), comparator_ascending);
+                else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
+                    try_sort = trySort(res.begin(), res.end(), comparator_ascending_stable);
+                else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Unstable)
+                    try_sort = trySort(res.begin(), res.end(), comparator_descending);
+                else
+                    try_sort = trySort(res.begin(), res.end(), comparator_descending_stable);
+
+                if (try_sort)
+                    return;
+
                 PaddedPODArray<ValueWithIndex<NativeT>> pairs(data_size);
-                for (UInt32 i = 0; i < UInt32(data_size); ++i)
+                for (UInt32 i = 0; i < static_cast<UInt32>(data_size); ++i)
                     pairs[i] = {data[i].value, i};
 
                 RadixSort<RadixSortTraits<NativeT>>::executeLSD(pairs.data(), data_size, reverse, res.data());
@@ -245,7 +246,37 @@ void ColumnDecimal<T>::updatePermutation(IColumn::PermutationSortDirection direc
         return data[lhs] < data[rhs];
     };
     auto equals_comparator = [this](size_t lhs, size_t rhs) { return data[lhs] == data[rhs]; };
-    auto sort = [](auto begin, auto end, auto pred) { ::sort(begin, end, pred); };
+    auto sort = [&](auto begin, auto end, auto pred)
+    {
+        bool reverse = direction == IColumn::PermutationSortDirection::Descending;
+        bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
+        bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
+
+        /// TODO: LSD RadixSort is currently not stable if direction is descending
+        bool use_radix_sort = (sort_is_stable && ascending) || !sort_is_stable;
+        size_t size = end - begin;
+
+        if (size >= 256 && size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
+        {
+            bool try_sort = trySort(begin, end, pred);
+            if (try_sort)
+                return;
+
+            PaddedPODArray<ValueWithIndex<NativeT>> pairs(size);
+            size_t index = 0;
+
+            for (auto * it = begin; it != end; ++it)
+            {
+                pairs[index] = {data[*it].value, static_cast<UInt32>(*it)};
+                ++index;
+            }
+
+            RadixSort<RadixSortTraits<NativeT>>::executeLSD(pairs.data(), size, reverse, res.data());
+            return;
+        }
+
+        ::sort(begin, end, pred);
+    };
     auto partial_sort = [](auto begin, auto mid, auto end, auto pred) { ::partial_sort(begin, mid, end, pred); };
 
     if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index c1150957a8f..37e62c76596 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -3,6 +3,7 @@
 #include <Columns/ColumnsCommon.h>
 #include <Columns/ColumnCompressed.h>
 #include <Columns/MaskOperations.h>
+#include <Columns/RadixSortHelper.h>
 #include <Processors/Transforms/ColumnGathererTransform.h>
 #include <IO/WriteHelpers.h>
 #include <Common/Arena.h>
@@ -192,26 +193,6 @@ struct ColumnVector<T>::equals
     bool operator()(size_t lhs, size_t rhs) const { return CompareHelper<T>::equals(parent.data[lhs], parent.data[rhs], nan_direction_hint); }
 };
 
-namespace
-{
-    template <typename T>
-    struct ValueWithIndex
-    {
-        T value;
-        UInt32 index;
-    };
-
-    template <typename T>
-    struct RadixSortTraits : RadixSortNumTraits<T>
-    {
-        using Element = ValueWithIndex<T>;
-        using Result = size_t;
-
-        static T & extractKey(Element & elem) { return elem.value; }
-        static size_t extractResult(Element & elem) { return elem.index; }
-    };
-}
-
 #if USE_EMBEDDED_COMPILER
 
 template <typename T>
@@ -263,11 +244,16 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
     if (limit >= data_size)
         limit = 0;
 
-    if (!limit) {
-        /// A case for radix sort
-        /// LSD RadixSort is stable
-        if constexpr (is_arithmetic_v<T> && !is_big_int_v<T>)
+    for (size_t i = 0; i < data_size; ++i)
+        res[i] = i;
+
+    if constexpr (is_arithmetic_v<T> && !is_big_int_v<T>)
+    {
+        if (!limit)
         {
+            /// A case for radix sort
+            /// LSD RadixSort is stable
+
             bool reverse = direction == IColumn::PermutationSortDirection::Descending;
             bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
             bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
@@ -278,6 +264,20 @@ void ColumnVector<T>::getPermutation(IColumn::PermutationSortDirection direction
             /// Thresholds on size. Lower threshold is arbitrary. Upper threshold is chosen by the type for histogram counters.
             if (data_size >= 256 && data_size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
             {
+                bool try_sort = false;
+
+                if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Unstable)
+                    try_sort = trySort(res.begin(), res.end(), less(*this, nan_direction_hint));
+                else if (direction == IColumn::PermutationSortDirection::Ascending && stability == IColumn::PermutationSortStability::Stable)
+                    try_sort = trySort(res.begin(), res.end(), less_stable(*this, nan_direction_hint));
+                else if (direction == IColumn::PermutationSortDirection::Descending && stability == IColumn::PermutationSortStability::Unstable)
+                    try_sort = trySort(res.begin(), res.end(), greater(*this, nan_direction_hint));
+                else
+                    try_sort = trySort(res.begin(), res.end(), greater_stable(*this, nan_direction_hint));
+
+                if (try_sort)
+                    return;
+
                 PaddedPODArray<ValueWithIndex<T>> pairs(data_size);
                 for (UInt32 i = 0; i < static_cast<UInt32>(data_size); ++i)
                     pairs[i] = {data[i], i};
@@ -323,12 +323,12 @@ template <typename T>
 void ColumnVector<T>::updatePermutation(IColumn::PermutationSortDirection direction, IColumn::PermutationSortStability stability,
                                     size_t limit, int nan_direction_hint, IColumn::Permutation & res, EqualRanges & equal_ranges) const
 {
-    bool reverse = direction == IColumn::PermutationSortDirection::Descending;
-    bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
-    bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
-
     auto sort = [&](auto begin, auto end, auto pred)
     {
+        bool reverse = direction == IColumn::PermutationSortDirection::Descending;
+        bool ascending = direction == IColumn::PermutationSortDirection::Ascending;
+        bool sort_is_stable = stability == IColumn::PermutationSortStability::Stable;
+
         /// A case for radix sort
         if constexpr (is_arithmetic_v<T> && !is_big_int_v<T>)
         {
@@ -339,6 +339,10 @@ void ColumnVector<T>::updatePermutation(IColumn::PermutationSortDirection direct
             /// Thresholds on size. Lower threshold is arbitrary. Upper threshold is chosen by the type for histogram counters.
             if (size >= 256 && size <= std::numeric_limits<UInt32>::max() && use_radix_sort)
             {
+                bool try_sort = trySort(begin, end, pred);
+                if (try_sort)
+                    return;
+
                 PaddedPODArray<ValueWithIndex<T>> pairs(size);
                 size_t index = 0;
 
diff --git a/src/Columns/RadixSortHelper.h b/src/Columns/RadixSortHelper.h
new file mode 100644
index 00000000000..e7d8ea6e535
--- /dev/null
+++ b/src/Columns/RadixSortHelper.h
@@ -0,0 +1,25 @@
+#pragma once
+
+#include <Common/RadixSort.h>
+
+namespace DB
+{
+
+template <typename T>
+struct ValueWithIndex
+{
+    T value;
+    UInt32 index;
+};
+
+template <typename T>
+struct RadixSortTraits : RadixSortNumTraits<T>
+{
+    using Element = ValueWithIndex<T>;
+    using Result = size_t;
+
+    static T & extractKey(Element & elem) { return elem.value; }
+    static size_t extractResult(Element & elem) { return elem.index; }
+};
+
+}
diff --git a/tests/performance/merge_tree_insert.xml b/tests/performance/merge_tree_insert.xml
index ec991c458c2..3e1d2541480 100644
--- a/tests/performance/merge_tree_insert.xml
+++ b/tests/performance/merge_tree_insert.xml
@@ -37,9 +37,9 @@
     <create_query>CREATE TABLE merge_tree_insert_5 (value_1 String, value_2 String, value_3 String) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
     <create_query>CREATE TABLE merge_tree_insert_6 (value_1 String, value_2 String, value_3 String) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
 
-    <create_query>CREATE TABLE merge_tree_insert_4 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1)</create_query>
-    <create_query>CREATE TABLE merge_tree_insert_5 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
-    <create_query>CREATE TABLE merge_tree_insert_6 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
+    <create_query>CREATE TABLE merge_tree_insert_7 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1)</create_query>
+    <create_query>CREATE TABLE merge_tree_insert_8 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2)</create_query>
+    <create_query>CREATE TABLE merge_tree_insert_9 (value_1 Decimal64(8), value_2  Decimal64(8), value_3  Decimal64(8)) ENGINE = MergeTree ORDER BY (value_1, value_2, value_3)</create_query>
 
     <query>INSERT INTO {integer_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 500000</query>
     <query>INSERT INTO {integer_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1000000</query>
@@ -49,9 +49,9 @@
     <query>INSERT INTO {string_primary_key_table_name} SELECT toString(rand64(0)), toString(rand64(1)), toString(rand64(2)) FROM system.numbers LIMIT 1000000</query>
     <query>INSERT INTO {string_primary_key_table_name} SELECT toString(rand64(0)), toString(rand64(1)), toString(rand64(2)) FROM system.numbers LIMIT 1500000</query>
 
-    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 500000</query>
-    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1000000</query>
-    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0), rand64(1), rand64(2) FROM system.numbers LIMIT 1500000</query>
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0) % 1000000, rand64(1) % 1500000, rand64(2) % 2000000 FROM system.numbers LIMIT 500000</query>
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0) % 1000000, rand64(1) % 1500000, rand64(2) % 2000000 FROM system.numbers LIMIT 1000000</query>
+    <query>INSERT INTO {decimal_primary_key_table_name} SELECT rand64(0) % 1000000, rand64(1) % 1500000, rand64(2) % 2000000 FROM system.numbers LIMIT 1500000</query>
 
     <drop_query>DROP TABLE IF EXISTS {integer_primary_key_table_name}</drop_query>
     <drop_query>DROP TABLE IF EXISTS {string_primary_key_table_name}</drop_query>
diff --git a/tests/performance/sort_patterns.xml b/tests/performance/sort_patterns.xml
new file mode 100644
index 00000000000..6ca4a34fc34
--- /dev/null
+++ b/tests/performance/sort_patterns.xml
@@ -0,0 +1,22 @@
+<test>
+    <substitutions>
+        <substitution>
+            <name>integer_type</name>
+            <values>
+                <value>UInt32</value>
+                <value>UInt64</value>
+            </values>
+        </substitution>
+    </substitutions>
+
+    <create_query>CREATE TABLE sequential_{integer_type} (key {integer_type}, value {integer_type}) Engine = Memory</create_query>
+
+    <fill_query>INSERT INTO sequential_{integer_type} SELECT number, number FROM numbers(10000000)</fill_query>
+
+    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key;</query>
+    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key, value;</query>
+    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key DESC;</query>
+    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key DESC, value DESC;</query>
+
+    <drop_query>DROP TABLE IF EXISTS sequential_{integer_type}</drop_query>
+</test>

From 40be8227ea3ed1507361378ce7dc500d3b817c51 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Fri, 22 Sep 2023 12:25:13 +0300
Subject: [PATCH 059/101] Fixed tests

---
 tests/performance/sort_patterns.xml | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/tests/performance/sort_patterns.xml b/tests/performance/sort_patterns.xml
index 6ca4a34fc34..fc49b20cc8c 100644
--- a/tests/performance/sort_patterns.xml
+++ b/tests/performance/sort_patterns.xml
@@ -7,16 +7,22 @@
                 <value>UInt64</value>
             </values>
         </substitution>
+        <substitution>
+            <name>sort_expression</name>
+            <values>
+                <value>key</value>
+                <value>key, value</value>
+                <value>key DESC</value>
+                <value>key DESC, value DESC</value>
+            </values>
+        </substitution>
     </substitutions>
 
     <create_query>CREATE TABLE sequential_{integer_type} (key {integer_type}, value {integer_type}) Engine = Memory</create_query>
 
-    <fill_query>INSERT INTO sequential_{integer_type} SELECT number, number FROM numbers(10000000)</fill_query>
+    <fill_query>INSERT INTO sequential_{integer_type} SELECT number, number FROM numbers(500000000)</fill_query>
 
-    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key;</query>
-    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key, value;</query>
-    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key DESC;</query>
-    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY key DESC, value DESC;</query>
+    <query>SELECT key, value FROM sequential_{integer_type} ORDER BY {sort_expression} FORMAT Null</query>
 
     <drop_query>DROP TABLE IF EXISTS sequential_{integer_type}</drop_query>
 </test>

From f7494a5e454110eb440c5e7eb7a7f65fdc9fa6c8 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 25 Sep 2023 11:39:57 +0300
Subject: [PATCH 060/101] Added documentation

---
 base/base/sort.h | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/base/base/sort.h b/base/base/sort.h
index cda03d92451..1a814587763 100644
--- a/base/base/sort.h
+++ b/base/base/sort.h
@@ -132,6 +132,13 @@ void sort(RandomIt first, RandomIt last)
     ::sort(first, last, comparator());
 }
 
+/** Try to fast sort elements for common sorting patterns:
+  * 1. If elements are already sorted.
+  * 2. If elements are already almost sorted.
+  * 3. If elements are already sorted in reverse order.
+  *
+  * Returns true if fast sort was performed or elements were already sorted, false otherwise.
+  */
 template <typename RandomIt, typename Compare>
 bool trySort(RandomIt first, RandomIt last, Compare compare)
 {
@@ -148,5 +155,5 @@ bool trySort(RandomIt first, RandomIt last)
 {
     using value_type = typename std::iterator_traits<RandomIt>::value_type;
     using comparator = std::less<value_type>;
-    return ::pdqsort_try_sort(first, last, comparator());
+    return ::trySort(first, last, comparator());
 }

From fd3f59acd930e9ffdf92d810bb95282d4aef4cb9 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 25 Sep 2023 16:30:38 +0200
Subject: [PATCH 061/101] Ping CI


From 330bcff2392ce0edfe436288c2f3c172de883160 Mon Sep 17 00:00:00 2001
From: usurai <crowdwei@gmail.com>
Date: Thu, 21 Sep 2023 20:49:53 +0800
Subject: [PATCH 062/101] Update ceilRowsToCompleteGranules to use binary
 search.

Replace the linear method in ceilRowsToCompleteGranules with a binary search.
---
 .../MergeTree/MergeTreeRangeReader.cpp        | 22 +++++++++++++------
 1 file changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeRangeReader.cpp b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
index 586d7aa918a..378a2deb5ff 100644
--- a/src/Storages/MergeTree/MergeTreeRangeReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeRangeReader.cpp
@@ -907,13 +907,21 @@ UInt64 MergeTreeRangeReader::Stream::lastPartOffset() const
 
 size_t MergeTreeRangeReader::Stream::ceilRowsToCompleteGranules(size_t rows_num) const
 {
-    /// FIXME suboptimal
-    size_t result = 0;
-    size_t from_mark = current_mark;
-    while (result < rows_num && from_mark < last_mark)
-        result += index_granularity->getMarkRows(from_mark++);
-
-    return result;
+    /// Find the first occurrence of mark that satisfies getRowsCountInRange(left, mark + 1) >= rows_num
+    /// in [current_mark, last_mark).
+    assert(current_mark + 1 <= last_mark);
+    size_t left_mark = current_mark;
+    size_t right_mark = last_mark;
+    while (left_mark < right_mark)
+    {
+        size_t mid_mark = left_mark + (right_mark - left_mark) / 2;
+        if (index_granularity->getRowsCountInRange(current_mark, mid_mark + 1) >= rows_num)
+            right_mark = mid_mark;
+        else
+            left_mark = mid_mark + 1;
+    }
+    size_t end_mark = (left_mark == last_mark) ? left_mark : left_mark + 1;
+    return index_granularity->getRowsCountInRange(current_mark, end_mark);
 }
 
 
From d30137b1b6b653f497eb57b6f9eb16855661d21a Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 25 Sep 2023 16:26:57 +0000
Subject: [PATCH 063/101] Disable syntax suggestions in clickhouse-local

---
 programs/local/LocalServer.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 9fb629a0871..154cd4ef6be 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -586,8 +586,7 @@ void LocalServer::processConfig()
 
     print_stack_trace = config().getBool("stacktrace", false);
     const std::string clickhouse_dialect{"clickhouse"};
-    load_suggestions = (is_interactive || delayed_interactive) && !config().getBool("disable_suggestion", false)
-        && config().getString("dialect", clickhouse_dialect) == clickhouse_dialect;
+    load_suggestions = false;
 
     auto logging = (config().has("logger.console")
                     || config().has("logger.level")

From 5e5761f6b3781edfccb2ca725dd74682feaad158 Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Sun, 24 Sep 2023 13:01:23 +0200
Subject: [PATCH 064/101] added docs

---
 .../functions/other-functions.md              | 29 +++++++++++++++----
 .../functions/other-functions.md              | 16 +++++++---
 2 files changed, 36 insertions(+), 9 deletions(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 566eff76584..378fc821df9 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -660,21 +660,26 @@ SELECT
 
 ## formatReadableTimeDelta
 
-Given a time interval (delta) in seconds, this function returns a time delta with year/month/day/hour/minute/second as string.
+Given a time interval (delta) in seconds, this function returns a time delta with year/month/day/hour/minute/second/millisecond/microsecond/nanosecond as string.
 
 **Syntax**
 
 ``` sql
-formatReadableTimeDelta(column[, maximum_unit])
+formatReadableTimeDelta(column[, maximum_unit, minimum_unit])
 ```
 
 **Arguments**
 
 - `column` — A column with a numeric time delta.
-- `maximum_unit` — Optional. Maximum unit to show. Acceptable values `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
-
-Example:
+- `maximum_unit` — Optional. Maximum unit to show.
+  * Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  * Default value: `years`.
+- `minimum_unit` — Optional. Minimum unit to show. All smaller units are truncated.
+  * Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  * If explicitly specified value is bigger than `maximum_unit`, an exception will be thrown.
+  * Default value: `seconds` if `maximum_unit` is `seconds` or bigger, `nanoseconds` otherwise.
 
+**Example**
 ``` sql
 SELECT
     arrayJoin([100, 12345, 432546534]) AS elapsed,
@@ -703,6 +708,20 @@ SELECT
 └────────────┴─────────────────────────────────────────────────────────────────┘
 ```
 
+```sql
+SELECT
+    arrayJoin([100, 12345, 432546534.00000006]) AS elapsed,
+    formatReadableTimeDelta(elapsed, 'minutes', 'nanoseconds') AS time_delta
+```
+
+```text
+┌────────────elapsed─┬─time_delta─────────────────────────────────────┐
+│                100 │ 1 minute and 40 seconds                        │
+│              12345 │ 205 minutes and 45 seconds                     │
+│ 432546534.00000006 │ 7209108 minutes, 54 seconds and 60 nanoseconds │
+└────────────────────┴────────────────────────────────────────────────┘
+```
+
 ## parseTimeDelta
 
 Parse a sequence of numbers followed by something resembling a time unit.
diff --git a/docs/ru/sql-reference/functions/other-functions.md b/docs/ru/sql-reference/functions/other-functions.md
index 78608aaf817..835aed934d5 100644
--- a/docs/ru/sql-reference/functions/other-functions.md
+++ b/docs/ru/sql-reference/functions/other-functions.md
@@ -659,9 +659,11 @@ SELECT
 └────────────────┴───────────────────┘
 ```
 
+
 ## formatReadableTimeDelta {#formatreadabletimedelta}
 
-Принимает дельту времени в секундах. Возвращает дельту времени с (год, месяц, день, час, минута, секунда) в виде строки.
+Принимает дельту времени в секундах. Возвращает дельту времени в виде строки.
+Есть возможность указать наиболее крупную единицу измерения для вывода (год, месяц, день, час, минута, секунда, милли/микро/наносекунда).
 
 **Синтаксис**
 
@@ -671,10 +673,16 @@ formatReadableTimeDelta(column[, maximum_unit])
 
 **Аргументы**
 
--   `column` — Столбец с числовой дельтой времени.
--   `maximum_unit` — Опциональный параметр. Максимальная единица измерения для отображения. Допустимые значения: секунды, минуты, часы, дни, месяцы, годы.
+- `column` — Столбец с числовой дельтой времени.
+- `maximum_unit` — Опциональный параметр. Максимальная единица измерения для отображения.
+  * Допустимые значения: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  * Значение по умолчанию: `years`.
+- `minimum_unit` — Опциональный параметр. Минимальная единица измерения для отображения. Более мелкие единицы будут отброшены.
+  * Допустимые значения: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  * Если минимальная единица задана явно и превышает максимальную единицу, будет выкинуто исключение.
+  * Значение по умолчанию: `seconds` если максимальная единица -- секунда или более крупный интервал, в противном случае -- `nanoseconds`.
 
-Пример:
+**Пример**
 
 ``` sql
 SELECT

From 77785925269390facbf31eb82e098bafc83b0b9b Mon Sep 17 00:00:00 2001
From: zvonand <azvonov@altinity.com>
Date: Sun, 24 Sep 2023 13:04:56 +0200
Subject: [PATCH 065/101] added subseconds to formatReadableTimeDelta and add
 tests

---
 src/Functions/formatReadableTimeDelta.cpp     | 250 +++++++++++++-----
 ...at_readable_timedelta_subseconds.reference |  24 ++
 ...7_format_readable_timedelta_subseconds.sql |  30 +++
 3 files changed, 243 insertions(+), 61 deletions(-)
 create mode 100644 tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.reference
 create mode 100644 tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.sql

diff --git a/src/Functions/formatReadableTimeDelta.cpp b/src/Functions/formatReadableTimeDelta.cpp
index 5fd48c01e8f..96d3a6fd966 100644
--- a/src/Functions/formatReadableTimeDelta.cpp
+++ b/src/Functions/formatReadableTimeDelta.cpp
@@ -2,11 +2,11 @@
 #include <Functions/IFunction.h>
 #include <Functions/FunctionHelpers.h>
 #include <Columns/ColumnString.h>
-#include <Columns/ColumnVector.h>
 #include <Common/NaNUtils.h>
 #include <DataTypes/DataTypeString.h>
 #include <IO/WriteBufferFromVector.h>
 #include <IO/WriteHelpers.h>
+#include <IO/DoubleConverter.h>
 
 
 namespace DB
@@ -14,9 +14,10 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int BAD_ARGUMENTS;
+extern const int CANNOT_PRINT_FLOAT_OR_DOUBLE_NUMBER;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int BAD_ARGUMENTS;
 }
 
 namespace
@@ -52,75 +53,88 @@ public:
     {
         if (arguments.empty())
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                "Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
-                getName(), arguments.size());
+                            "Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
+                            getName(), arguments.size());
 
-        if (arguments.size() > 2)
+        if (arguments.size() > 3)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                "Number of arguments for function {} doesn't match: passed {}, should be at most 2.",
-                getName(), arguments.size());
+                            "Number of arguments for function {} doesn't match: passed {}, should be 1, 2 or 3.",
+                            getName(), arguments.size());
 
         const IDataType & type = *arguments[0];
 
         if (!isNativeNumber(type))
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Cannot format {} as time delta", type.getName());
 
-        if (arguments.size() == 2)
+        if (arguments.size() >= 2)
         {
             const auto * maximum_unit_arg = arguments[1].get();
             if (!isStringOrFixedString(maximum_unit_arg))
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument maximum_unit of function {}",
                                 maximum_unit_arg->getName(), getName());
+
+            if (arguments.size() == 3)
+            {
+                const auto * minimum_unit_arg = arguments[2].get();
+                if (!isStringOrFixedString(minimum_unit_arg))
+                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument minimum_unit of function {}",
+                                    minimum_unit_arg->getName(), getName());
+            }
         }
 
         return std::make_shared<DataTypeString>();
     }
 
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2}; }
 
     bool useDefaultImplementationForConstants() const override { return true; }
 
     enum Unit
     {
-        Seconds,
-        Minutes,
-        Hours,
-        Days,
-        Months,
-        Years
+        Nanoseconds = 1,
+        Microseconds = 2,
+        Milliseconds = 3,
+        Seconds = 4,
+        Minutes = 5,
+        Hours = 6,
+        Days = 7,
+        Months = 8,
+        Years = 9
     };
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
-        std::string_view maximum_unit_str;
-        if (arguments.size() == 2)
+        std::string_view maximum_unit_str, minimum_unit_str;
+        if (arguments.size() >= 2)
         {
             const ColumnPtr & maximum_unit_column = arguments[1].column;
             const ColumnConst * maximum_unit_const_col = checkAndGetColumnConstStringOrFixedString(maximum_unit_column.get());
             if (maximum_unit_const_col)
                 maximum_unit_str = maximum_unit_const_col->getDataColumn().getDataAt(0).toView();
+
+            if (arguments.size() == 3)
+            {
+                const ColumnPtr & minimum_unit_column = arguments[2].column;
+                const ColumnConst * minimum_unit_const_col = checkAndGetColumnConstStringOrFixedString(minimum_unit_column.get());
+                if (minimum_unit_const_col)
+                    minimum_unit_str = minimum_unit_const_col->getDataColumn().getDataAt(0).toView();
+            }
         }
+        /// Default means "use all available whole units".
+        Unit max_unit = dispatchUnit(maximum_unit_str, Years, "maximum");
+        /// Set seconds as min_unit by default not to ruin old use cases
+        Unit min_unit = dispatchUnit(minimum_unit_str, Seconds, "minimum");
 
-        Unit max_unit;
-
-        /// Default means "use all available units".
-        if (maximum_unit_str.empty() || maximum_unit_str == "years")
-            max_unit = Years;
-        else if (maximum_unit_str == "months")
-            max_unit = Months;
-        else if (maximum_unit_str == "days")
-            max_unit = Days;
-        else if (maximum_unit_str == "hours")
-            max_unit = Hours;
-        else if (maximum_unit_str == "minutes")
-            max_unit = Minutes;
-        else if (maximum_unit_str == "seconds")
-            max_unit = Seconds;
-        else
-            throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                "Unexpected value of maximum unit argument ({}) for function {}, the only allowed values are:"
-                " 'seconds', 'minutes', 'hours', 'days', 'months', 'years'.",
-                maximum_unit_str, getName());
+        if (min_unit > max_unit)
+        {
+            if (minimum_unit_str.empty())
+                min_unit = Nanoseconds;   /// User wants sub-second max_unit. Show him all sub-second units unless other specified.
+            else
+                throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                                "Explicitly specified value of minimum unit argument ({}) for function {} "
+                                "must not be greater than maximum unit value ({}).",
+                                minimum_unit_str, getName(), maximum_unit_str);
+        }
 
         auto col_to = ColumnString::create();
 
@@ -152,14 +166,61 @@ public:
                 /// To output separators between parts: ", " and " and ".
                 bool has_output = false;
 
+                Float64 whole_part;
+                std::string fractional_str = getFractionalString(std::modf(value, &whole_part));
+
                 switch (max_unit) /// A kind of Duff Device.
                 {
-                    case Years:     processUnit(365 * 24 * 3600, " year", 5, value, buf_to, has_output); [[fallthrough]];
-                    case Months:    processUnit(static_cast<UInt64>(30.5 * 24 * 3600), " month", 6, value, buf_to, has_output); [[fallthrough]];
-                    case Days:      processUnit(24 * 3600, " day", 4, value, buf_to, has_output); [[fallthrough]];
-                    case Hours:     processUnit(3600, " hour", 5, value, buf_to, has_output); [[fallthrough]];
-                    case Minutes:   processUnit(60, " minute", 7, value, buf_to, has_output); [[fallthrough]];
-                    case Seconds:   processUnit(1, " second", 7, value, buf_to, has_output);
+                    case Years:
+                        processUnit(365 * 24 * 3600, 0, " year", 5, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Years);
+                        if (min_unit == Years)
+                            break;
+                        [[fallthrough]];
+
+                    case Months:
+                        processUnit(static_cast<UInt64>(30.5 * 24 * 3600), 0, " month", 6, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Months);
+                        if (min_unit == Months)
+                            break;
+                        [[fallthrough]];
+
+                    case Days:
+                        processUnit(24 * 3600, 0, " day", 4, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Days);
+                        if (min_unit == Days)
+                            break;
+                        [[fallthrough]];
+
+                    case Hours:
+                        processUnit(3600, 0, " hour", 5, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Hours);
+                        if (min_unit == Hours)
+                            break;
+                        [[fallthrough]];
+
+                    case Minutes:
+                        processUnit(60, 0, " minute", 7, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Minutes);
+                        if (min_unit == Minutes)
+                            break;
+                        [[fallthrough]];
+
+                    case Seconds:
+                        processUnit(1, 0, " second", 7, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Seconds);
+                        if (min_unit == Seconds)
+                            break;
+                        [[fallthrough]];
+
+                    case Milliseconds:
+                        processUnit(1, 3, " millisecond", 12, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Milliseconds);
+                        if (min_unit == Milliseconds)
+                            break;
+                        [[fallthrough]];
+
+                    case Microseconds:
+                        processUnit(1, 6, " microsecond", 12, whole_part, fractional_str, buf_to, has_output, min_unit, min_unit == Microseconds);
+                        if (min_unit == Microseconds)
+                            break;
+                        [[fallthrough]];
+
+                    case Nanoseconds:
+                        processUnit(1, 9, " nanosecond", 11, whole_part, fractional_str, buf_to, has_output, min_unit, true);
                 }
             }
 
@@ -172,42 +233,68 @@ public:
     }
 
     static void processUnit(
-        UInt64 unit_size, const char * unit_name, size_t unit_name_size,
-        Float64 & value, WriteBuffer & buf_to, bool & has_output)
+        UInt64 unit_multiplier, UInt32 unit_scale, const char * unit_name, size_t unit_name_size, Float64 & whole_part,
+        String & fractional_str, WriteBuffer & buf_to, bool & has_output,  Unit min_unit, bool is_minimum_unit)
     {
-        if (unlikely(value + 1.0 == value))
+        if (unlikely(whole_part + 1.0 == whole_part))
         {
             /// The case when value is too large so exact representation for subsequent smaller units is not possible.
-            writeText(std::floor(value / unit_size), buf_to);
+            writeText(std::floor(whole_part * DecimalUtils::scaleMultiplier<Int64>(unit_scale) / unit_multiplier), buf_to);
             buf_to.write(unit_name, unit_name_size);
             writeChar('s', buf_to);
             has_output = true;
-            value = 0;
+            whole_part = 0;
             return;
         }
-
-        UInt64 num_units = static_cast<UInt64>(value / unit_size);
-
-        if (!num_units)
+        UInt64 num_units = 0;
+        if (unit_scale == 0)  /// dealing with whole number of seconds
         {
-            /// Zero units, no need to print. But if it's the last (seconds) and the only unit, print "0 seconds" nevertheless.
-            if (unit_size > 1 || has_output)
-                return;
+            num_units = static_cast<UInt64>(std::floor(whole_part / unit_multiplier));
+
+            if (!num_units)
+            {
+                /// Zero units, no need to print. But if it's the last (seconds) and the only unit, print "0 seconds" nevertheless.
+                if (unit_multiplier != 1 || has_output)
+                    return;
+            }
+
+            /// Remaining value to print on next iteration.
+            whole_part -= num_units * unit_multiplier;
+        }
+        else   /// dealing with sub-seconds, a bit more peculiar to avoid more precision issues
+        {
+            if (whole_part >= 1)  /// There were no whole units printed
+            {
+                num_units += static_cast<UInt64>(whole_part) * DecimalUtils::scaleMultiplier<Int64>(unit_scale);
+                whole_part = 0;
+            }
+
+            for (UInt32 i = 0; i < unit_scale; ++i)
+            {
+                num_units += (fractional_str[i] - '0') * DecimalUtils::scaleMultiplier<Int64>(unit_scale - i - 1);
+                fractional_str[i] = '0';
+            }
+
+            if (!num_units)
+            {
+                /// Zero units, no need to print. But if it's the last (nanoseconds) and the only unit, print "0 nanoseconds" nevertheless.
+                if (!is_minimum_unit || has_output)
+                    return;
+            }
         }
 
-        /// Remaining value to print on next iteration.
-        value -= num_units * unit_size;
-
+        /// Write number of units
         if (has_output)
         {
             /// Need delimiter between values. The last delimiter is " and ", all previous are comma.
-            if (value < 1)
+            if (is_minimum_unit || (whole_part < 1 && fractional_str.substr(0, (4 - min_unit) * 3) == std::string((4 - min_unit) * 3, '0')))
                 writeCString(" and ", buf_to);
             else
                 writeCString(", ", buf_to);
         }
 
         writeText(num_units, buf_to);
+
         buf_to.write(unit_name, unit_name_size); /// If we just leave strlen(unit_name) here, clang-11 fails to make it compile-time.
 
         /// How to pronounce: unit vs. units.
@@ -216,6 +303,47 @@ public:
 
         has_output = true;
     }
+
+private:
+    static std::string getFractionalString(const Float64 & fractional_part)
+    {
+        DB::DoubleConverter<true>::BufferType buffer;
+        double_conversion::StringBuilder builder{buffer, sizeof(buffer)};
+
+        if (!DB::DoubleConverter<false>::instance().ToFixed(fractional_part, 9, &builder))
+            throw DB::Exception(DB::ErrorCodes::CANNOT_PRINT_FLOAT_OR_DOUBLE_NUMBER, "Cannot print double number: {}", fractional_part);
+
+        return std::string(buffer, builder.position()).substr(2);   /// do not return `0.` -- we don't need it
+    }
+
+    Unit dispatchUnit(const std::string_view & unit_str, const Unit default_unit, const std::string & bound_name) const
+    {
+        if (unit_str.empty())
+            return default_unit;
+        else if (unit_str == "years")
+            return Years;
+        else if (unit_str == "months")
+            return Months;
+        else if (unit_str == "days")
+            return Days;
+        else if (unit_str == "hours")
+            return Hours;
+        else if (unit_str == "minutes")
+            return Minutes;
+        else if (unit_str == "seconds")
+            return Seconds;
+        else if (unit_str == "milliseconds")
+            return Milliseconds;
+        else if (unit_str == "microseconds")
+            return Microseconds;
+        else if (unit_str == "nanoseconds")
+            return Nanoseconds;
+        else
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                            "Unexpected value of {} unit argument ({}) for function {}, the only allowed values are:"
+                            " 'nanoseconds', 'microseconds', 'nanoseconds', 'seconds', 'minutes', 'hours', 'days', 'months', 'years'.",
+                            bound_name, unit_str, getName());
+    }
 };
 
 }
diff --git a/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.reference b/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.reference
new file mode 100644
index 00000000000..389479eb529
--- /dev/null
+++ b/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.reference
@@ -0,0 +1,24 @@
+1 second
+1 minute
+2 minutes and 3 seconds
+24 seconds
+35 seconds
+1 minute and 6 seconds
+1 minute and 7 seconds
+48 seconds
+1 minute and 39 seconds
+1 hour
+1120 milliseconds
+60200 milliseconds
+123330 milliseconds
+24450 milliseconds
+35570 milliseconds
+66640 milliseconds
+67797 milliseconds, 979 microseconds and 790 nanoseconds
+48888 milliseconds and 888 microseconds
+99960 milliseconds
+3600000 milliseconds
+0 seconds
+1 hour and 1 second
+0 nanoseconds
+1000 milliseconds and 500 microseconds
diff --git a/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.sql b/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.sql
new file mode 100644
index 00000000000..0a8a76d54fd
--- /dev/null
+++ b/tests/queries/0_stateless/02887_format_readable_timedelta_subseconds.sql
@@ -0,0 +1,30 @@
+-- max_unit bigger than second, min_unit omitted (and considered 'seconds')
+WITH
+    'hours' AS maximum_unit,
+    arrayJoin([1.12, 60.2, 123.33, 24.45, 35.57, 66.64, 67.79, 48.88, 99.96, 3600]) AS elapsed
+SELECT
+    formatReadableTimeDelta(elapsed, maximum_unit) AS time_delta;
+
+-- max_unit smaller than second, min_unit omitted (and considered 'nanoseconds')
+WITH
+    'milliseconds' AS maximum_unit,
+    arrayJoin([1.12, 60.2, 123.33, 24.45, 35.57, 66.64, 67.79797979, 48.888888, 99.96, 3600]) AS elapsed
+SELECT
+    formatReadableTimeDelta(elapsed, maximum_unit) AS time_delta;
+
+-- Check exception is thrown
+SELECT formatReadableTimeDelta(1.1, 'seconds', 'hours'); -- { serverError BAD_ARGUMENTS }
+
+-- Check empty units are omitted unless they are the only one
+WITH
+    'hours' AS maximum_unit,
+    'microseconds' as minimum_unit,
+    arrayJoin([0, 3601.000000003]) AS elapsed
+SELECT
+    formatReadableTimeDelta(elapsed, maximum_unit, minimum_unit);
+
+WITH
+    'milliseconds' AS maximum_unit,
+    arrayJoin([0, 1.0005]) AS elapsed
+SELECT
+    formatReadableTimeDelta(elapsed, maximum_unit);

From b8695525ad1c54f03ba29b74ea05f9a2c15f3e50 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Sep 2023 19:17:33 +0200
Subject: [PATCH 066/101] Add a test for compatibility

---
 .../0_stateless/02887_tuple_element_distributed.reference   | 6 ++++++
 .../queries/0_stateless/02887_tuple_element_distributed.sql | 1 +
 2 files changed, 7 insertions(+)
 create mode 100644 tests/queries/0_stateless/02887_tuple_element_distributed.reference
 create mode 100644 tests/queries/0_stateless/02887_tuple_element_distributed.sql

diff --git a/tests/queries/0_stateless/02887_tuple_element_distributed.reference b/tests/queries/0_stateless/02887_tuple_element_distributed.reference
new file mode 100644
index 00000000000..a9e2f17562a
--- /dev/null
+++ b/tests/queries/0_stateless/02887_tuple_element_distributed.reference
@@ -0,0 +1,6 @@
+1
+1
+1
+1
+1
+1
diff --git a/tests/queries/0_stateless/02887_tuple_element_distributed.sql b/tests/queries/0_stateless/02887_tuple_element_distributed.sql
new file mode 100644
index 00000000000..b9c5c856d00
--- /dev/null
+++ b/tests/queries/0_stateless/02887_tuple_element_distributed.sql
@@ -0,0 +1 @@
+SELECT equals(tupleElement(tuple('a', 10) AS x, 1), 'a') FROM remote('127.0.0.{1,2,3}', numbers(2));

From bb0375d97015a030193db8ffec13dd4df6edc1d0 Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <evillique@gmail.com>
Date: Fri, 22 Sep 2023 20:20:21 +0000
Subject: [PATCH 067/101] Fix data race in SYSTEM STOP LISTEN

---
 programs/server/Server.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index a968acb549f..78f3f749d9a 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1516,11 +1516,13 @@ try
 
     global_context->setStopServersCallback([&](const ServerType & server_type)
     {
+        std::lock_guard lock(servers_lock);
         stopServers(servers, server_type);
     });
 
     global_context->setStartServersCallback([&](const ServerType & server_type)
     {
+        std::lock_guard lock(servers_lock);
         createServers(
             config(),
             listen_hosts,

From 4fb12f8703d68400cd7d1ea71f18e645ea889c49 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 18 Sep 2023 19:35:08 +0000
Subject: [PATCH 068/101] Add retries to rests
 test_async_query_sending/test_async_connect

---
 .../integration/test_hedged_requests/test.py  | 37 +++++++++++++------
 1 file changed, 26 insertions(+), 11 deletions(-)

diff --git a/tests/integration/test_hedged_requests/test.py b/tests/integration/test_hedged_requests/test.py
index 6f5d5706da4..d3f22625f76 100644
--- a/tests/integration/test_hedged_requests/test.py
+++ b/tests/integration/test_hedged_requests/test.py
@@ -133,7 +133,7 @@ def check_if_query_sending_was_suspended():
         "SELECT value FROM system.events WHERE event='SuspendSendingQueryToShard'"
     )
 
-    assert int(result) >= 1
+    return len(result) != 0 and int(result) >= 1
 
 
 def check_if_query_sending_was_not_suspended():
@@ -380,11 +380,19 @@ def test_async_connect(started_cluster):
     # Restart server to reset connection pool state
     NODES["node"].restart_clickhouse()
 
-    NODES["node"].query(
-        "SELECT hostName(), id FROM distributed_connect ORDER BY id LIMIT 1 SETTINGS prefer_localhost_replica = 0, connect_timeout_with_failover_ms=5000, async_query_sending_for_remote=1, max_threads=1, max_distributed_connections=1"
-    )
-    check_changing_replica_events(2)
-    check_if_query_sending_was_suspended()
+    attempt = 0
+    while attempt < 1000:
+        NODES["node"].query(
+            "SELECT hostName(), id FROM distributed_connect ORDER BY id LIMIT 1 SETTINGS prefer_localhost_replica = 0, connect_timeout_with_failover_ms=5000, async_query_sending_for_remote=1, max_threads=1, max_distributed_connections=1"
+        )
+
+        check_changing_replica_events(2)
+        if check_if_query_sending_was_suspended():
+            break
+
+        attempt += 1
+
+    assert attempt < 1000
 
     NODES["node"].query("DROP TABLE distributed_connect")
 
@@ -418,10 +426,17 @@ def test_async_query_sending(started_cluster):
     )
     check_if_query_sending_was_not_suspended()
 
-    NODES["node"].query(
-        "SELECT hostName(), id FROM distributed_query_sending ORDER BY id LIMIT 1 SETTINGS"
-        " prefer_localhost_replica = 0, async_query_sending_for_remote=1, max_threads = 1, max_distributed_connections=1"
-    )
-    check_if_query_sending_was_suspended()
+    attempt = 0
+    while attempt < 1000:
+        NODES["node"].query(
+            "SELECT hostName(), id FROM distributed_query_sending ORDER BY id LIMIT 1 SETTINGS"
+            " prefer_localhost_replica = 0, async_query_sending_for_remote=1, max_threads = 1, max_distributed_connections=1"
+        )
 
+        if check_if_query_sending_was_suspended():
+            break
+
+        attempt += 1
+
+    assert attempt < 1000
     NODES["node"].query("DROP TABLE distributed_query_sending")

From 92de61ca5bfe68aa7e758ee70cf6a0d94c8fb7f1 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 19 Sep 2023 13:32:49 +0200
Subject: [PATCH 069/101] Use less attempts

---
 tests/integration/test_hedged_requests/test.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_hedged_requests/test.py b/tests/integration/test_hedged_requests/test.py
index d3f22625f76..02ecf3c1367 100644
--- a/tests/integration/test_hedged_requests/test.py
+++ b/tests/integration/test_hedged_requests/test.py
@@ -381,7 +381,7 @@ def test_async_connect(started_cluster):
     NODES["node"].restart_clickhouse()
 
     attempt = 0
-    while attempt < 1000:
+    while attempt < 100:
         NODES["node"].query(
             "SELECT hostName(), id FROM distributed_connect ORDER BY id LIMIT 1 SETTINGS prefer_localhost_replica = 0, connect_timeout_with_failover_ms=5000, async_query_sending_for_remote=1, max_threads=1, max_distributed_connections=1"
         )
@@ -392,7 +392,7 @@ def test_async_connect(started_cluster):
 
         attempt += 1
 
-    assert attempt < 1000
+    assert attempt < 100
 
     NODES["node"].query("DROP TABLE distributed_connect")
 
@@ -427,7 +427,7 @@ def test_async_query_sending(started_cluster):
     check_if_query_sending_was_not_suspended()
 
     attempt = 0
-    while attempt < 1000:
+    while attempt < 100:
         NODES["node"].query(
             "SELECT hostName(), id FROM distributed_query_sending ORDER BY id LIMIT 1 SETTINGS"
             " prefer_localhost_replica = 0, async_query_sending_for_remote=1, max_threads = 1, max_distributed_connections=1"
@@ -438,5 +438,5 @@ def test_async_query_sending(started_cluster):
 
         attempt += 1
 
-    assert attempt < 1000
+    assert attempt < 100
     NODES["node"].query("DROP TABLE distributed_query_sending")

From ac384677cce8a59265d9a05cf968b355b769fc38 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 25 Sep 2023 13:10:25 +0200
Subject: [PATCH 070/101] Delete a test

---
 tests/queries/0_stateless/02344_describe_cache.reference | 1 -
 tests/queries/0_stateless/02344_describe_cache.sql       | 4 ----
 2 files changed, 5 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02344_describe_cache.reference
 delete mode 100644 tests/queries/0_stateless/02344_describe_cache.sql

diff --git a/tests/queries/0_stateless/02344_describe_cache.reference b/tests/queries/0_stateless/02344_describe_cache.reference
deleted file mode 100644
index 5db1aa3e7f5..00000000000
--- a/tests/queries/0_stateless/02344_describe_cache.reference
+++ /dev/null
@@ -1 +0,0 @@
-134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache/	2	0
diff --git a/tests/queries/0_stateless/02344_describe_cache.sql b/tests/queries/0_stateless/02344_describe_cache.sql
deleted file mode 100644
index 9c5c5c10952..00000000000
--- a/tests/queries/0_stateless/02344_describe_cache.sql
+++ /dev/null
@@ -1,4 +0,0 @@
--- Tags: no-fasttest, no-parallel
-
-SYSTEM DROP FILESYSTEM CACHE 's3_cache';
-DESCRIBE FILESYSTEM CACHE 's3_cache';

From d2b787429dafd7b66a3fb21eab94e5cf8d524397 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 25 Sep 2023 14:23:46 +0200
Subject: [PATCH 071/101] Remove 02151_hash_table_sizes_stats_distributed
 (fixes broken CI) (#54969)

* Fix 02151_hash_table_sizes_stats_distributed (fixes broken CI)

Fixes: #54961
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>

* Remove 02151_hash_table_sizes_stats_distributed

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>

---------

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ...sh_table_sizes_stats_distributed.reference | 33 -------
 ...2151_hash_table_sizes_stats_distributed.sh | 95 -------------------
 2 files changed, 128 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.reference
 delete mode 100755 tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.sh

diff --git a/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.reference b/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.reference
deleted file mode 100644
index 0d10114f4ff..00000000000
--- a/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.reference
+++ /dev/null
@@ -1,33 +0,0 @@
-1
-1
---
-1
-1
---
-1
-1
---
-1
-1
---
-1
-1
-1
-1
---
-1
-1
---
-1
-1
-1
-1
---
-1
-1
---
-1
-1
-1
-1
---
diff --git a/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.sh b/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.sh
deleted file mode 100755
index 77b9b2942c5..00000000000
--- a/tests/queries/0_stateless/02151_hash_table_sizes_stats_distributed.sh
+++ /dev/null
@@ -1,95 +0,0 @@
-#!/usr/bin/env bash
-# Tags: long, distributed, no-tsan, no-debug
-
-# These tests don't use `current_database = currentDatabase()` condition, because database name isn't propagated during remote queries.
-
-# shellcheck disable=SC2154
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-
-# tests rely on that all the rows are unique and max_threads divides table_size
-table_size=1000005
-max_threads=5
-
-
-prepare_table() {
-  table_name="t_hash_table_sizes_stats_$RANDOM$RANDOM"
-  $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS $table_name;"
-  if [ -z "$1" ]; then
-    $CLICKHOUSE_CLIENT -q "CREATE TABLE $table_name(number UInt64) Engine=MergeTree() ORDER BY tuple() SETTINGS index_granularity = 8192, index_granularity_bytes = '10Mi';"
-  else
-    $CLICKHOUSE_CLIENT -q "CREATE TABLE $table_name(number UInt64) Engine=MergeTree() ORDER BY $1 SETTINGS index_granularity = 8192, index_granularity_bytes = '10Mi';"
-  fi
-  $CLICKHOUSE_CLIENT -q "SYSTEM STOP MERGES $table_name;"
-  for ((i = 1; i <= max_threads; i++)); do
-    cnt=$((table_size / max_threads))
-    from=$(((i - 1) * cnt))
-    $CLICKHOUSE_CLIENT -q "INSERT INTO $table_name SELECT * FROM numbers($from, $cnt);"
-  done
-  $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS ${table_name}_d;"
-  $CLICKHOUSE_CLIENT -q "CREATE TABLE ${table_name}_d AS $table_name ENGINE = Distributed(test_cluster_two_shards, currentDatabase(), $table_name);"
-  table_name="${table_name}_d"
-}
-
-prepare_table_with_sorting_key() {
-  prepare_table "$1"
-}
-
-run_query() {
-  query_id="${CLICKHOUSE_DATABASE}_hash_table_sizes_stats_$RANDOM$RANDOM"
-  $CLICKHOUSE_CLIENT --query_id="$query_id" --multiquery -q "
-    SET max_block_size = $((table_size / 10));
-    SET merge_tree_min_rows_for_concurrent_read = 1;
-    SET max_untracked_memory = 0;
-    SET prefer_localhost_replica = 1;
-    $query"
-}
-
-check_preallocated_elements() {
-  $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
-  # rows may be distributed in any way including "everything goes to the one particular thread"
-  min=$1
-  if [ -z "$2" ]; then
-    max=$1
-  else
-    max=$2
-  fi
-  $CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "
-    SELECT COUNT(*)
-      FROM system.query_log
-     WHERE event_date >= yesterday() AND (query_id = {query_id:String} OR initial_query_id = {query_id:String})
-           AND ProfileEvents['AggregationPreallocatedElementsInHashTables'] BETWEEN $min AND $max
-  GROUP BY query_id"
-}
-
-check_convertion_to_two_level() {
-  $CLICKHOUSE_CLIENT -q "SYSTEM FLUSH LOGS"
-  # rows may be distributed in any way including "everything goes to the one particular thread"
-  $CLICKHOUSE_CLIENT --param_query_id="$query_id" -q "
-    SELECT SUM(ProfileEvents['AggregationHashTablesInitializedAsTwoLevel']) BETWEEN 1 AND $max_threads
-      FROM system.query_log
-     WHERE event_date >= yesterday() AND (query_id = {query_id:String} OR initial_query_id = {query_id:String})
-  GROUP BY query_id"
-}
-
-print_border() {
-  echo "--"
-}
-
-
-# shellcheck source=./02151_hash_table_sizes_stats.testcases
-source "$CURDIR"/02151_hash_table_sizes_stats.testcases
-
-
-test_one_thread_simple_group_by
-test_one_thread_simple_group_by_with_limit
-test_one_thread_simple_group_by_with_join_and_subquery
-test_several_threads_simple_group_by_with_limit_single_level_ht
-test_several_threads_simple_group_by_with_limit_two_level_ht
-test_several_threads_simple_group_by_with_limit_and_rollup_single_level_ht
-test_several_threads_simple_group_by_with_limit_and_rollup_two_level_ht
-test_several_threads_simple_group_by_with_limit_and_cube_single_level_ht
-test_several_threads_simple_group_by_with_limit_and_cube_two_level_ht

From 5a6d37d8e793299bf15c7cad2c366575ac5670d3 Mon Sep 17 00:00:00 2001
From: Alex Cheng <chengxin1985@gmail.com>
Date: Fri, 22 Sep 2023 19:55:44 +0800
Subject: [PATCH 072/101] fix exception message in Pipe::addTransform

---
 src/QueryPipeline/Pipe.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/QueryPipeline/Pipe.cpp b/src/QueryPipeline/Pipe.cpp
index 293d152ea65..ff842478712 100644
--- a/src/QueryPipeline/Pipe.cpp
+++ b/src/QueryPipeline/Pipe.cpp
@@ -556,7 +556,7 @@ void Pipe::addTransform(ProcessorPtr transform, InputPort * totals, InputPort *
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming totals to Pipe because Pipe does not have totals");
 
     if (extremes && !extremes_port)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming extremes to Pipe because it already has extremes");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming extremes to Pipe because Pipe does not have extremes");
 
     if (totals)
     {

From b7a3873265ae7afa68b379920c9d60cb2fbf7d82 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Fri, 22 Sep 2023 17:43:52 +0000
Subject: [PATCH 073/101] Add function hammingDistance

---
 src/Functions/FunctionsStringSimilarity.h     |  42 +++++--
 src/Functions/stringHammingDistance.cpp       | 106 ++++++++++++++++++
 .../02884_string_hamming_distance.reference   |  10 ++
 .../02884_string_hamming_distance.sql         |  17 +++
 4 files changed, 166 insertions(+), 9 deletions(-)
 create mode 100644 src/Functions/stringHammingDistance.cpp
 create mode 100644 tests/queries/0_stateless/02884_string_hamming_distance.reference
 create mode 100644 tests/queries/0_stateless/02884_string_hamming_distance.sql

diff --git a/src/Functions/FunctionsStringSimilarity.h b/src/Functions/FunctionsStringSimilarity.h
index a360442ea75..e148730054d 100644
--- a/src/Functions/FunctionsStringSimilarity.h
+++ b/src/Functions/FunctionsStringSimilarity.h
@@ -27,6 +27,9 @@ namespace ErrorCodes
     extern const int TOO_LARGE_STRING_SIZE;
 }
 
+template <typename T>
+concept has_max_string_size = requires { T::max_string_size; };
+
 template <typename Impl, typename Name>
 class FunctionsStringSimilarity : public IFunction
 {
@@ -68,10 +71,17 @@ public:
         {
             ResultType res{};
             const String & needle = col_needle_const->getValue<String>();
-            if (needle.size() > Impl::max_string_size)
+            if constexpr (has_max_string_size<Impl>)
             {
-                throw Exception(ErrorCodes::TOO_LARGE_STRING_SIZE, "String size of needle is too big for function {}. "
-                    "Should be at most {}", getName(), Impl::max_string_size);
+                if (needle.size() > Impl::max_string_size)
+                {
+                    throw Exception(
+                        ErrorCodes::TOO_LARGE_STRING_SIZE,
+                        "String size of needle is too big for function {}. "
+                        "Should be at most {}",
+                        getName(),
+                        Impl::max_string_size);
+                }
             }
             Impl::constantConstant(col_haystack_const->getValue<String>(), needle, res);
             return result_type->createColumnConst(col_haystack_const->size(), toField(res));
@@ -88,10 +98,17 @@ public:
         if (col_haystack_vector && col_needle_const)
         {
             const String & needle = col_needle_const->getValue<String>();
-            if (needle.size() > Impl::max_string_size)
+            if constexpr (has_max_string_size<Impl>)
             {
-                throw Exception(ErrorCodes::TOO_LARGE_STRING_SIZE, "String size of needle is too big for function {}. "
-                    "Should be at most {}", getName(), Impl::max_string_size);
+                if (needle.size() > Impl::max_string_size)
+                {
+                    throw Exception(
+                        ErrorCodes::TOO_LARGE_STRING_SIZE,
+                        "String size of needle is too big for function {}. "
+                        "Should be at most {}",
+                        getName(),
+                        Impl::max_string_size);
+                }
             }
             Impl::vectorConstant(col_haystack_vector->getChars(), col_haystack_vector->getOffsets(), needle, vec_res);
         }
@@ -107,10 +124,17 @@ public:
         else if (col_haystack_const && col_needle_vector)
         {
             const String & haystack = col_haystack_const->getValue<String>();
-            if (haystack.size() > Impl::max_string_size)
+            if constexpr (has_max_string_size<Impl>)
             {
-                throw Exception(ErrorCodes::TOO_LARGE_STRING_SIZE, "String size of haystack is too big for function {}. "
-                    "Should be at most {}", getName(), Impl::max_string_size);
+                if (haystack.size() > Impl::max_string_size)
+                {
+                    throw Exception(
+                        ErrorCodes::TOO_LARGE_STRING_SIZE,
+                        "String size of haystack is too big for function {}. "
+                        "Should be at most {}",
+                        getName(),
+                        Impl::max_string_size);
+                }
             }
             Impl::constantVector(haystack, col_needle_vector->getChars(), col_needle_vector->getOffsets(), vec_res);
         }
diff --git a/src/Functions/stringHammingDistance.cpp b/src/Functions/stringHammingDistance.cpp
new file mode 100644
index 00000000000..fd22ca96ba3
--- /dev/null
+++ b/src/Functions/stringHammingDistance.cpp
@@ -0,0 +1,106 @@
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionsStringSimilarity.h>
+
+#ifdef __SSE4_2__
+#    include <nmmintrin.h>
+#endif
+
+namespace DB
+{
+struct StringHammingDistanceImpl
+{
+    using ResultType = UInt64;
+
+    static void constantConstant(const std::string & haystack, const std::string & needle, UInt64 & res)
+    {
+        res = process(haystack.data(), haystack.size(), needle.data(), needle.size());
+    }
+
+    static void vectorVector(
+        const ColumnString::Chars & haystack_data,
+        const ColumnString::Offsets & haystack_offsets,
+        const ColumnString::Chars & needle_data,
+        const ColumnString::Offsets & needle_offsets,
+        PaddedPODArray<UInt64> & res)
+    {
+        size_t size = res.size();
+        const char * haystack = reinterpret_cast<const char *>(haystack_data.data());
+        const char * needle = reinterpret_cast<const char *>(needle_data.data());
+        for (size_t i = 0; i < size; ++i)
+        {
+            res[i] = process(
+                haystack + haystack_offsets[i - 1],
+                haystack_offsets[i] - haystack_offsets[i - 1] - 1,
+                needle + needle_offsets[i - 1],
+                needle_offsets[i] - needle_offsets[i - 1] - 1);
+        }
+    }
+
+    static void constantVector(
+        const std::string & haystack,
+        const ColumnString::Chars & needle_data,
+        const ColumnString::Offsets & needle_offsets,
+        PaddedPODArray<UInt64> & res)
+    {
+        const char * haystack_data = haystack.data();
+        size_t haystack_size = haystack.size();
+        const char * needle = reinterpret_cast<const char *>(needle_data.data());
+        size_t size = res.size();
+        for (size_t i = 0; i < size; ++i)
+        {
+            res[i] = process(haystack_data, haystack_size, needle + needle_offsets[i - 1], needle_offsets[i] - needle_offsets[i - 1] - 1);
+        }
+    }
+
+    static void vectorConstant(
+        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & needle, PaddedPODArray<UInt64> & res)
+    {
+        constantVector(needle, data, offsets, res);
+    }
+
+private:
+    static UInt64 inline process(const char * haystack, size_t haystack_size, const char * needle, size_t needle_size)
+    {
+        UInt64 res = 0;
+        const char * haystack_end = haystack + haystack_size;
+        const char * needle_end = needle + needle_size;
+
+#ifdef __SSE4_2__
+        static constexpr auto mode = _SIDD_UBYTE_OPS | _SIDD_CMP_EQUAL_EACH | _SIDD_NEGATIVE_POLARITY;
+
+        const char * haystack_end16 = haystack + haystack_size / 16 * 16;
+        const char * needle_end16 = needle + needle_size / 16 * 16;
+
+        for (; haystack < haystack_end16 && needle < needle_end16; haystack += 16, needle += 16)
+        {
+            __m128i s1 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(haystack));
+            __m128i s2 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(needle));
+            auto result_mask = _mm_cmpestrm(s1, 16, s2, 16, mode);
+            const __m128i mask_hi = _mm_unpackhi_epi64(result_mask, result_mask);
+            res += _mm_popcnt_u64(_mm_cvtsi128_si64(result_mask)) + _mm_popcnt_u64(_mm_cvtsi128_si64(mask_hi));
+        }
+#endif
+        for (; haystack != haystack_end && needle != needle_end; ++haystack, ++needle)
+            res += *haystack != *needle;
+
+        res = res + (haystack_end - haystack) + (needle_end - needle);
+        return res;
+    }
+};
+
+struct NameStringHammingDistance
+{
+    static constexpr auto name = "hammingDistance";
+};
+
+using FunctionStringHammingDistance = FunctionsStringSimilarity<StringHammingDistanceImpl, NameStringHammingDistance>;
+
+REGISTER_FUNCTION(StringHammingDistance)
+{
+    factory.registerFunction<FunctionStringHammingDistance>();
+}
+}
diff --git a/tests/queries/0_stateless/02884_string_hamming_distance.reference b/tests/queries/0_stateless/02884_string_hamming_distance.reference
new file mode 100644
index 00000000000..656cd356016
--- /dev/null
+++ b/tests/queries/0_stateless/02884_string_hamming_distance.reference
@@ -0,0 +1,10 @@
+0
+1
+7
+7
+3
+6
+3
+6
+6
+3
diff --git a/tests/queries/0_stateless/02884_string_hamming_distance.sql b/tests/queries/0_stateless/02884_string_hamming_distance.sql
new file mode 100644
index 00000000000..3f026d6f8d0
--- /dev/null
+++ b/tests/queries/0_stateless/02884_string_hamming_distance.sql
@@ -0,0 +1,17 @@
+select hammingDistance('abcd', 'abcd');
+drop table if exists t;
+create table t
+(
+	s1 String,
+	s2 String
+) engine = MergeTree order by s1;
+
+insert into t values ('abcdefg', 'abcdef') ('abcdefg', 'bcdefg') ('abcdefg', '');
+
+select hammingDistance(s1, s2) from t;
+
+select hammingDistance('abc', s2) from t;
+
+select hammingDistance(s2, 'def') from t;
+
+drop table t;

From 5a72de34ed26792d1a6a22ab2cb0287d99f40936 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Fri, 22 Sep 2023 17:48:17 +0000
Subject: [PATCH 074/101] add doc

---
 .../functions/string-search-functions.md      | 26 ++++++++++++++++++-
 1 file changed, 25 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index c10a1036677..cb4963c1091 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -680,4 +680,28 @@ Like [hasSubsequence](#hasSubsequence) but assumes `haystack` and `needle` are U
 
 ## hasSubsequenceCaseInsensitiveUTF8
 
-Like [hasSubsequenceUTF8](#hasSubsequenceUTF8) but searches case-insensitively.
\ No newline at end of file
+Like [hasSubsequenceUTF8](#hasSubsequenceUTF8) but searches case-insensitively.
+
+## hammingDistance
+
+Calculates the hamming distance between two strings.
+
+**Syntax**
+
+```sql
+hammingDistance(haystack, needle)
+```
+
+**Examples**
+
+``` sql
+SELECT hammingDistance('abc', 'ab') ;
+```
+
+Result:
+
+``` text
+┌─hammingDistance('abc', 'ab')─┐
+│                            1 │
+└──────────────────────────────┘
+```

From cbbabc4e1fa8715133a6f527c63da6c333879901 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Sat, 23 Sep 2023 04:11:20 +0000
Subject: [PATCH 075/101] fix

---
 .../functions/string-search-functions.md           | 14 +++++++-------
 ...HammingDistance.cpp => byteHammingDistance.cpp} | 11 ++++++-----
 2 files changed, 13 insertions(+), 12 deletions(-)
 rename src/Functions/{stringHammingDistance.cpp => byteHammingDistance.cpp} (90%)

diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index cb4963c1091..c7e2bfa1cad 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -682,26 +682,26 @@ Like [hasSubsequence](#hasSubsequence) but assumes `haystack` and `needle` are U
 
 Like [hasSubsequenceUTF8](#hasSubsequenceUTF8) but searches case-insensitively.
 
-## hammingDistance
+## byteHammingDistance
 
-Calculates the hamming distance between two strings.
+Calculates the hamming distance between two byte strings.
 
 **Syntax**
 
 ```sql
-hammingDistance(haystack, needle)
+byteHammingDistance(haystack, needle)
 ```
 
 **Examples**
 
 ``` sql
-SELECT hammingDistance('abc', 'ab') ;
+SELECT byteHammingDistance('abc', 'ab') ;
 ```
 
 Result:
 
 ``` text
-┌─hammingDistance('abc', 'ab')─┐
-│                            1 │
-└──────────────────────────────┘
+┌─byteHammingDistance('abc', 'ab')─┐
+│                                1 │
+└──────────────────────────────────┘
 ```
diff --git a/src/Functions/stringHammingDistance.cpp b/src/Functions/byteHammingDistance.cpp
similarity index 90%
rename from src/Functions/stringHammingDistance.cpp
rename to src/Functions/byteHammingDistance.cpp
index fd22ca96ba3..80df4163c1c 100644
--- a/src/Functions/stringHammingDistance.cpp
+++ b/src/Functions/byteHammingDistance.cpp
@@ -11,7 +11,7 @@
 
 namespace DB
 {
-struct StringHammingDistanceImpl
+struct ByteHammingDistanceImpl
 {
     using ResultType = UInt64;
 
@@ -92,15 +92,16 @@ private:
     }
 };
 
-struct NameStringHammingDistance
+struct NameByteHammingDistance
 {
-    static constexpr auto name = "hammingDistance";
+    static constexpr auto name = "byteHammingDistance";
 };
 
-using FunctionStringHammingDistance = FunctionsStringSimilarity<StringHammingDistanceImpl, NameStringHammingDistance>;
+using FunctionByteHammingDistance = FunctionsStringSimilarity<ByteHammingDistanceImpl, NameByteHammingDistance>;
 
 REGISTER_FUNCTION(StringHammingDistance)
 {
-    factory.registerFunction<FunctionStringHammingDistance>();
+    factory.registerFunction<FunctionByteHammingDistance>(
+        FunctionDocumentation{.description = R"(Calculates the hamming distance between two bytes strings.)"});
 }
 }

From 53da7243ea362c8f3cfe211a49827d9606805709 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Sat, 23 Sep 2023 04:14:21 +0000
Subject: [PATCH 076/101] fix spell check

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index e5a031dabe3..ef3ad7d793c 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1178,6 +1178,7 @@ builtins
 byteSize
 bytebase
 bytesToCutForIPv
+byteHammingDistance
 cLoki
 caConfig
 cacheSessions

From c1f4d911b8de9b7b025f0d97198bfde816fea74d Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Sat, 23 Sep 2023 04:52:31 +0000
Subject: [PATCH 077/101] update test

---
 ...ce.reference => 02884_byte_hamming_distance.reference} | 0
 ...mming_distance.sql => 02884_byte_hamming_distance.sql} | 8 ++++----
 2 files changed, 4 insertions(+), 4 deletions(-)
 rename tests/queries/0_stateless/{02884_string_hamming_distance.reference => 02884_byte_hamming_distance.reference} (100%)
 rename tests/queries/0_stateless/{02884_string_hamming_distance.sql => 02884_byte_hamming_distance.sql} (52%)

diff --git a/tests/queries/0_stateless/02884_string_hamming_distance.reference b/tests/queries/0_stateless/02884_byte_hamming_distance.reference
similarity index 100%
rename from tests/queries/0_stateless/02884_string_hamming_distance.reference
rename to tests/queries/0_stateless/02884_byte_hamming_distance.reference
diff --git a/tests/queries/0_stateless/02884_string_hamming_distance.sql b/tests/queries/0_stateless/02884_byte_hamming_distance.sql
similarity index 52%
rename from tests/queries/0_stateless/02884_string_hamming_distance.sql
rename to tests/queries/0_stateless/02884_byte_hamming_distance.sql
index 3f026d6f8d0..62d4348449c 100644
--- a/tests/queries/0_stateless/02884_string_hamming_distance.sql
+++ b/tests/queries/0_stateless/02884_byte_hamming_distance.sql
@@ -1,4 +1,4 @@
-select hammingDistance('abcd', 'abcd');
+select byteHammingDistance('abcd', 'abcd');
 drop table if exists t;
 create table t
 (
@@ -8,10 +8,10 @@ create table t
 
 insert into t values ('abcdefg', 'abcdef') ('abcdefg', 'bcdefg') ('abcdefg', '');
 
-select hammingDistance(s1, s2) from t;
+select byteHammingDistance(s1, s2) from t;
 
-select hammingDistance('abc', s2) from t;
+select byteHammingDistance('abc', s2) from t;
 
-select hammingDistance(s2, 'def') from t;
+select byteHammingDistance(s2, 'def') from t;
 
 drop table t;

From 03b088a5710b6e458f2460bb067da8c43a5ca0b4 Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Sat, 23 Sep 2023 17:17:35 +0000
Subject: [PATCH 078/101] add more functions

---
 .../functions/string-search-functions.md      |  53 +++++
 src/Functions/FunctionsStringDistance.cpp     | 218 ++++++++++++++++++
 src/Functions/byteHammingDistance.cpp         | 107 ---------
 .../02884_byte_hamming_distance.reference     |  10 -
 .../02884_string_distance_function.reference  |  37 +++
 ...sql => 02884_string_distance_function.sql} |  15 +-
 .../aspell-ignore/en/aspell-dict.txt          |   3 +
 7 files changed, 322 insertions(+), 121 deletions(-)
 create mode 100644 src/Functions/FunctionsStringDistance.cpp
 delete mode 100644 src/Functions/byteHammingDistance.cpp
 delete mode 100644 tests/queries/0_stateless/02884_byte_hamming_distance.reference
 create mode 100644 tests/queries/0_stateless/02884_string_distance_function.reference
 rename tests/queries/0_stateless/{02884_byte_hamming_distance.sql => 02884_string_distance_function.sql} (50%)

diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index c7e2bfa1cad..e75c4fa8252 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -705,3 +705,56 @@ Result:
 │                                1 │
 └──────────────────────────────────┘
 ```
+
+- Alias: mismatches
+
+## byteJaccardIndex
+
+Calculates the jaccard similarity index between two byte strings.
+
+**Syntax**
+
+```sql
+byteJaccardIndex(haystack, needle)
+```
+
+**Examples**
+
+``` sql
+SELECT byteJaccardIndex('clickhouse', 'mouse');
+```
+
+Result:
+
+``` text
+┌─byteJaccardIndex('clickhouse', 'mouse')─┐
+│                                     0.4 │
+└─────────────────────────────────────────┘
+```
+
+## byteEditDistance
+
+Calcultes the edit distance between two byte strings.
+
+**Syntax**
+
+```sql
+byteEidtDistance(haystack, needle)
+```
+
+**Examples**
+
+``` sql
+SELECT byteEditDistance('clickhouse', 'mouse');
+```
+
+Result:
+
+``` text
+┌─byteEditDistance('clickhouse', 'mouse')─┐
+│                                       6 │
+└─────────────────────────────────────────┘
+```
+
+- Alias: byteLevenshteinDistance
+
diff --git a/src/Functions/FunctionsStringDistance.cpp b/src/Functions/FunctionsStringDistance.cpp
new file mode 100644
index 00000000000..73ff379aae0
--- /dev/null
+++ b/src/Functions/FunctionsStringDistance.cpp
@@ -0,0 +1,218 @@
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionsStringSimilarity.h>
+#include <Common/PODArray.h>
+
+#ifdef __SSE4_2__
+#    include <nmmintrin.h>
+#endif
+
+namespace DB
+{
+namespace ErrorCodes
+{
+extern const int TOO_LARGE_STRING_SIZE;
+}
+
+template <typename Op>
+struct FunctionDistanceImpl
+{
+    using ResultType = typename Op::ResultType;
+
+    static void constantConstant(const std::string & haystack, const std::string & needle, ResultType & res)
+    {
+        res = Op::process(haystack.data(), haystack.size(), needle.data(), needle.size());
+    }
+
+    static void vectorVector(
+        const ColumnString::Chars & haystack_data,
+        const ColumnString::Offsets & haystack_offsets,
+        const ColumnString::Chars & needle_data,
+        const ColumnString::Offsets & needle_offsets,
+        PaddedPODArray<ResultType> & res)
+    {
+        size_t size = res.size();
+        const char * haystack = reinterpret_cast<const char *>(haystack_data.data());
+        const char * needle = reinterpret_cast<const char *>(needle_data.data());
+        for (size_t i = 0; i < size; ++i)
+        {
+            res[i] = Op::process(
+                haystack + haystack_offsets[i - 1],
+                haystack_offsets[i] - haystack_offsets[i - 1] - 1,
+                needle + needle_offsets[i - 1],
+                needle_offsets[i] - needle_offsets[i - 1] - 1);
+        }
+    }
+
+    static void constantVector(
+        const std::string & haystack,
+        const ColumnString::Chars & needle_data,
+        const ColumnString::Offsets & needle_offsets,
+        PaddedPODArray<ResultType> & res)
+    {
+        const char * haystack_data = haystack.data();
+        size_t haystack_size = haystack.size();
+        const char * needle = reinterpret_cast<const char *>(needle_data.data());
+        size_t size = res.size();
+        for (size_t i = 0; i < size; ++i)
+        {
+            res[i]
+                = Op::process(haystack_data, haystack_size, needle + needle_offsets[i - 1], needle_offsets[i] - needle_offsets[i - 1] - 1);
+        }
+    }
+
+    static void vectorConstant(
+        const ColumnString::Chars & data,
+        const ColumnString::Offsets & offsets,
+        const std::string & needle,
+        PaddedPODArray<ResultType> & res)
+    {
+        constantVector(needle, data, offsets, res);
+    }
+
+};
+
+struct ByteHammingDistanceImpl
+{
+    using ResultType = UInt64;
+    static ResultType inline process(
+        const char * __restrict haystack, size_t haystack_size, const char * __restrict needle, size_t needle_size)
+    {
+        UInt64 res = 0;
+        const char * haystack_end = haystack + haystack_size;
+        const char * needle_end = needle + needle_size;
+
+#ifdef __SSE4_2__
+        static constexpr auto mode = _SIDD_UBYTE_OPS | _SIDD_CMP_EQUAL_EACH | _SIDD_NEGATIVE_POLARITY;
+
+        const char * haystack_end16 = haystack + haystack_size / 16 * 16;
+        const char * needle_end16 = needle + needle_size / 16 * 16;
+
+        for (; haystack < haystack_end16 && needle < needle_end16; haystack += 16, needle += 16)
+        {
+            __m128i s1 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(haystack));
+            __m128i s2 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(needle));
+            auto result_mask = _mm_cmpestrm(s1, 16, s2, 16, mode);
+            const __m128i mask_hi = _mm_unpackhi_epi64(result_mask, result_mask);
+            res += _mm_popcnt_u64(_mm_cvtsi128_si64(result_mask)) + _mm_popcnt_u64(_mm_cvtsi128_si64(mask_hi));
+        }
+#endif
+        for (; haystack != haystack_end && needle != needle_end; ++haystack, ++needle)
+            res += *haystack != *needle;
+
+        res = res + (haystack_end - haystack) + (needle_end - needle);
+        return res;
+    }
+};
+
+struct ByteJaccardIndexImpl
+{
+    using ResultType = Float64;
+    static ResultType inline process(
+        const char * __restrict haystack, size_t haystack_size, const char * __restrict needle, size_t needle_size)
+    {
+        if (haystack_size == 0 || needle_size == 0)
+            return 0;
+
+        std::unordered_set<char> haystack_set(haystack, haystack + haystack_size);
+        std::unordered_set<char> needle_set(needle, needle + needle_size);
+
+        size_t intersect = 0;
+        for (auto elem : haystack_set)
+        {
+            intersect += needle_set.contains(elem);
+        }
+        return static_cast<Float64>(intersect) / (haystack_set.size() + needle_set.size() - intersect);
+    }
+};
+
+struct ByteEditDistanceImpl
+{
+    using ResultType = UInt64;
+    static constexpr size_t max_string_size = 1u << 16;
+
+    static ResultType inline process(
+        const char * __restrict haystack, size_t haystack_size, const char * __restrict needle, size_t needle_size)
+    {
+        if (haystack_size == 0 || needle_size == 0)
+            return haystack_size + needle_size;
+
+        /// Safety threshold against DoS, since we use two array to calculate the distance.
+        if (haystack_size > max_string_size || needle_size > max_string_size)
+            throw Exception(
+                ErrorCodes::TOO_LARGE_STRING_SIZE,
+                "The string size is too big for function byteEditDistance. "
+                "Should be at most {}",
+                max_string_size);
+
+        PaddedPODArray<ResultType> distances0(haystack_size + 1, 0);
+        PaddedPODArray<ResultType> distances1(haystack_size + 1, 0);
+
+        ResultType substitution = 0;
+        ResultType insertion = 0;
+        ResultType deletion = 0;
+
+        for (size_t i = 0; i <= haystack_size; ++i)
+            distances0[i] = i;
+
+        for (size_t pos_needle = 0; pos_needle < needle_size; ++pos_needle)
+        {
+            distances1[0] = pos_needle + 1;
+
+            for (size_t pos_haystack = 0; pos_haystack < haystack_size; pos_haystack++)
+            {
+                deletion = distances0[pos_haystack + 1] + 1;
+                insertion = distances1[pos_haystack] + 1;
+                substitution = distances0[pos_haystack];
+
+                if (*(needle + pos_needle) != *(haystack + pos_haystack))
+                    substitution += 1;
+
+                distances1[pos_haystack + 1] = std::min(deletion, std::min(substitution, insertion));
+            }
+            distances0.swap(distances1);
+        }
+
+        return distances0[haystack_size];
+    }
+};
+
+struct NameByteHammingDistance
+{
+    static constexpr auto name = "byteHammingDistance";
+};
+
+struct NameByteJaccardIndex
+{
+    static constexpr auto name = "byteJaccardIndex";
+};
+
+struct NameByteEditDistance
+{
+    static constexpr auto name = "byteEditDistance";
+};
+
+using FunctionByteHammingDistance
+    = FunctionsStringSimilarity<FunctionDistanceImpl<ByteHammingDistanceImpl>, NameByteHammingDistance>;
+
+using FunctionByteJaccardIndex = FunctionsStringSimilarity<FunctionDistanceImpl<ByteJaccardIndexImpl>, NameByteJaccardIndex>;
+
+using FunctionByteEditDistance = FunctionsStringSimilarity<FunctionDistanceImpl<ByteEditDistanceImpl>, NameByteEditDistance>;
+
+REGISTER_FUNCTION(StringHammingDistance)
+{
+    factory.registerFunction<FunctionByteHammingDistance>(
+        FunctionDocumentation{.description = R"(Calculates the hamming distance between two bytes strings.)"});
+    factory.registerAlias("mismatches", NameByteHammingDistance::name);
+
+    factory.registerFunction<FunctionByteJaccardIndex>(
+        FunctionDocumentation{.description = R"(Calculates the jaccard similarity index between two bytes strings.)"});
+
+    factory.registerFunction<FunctionByteEditDistance>(
+        FunctionDocumentation{.description = R"(Calculates the edit distance between two bytes strings.)"});
+    factory.registerAlias("byteLevenshteinDistance", NameByteEditDistance::name);
+}
+}
diff --git a/src/Functions/byteHammingDistance.cpp b/src/Functions/byteHammingDistance.cpp
deleted file mode 100644
index 80df4163c1c..00000000000
--- a/src/Functions/byteHammingDistance.cpp
+++ /dev/null
@@ -1,107 +0,0 @@
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnsNumber.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/FunctionsStringSimilarity.h>
-
-#ifdef __SSE4_2__
-#    include <nmmintrin.h>
-#endif
-
-namespace DB
-{
-struct ByteHammingDistanceImpl
-{
-    using ResultType = UInt64;
-
-    static void constantConstant(const std::string & haystack, const std::string & needle, UInt64 & res)
-    {
-        res = process(haystack.data(), haystack.size(), needle.data(), needle.size());
-    }
-
-    static void vectorVector(
-        const ColumnString::Chars & haystack_data,
-        const ColumnString::Offsets & haystack_offsets,
-        const ColumnString::Chars & needle_data,
-        const ColumnString::Offsets & needle_offsets,
-        PaddedPODArray<UInt64> & res)
-    {
-        size_t size = res.size();
-        const char * haystack = reinterpret_cast<const char *>(haystack_data.data());
-        const char * needle = reinterpret_cast<const char *>(needle_data.data());
-        for (size_t i = 0; i < size; ++i)
-        {
-            res[i] = process(
-                haystack + haystack_offsets[i - 1],
-                haystack_offsets[i] - haystack_offsets[i - 1] - 1,
-                needle + needle_offsets[i - 1],
-                needle_offsets[i] - needle_offsets[i - 1] - 1);
-        }
-    }
-
-    static void constantVector(
-        const std::string & haystack,
-        const ColumnString::Chars & needle_data,
-        const ColumnString::Offsets & needle_offsets,
-        PaddedPODArray<UInt64> & res)
-    {
-        const char * haystack_data = haystack.data();
-        size_t haystack_size = haystack.size();
-        const char * needle = reinterpret_cast<const char *>(needle_data.data());
-        size_t size = res.size();
-        for (size_t i = 0; i < size; ++i)
-        {
-            res[i] = process(haystack_data, haystack_size, needle + needle_offsets[i - 1], needle_offsets[i] - needle_offsets[i - 1] - 1);
-        }
-    }
-
-    static void vectorConstant(
-        const ColumnString::Chars & data, const ColumnString::Offsets & offsets, const std::string & needle, PaddedPODArray<UInt64> & res)
-    {
-        constantVector(needle, data, offsets, res);
-    }
-
-private:
-    static UInt64 inline process(const char * haystack, size_t haystack_size, const char * needle, size_t needle_size)
-    {
-        UInt64 res = 0;
-        const char * haystack_end = haystack + haystack_size;
-        const char * needle_end = needle + needle_size;
-
-#ifdef __SSE4_2__
-        static constexpr auto mode = _SIDD_UBYTE_OPS | _SIDD_CMP_EQUAL_EACH | _SIDD_NEGATIVE_POLARITY;
-
-        const char * haystack_end16 = haystack + haystack_size / 16 * 16;
-        const char * needle_end16 = needle + needle_size / 16 * 16;
-
-        for (; haystack < haystack_end16 && needle < needle_end16; haystack += 16, needle += 16)
-        {
-            __m128i s1 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(haystack));
-            __m128i s2 = _mm_loadu_si128(reinterpret_cast<const __m128i *>(needle));
-            auto result_mask = _mm_cmpestrm(s1, 16, s2, 16, mode);
-            const __m128i mask_hi = _mm_unpackhi_epi64(result_mask, result_mask);
-            res += _mm_popcnt_u64(_mm_cvtsi128_si64(result_mask)) + _mm_popcnt_u64(_mm_cvtsi128_si64(mask_hi));
-        }
-#endif
-        for (; haystack != haystack_end && needle != needle_end; ++haystack, ++needle)
-            res += *haystack != *needle;
-
-        res = res + (haystack_end - haystack) + (needle_end - needle);
-        return res;
-    }
-};
-
-struct NameByteHammingDistance
-{
-    static constexpr auto name = "byteHammingDistance";
-};
-
-using FunctionByteHammingDistance = FunctionsStringSimilarity<ByteHammingDistanceImpl, NameByteHammingDistance>;
-
-REGISTER_FUNCTION(StringHammingDistance)
-{
-    factory.registerFunction<FunctionByteHammingDistance>(
-        FunctionDocumentation{.description = R"(Calculates the hamming distance between two bytes strings.)"});
-}
-}
diff --git a/tests/queries/0_stateless/02884_byte_hamming_distance.reference b/tests/queries/0_stateless/02884_byte_hamming_distance.reference
deleted file mode 100644
index 656cd356016..00000000000
--- a/tests/queries/0_stateless/02884_byte_hamming_distance.reference
+++ /dev/null
@@ -1,10 +0,0 @@
-0
-1
-7
-7
-3
-6
-3
-6
-6
-3
diff --git a/tests/queries/0_stateless/02884_string_distance_function.reference b/tests/queries/0_stateless/02884_string_distance_function.reference
new file mode 100644
index 00000000000..d50ffa0a48e
--- /dev/null
+++ b/tests/queries/0_stateless/02884_string_distance_function.reference
@@ -0,0 +1,37 @@
+0
+1
+7
+7
+10
+3
+6
+3
+10
+6
+6
+3
+10
+1
+7
+7
+10
+3
+6
+3
+10
+6
+6
+3
+10
+0.8571428571428571
+0.8571428571428571
+0
+0.4
+1
+1
+7
+6
+1
+1
+7
+6
diff --git a/tests/queries/0_stateless/02884_byte_hamming_distance.sql b/tests/queries/0_stateless/02884_string_distance_function.sql
similarity index 50%
rename from tests/queries/0_stateless/02884_byte_hamming_distance.sql
rename to tests/queries/0_stateless/02884_string_distance_function.sql
index 62d4348449c..bab22f24bf2 100644
--- a/tests/queries/0_stateless/02884_byte_hamming_distance.sql
+++ b/tests/queries/0_stateless/02884_string_distance_function.sql
@@ -6,12 +6,19 @@ create table t
 	s2 String
 ) engine = MergeTree order by s1;
 
-insert into t values ('abcdefg', 'abcdef') ('abcdefg', 'bcdefg') ('abcdefg', '');
-
+insert into t values ('abcdefg', 'abcdef') ('abcdefg', 'bcdefg') ('abcdefg', '') ('mouse', 'clickhouse');
 select byteHammingDistance(s1, s2) from t;
-
 select byteHammingDistance('abc', s2) from t;
-
 select byteHammingDistance(s2, 'def') from t;
 
+select mismatches(s1, s2) from t;
+select mismatches('abc', s2) from t;
+select mismatches(s2, 'def') from t;
+
+select byteJaccardIndex(s1, s2) from t;
+select byteEditDistance(s1, s2) from t;
+select byteLevenshteinDistance(s1, s2) from t;
+
+SELECT byteEditDistance(randomString(power(2, 17)), 'abc'); -- { serverError 131 }
+
 drop table t;
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index ef3ad7d793c..560b9130e10 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1178,7 +1178,10 @@ builtins
 byteSize
 bytebase
 bytesToCutForIPv
+byteEditDistance
 byteHammingDistance
+byteJaccardIndex
+byteLevenshteinDistance
 cLoki
 caConfig
 cacheSessions

From 9b40ca9d5fe7a8ab2d47f10ea4d66c55ec24e35b Mon Sep 17 00:00:00 2001
From: flynn <fenglv15@mails.ucas.ac.cn>
Date: Sat, 23 Sep 2023 17:50:02 +0000
Subject: [PATCH 079/101] fix spell

---
 docs/en/sql-reference/functions/string-search-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index e75c4fa8252..8a2e257ed34 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -734,7 +734,7 @@ Result:
 
 ## byteEditDistance
 
-Calcultes the edit distance between two byte strings.
+Calculates the edit distance between two byte strings.
 
 **Syntax**
 

From 601f904275834f6750638142083c4d9e531a4348 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 20 Sep 2023 16:00:28 +0000
Subject: [PATCH 080/101] Move obsolete format settings to separate section

---
 src/Core/Settings.cpp                    |  2 +-
 src/Core/Settings.h                      | 26 ++++++++++++++++--------
 src/Storages/FileLog/FileLogSettings.h   |  2 +-
 src/Storages/Hive/HiveSettings.h         |  2 +-
 src/Storages/Kafka/KafkaSettings.h       |  2 +-
 src/Storages/NATS/NATSSettings.h         |  2 +-
 src/Storages/RabbitMQ/RabbitMQSettings.h |  2 +-
 src/Storages/S3Queue/S3QueueSettings.h   |  2 +-
 src/Storages/SetSettings.h               |  2 +-
 9 files changed, 25 insertions(+), 17 deletions(-)

diff --git a/src/Core/Settings.cpp b/src/Core/Settings.cpp
index ed0868eaa4d..33db7660abd 100644
--- a/src/Core/Settings.cpp
+++ b/src/Core/Settings.cpp
@@ -158,6 +158,6 @@ void Settings::applyCompatibilitySetting(const String & compatibility_value)
     }
 }
 
-IMPLEMENT_SETTINGS_TRAITS(FormatFactorySettingsTraits, FORMAT_FACTORY_SETTINGS)
+IMPLEMENT_SETTINGS_TRAITS(FormatFactorySettingsTraits, LIST_OF_ALL_FORMAT_SETTINGS)
 
 }
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index f2b55fbcd0b..8338e5c7d59 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -806,7 +806,7 @@ class IColumn;
     M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0)                                                                                                  \
 
 // End of COMMON_SETTINGS
-    // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS and move obsolete settings to OBSOLETE_SETTINGS.
+    // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
 
 #define MAKE_OBSOLETE(M, TYPE, NAME, DEFAULT) \
     M(TYPE, NAME, DEFAULT, "Obsolete setting, does nothing.", BaseSettingsHelpers::Flags::OBSOLETE)
@@ -859,9 +859,6 @@ class IColumn;
     MAKE_OBSOLETE(M, Seconds, drain_timeout, 3) \
     MAKE_OBSOLETE(M, UInt64, backup_threads, 16) \
     MAKE_OBSOLETE(M, UInt64, restore_threads, 16) \
-    MAKE_OBSOLETE(M, Bool, input_format_arrow_import_nested, false) \
-    MAKE_OBSOLETE(M, Bool, input_format_parquet_import_nested, false) \
-    MAKE_OBSOLETE(M, Bool, input_format_orc_import_nested, false) \
     MAKE_OBSOLETE(M, Bool, optimize_duplicate_order_by_and_distinct, false) \
 
     /** The section above is for obsolete settings. Do not add anything there. */
@@ -1068,10 +1065,17 @@ class IColumn;
 // End of FORMAT_FACTORY_SETTINGS
 // Please add settings non-related to formats into the COMMON_SETTINGS above.
 
-#define LIST_OF_SETTINGS(M, ALIAS)    \
-    COMMON_SETTINGS(M, ALIAS)         \
-    OBSOLETE_SETTINGS(M, ALIAS)       \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+#define OBSOLETE_FORMAT_SETTINGS(M, ALIAS) \
+    /** Obsolete format settings that do nothing but left for compatibility reasons. Remove each one after half a year of obsolescence. */ \
+    MAKE_OBSOLETE(M, Bool, input_format_arrow_import_nested, false) \
+    MAKE_OBSOLETE(M, Bool, input_format_parquet_import_nested, false) \
+    MAKE_OBSOLETE(M, Bool, input_format_orc_import_nested, false) \
+
+#define LIST_OF_SETTINGS(M, ALIAS)     \
+    COMMON_SETTINGS(M, ALIAS)          \
+    OBSOLETE_SETTINGS(M, ALIAS)        \
+    FORMAT_FACTORY_SETTINGS(M, ALIAS)  \
+    OBSOLETE_FORMAT_SETTINGS(M, ALIAS) \
 
 DECLARE_SETTINGS_TRAITS_ALLOW_CUSTOM_SETTINGS(SettingsTraits, LIST_OF_SETTINGS)
 
@@ -1110,10 +1114,14 @@ private:
     std::unordered_set<std::string_view> settings_changed_by_compatibility_setting;
 };
 
+#define LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS) \
+    FORMAT_FACTORY_SETTINGS(M, ALIAS)         \
+    OBSOLETE_FORMAT_SETTINGS(M, ALIAS)        \
+
 /*
  * User-specified file format settings for File and URL engines.
  */
-DECLARE_SETTINGS_TRAITS(FormatFactorySettingsTraits, FORMAT_FACTORY_SETTINGS)
+DECLARE_SETTINGS_TRAITS(FormatFactorySettingsTraits, LIST_OF_ALL_FORMAT_SETTINGS)
 
 struct FormatFactorySettings : public BaseSettings<FormatFactorySettingsTraits>
 {
diff --git a/src/Storages/FileLog/FileLogSettings.h b/src/Storages/FileLog/FileLogSettings.h
index 00c774dba08..4f3157424db 100644
--- a/src/Storages/FileLog/FileLogSettings.h
+++ b/src/Storages/FileLog/FileLogSettings.h
@@ -21,7 +21,7 @@ class ASTStorage;
 
 #define LIST_OF_FILELOG_SETTINGS(M, ALIAS) \
     FILELOG_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(FileLogSettingsTraits, LIST_OF_FILELOG_SETTINGS)
 
diff --git a/src/Storages/Hive/HiveSettings.h b/src/Storages/Hive/HiveSettings.h
index aaaa3306cf7..cbef19b3fa7 100644
--- a/src/Storages/Hive/HiveSettings.h
+++ b/src/Storages/Hive/HiveSettings.h
@@ -20,7 +20,7 @@ class ASTStorage;
 
 #define LIST_OF_HIVE_SETTINGS(M, ALIAS) \
     HIVE_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(HiveSettingsTraits, LIST_OF_HIVE_SETTINGS)
 
diff --git a/src/Storages/Kafka/KafkaSettings.h b/src/Storages/Kafka/KafkaSettings.h
index 03c415b80e1..cfe9f16c019 100644
--- a/src/Storages/Kafka/KafkaSettings.h
+++ b/src/Storages/Kafka/KafkaSettings.h
@@ -39,7 +39,7 @@ class ASTStorage;
 
 #define LIST_OF_KAFKA_SETTINGS(M, ALIAS) \
     KAFKA_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(KafkaSettingsTraits, LIST_OF_KAFKA_SETTINGS)
 
diff --git a/src/Storages/NATS/NATSSettings.h b/src/Storages/NATS/NATSSettings.h
index e82f351dd42..2482f811e50 100644
--- a/src/Storages/NATS/NATSSettings.h
+++ b/src/Storages/NATS/NATSSettings.h
@@ -30,7 +30,7 @@ class ASTStorage;
 
 #define LIST_OF_NATS_SETTINGS(M, ALIAS) \
     NATS_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(NATSSettingsTraits, LIST_OF_NATS_SETTINGS)
 
diff --git a/src/Storages/RabbitMQ/RabbitMQSettings.h b/src/Storages/RabbitMQ/RabbitMQSettings.h
index 58d80c6ec9d..78cc8bf4df1 100644
--- a/src/Storages/RabbitMQ/RabbitMQSettings.h
+++ b/src/Storages/RabbitMQ/RabbitMQSettings.h
@@ -38,7 +38,7 @@ namespace DB
 
 #define LIST_OF_RABBITMQ_SETTINGS(M, ALIAS) \
     RABBITMQ_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(RabbitMQSettingsTraits, LIST_OF_RABBITMQ_SETTINGS)
 
diff --git a/src/Storages/S3Queue/S3QueueSettings.h b/src/Storages/S3Queue/S3QueueSettings.h
index 75defc4a57f..328980f46d8 100644
--- a/src/Storages/S3Queue/S3QueueSettings.h
+++ b/src/Storages/S3Queue/S3QueueSettings.h
@@ -33,7 +33,7 @@ class ASTStorage;
 
 #define LIST_OF_S3QUEUE_SETTINGS(M, ALIAS) \
     S3QUEUE_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(S3QueueSettingsTraits, LIST_OF_S3QUEUE_SETTINGS)
 
diff --git a/src/Storages/SetSettings.h b/src/Storages/SetSettings.h
index cc1cc642f91..98c1f3d97f5 100644
--- a/src/Storages/SetSettings.h
+++ b/src/Storages/SetSettings.h
@@ -15,7 +15,7 @@ class ASTStorage;
 
 #define LIST_OF_SET_SETTINGS(M, ALIAS) \
     SET_RELATED_SETTINGS(M, ALIAS) \
-    FORMAT_FACTORY_SETTINGS(M, ALIAS)
+    LIST_OF_ALL_FORMAT_SETTINGS(M, ALIAS)
 
 DECLARE_SETTINGS_TRAITS(setSettingsTraits, LIST_OF_SET_SETTINGS)
 

From 5b4033e829d5e5d56b9e70e40d41617513cbb064 Mon Sep 17 00:00:00 2001
From: Tyler Hannan <tyler@clickhouse.com>
Date: Mon, 25 Sep 2023 17:11:20 +0200
Subject: [PATCH 081/101] Update README.md

Updating README
---
 README.md | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 6d253342a15..6736f5c67f3 100644
--- a/README.md
+++ b/README.md
@@ -22,9 +22,11 @@ curl https://clickhouse.com/ | sh
 
 ## Upcoming Events
 
-* [**v23.8 Community Call**](https://clickhouse.com/company/events/v23-8-community-release-call?utm_source=github&utm_medium=social&utm_campaign=release-webinar-2023-08) - Aug 31 - 23.8 is rapidly approaching. Original creator, co-founder, and CTO of ClickHouse Alexey Milovidov will walk us through the highlights of the release.
-* [**ClickHouse & AI - A Meetup in San Francisco**](https://www.meetup.com/clickhouse-silicon-valley-meetup-group/events/294472987) - Aug 8
-* [**ClickHouse Meetup in Paris**](https://www.meetup.com/clickhouse-france-user-group/events/294283460) - Sep 12
+* [**v23.9 Community Call**]([https://clickhouse.com/company/events/v23-8-community-release-call](https://clickhouse.com/company/events/v23-9-community-release-call)?utm_source=github&utm_medium=social&utm_campaign=release-webinar-2023-08) - Sep 28 - 23.9 is rapidly approaching. Original creator, co-founder, and CTO of ClickHouse Alexey Milovidov will walk us through the highlights of the release.
+* [**ClickHouse Meetup in Amsterdam**](https://www.meetup.com/clickhouse-netherlands-user-group/events/296334590/)) - Oct 31
+* [**ClickHouse Meetup in Beijing**](https://www.meetup.com/clickhouse-beijing-user-group/events/296334856/) - Nov 4
+* [**ClickHouse Meetup in San Francisco**](https://www.meetup.com/clickhouse-silicon-valley-meetup-group/events/296334923/) - Nov 14
+* [**ClickHouse Meetup in Singapore**](https://www.meetup.com/clickhouse-singapore-meetup-group/events/296334976/) - Nov 15
 
 Also, keep an eye out for upcoming meetups around the world. Somewhere else you want us to be? Please feel free to reach out to tyler <at> clickhouse <dot> com.
 

From d368dda185c38c9b8a3b7cf15807aa9ade91653e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 25 Sep 2023 23:14:15 +0200
Subject: [PATCH 082/101] Remove incorrect assertion

---
 src/Interpreters/Cache/Metadata.cpp | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/src/Interpreters/Cache/Metadata.cpp b/src/Interpreters/Cache/Metadata.cpp
index 7a9321e4215..f8fe3dd4185 100644
--- a/src/Interpreters/Cache/Metadata.cpp
+++ b/src/Interpreters/Cache/Metadata.cpp
@@ -362,12 +362,6 @@ public:
                 return;
             inserted = keys.insert(key).second;
         }
-        /// There is an invariant that key cannot be submitted for removal if it is already in removal queue.
-        /// Because
-        /// 1) when submit key to removal it acquires state REMOVING and we submit key for removal only if it has ACTIVE state.
-        /// 2) if a key is added to cache and it was found in removal queue - it will be removed from the queue and get state ACTIVE.
-        /// and both these actions are synchronized by the same KeyGuard.
-        chassert(inserted);
         if (inserted)
         {
             CurrentMetrics::add(CurrentMetrics::FilesystemCacheDelayedCleanupElements);

From 805924d9f4f18bb63f052f4f1d41f7f6b4b44874 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 25 Sep 2023 21:50:24 +0000
Subject: [PATCH 083/101] Disable suggestions

---
 programs/local/LocalServer.cpp                             | 3 ++-
 .../0_stateless/02815_no_throw_in_simple_queries.sh        | 7 ++++++-
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 154cd4ef6be..9fb629a0871 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -586,7 +586,8 @@ void LocalServer::processConfig()
 
     print_stack_trace = config().getBool("stacktrace", false);
     const std::string clickhouse_dialect{"clickhouse"};
-    load_suggestions = false;
+    load_suggestions = (is_interactive || delayed_interactive) && !config().getBool("disable_suggestion", false)
+        && config().getString("dialect", clickhouse_dialect) == clickhouse_dialect;
 
     auto logging = (config().has("logger.console")
                     || config().has("logger.level")
diff --git a/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh b/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
index a5c6de3ce58..e2e4f3f8433 100755
--- a/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
+++ b/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
@@ -53,4 +53,9 @@ expect eof
 EOF
 }
 
-run "$CLICKHOUSE_LOCAL"
+run "$CLICKHOUSE_LOCAL --disable_suggestion"
+# Suggestions are off because the suggestion feature initializes itself by reading all available function
+# names from "system.functions". Getting the value for field "is_obsolete" occasionally throws (e.g. for
+# certain dictionary functions when dictionaries are not set up yet). Exceptions are properly handled, but
+# they exist for a short time. This, in combination with CLICKHOUSE_TERMINATE_ON_ANY_EXCEPTION, terminates
+# clickhouse-local and clickhouse-client when run in interactive mode *with* suggestions.

From 987906680f1510814281b5570d3b3813fc371c9e Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <43110995+evillique@users.noreply.github.com>
Date: Tue, 26 Sep 2023 03:36:14 +0200
Subject: [PATCH 084/101] Revert "Fix NATS high cpu usage"

---
 src/Storages/NATS/NATSHandler.cpp | 2 +-
 src/Storages/NATS/StorageNATS.cpp | 1 -
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Storages/NATS/NATSHandler.cpp b/src/Storages/NATS/NATSHandler.cpp
index f73b338380b..7006e5633a9 100644
--- a/src/Storages/NATS/NATSHandler.cpp
+++ b/src/Storages/NATS/NATSHandler.cpp
@@ -43,7 +43,7 @@ void NATSHandler::startLoop()
 
     while (loop_state.load() == Loop::RUN && duration.count() < MAX_THREAD_WORK_DURATION_MS)
     {
-        uv_run(loop, UV_RUN_DEFAULT);
+        uv_run(loop, UV_RUN_NOWAIT);
         end_time = std::chrono::steady_clock::now();
         duration = std::chrono::duration_cast<std::chrono::milliseconds>(end_time - start_time);
     }
diff --git a/src/Storages/NATS/StorageNATS.cpp b/src/Storages/NATS/StorageNATS.cpp
index 36ef302fa49..a3478069356 100644
--- a/src/Storages/NATS/StorageNATS.cpp
+++ b/src/Storages/NATS/StorageNATS.cpp
@@ -108,7 +108,6 @@ StorageNATS::StorageNATS(
             }
 
             LOG_DEBUG(log, "Connect attempt #{} failed, error: {}. Reconnecting...", i + 1, nats_GetLastError(nullptr));
-            std::this_thread::sleep_for(std::chrono::milliseconds(configuration.reconnect_wait));
         }
     }
     catch (...)

From 01f64be558d466690c78db85d31c0dcc3d7f7715 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 26 Sep 2023 07:41:05 +0000
Subject: [PATCH 085/101] Set path in response

---
 src/Coordination/KeeperStorage.cpp | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index fda1e6bc735..1779415dd30 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -956,6 +956,9 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         std::string path_created = request.path;
         if (request.is_sequential)
         {
+            if (request.not_exists)
+                return {KeeperStorage::Delta{zxid, Coordination::Error::ZBADARGUMENTS}};
+
             auto seq_num = parent_node->seq_num;
 
             std::stringstream seq_num_str; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
@@ -1037,7 +1040,11 @@ struct KeeperStorageCreateRequestProcessor final : public KeeperStorageRequestPr
         Coordination::ZooKeeperCreateResponse & response = dynamic_cast<Coordination::ZooKeeperCreateResponse &>(*response_ptr);
 
         if (storage.uncommitted_state.deltas.begin()->zxid != zxid)
+        {
+            response.path_created = zk_request->getPath();
+            response.error = Coordination::Error::ZOK;
             return response_ptr;
+        }
 
         if (const auto result = storage.commit(zxid); result != Coordination::Error::ZOK)
         {

From ef6c7fe45d5f48954248fe407748bfa8f75d3b2d Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 26 Sep 2023 08:30:34 +0000
Subject: [PATCH 086/101] Lower log levels for SSOCredentialsProvider

---
 src/IO/S3/Credentials.cpp | 17 +++++++----------
 1 file changed, 7 insertions(+), 10 deletions(-)

diff --git a/src/IO/S3/Credentials.cpp b/src/IO/S3/Credentials.cpp
index e02ab628e62..1eea167e1b9 100644
--- a/src/IO/S3/Credentials.cpp
+++ b/src/IO/S3/Credentials.cpp
@@ -461,7 +461,7 @@ SSOCredentialsProvider::SSOCredentialsProvider(DB::S3::PocoHTTPClientConfigurati
     , expiration_window_seconds(expiration_window_seconds_)
     , logger(&Poco::Logger::get(SSO_CREDENTIALS_PROVIDER_LOG_TAG))
 {
-    LOG_INFO(logger, "Setting sso credentials provider to read config from {}", profile_to_use);
+    LOG_TRACE(logger, "Setting sso credentials provider to read config from {}", profile_to_use);
 }
 
 Aws::Auth::AWSCredentials SSOCredentialsProvider::GetAWSCredentials()
@@ -491,16 +491,14 @@ void SSOCredentialsProvider::Reload()
         ss_token << profile_directory;
         ss_token << Aws::FileSystem::PATH_DELIM << "sso"  << Aws::FileSystem::PATH_DELIM << "cache" << Aws::FileSystem::PATH_DELIM << hashed_start_url << ".json";
         auto sso_token_path = ss_token.str();
-        LOG_INFO(logger, "Loading token from: {}", sso_token_path);
+        LOG_TEST(logger, "Loading token from: {}", sso_token_path);
         sso_region = profile.GetSsoRegion();
         return loadAccessTokenFile(sso_token_path);
     }();
 
     if (access_token.empty())
-    {
-        LOG_TRACE(logger, "Access token for SSO not available");
         return;
-    }
+
     if (expires_at < Aws::Utils::DateTime::Now())
     {
         LOG_TRACE(logger, "Cached Token expired at {}", expires_at.ToGmtString(Aws::Utils::DateFormat::ISO_8601));
@@ -514,7 +512,7 @@ void SSOCredentialsProvider::Reload()
 
     aws_client_configuration.scheme = Aws::Http::Scheme::HTTPS;
     aws_client_configuration.region = sso_region;
-    LOG_TRACE(logger, "Passing config to client for region: {}", sso_region);
+    LOG_TEST(logger, "Passing config to client for region: {}", sso_region);
 
     Aws::Vector<Aws::String> retryable_errors;
     retryable_errors.push_back("TooManyRequestsException");
@@ -545,13 +543,13 @@ void SSOCredentialsProvider::refreshIfExpired()
 
 Aws::String SSOCredentialsProvider::loadAccessTokenFile(const Aws::String & sso_access_token_path)
 {
-    LOG_TRACE(logger, "Preparing to load token from: {}", sso_access_token_path);
+    LOG_TEST(logger, "Preparing to load token from: {}", sso_access_token_path);
 
     Aws::IFStream input_file(sso_access_token_path.c_str());
 
     if (input_file)
     {
-        LOG_TRACE(logger, "Reading content from token file: {}", sso_access_token_path);
+        LOG_TEST(logger, "Reading content from token file: {}", sso_access_token_path);
 
         Aws::Utils::Json::JsonValue token_doc(input_file);
         if (!token_doc.WasParseSuccessful())
@@ -565,11 +563,10 @@ Aws::String SSOCredentialsProvider::loadAccessTokenFile(const Aws::String & sso_
         expiration_str = token_view.GetString("expiresAt");
         Aws::Utils::DateTime expiration(expiration_str, Aws::Utils::DateFormat::ISO_8601);
 
-        LOG_TRACE(logger, "Token cache file contains accessToken [{}], expiration [{}]", tmp_access_token, expiration_str);
+        LOG_TEST(logger, "Token cache file contains accessToken [{}], expiration [{}]", tmp_access_token, expiration_str);
 
         if (tmp_access_token.empty() || !expiration.WasParseSuccessful())
         {
-            LOG_TRACE(logger, R"(The SSO session associated with this profile has expired or is otherwise invalid. To refresh this SSO session run aws sso login with the corresponding profile.)");
             LOG_TRACE(
                 logger,
                 "Token cache file failed because {}{}",

From 0255d355ece336d836a4417fec9d1735430520cd Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 26 Sep 2023 11:48:28 +0300
Subject: [PATCH 087/101] CMake added DISABLE_OMIT_FRAME_POINTER option

---
 CMakeLists.txt | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b4e13e8ab5b..5a08fc9e8c4 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -329,7 +329,16 @@ set (COMPILER_FLAGS "${COMPILER_FLAGS}")
 # Our built-in unwinder only supports DWARF version up to 4.
 set (DEBUG_INFO_FLAGS "-g -gdwarf-4")
 
-set (CMAKE_CXX_FLAGS                     "${CMAKE_CXX_FLAGS} ${COMPILER_FLAGS}")
+# Disable omit frame pointer compiler optimization using -fno-omit-frame-pointer
+option(DISABLE_OMIT_FRAME_POINTER "Disable omit frame pointer compiler optimization" OFF)
+
+if (DISABLE_OMIT_FRAME_POINTER)
+    set (CMAKE_CXX_FLAGS_ADD "${CMAKE_CXX_FLAGS_ADD} -fno-omit-frame-pointer")
+    set (CMAKE_C_FLAGS_ADD "${CMAKE_C_FLAGS_ADD} -fno-omit-frame-pointer")
+    set (CMAKE_ASM_FLAGS_ADD "${CMAKE_ASM_FLAGS_ADD} -fno-omit-frame-pointer")
+endif()
+
+set (CMAKE_CXX_FLAGS                     "${CMAKE_CXX_FLAGS} ${COMPILER_FLAGS} ${CMAKE_CXX_FLAGS_ADD}")
 set (CMAKE_CXX_FLAGS_RELWITHDEBINFO      "${CMAKE_CXX_FLAGS_RELWITHDEBINFO} -O3 ${DEBUG_INFO_FLAGS} ${CMAKE_CXX_FLAGS_ADD}")
 set (CMAKE_CXX_FLAGS_DEBUG               "${CMAKE_CXX_FLAGS_DEBUG} -O0 ${DEBUG_INFO_FLAGS} ${CMAKE_CXX_FLAGS_ADD}")
 

From e954ffe939f420bd45ba4be1233bf93437096d1b Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 26 Sep 2023 09:51:48 +0000
Subject: [PATCH 088/101] Cleanups

---
 src/Core/Settings.h                        | 8 ++++----
 src/Storages/MergeTree/MergeTreeSettings.h | 1 -
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 94968735800..19182db16fb 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -800,9 +800,9 @@ class IColumn;
     M(Bool, keeper_map_strict_mode, false, "Enforce additional checks during operations on KeeperMap. E.g. throw an exception on an insert for already existing key", 0) \
     M(UInt64, extract_kvp_max_pairs_per_row, 1000, "Max number pairs that can be produced by extractKeyValuePairs function. Used to safeguard against consuming too much memory.", 0) \
     M(Timezone, session_timezone, "", "This setting can be removed in the future due to potential caveats. It is experimental and is not suitable for production usage. The default timezone for current session or query. The server default timezone if empty.", 0) \
-    M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0)\
-    M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0)                                                                                                  \
-    M(Bool, ignore_access_denied_multidirectory_globs, false, "Ignore access denied errors when processing multi-directory globs for file & HDFS.", 0)\
+    M(Bool, allow_create_index_without_type, false, "Allow CREATE INDEX query without TYPE. Query will be ignored. Made for SQL compatibility tests.", 0) \
+    M(Bool, create_index_ignore_unique, false, "Ignore UNIQUE keyword in CREATE UNIQUE INDEX. Made for SQL compatibility tests.", 0) \
+    M(Bool, ignore_access_denied_multidirectory_globs, false, "Ignore access denied errors when processing multi-directory globs for file & HDFS.", 0) \
 
 // End of COMMON_SETTINGS
     // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS and move obsolete settings to OBSOLETE_SETTINGS.
@@ -851,7 +851,7 @@ class IColumn;
     MAKE_DEPRECATED_BY_SERVER_CONFIG(M, UInt64, max_replicated_sends_network_bandwidth_for_server, 0) \
     /* ---- */ \
     MAKE_OBSOLETE(M, DefaultDatabaseEngine, default_database_engine, DefaultDatabaseEngine::Atomic) \
-    MAKE_OBSOLETE(M, UInt64, max_pipeline_depth, 0)                                                                                 \
+    MAKE_OBSOLETE(M, UInt64, max_pipeline_depth, 0) \
     MAKE_OBSOLETE(M, Seconds, temporary_live_view_timeout, 1) \
     MAKE_OBSOLETE(M, Milliseconds, async_insert_cleanup_timeout_ms, 1000) \
     MAKE_OBSOLETE(M, Bool, optimize_fuse_sum_count_avg, 0) \
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 1c338f3817c..79df52f2aa9 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -181,7 +181,6 @@ struct Settings;
     M(String, primary_key_compression_codec, "ZSTD(3)", "Compression encoding used by primary, primary key is small enough and cached, so the default compression is ZSTD(3).", 0) \
     M(UInt64, marks_compress_block_size, 65536, "Mark compress block size, the actual size of the block to compress.", 0) \
     M(UInt64, primary_key_compress_block_size, 65536, "Primary compress block size, the actual size of the block to compress.", 0) \
-    \
 
 #define MAKE_OBSOLETE_MERGE_TREE_SETTING(M, TYPE, NAME, DEFAULT) \
     M(TYPE, NAME, DEFAULT, "Obsolete setting, does nothing.", BaseSettingsHelpers::Flags::OBSOLETE)

From 978a0c9cab4a36bbe95e1d75270040e10083805a Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Tue, 26 Sep 2023 10:45:50 +0000
Subject: [PATCH 089/101] + test

---
 .../system-tables/merge_tree_settings.md      |  2 +-
 .../system-tables/server_settings.md          |  2 +-
 docs/en/operations/system-tables/settings.md  |  2 +-
 .../02888_obsolete_settings.reference         | 63 +++++++++++++++++++
 .../0_stateless/02888_obsolete_settings.sql   |  8 +++
 5 files changed, 74 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/02888_obsolete_settings.reference
 create mode 100644 tests/queries/0_stateless/02888_obsolete_settings.sql

diff --git a/docs/en/operations/system-tables/merge_tree_settings.md b/docs/en/operations/system-tables/merge_tree_settings.md
index 557835ce3b6..48217d63f9d 100644
--- a/docs/en/operations/system-tables/merge_tree_settings.md
+++ b/docs/en/operations/system-tables/merge_tree_settings.md
@@ -17,7 +17,7 @@ Columns:
     - `0` — Current user can change the setting.
     - `1` — Current user can’t change the setting.
 - `type` ([String](../../sql-reference/data-types/string.md)) — Setting type (implementation specific string value).
-- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) _ Shows whether a setting is obsolete.
+- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) - Shows whether a setting is obsolete.
 
 **Example**
 ```sql
diff --git a/docs/en/operations/system-tables/server_settings.md b/docs/en/operations/system-tables/server_settings.md
index df482261ae8..7efe605ccef 100644
--- a/docs/en/operations/system-tables/server_settings.md
+++ b/docs/en/operations/system-tables/server_settings.md
@@ -14,7 +14,7 @@ Columns:
 - `changed` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) — Shows whether a setting was specified in `config.xml`
 - `description` ([String](../../sql-reference/data-types/string.md)) — Short server setting description.
 - `type` ([String](../../sql-reference/data-types/string.md)) — Server setting value type.
-- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) _ Shows whether a setting is obsolete.
+- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) - Shows whether a setting is obsolete.
 
 **Example**
 
diff --git a/docs/en/operations/system-tables/settings.md b/docs/en/operations/system-tables/settings.md
index 7dd2345a2d0..a04e095e990 100644
--- a/docs/en/operations/system-tables/settings.md
+++ b/docs/en/operations/system-tables/settings.md
@@ -17,7 +17,7 @@ Columns:
     - `0` — Current user can change the setting.
     - `1` — Current user can’t change the setting.
 - `default` ([String](../../sql-reference/data-types/string.md)) — Setting default value.
-- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) _ Shows whether a setting is obsolete.
+- `is_obsolete` ([UInt8](../../sql-reference/data-types/int-uint.md#uint-ranges)) - Shows whether a setting is obsolete.
 
 **Example**
 
diff --git a/tests/queries/0_stateless/02888_obsolete_settings.reference b/tests/queries/0_stateless/02888_obsolete_settings.reference
new file mode 100644
index 00000000000..af4e486ffb5
--- /dev/null
+++ b/tests/queries/0_stateless/02888_obsolete_settings.reference
@@ -0,0 +1,63 @@
+-- Obsolete server settings
+-- Obsolete general settings
+allow_experimental_bigint_types
+allow_experimental_database_atomic
+allow_experimental_geo_types
+allow_experimental_map_type
+allow_experimental_window_functions
+async_insert_cleanup_timeout_ms
+async_insert_stale_timeout_ms
+async_insert_threads
+background_buffer_flush_schedule_pool_size
+background_common_pool_size
+background_distributed_schedule_pool_size
+background_fetches_pool_size
+background_merges_mutations_concurrency_ratio
+background_message_broker_schedule_pool_size
+background_move_pool_size
+background_pool_size
+background_schedule_pool_size
+backup_threads
+database_replicated_ddl_output
+default_database_engine
+drain_timeout
+enable_debug_queries
+handle_kafka_error_mode
+input_format_arrow_import_nested
+input_format_orc_import_nested
+input_format_parquet_import_nested
+max_alter_threads
+max_memory_usage_for_all_queries
+max_pipeline_depth
+max_remote_read_network_bandwidth_for_server
+max_remote_write_network_bandwidth_for_server
+max_replicated_fetches_network_bandwidth_for_server
+max_replicated_sends_network_bandwidth_for_server
+merge_tree_clear_old_parts_interval_seconds
+merge_tree_clear_old_temporary_directories_interval_seconds
+multiple_joins_rewriter_version
+odbc_max_field_size
+optimize_duplicate_order_by_and_distinct
+optimize_fuse_sum_count_avg
+partial_merge_join_optimizations
+replication_alter_columns_timeout
+restore_threads
+temporary_live_view_timeout
+-- Obsolete merge tree settings
+check_delay_period
+in_memory_parts_enable_wal
+in_memory_parts_insert_sync
+max_part_loading_threads
+max_part_removal_threads
+min_bytes_for_compact_part
+min_relative_delay_to_yield_leadership
+min_rows_for_compact_part
+replicated_max_parallel_fetches
+replicated_max_parallel_fetches_for_table
+replicated_max_parallel_sends
+replicated_max_parallel_sends_for_table
+use_metadata_cache
+write_ahead_log_bytes_to_fsync
+write_ahead_log_interval_ms_to_fsync
+write_ahead_log_max_bytes
+write_final_mark
diff --git a/tests/queries/0_stateless/02888_obsolete_settings.sql b/tests/queries/0_stateless/02888_obsolete_settings.sql
new file mode 100644
index 00000000000..4d336997ad2
--- /dev/null
+++ b/tests/queries/0_stateless/02888_obsolete_settings.sql
@@ -0,0 +1,8 @@
+SELECT '-- Obsolete server settings';
+SELECT name FROM system.server_settings WHERE is_obsolete = 1 ORDER BY name;
+
+SELECT '-- Obsolete general settings';
+SELECT name FROM system.settings WHERE is_obsolete = 1 ORDER BY name;
+
+SELECT '-- Obsolete merge tree settings';
+SELECT name FROM system.merge_tree_settings WHERE is_obsolete = 1 ORDER BY name;

From d5de17f6aa1bde2823df4e329a1d516b7f807833 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 26 Sep 2023 12:19:25 +0000
Subject: [PATCH 090/101] Fix bad cast to ColumnVector<Int128> in function if

---
 src/Functions/if.cpp                          | 19 ++++++++-------
 ...er_type_inference_in_if_function.reference | 24 +++++++++++++++++++
 ..._integer_type_inference_in_if_function.sql | 13 ++++++++++
 3 files changed, 48 insertions(+), 8 deletions(-)
 create mode 100644 tests/queries/0_stateless/02888_integer_type_inference_in_if_function.reference
 create mode 100644 tests/queries/0_stateless/02888_integer_type_inference_in_if_function.sql

diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index a955230f3d3..eba1733c683 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -1096,22 +1096,25 @@ public:
             return res != nullptr;
         };
 
-        TypeIndex left_id = arg_then.type->getTypeId();
-        TypeIndex right_id = arg_else.type->getTypeId();
+        DataTypePtr left_type = arg_then.type;
+        DataTypePtr right_type = arg_else.type;
 
         if (const auto * left_array = checkAndGetDataType<DataTypeArray>(arg_then.type.get()))
-            left_id = left_array->getNestedType()->getTypeId();
+            left_type = left_array->getNestedType();
 
         if (const auto * right_array = checkAndGetDataType<DataTypeArray>(arg_else.type.get()))
-            right_id = right_array->getNestedType()->getTypeId();
+            right_type = right_array->getNestedType();
 
         /// Special case when one column is Integer and another is UInt64 that can be actually Int64.
         /// The result type for this case is Int64 and we need to change UInt64 type to Int64
         /// so the NumberTraits::ResultOfIf will return Int64 instead if Int128.
-        if (isNativeInteger(arg_then.type) && isUInt64ThatCanBeInt64(arg_else.type))
-            right_id = TypeIndex::Int64;
-        else if (isNativeInteger(arg_else.type) && isUInt64ThatCanBeInt64(arg_then.type))
-            left_id = TypeIndex::Int64;
+        if (isNativeInteger(left_type) && isUInt64ThatCanBeInt64(right_type))
+            right_type = std::make_shared<DataTypeInt64>();
+        else if (isNativeInteger(right_type) && isUInt64ThatCanBeInt64(left_type))
+            left_type = std::make_shared<DataTypeInt64>();
+
+        TypeIndex left_id = left_type->getTypeId();
+        TypeIndex right_id = right_type->getTypeId();
 
         if (!(callOnBasicTypes<true, true, true, false>(left_id, right_id, call)
             || (res = executeTyped<UUID, UUID>(cond_col, arguments, result_type, input_rows_count))
diff --git a/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.reference b/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.reference
new file mode 100644
index 00000000000..b5909a82df3
--- /dev/null
+++ b/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.reference
@@ -0,0 +1,24 @@
+-9223372036854775808
+9223372036854775806
+-9223372036854775808
+9223372036854775806
+-9223372036854775808
+9223372036854775806
+-9223372036854775808
+9223372036854775806
+[2,65537,-9223372036854775808]
+[9223372036854775806]
+[2,65537,-9223372036854775808]
+[9223372036854775806]
+[2,65537,-9223372036854775808]
+[9223372036854775806]
+[2,65537,-9223372036854775808]
+[9223372036854775806]
+[[2,65537,-9223372036854775808]]
+[[9223372036854775806]]
+[[2,65537,-9223372036854775808]]
+[[9223372036854775806]]
+[[2,65537,-9223372036854775808]]
+[[9223372036854775806]]
+[[2,65537,-9223372036854775808]]
+[[9223372036854775806]]
diff --git a/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.sql b/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.sql
new file mode 100644
index 00000000000..065536e0e6f
--- /dev/null
+++ b/tests/queries/0_stateless/02888_integer_type_inference_in_if_function.sql
@@ -0,0 +1,13 @@
+SELECT if(number % 2, 9223372036854775806, -9223372036854775808) AS res FROM numbers(2);
+SELECT if(number % 2, materialize(9223372036854775806), -9223372036854775808) AS res FROM numbers(2);
+SELECT if(number % 2, 9223372036854775806, materialize(-9223372036854775808)) AS res FROM numbers(2);
+SELECT if(number % 2, materialize(9223372036854775806), materialize(-9223372036854775808)) AS res FROM numbers(2);
+SELECT if(number % 2, [9223372036854775806], [2, 65537, -9223372036854775808]) AS res FROM numbers(2);
+SELECT if(number % 2, materialize([9223372036854775806]), [2, 65537, -9223372036854775808]) AS res FROM numbers(2);
+SELECT if(number % 2, [9223372036854775806], materialize([2, 65537, -9223372036854775808])) AS res FROM numbers(2);
+SELECT if(number % 2, materialize([9223372036854775806]), materialize([2, 65537, -9223372036854775808])) AS res FROM numbers(2);
+SELECT if(number % 2, [[9223372036854775806]], [[2, 65537, -9223372036854775808]]) AS res FROM numbers(2);
+SELECT if(number % 2, materialize([[9223372036854775806]]), [[2, 65537, -9223372036854775808]]) AS res FROM numbers(2);
+SELECT if(number % 2, [[9223372036854775806]], materialize([[2, 65537, -9223372036854775808]])) AS res FROM numbers(2);
+SELECT if(number % 2, materialize([[9223372036854775806]]), materialize([[2, 65537, -9223372036854775808]])) AS res FROM numbers(2);
+

From f39cb17881c990850947d380daca631a4dc97182 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@gmail.com>
Date: Tue, 26 Sep 2023 15:01:05 +0200
Subject: [PATCH 091/101] Revert "Added field "is_deterministic" to
 system.functions"

---
 docs/en/operations/system-tables/functions.md | 38 ++++------
 .../System/StorageSystemFunctions.cpp         | 73 +++++--------------
 .../02117_show_create_table_system.reference  |  1 -
 .../02815_no_throw_in_simple_queries.sh       |  7 +-
 4 files changed, 36 insertions(+), 83 deletions(-)

diff --git a/docs/en/operations/system-tables/functions.md b/docs/en/operations/system-tables/functions.md
index d52bf24f289..60bfa08975b 100644
--- a/docs/en/operations/system-tables/functions.md
+++ b/docs/en/operations/system-tables/functions.md
@@ -7,34 +7,28 @@ Contains information about normal and aggregate functions.
 
 Columns:
 
-- `name` ([String](../../sql-reference/data-types/string.md)) – The name of the function.
-- `is_aggregate` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Whether the function is an aggregate function.
-- `is_deterministic` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt8](../../sql-reference/data-types/int-uint.md))) - Whether the function is deterministic.
-- `case_insensitive`, ([UInt8](../../sql-reference/data-types/int-uint.md)) - Whether the function name can be used case-insensitively.
-- `alias_to`, ([String](../../sql-reference/data-types/string.md)) - The original function name, if the function name is an alias.
-- `create_query`, ([String](../../sql-reference/data-types/enum.md)) - Unused.
-- `origin`, ([Enum8](../../sql-reference/data-types/string.md)) - Unused.
-- `description`, ([String](../../sql-reference/data-types/string.md)) - A high-level description what the function does.
-- `syntax`, ([String](../../sql-reference/data-types/string.md)) - Signature of the function.
-- `arguments`, ([String](../../sql-reference/data-types/string.md)) - What arguments does the function take.
-- `returned_value`, ([String](../../sql-reference/data-types/string.md)) - What does the function return.
-- `examples`, ([String](../../sql-reference/data-types/string.md)) - Example usage of the function.
-- `categories`, ([String](../../sql-reference/data-types/string.md)) - The category of the function.
+- `name`(`String`) – The name of the function.
+- `is_aggregate`(`UInt8`) — Whether the function is aggregate.
 
 **Example**
 
 ```sql
- SELECT name, is_aggregate, is_deterministic, case_insensitive, alias_to FROM system.functions LIMIT 5;
+ SELECT * FROM system.functions LIMIT 10;
 ```
 
 ```text
-┌─name─────────────────────┬─is_aggregate─┬─is_deterministic─┬─case_insensitive─┬─alias_to─┐
-│ BLAKE3                   │            0 │                1 │                0 │          │
-│ sipHash128Reference      │            0 │                1 │                0 │          │
-│ mapExtractKeyLike        │            0 │                1 │                0 │          │
-│ sipHash128ReferenceKeyed │            0 │                1 │                0 │          │
-│ mapPartialSort           │            0 │                1 │                0 │          │
-└──────────────────────────┴──────────────┴──────────────────┴──────────────────┴──────────┘
+┌─name──────────────────┬─is_aggregate─┬─case_insensitive─┬─alias_to─┬─create_query─┬─origin─┐
+│ logTrace              │            0 │                0 │          │              │ System │
+│ aes_decrypt_mysql     │            0 │                0 │          │              │ System │
+│ aes_encrypt_mysql     │            0 │                0 │          │              │ System │
+│ decrypt               │            0 │                0 │          │              │ System │
+│ encrypt               │            0 │                0 │          │              │ System │
+│ toBool                │            0 │                0 │          │              │ System │
+│ windowID              │            0 │                0 │          │              │ System │
+│ hopStart              │            0 │                0 │          │              │ System │
+│ hop                   │            0 │                0 │          │              │ System │
+│ snowflakeToDateTime64 │            0 │                0 │          │              │ System │
+└───────────────────────┴──────────────┴──────────────────┴──────────┴──────────────┴────────┘
 
-5 rows in set. Elapsed: 0.002 sec.
+10 rows in set. Elapsed: 0.002 sec.
 ```
diff --git a/src/Storages/System/StorageSystemFunctions.cpp b/src/Storages/System/StorageSystemFunctions.cpp
index 968f41392c8..0c609d84da3 100644
--- a/src/Storages/System/StorageSystemFunctions.cpp
+++ b/src/Storages/System/StorageSystemFunctions.cpp
@@ -1,6 +1,5 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <DataTypes/DataTypeMap.h>
-#include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -16,14 +15,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int DICTIONARIES_WAS_NOT_LOADED;
-    extern const int FUNCTION_NOT_ALLOWED;
-    extern const int NOT_IMPLEMENTED;
-    extern const int SUPPORT_IS_DISABLED;
-};
-
 enum class FunctionOrigin : Int8
 {
     SYSTEM = 0,
@@ -38,7 +29,6 @@ namespace
         MutableColumns & res_columns,
         const String & name,
         UInt64 is_aggregate,
-        std::optional<UInt64> is_deterministic,
         const String & create_query,
         FunctionOrigin function_origin,
         const Factory & factory)
@@ -46,58 +36,53 @@ namespace
         res_columns[0]->insert(name);
         res_columns[1]->insert(is_aggregate);
 
-        if (!is_deterministic.has_value())
-            res_columns[2]->insertDefault();
-        else
-            res_columns[2]->insert(*is_deterministic);
-
         if constexpr (std::is_same_v<Factory, UserDefinedSQLFunctionFactory> || std::is_same_v<Factory, UserDefinedExecutableFunctionFactory>)
         {
-            res_columns[3]->insert(false);
-            res_columns[4]->insertDefault();
+            res_columns[2]->insert(false);
+            res_columns[3]->insertDefault();
         }
         else
         {
-            res_columns[3]->insert(factory.isCaseInsensitive(name));
+            res_columns[2]->insert(factory.isCaseInsensitive(name));
             if (factory.isAlias(name))
-                res_columns[4]->insert(factory.aliasTo(name));
+                res_columns[3]->insert(factory.aliasTo(name));
             else
-                res_columns[4]->insertDefault();
+                res_columns[3]->insertDefault();
         }
 
-        res_columns[5]->insert(create_query);
-        res_columns[6]->insert(static_cast<Int8>(function_origin));
+        res_columns[4]->insert(create_query);
+        res_columns[5]->insert(static_cast<Int8>(function_origin));
 
         if constexpr (std::is_same_v<Factory, FunctionFactory>)
         {
             if (factory.isAlias(name))
             {
+                res_columns[6]->insertDefault();
                 res_columns[7]->insertDefault();
                 res_columns[8]->insertDefault();
                 res_columns[9]->insertDefault();
                 res_columns[10]->insertDefault();
                 res_columns[11]->insertDefault();
-                res_columns[12]->insertDefault();
             }
             else
             {
                 auto documentation = factory.getDocumentation(name);
-                res_columns[7]->insert(documentation.description);
-                res_columns[8]->insert(documentation.syntax);
-                res_columns[9]->insert(documentation.argumentsAsString());
-                res_columns[10]->insert(documentation.returned_value);
-                res_columns[11]->insert(documentation.examplesAsString());
-                res_columns[12]->insert(documentation.categoriesAsString());
+                res_columns[6]->insert(documentation.description);
+                res_columns[7]->insert(documentation.syntax);
+                res_columns[8]->insert(documentation.argumentsAsString());
+                res_columns[9]->insert(documentation.returned_value);
+                res_columns[10]->insert(documentation.examplesAsString());
+                res_columns[11]->insert(documentation.categoriesAsString());
             }
         }
         else
         {
+            res_columns[6]->insertDefault();
             res_columns[7]->insertDefault();
             res_columns[8]->insertDefault();
             res_columns[9]->insertDefault();
             res_columns[10]->insertDefault();
             res_columns[11]->insertDefault();
-            res_columns[12]->insertDefault();
         }
     }
 }
@@ -117,7 +102,6 @@ NamesAndTypesList StorageSystemFunctions::getNamesAndTypes()
     return {
         {"name", std::make_shared<DataTypeString>()},
         {"is_aggregate", std::make_shared<DataTypeUInt8>()},
-        {"is_deterministic", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt8>())},
         {"case_insensitive", std::make_shared<DataTypeUInt8>()},
         {"alias_to", std::make_shared<DataTypeString>()},
         {"create_query", std::make_shared<DataTypeString>()},
@@ -137,33 +121,14 @@ void StorageSystemFunctions::fillData(MutableColumns & res_columns, ContextPtr c
     const auto & function_names = functions_factory.getAllRegisteredNames();
     for (const auto & function_name : function_names)
     {
-        std::optional<UInt64> is_deterministic;
-        try
-        {
-            is_deterministic = functions_factory.tryGet(function_name, context)->isDeterministic();
-        }
-        catch (const Exception & e)
-        {
-            /// Some functions throw because they need special configuration or setup before use.
-            if (e.code() == ErrorCodes::DICTIONARIES_WAS_NOT_LOADED
-                || e.code() == ErrorCodes::FUNCTION_NOT_ALLOWED
-                || e.code() == ErrorCodes::NOT_IMPLEMENTED
-                || e.code() == ErrorCodes::SUPPORT_IS_DISABLED)
-            {
-                /// Ignore exception, show is_deterministic = NULL.
-            }
-            else
-                throw;
-        }
-
-        fillRow(res_columns, function_name, 0, is_deterministic, "", FunctionOrigin::SYSTEM, functions_factory);
+        fillRow(res_columns, function_name, UInt64(0), "", FunctionOrigin::SYSTEM, functions_factory);
     }
 
     const auto & aggregate_functions_factory = AggregateFunctionFactory::instance();
     const auto & aggregate_function_names = aggregate_functions_factory.getAllRegisteredNames();
     for (const auto & function_name : aggregate_function_names)
     {
-        fillRow(res_columns, function_name, 1, {1}, "", FunctionOrigin::SYSTEM, aggregate_functions_factory);
+        fillRow(res_columns, function_name, UInt64(1), "", FunctionOrigin::SYSTEM, aggregate_functions_factory);
     }
 
     const auto & user_defined_sql_functions_factory = UserDefinedSQLFunctionFactory::instance();
@@ -171,14 +136,14 @@ void StorageSystemFunctions::fillData(MutableColumns & res_columns, ContextPtr c
     for (const auto & function_name : user_defined_sql_functions_names)
     {
         auto create_query = queryToString(user_defined_sql_functions_factory.get(function_name));
-        fillRow(res_columns, function_name, 0, {0}, create_query, FunctionOrigin::SQL_USER_DEFINED, user_defined_sql_functions_factory);
+        fillRow(res_columns, function_name, UInt64(0), create_query, FunctionOrigin::SQL_USER_DEFINED, user_defined_sql_functions_factory);
     }
 
     const auto & user_defined_executable_functions_factory = UserDefinedExecutableFunctionFactory::instance();
     const auto & user_defined_executable_functions_names = user_defined_executable_functions_factory.getRegisteredNames(context);
     for (const auto & function_name : user_defined_executable_functions_names)
     {
-        fillRow(res_columns, function_name, 0, {0}, "", FunctionOrigin::EXECUTABLE_USER_DEFINED, user_defined_executable_functions_factory);
+        fillRow(res_columns, function_name, UInt64(0), "", FunctionOrigin::EXECUTABLE_USER_DEFINED, user_defined_executable_functions_factory);
     }
 }
 
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 04f052f47bd..46373f49700 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -283,7 +283,6 @@ CREATE TABLE system.functions
 (
     `name` String,
     `is_aggregate` UInt8,
-    `is_deterministic` Nullable(UInt8),
     `case_insensitive` UInt8,
     `alias_to` String,
     `create_query` String,
diff --git a/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh b/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
index e2e4f3f8433..a5c6de3ce58 100755
--- a/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
+++ b/tests/queries/0_stateless/02815_no_throw_in_simple_queries.sh
@@ -53,9 +53,4 @@ expect eof
 EOF
 }
 
-run "$CLICKHOUSE_LOCAL --disable_suggestion"
-# Suggestions are off because the suggestion feature initializes itself by reading all available function
-# names from "system.functions". Getting the value for field "is_obsolete" occasionally throws (e.g. for
-# certain dictionary functions when dictionaries are not set up yet). Exceptions are properly handled, but
-# they exist for a short time. This, in combination with CLICKHOUSE_TERMINATE_ON_ANY_EXCEPTION, terminates
-# clickhouse-local and clickhouse-client when run in interactive mode *with* suggestions.
+run "$CLICKHOUSE_LOCAL"

From aff486dac13a887308498ce3a6bbfc0c5ad93de9 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Tue, 26 Sep 2023 15:59:57 +0200
Subject: [PATCH 092/101] Additional scripts for packager (#55000)

---
 docker/packager/binary/build.sh | 21 ++++++++++++++++-----
 packages/.gitignore             |  1 +
 packages/pre-build/example.sh   |  3 +++
 3 files changed, 20 insertions(+), 5 deletions(-)
 create mode 100755 packages/pre-build/example.sh

diff --git a/docker/packager/binary/build.sh b/docker/packager/binary/build.sh
index 11efffd592c..93de6eeb374 100755
--- a/docker/packager/binary/build.sh
+++ b/docker/packager/binary/build.sh
@@ -55,6 +55,17 @@ ccache_status
 # clear cache stats
 ccache --zero-stats ||:
 
+# Check whether the directory with pre-build scripts exists and not empty.
+if [ -d "/build/packages/pre-build" ] && [ -z "$(ls -A /build/packages/pre-build)" ]; then
+   echo "There are no subcommands to execute :)"
+else
+  # Execute all commands
+  for file in /build/packages/pre-build/*.sh ;
+  do
+    bash "$file"
+  done
+fi
+
 if [ "$BUILD_MUSL_KEEPER" == "1" ]
 then
     # build keeper with musl separately
@@ -73,13 +84,13 @@ then
     fi
     rm -f CMakeCache.txt
 
-    # Build the rest of binaries
-    cmake --debug-trycompile -DBUILD_STANDALONE_KEEPER=0 -DCREATE_KEEPER_SYMLINK=0 -DCMAKE_VERBOSE_MAKEFILE=1 -LA "-DCMAKE_BUILD_TYPE=$BUILD_TYPE" "-DSANITIZE=$SANITIZER" -DENABLE_CHECK_HEAVY_BUILDS=1 "${CMAKE_FLAGS[@]}" ..
-else
-    # Build everything
-    cmake --debug-trycompile -DCMAKE_VERBOSE_MAKEFILE=1 -LA "-DCMAKE_BUILD_TYPE=$BUILD_TYPE" "-DSANITIZE=$SANITIZER" -DENABLE_CHECK_HEAVY_BUILDS=1 "${CMAKE_FLAGS[@]}" ..
+    # Modify CMake flags, so we won't overwrite standalone keeper with symlinks
+    CMAKE_FLAGS+=(-DBUILD_STANDALONE_KEEPER=0 -DCREATE_KEEPER_SYMLINK=0)
 fi
 
+# Build everything
+cmake --debug-trycompile -DCMAKE_VERBOSE_MAKEFILE=1 -LA "-DCMAKE_BUILD_TYPE=$BUILD_TYPE" "-DSANITIZE=$SANITIZER" -DENABLE_CHECK_HEAVY_BUILDS=1 "${CMAKE_FLAGS[@]}" ..
+
 # No quotes because I want it to expand to nothing if empty.
 # shellcheck disable=SC2086 # No quotes because I want it to expand to nothing if empty.
 ninja $NINJA_FLAGS $BUILD_TARGET
diff --git a/packages/.gitignore b/packages/.gitignore
index 355164c1265..69cf3a785e4 100644
--- a/packages/.gitignore
+++ b/packages/.gitignore
@@ -1 +1,2 @@
 */
+!pre-build/
diff --git a/packages/pre-build/example.sh b/packages/pre-build/example.sh
new file mode 100755
index 00000000000..2e361d6ca44
--- /dev/null
+++ b/packages/pre-build/example.sh
@@ -0,0 +1,3 @@
+#!/usr/bin/env bash
+
+echo "This is an example pre-build script!"

From d39bd7154fe304409889e0c51aa24113f24269e3 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Sat, 23 Sep 2023 21:13:13 +0200
Subject: [PATCH 093/101] Use pregenerated gRPC protocol pb2 files to fix test
 flakyness.

---
 tests/integration/runner                      |  26 +--
 tests/integration/test_grpc_protocol/pb2      |   1 +
 .../protos/clickhouse_grpc.proto              |   1 -
 tests/integration/test_grpc_protocol/test.py  |  28 +--
 tests/integration/test_grpc_protocol_ssl/pb2  |   1 +
 .../protos/clickhouse_grpc.proto              |   1 -
 .../test_grpc_protocol_ssl/test.py            |  28 +--
 .../grpc_protocol_pb2                         |   1 +
 .../protos/clickhouse_grpc.proto              |   1 -
 .../test.py                                   |  22 +--
 .../test_server_reload/grpc_protocol_pb2      |   1 +
 .../protos/clickhouse_grpc.proto              |   1 -
 tests/integration/test_server_reload/test.py  |  23 +--
 .../test_session_log/grpc_protocol_pb2        |   1 +
 .../protos/clickhouse_grpc.proto              |   1 -
 tests/integration/test_session_log/test.py    |  22 +--
 utils/check-style/check-black                 |  12 +-
 utils/grpc-client/clickhouse-grpc-client.py   |  50 ++----
 utils/grpc-client/pb2/clickhouse_grpc_pb2.py  | 163 +++++++++++++++++
 .../pb2/clickhouse_grpc_pb2_grpc.py           | 165 ++++++++++++++++++
 utils/grpc-client/pb2/generate.py             |  29 +++
 .../grpc-client/protos/clickhouse_grpc.proto  |   1 -
 22 files changed, 432 insertions(+), 147 deletions(-)
 create mode 120000 tests/integration/test_grpc_protocol/pb2
 delete mode 120000 tests/integration/test_grpc_protocol/protos/clickhouse_grpc.proto
 create mode 120000 tests/integration/test_grpc_protocol_ssl/pb2
 delete mode 120000 tests/integration/test_grpc_protocol_ssl/protos/clickhouse_grpc.proto
 create mode 120000 tests/integration/test_profile_max_sessions_for_user/grpc_protocol_pb2
 delete mode 120000 tests/integration/test_profile_max_sessions_for_user/protos/clickhouse_grpc.proto
 create mode 120000 tests/integration/test_server_reload/grpc_protocol_pb2
 delete mode 120000 tests/integration/test_server_reload/protos/clickhouse_grpc.proto
 create mode 120000 tests/integration/test_session_log/grpc_protocol_pb2
 delete mode 120000 tests/integration/test_session_log/protos/clickhouse_grpc.proto
 create mode 100644 utils/grpc-client/pb2/clickhouse_grpc_pb2.py
 create mode 100644 utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
 create mode 100755 utils/grpc-client/pb2/generate.py
 delete mode 120000 utils/grpc-client/protos/clickhouse_grpc.proto

diff --git a/tests/integration/runner b/tests/integration/runner
index 4c2b1054538..7be491a9a57 100755
--- a/tests/integration/runner
+++ b/tests/integration/runner
@@ -27,7 +27,7 @@ CONTAINER_NAME = f"{VOLUME_NAME}_{random_str()}"
 
 CONFIG_DIR_IN_REPO = "programs/server"
 INTEGRATION_DIR_IN_REPO = "tests/integration"
-SRC_DIR_IN_REPO = "src"
+UTILS_DIR_IN_REPO = "utils"
 
 DIND_INTEGRATION_TESTS_IMAGE_NAME = "clickhouse/integration-tests-runner"
 
@@ -89,12 +89,16 @@ def check_args_and_update_paths(args):
         )
         logging.info("Cases dir is not set. Will use %s" % (args.cases_dir))
 
-    if args.src_dir:
-        if not os.path.isabs(args.src_dir):
-            args.src_dir = os.path.abspath(os.path.join(CURRENT_WORK_DIR, args.src_dir))
+    if args.utils_dir:
+        if not os.path.isabs(args.utils_dir):
+            args.utils_dir = os.path.abspath(
+                os.path.join(CURRENT_WORK_DIR, args.utils_dir)
+            )
     else:
-        args.src_dir = os.path.abspath(os.path.join(CLICKHOUSE_ROOT, SRC_DIR_IN_REPO))
-        logging.info("src dir is not set. Will use %s" % (args.src_dir))
+        args.utils_dir = os.path.abspath(
+            os.path.join(CLICKHOUSE_ROOT, UTILS_DIR_IN_REPO)
+        )
+        logging.info("utils dir is not set. Will use %s" % (args.utils_dir))
 
     logging.info(
         "base_configs_dir: {}, binary: {}, cases_dir: {} ".format(
@@ -115,7 +119,7 @@ def check_args_and_update_paths(args):
 
     if args.dockerd_volume:
         if not os.path.isabs(args.dockerd_volume):
-            args.src_dir = os.path.abspath(
+            args.dockerd_volume = os.path.abspath(
                 os.path.join(CURRENT_WORK_DIR, args.dockerd_volume)
             )
 
@@ -197,9 +201,9 @@ if __name__ == "__main__":
     )
 
     parser.add_argument(
-        "--src-dir",
-        default=os.environ.get("CLICKHOUSE_SRC_DIR"),
-        help="Path to the 'src' directory in repository. Used to provide schemas (e.g. *.proto) for some tests when those schemas are located in the 'src' directory",
+        "--utils-dir",
+        default=os.environ.get("CLICKHOUSE_UTILS_DIR"),
+        help="Path to the 'utils' directory in repository. Used to provide Python modules for grpc protocol schemas which are located in the 'utils' directory",
     )
 
     parser.add_argument(
@@ -424,7 +428,7 @@ if __name__ == "__main__":
         f"--volume={args.library_bridge_binary}:/clickhouse-library-bridge "
         f"--volume={args.base_configs_dir}:/clickhouse-config "
         f"--volume={args.cases_dir}:/ClickHouse/tests/integration "
-        f"--volume={args.src_dir}/Server/grpc_protos:/ClickHouse/src/Server/grpc_protos "
+        f"--volume={args.utils_dir}/grpc-client/pb2:/ClickHouse/utils/grpc-client/pb2 "
         f"--volume=/run:/run/host:ro {dockerd_internal_volume} {env_tags} {env_cleanup} "
         f"-e DOCKER_CLIENT_TIMEOUT=300 -e COMPOSE_HTTP_TIMEOUT=600 {use_analyzer} -e PYTHONUNBUFFERED=1 "
         f'-e PYTEST_ADDOPTS="{parallel_args} {pytest_opts} {tests_list} {rand_args} -vvv"'
diff --git a/tests/integration/test_grpc_protocol/pb2 b/tests/integration/test_grpc_protocol/pb2
new file mode 120000
index 00000000000..27cc9a4f321
--- /dev/null
+++ b/tests/integration/test_grpc_protocol/pb2
@@ -0,0 +1 @@
+../../../utils/grpc-client/pb2
\ No newline at end of file
diff --git a/tests/integration/test_grpc_protocol/protos/clickhouse_grpc.proto b/tests/integration/test_grpc_protocol/protos/clickhouse_grpc.proto
deleted file mode 120000
index 25d15f11e3b..00000000000
--- a/tests/integration/test_grpc_protocol/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file
diff --git a/tests/integration/test_grpc_protocol/test.py b/tests/integration/test_grpc_protocol/test.py
index efc7d98e820..0dc08630b77 100644
--- a/tests/integration/test_grpc_protocol/test.py
+++ b/tests/integration/test_grpc_protocol/test.py
@@ -10,32 +10,20 @@ from threading import Thread
 import gzip
 import lz4.frame
 
+script_dir = os.path.dirname(os.path.realpath(__file__))
+pb2_dir = os.path.join(script_dir, "pb2")
+if pb2_dir not in sys.path:
+    sys.path.append(pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute pb2/generate.py to generate these modules.
+
+
 GRPC_PORT = 9100
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DEFAULT_ENCODING = "utf-8"
 
 
-# Use grpcio-tools to generate *pb2.py files from *.proto.
-
-proto_dir = os.path.join(SCRIPT_DIR, "./protos")
-gen_dir = os.path.join(SCRIPT_DIR, "./_gen")
-os.makedirs(gen_dir, exist_ok=True)
-run_and_check(
-    "python3 -m grpc_tools.protoc -I{proto_dir} --python_out={gen_dir} --grpc_python_out={gen_dir} \
-    {proto_dir}/clickhouse_grpc.proto".format(
-        proto_dir=proto_dir, gen_dir=gen_dir
-    ),
-    shell=True,
-)
-
-sys.path.append(gen_dir)
-import clickhouse_grpc_pb2
-import clickhouse_grpc_pb2_grpc
-
-
 # Utilities
 
-config_dir = os.path.join(SCRIPT_DIR, "./configs")
+config_dir = os.path.join(script_dir, "./configs")
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node",
diff --git a/tests/integration/test_grpc_protocol_ssl/pb2 b/tests/integration/test_grpc_protocol_ssl/pb2
new file mode 120000
index 00000000000..27cc9a4f321
--- /dev/null
+++ b/tests/integration/test_grpc_protocol_ssl/pb2
@@ -0,0 +1 @@
+../../../utils/grpc-client/pb2
\ No newline at end of file
diff --git a/tests/integration/test_grpc_protocol_ssl/protos/clickhouse_grpc.proto b/tests/integration/test_grpc_protocol_ssl/protos/clickhouse_grpc.proto
deleted file mode 120000
index 25d15f11e3b..00000000000
--- a/tests/integration/test_grpc_protocol_ssl/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file
diff --git a/tests/integration/test_grpc_protocol_ssl/test.py b/tests/integration/test_grpc_protocol_ssl/test.py
index 4c7fe99f49d..2bc835e9c4c 100644
--- a/tests/integration/test_grpc_protocol_ssl/test.py
+++ b/tests/integration/test_grpc_protocol_ssl/test.py
@@ -4,35 +4,23 @@ import sys
 import grpc
 from helpers.cluster import ClickHouseCluster, run_and_check
 
+script_dir = os.path.dirname(os.path.realpath(__file__))
+pb2_dir = os.path.join(script_dir, "pb2")
+if pb2_dir not in sys.path:
+    sys.path.append(pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute pb2/generate.py to generate these modules.
+
+
 # The test cluster is configured with certificate for that host name, see 'server-ext.cnf'.
 # The client have to verify server certificate against that name. Client uses SNI
 SSL_HOST = "integration-tests.clickhouse.com"
 GRPC_PORT = 9100
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DEFAULT_ENCODING = "utf-8"
 
 
-# Use grpcio-tools to generate *pb2.py files from *.proto.
-
-proto_dir = os.path.join(SCRIPT_DIR, "./protos")
-gen_dir = os.path.join(SCRIPT_DIR, "./_gen")
-os.makedirs(gen_dir, exist_ok=True)
-run_and_check(
-    "python3 -m grpc_tools.protoc -I{proto_dir} --python_out={gen_dir} --grpc_python_out={gen_dir} \
-    {proto_dir}/clickhouse_grpc.proto".format(
-        proto_dir=proto_dir, gen_dir=gen_dir
-    ),
-    shell=True,
-)
-
-sys.path.append(gen_dir)
-import clickhouse_grpc_pb2
-import clickhouse_grpc_pb2_grpc
-
-
 # Utilities
 
-config_dir = os.path.join(SCRIPT_DIR, "./configs")
+config_dir = os.path.join(script_dir, "./configs")
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node",
diff --git a/tests/integration/test_profile_max_sessions_for_user/grpc_protocol_pb2 b/tests/integration/test_profile_max_sessions_for_user/grpc_protocol_pb2
new file mode 120000
index 00000000000..27cc9a4f321
--- /dev/null
+++ b/tests/integration/test_profile_max_sessions_for_user/grpc_protocol_pb2
@@ -0,0 +1 @@
+../../../utils/grpc-client/pb2
\ No newline at end of file
diff --git a/tests/integration/test_profile_max_sessions_for_user/protos/clickhouse_grpc.proto b/tests/integration/test_profile_max_sessions_for_user/protos/clickhouse_grpc.proto
deleted file mode 120000
index 25d15f11e3b..00000000000
--- a/tests/integration/test_profile_max_sessions_for_user/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file
diff --git a/tests/integration/test_profile_max_sessions_for_user/test.py b/tests/integration/test_profile_max_sessions_for_user/test.py
index 28c2597e52d..133991fed7a 100755
--- a/tests/integration/test_profile_max_sessions_for_user/test.py
+++ b/tests/integration/test_profile_max_sessions_for_user/test.py
@@ -9,9 +9,15 @@ import threading
 
 from helpers.cluster import ClickHouseCluster, run_and_check
 from helpers.test_tools import assert_logs_contain_with_retry
-
 from helpers.uclient import client, prompt
 
+script_dir = os.path.dirname(os.path.realpath(__file__))
+grpc_protocol_pb2_dir = os.path.join(script_dir, "grpc_protocol_pb2")
+if grpc_protocol_pb2_dir not in sys.path:
+    sys.path.append(grpc_protocol_pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute grpc_protocol_pb2/generate.py to generate these modules.
+
+
 MAX_SESSIONS_FOR_USER = 2
 POSTGRES_SERVER_PORT = 5433
 MYSQL_SERVER_PORT = 9001
@@ -20,22 +26,8 @@ GRPC_PORT = 9100
 TEST_USER = "test_user"
 TEST_PASSWORD = "123"
 
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DEFAULT_ENCODING = "utf-8"
 
-# Use grpcio-tools to generate *pb2.py files from *.proto.
-proto_dir = os.path.join(SCRIPT_DIR, "./protos")
-gen_dir = os.path.join(SCRIPT_DIR, "./_gen")
-os.makedirs(gen_dir, exist_ok=True)
-run_and_check(
-    f"python3 -m grpc_tools.protoc -I{proto_dir} --python_out={gen_dir} --grpc_python_out={gen_dir} {proto_dir}/clickhouse_grpc.proto",
-    shell=True,
-)
-
-sys.path.append(gen_dir)
-
-import clickhouse_grpc_pb2
-import clickhouse_grpc_pb2_grpc
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
diff --git a/tests/integration/test_server_reload/grpc_protocol_pb2 b/tests/integration/test_server_reload/grpc_protocol_pb2
new file mode 120000
index 00000000000..27cc9a4f321
--- /dev/null
+++ b/tests/integration/test_server_reload/grpc_protocol_pb2
@@ -0,0 +1 @@
+../../../utils/grpc-client/pb2
\ No newline at end of file
diff --git a/tests/integration/test_server_reload/protos/clickhouse_grpc.proto b/tests/integration/test_server_reload/protos/clickhouse_grpc.proto
deleted file mode 120000
index 25d15f11e3b..00000000000
--- a/tests/integration/test_server_reload/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file
diff --git a/tests/integration/test_server_reload/test.py b/tests/integration/test_server_reload/test.py
index da5208799ac..655c83dd81f 100644
--- a/tests/integration/test_server_reload/test.py
+++ b/tests/integration/test_server_reload/test.py
@@ -22,6 +22,13 @@ from pathlib import Path
 from requests.exceptions import ConnectionError
 from urllib3.util.retry import Retry
 
+script_dir = os.path.dirname(os.path.realpath(__file__))
+grpc_protocol_pb2_dir = os.path.join(script_dir, "grpc_protocol_pb2")
+if grpc_protocol_pb2_dir not in sys.path:
+    sys.path.append(grpc_protocol_pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute grpc_protocol_pb2/generate.py to generate these modules.
+
+
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
     "instance",
@@ -44,22 +51,6 @@ instance = cluster.add_instance(
 LOADS_QUERY = "SELECT value FROM system.events WHERE event = 'MainConfigLoads'"
 
 
-# Use grpcio-tools to generate *pb2.py files from *.proto.
-
-proto_dir = Path(__file__).parent / "protos"
-gen_dir = Path(__file__).parent / "_gen"
-gen_dir.mkdir(exist_ok=True)
-run_and_check(
-    f"python3 -m grpc_tools.protoc -I{proto_dir!s} --python_out={gen_dir!s} --grpc_python_out={gen_dir!s} \
-    {proto_dir!s}/clickhouse_grpc.proto",
-    shell=True,
-)
-
-sys.path.append(str(gen_dir))
-import clickhouse_grpc_pb2
-import clickhouse_grpc_pb2_grpc
-
-
 @pytest.fixture(name="cluster", scope="module")
 def fixture_cluster():
     try:
diff --git a/tests/integration/test_session_log/grpc_protocol_pb2 b/tests/integration/test_session_log/grpc_protocol_pb2
new file mode 120000
index 00000000000..27cc9a4f321
--- /dev/null
+++ b/tests/integration/test_session_log/grpc_protocol_pb2
@@ -0,0 +1 @@
+../../../utils/grpc-client/pb2
\ No newline at end of file
diff --git a/tests/integration/test_session_log/protos/clickhouse_grpc.proto b/tests/integration/test_session_log/protos/clickhouse_grpc.proto
deleted file mode 120000
index 25d15f11e3b..00000000000
--- a/tests/integration/test_session_log/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file
diff --git a/tests/integration/test_session_log/test.py b/tests/integration/test_session_log/test.py
index 0c350e6c2c9..922e2557c50 100644
--- a/tests/integration/test_session_log/test.py
+++ b/tests/integration/test_session_log/test.py
@@ -8,27 +8,19 @@ import threading
 
 from helpers.cluster import ClickHouseCluster, run_and_check
 
+script_dir = os.path.dirname(os.path.realpath(__file__))
+grpc_protocol_pb2_dir = os.path.join(script_dir, "grpc_protocol_pb2")
+if grpc_protocol_pb2_dir not in sys.path:
+    sys.path.append(grpc_protocol_pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute grpc_protocol_pb2/generate.py to generate these modules.
+
+
 POSTGRES_SERVER_PORT = 5433
 MYSQL_SERVER_PORT = 9001
 GRPC_PORT = 9100
 SESSION_LOG_MATCHING_FIELDS = "auth_id, auth_type, client_version_major, client_version_minor, client_version_patch, interface"
-
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DEFAULT_ENCODING = "utf-8"
 
-# Use grpcio-tools to generate *pb2.py files from *.proto.
-proto_dir = os.path.join(SCRIPT_DIR, "./protos")
-gen_dir = os.path.join(SCRIPT_DIR, "./_gen")
-os.makedirs(gen_dir, exist_ok=True)
-run_and_check(
-    f"python3 -m grpc_tools.protoc -I{proto_dir} --python_out={gen_dir} --grpc_python_out={gen_dir} {proto_dir}/clickhouse_grpc.proto",
-    shell=True,
-)
-
-sys.path.append(gen_dir)
-
-import clickhouse_grpc_pb2
-import clickhouse_grpc_pb2_grpc
 
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
diff --git a/utils/check-style/check-black b/utils/check-style/check-black
index 33c463d1668..f179ce68f50 100755
--- a/utils/check-style/check-black
+++ b/utils/check-style/check-black
@@ -13,10 +13,14 @@ tmp=$(mktemp)
 find_cmd=(
   find "$GIT_ROOT" -type f -not -path "${GIT_ROOT}contrib/*"
     \(
-      -name '*.py' -or -name "*.python" -or
-        \(
-          -executable -not -name "*.*" -exec sh -c 'file {} | grep -q "Python script"' \;
-        \)
+      \(
+        -name '*.py' -or -name "*.python" -or
+          \(
+            -executable -not -name "*.*" -exec sh -c 'file {} | grep -q "Python script"' \;
+          \)
+      \)
+      # We skip modules generated by the protocol buffer compiler from *.proto files.
+      -and -not -name '*_pb2.py' -and -not -name '*_pb2_grpc.py'
     \)
 )
 
diff --git a/utils/grpc-client/clickhouse-grpc-client.py b/utils/grpc-client/clickhouse-grpc-client.py
index 0caa9e6fdca..e89b6282741 100755
--- a/utils/grpc-client/clickhouse-grpc-client.py
+++ b/utils/grpc-client/clickhouse-grpc-client.py
@@ -10,10 +10,6 @@
 # Most of the command line options are the same, for more information type
 # ./clickhouse_grpc_client.py --help
 
-import grpc  # pip3 install grpcio
-import grpc_tools  # pip3 install grpcio-tools
-import argparse, cmd, os, signal, subprocess, sys, threading, time, uuid
-
 DEFAULT_HOST = "localhost"
 DEFAULT_PORT = 9100
 DEFAULT_USER_NAME = "default"
@@ -24,6 +20,16 @@ STDIN_BUFFER_SIZE = 1048576
 DEFAULT_ENCODING = "utf-8"
 
 
+import grpc  # pip3 install grpcio
+import argparse, cmd, os, signal, sys, threading, time, uuid
+
+script_dir = os.path.dirname(os.path.realpath(__file__))
+pb2_dir = os.path.join(script_dir, "pb2")
+if pb2_dir not in sys.path:
+    sys.path.append(pb2_dir)
+import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc  # Execute pb2/generate.py to generate these modules.
+
+
 class ClickHouseGRPCError(Exception):
     pass
 
@@ -80,8 +86,6 @@ class ClickHouseGRPCClient(cmd.Cmd):
         self.session_id = None
 
     def __enter__(self):
-        ClickHouseGRPCClient.__generate_pb2()
-        ClickHouseGRPCClient.__import_pb2()
         self.__connect()
         return self
 
@@ -229,40 +233,6 @@ class ClickHouseGRPCClient(cmd.Cmd):
         if result.HasField("exception"):
             raise ClickHouseGRPCError(result.exception.display_text)
 
-    # Use grpcio-tools to generate *pb2.py files from *.proto.
-    @staticmethod
-    def __generate_pb2():
-        script_dir = os.path.dirname(os.path.realpath(__file__))
-        proto_dir = os.path.join(script_dir, "./protos")
-        gen_dir = os.path.join(script_dir, "./_gen")
-        if os.path.exists(os.path.join(gen_dir, "clickhouse_grpc_pb2_grpc.py")):
-            return
-        os.makedirs(gen_dir, exist_ok=True)
-        cmd = [
-            "python3",
-            "-m",
-            "grpc_tools.protoc",
-            "-I" + proto_dir,
-            "--python_out=" + gen_dir,
-            "--grpc_python_out=" + gen_dir,
-            proto_dir + "/clickhouse_grpc.proto",
-        ]
-        p = subprocess.Popen(cmd, stderr=subprocess.PIPE)
-        # We don't want to show grpc_tools warnings.
-        errors = p.stderr.read().decode().strip("\n").split("\n")
-        only_warnings = all(("Warning" in error) for error in errors)
-        if not only_warnings:
-            error_print("\n".join(errors))
-
-    # Import the generated *pb2.py files.
-    @staticmethod
-    def __import_pb2():
-        script_dir = os.path.dirname(os.path.realpath(__file__))
-        gen_dir = os.path.join(script_dir, "./_gen")
-        sys.path.append(gen_dir)
-        global clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc
-        import clickhouse_grpc_pb2, clickhouse_grpc_pb2_grpc
-
     # Prints only if interactive mode is activated.
     def verbatim_print(self, *args, **kwargs):
         if self.verbatim:
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
new file mode 100644
index 00000000000..6218047af3c
--- /dev/null
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2.py
@@ -0,0 +1,163 @@
+# -*- coding: utf-8 -*-
+# Generated by the protocol buffer compiler.  DO NOT EDIT!
+# source: clickhouse_grpc.proto
+"""Generated protocol buffer code."""
+from google.protobuf.internal import enum_type_wrapper
+from google.protobuf import descriptor as _descriptor
+from google.protobuf import descriptor_pool as _descriptor_pool
+from google.protobuf import message as _message
+from google.protobuf import reflection as _reflection
+from google.protobuf import symbol_database as _symbol_database
+# @@protoc_insertion_point(imports)
+
+_sym_db = _symbol_database.Default()
+
+
+
+
+DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(b'\n\x15\x63lickhouse_grpc.proto\x12\x0f\x63lickhouse.grpc\")\n\x0bNameAndType\x12\x0c\n\x04name\x18\x01 \x01(\t\x12\x0c\n\x04type\x18\x02 \x01(\t\"\xf5\x01\n\rExternalTable\x12\x0c\n\x04name\x18\x01 \x01(\t\x12-\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0c\n\x04\x64\x61ta\x18\x03 \x01(\x0c\x12\x0e\n\x06\x66ormat\x18\x04 \x01(\t\x12\x18\n\x10\x63ompression_type\x18\x06 \x01(\t\x12>\n\x08settings\x18\x05 \x03(\x0b\x32,.clickhouse.grpc.ExternalTable.SettingsEntry\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\x85\x03\n\x1cObsoleteTransportCompression\x12U\n\talgorithm\x18\x01 \x01(\x0e\x32\x42.clickhouse.grpc.ObsoleteTransportCompression.CompressionAlgorithm\x12M\n\x05level\x18\x02 \x01(\x0e\x32>.clickhouse.grpc.ObsoleteTransportCompression.CompressionLevel\"R\n\x14\x43ompressionAlgorithm\x12\x12\n\x0eNO_COMPRESSION\x10\x00\x12\x0b\n\x07\x44\x45\x46LATE\x10\x01\x12\x08\n\x04GZIP\x10\x02\x12\x0f\n\x0bSTREAM_GZIP\x10\x03\"k\n\x10\x43ompressionLevel\x12\x14\n\x10\x43OMPRESSION_NONE\x10\x00\x12\x13\n\x0f\x43OMPRESSION_LOW\x10\x01\x12\x16\n\x12\x43OMPRESSION_MEDIUM\x10\x02\x12\x14\n\x10\x43OMPRESSION_HIGH\x10\x03\"\x8e\x06\n\tQueryInfo\x12\r\n\x05query\x18\x01 \x01(\t\x12\x10\n\x08query_id\x18\x02 \x01(\t\x12:\n\x08settings\x18\x03 \x03(\x0b\x32(.clickhouse.grpc.QueryInfo.SettingsEntry\x12\x10\n\x08\x64\x61tabase\x18\x04 \x01(\t\x12\x12\n\ninput_data\x18\x05 \x01(\x0c\x12\x1c\n\x14input_data_delimiter\x18\x06 \x01(\x0c\x12\x15\n\routput_format\x18\x07 \x01(\t\x12\x1b\n\x13send_output_columns\x18\x18 \x01(\x08\x12\x37\n\x0f\x65xternal_tables\x18\x08 \x03(\x0b\x32\x1e.clickhouse.grpc.ExternalTable\x12\x11\n\tuser_name\x18\t \x01(\t\x12\x10\n\x08password\x18\n \x01(\t\x12\r\n\x05quota\x18\x0b \x01(\t\x12\x12\n\nsession_id\x18\x0c \x01(\t\x12\x15\n\rsession_check\x18\r \x01(\x08\x12\x17\n\x0fsession_timeout\x18\x0e \x01(\r\x12\x0e\n\x06\x63\x61ncel\x18\x0f \x01(\x08\x12\x17\n\x0fnext_query_info\x18\x10 \x01(\x08\x12\x1e\n\x16input_compression_type\x18\x14 \x01(\t\x12\x1f\n\x17output_compression_type\x18\x15 \x01(\t\x12 \n\x18output_compression_level\x18\x13 \x01(\x05\x12\"\n\x1atransport_compression_type\x18\x16 \x01(\t\x12#\n\x1btransport_compression_level\x18\x17 \x01(\x05\x12R\n\x1bobsolete_result_compression\x18\x11 \x01(\x0b\x32-.clickhouse.grpc.ObsoleteTransportCompression\x12!\n\x19obsolete_compression_type\x18\x12 \x01(\t\x1a/\n\rSettingsEntry\x12\x0b\n\x03key\x18\x01 \x01(\t\x12\r\n\x05value\x18\x02 \x01(\t:\x02\x38\x01\"\xa1\x01\n\x08LogEntry\x12\x0c\n\x04time\x18\x01 \x01(\r\x12\x19\n\x11time_microseconds\x18\x02 \x01(\r\x12\x11\n\tthread_id\x18\x03 \x01(\x04\x12\x10\n\x08query_id\x18\x04 \x01(\t\x12)\n\x05level\x18\x05 \x01(\x0e\x32\x1a.clickhouse.grpc.LogsLevel\x12\x0e\n\x06source\x18\x06 \x01(\t\x12\x0c\n\x04text\x18\x07 \x01(\t\"z\n\x08Progress\x12\x11\n\tread_rows\x18\x01 \x01(\x04\x12\x12\n\nread_bytes\x18\x02 \x01(\x04\x12\x1a\n\x12total_rows_to_read\x18\x03 \x01(\x04\x12\x14\n\x0cwritten_rows\x18\x04 \x01(\x04\x12\x15\n\rwritten_bytes\x18\x05 \x01(\x04\"p\n\x05Stats\x12\x0c\n\x04rows\x18\x01 \x01(\x04\x12\x0e\n\x06\x62locks\x18\x02 \x01(\x04\x12\x17\n\x0f\x61llocated_bytes\x18\x03 \x01(\x04\x12\x15\n\rapplied_limit\x18\x04 \x01(\x08\x12\x19\n\x11rows_before_limit\x18\x05 \x01(\x04\"R\n\tException\x12\x0c\n\x04\x63ode\x18\x01 \x01(\x05\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x14\n\x0c\x64isplay_text\x18\x03 \x01(\t\x12\x13\n\x0bstack_trace\x18\x04 \x01(\t\"\xeb\x02\n\x06Result\x12\x10\n\x08query_id\x18\t \x01(\t\x12\x11\n\ttime_zone\x18\n \x01(\t\x12\x15\n\routput_format\x18\x0b \x01(\t\x12\x34\n\x0eoutput_columns\x18\x0c \x03(\x0b\x32\x1c.clickhouse.grpc.NameAndType\x12\x0e\n\x06output\x18\x01 \x01(\x0c\x12\x0e\n\x06totals\x18\x02 \x01(\x0c\x12\x10\n\x08\x65xtremes\x18\x03 \x01(\x0c\x12\'\n\x04logs\x18\x04 \x03(\x0b\x32\x19.clickhouse.grpc.LogEntry\x12+\n\x08progress\x18\x05 \x01(\x0b\x32\x19.clickhouse.grpc.Progress\x12%\n\x05stats\x18\x06 \x01(\x0b\x32\x16.clickhouse.grpc.Stats\x12-\n\texception\x18\x07 \x01(\x0b\x32\x1a.clickhouse.grpc.Exception\x12\x11\n\tcancelled\x18\x08 \x01(\x08*\x9d\x01\n\tLogsLevel\x12\x0c\n\x08LOG_NONE\x10\x00\x12\r\n\tLOG_FATAL\x10\x01\x12\x10\n\x0cLOG_CRITICAL\x10\x02\x12\r\n\tLOG_ERROR\x10\x03\x12\x0f\n\x0bLOG_WARNING\x10\x04\x12\x0e\n\nLOG_NOTICE\x10\x05\x12\x13\n\x0fLOG_INFORMATION\x10\x06\x12\r\n\tLOG_DEBUG\x10\x07\x12\r\n\tLOG_TRACE\x10\x08\x32\xdb\x02\n\nClickHouse\x12\x45\n\x0c\x45xecuteQuery\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x12V\n\x1b\x45xecuteQueryWithStreamInput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x12W\n\x1c\x45xecuteQueryWithStreamOutput\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00\x30\x01\x12U\n\x18\x45xecuteQueryWithStreamIO\x12\x1a.clickhouse.grpc.QueryInfo\x1a\x17.clickhouse.grpc.Result\"\x00(\x01\x30\x01\x62\x06proto3')
+
+_LOGSLEVEL = DESCRIPTOR.enum_types_by_name['LogsLevel']
+LogsLevel = enum_type_wrapper.EnumTypeWrapper(_LOGSLEVEL)
+LOG_NONE = 0
+LOG_FATAL = 1
+LOG_CRITICAL = 2
+LOG_ERROR = 3
+LOG_WARNING = 4
+LOG_NOTICE = 5
+LOG_INFORMATION = 6
+LOG_DEBUG = 7
+LOG_TRACE = 8
+
+
+_NAMEANDTYPE = DESCRIPTOR.message_types_by_name['NameAndType']
+_EXTERNALTABLE = DESCRIPTOR.message_types_by_name['ExternalTable']
+_EXTERNALTABLE_SETTINGSENTRY = _EXTERNALTABLE.nested_types_by_name['SettingsEntry']
+_OBSOLETETRANSPORTCOMPRESSION = DESCRIPTOR.message_types_by_name['ObsoleteTransportCompression']
+_QUERYINFO = DESCRIPTOR.message_types_by_name['QueryInfo']
+_QUERYINFO_SETTINGSENTRY = _QUERYINFO.nested_types_by_name['SettingsEntry']
+_LOGENTRY = DESCRIPTOR.message_types_by_name['LogEntry']
+_PROGRESS = DESCRIPTOR.message_types_by_name['Progress']
+_STATS = DESCRIPTOR.message_types_by_name['Stats']
+_EXCEPTION = DESCRIPTOR.message_types_by_name['Exception']
+_RESULT = DESCRIPTOR.message_types_by_name['Result']
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionAlgorithm']
+_OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL = _OBSOLETETRANSPORTCOMPRESSION.enum_types_by_name['CompressionLevel']
+NameAndType = _reflection.GeneratedProtocolMessageType('NameAndType', (_message.Message,), {
+  'DESCRIPTOR' : _NAMEANDTYPE,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.NameAndType)
+  })
+_sym_db.RegisterMessage(NameAndType)
+
+ExternalTable = _reflection.GeneratedProtocolMessageType('ExternalTable', (_message.Message,), {
+
+  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
+    'DESCRIPTOR' : _EXTERNALTABLE_SETTINGSENTRY,
+    '__module__' : 'clickhouse_grpc_pb2'
+    # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable.SettingsEntry)
+    })
+  ,
+  'DESCRIPTOR' : _EXTERNALTABLE,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ExternalTable)
+  })
+_sym_db.RegisterMessage(ExternalTable)
+_sym_db.RegisterMessage(ExternalTable.SettingsEntry)
+
+ObsoleteTransportCompression = _reflection.GeneratedProtocolMessageType('ObsoleteTransportCompression', (_message.Message,), {
+  'DESCRIPTOR' : _OBSOLETETRANSPORTCOMPRESSION,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.ObsoleteTransportCompression)
+  })
+_sym_db.RegisterMessage(ObsoleteTransportCompression)
+
+QueryInfo = _reflection.GeneratedProtocolMessageType('QueryInfo', (_message.Message,), {
+
+  'SettingsEntry' : _reflection.GeneratedProtocolMessageType('SettingsEntry', (_message.Message,), {
+    'DESCRIPTOR' : _QUERYINFO_SETTINGSENTRY,
+    '__module__' : 'clickhouse_grpc_pb2'
+    # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo.SettingsEntry)
+    })
+  ,
+  'DESCRIPTOR' : _QUERYINFO,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.QueryInfo)
+  })
+_sym_db.RegisterMessage(QueryInfo)
+_sym_db.RegisterMessage(QueryInfo.SettingsEntry)
+
+LogEntry = _reflection.GeneratedProtocolMessageType('LogEntry', (_message.Message,), {
+  'DESCRIPTOR' : _LOGENTRY,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.LogEntry)
+  })
+_sym_db.RegisterMessage(LogEntry)
+
+Progress = _reflection.GeneratedProtocolMessageType('Progress', (_message.Message,), {
+  'DESCRIPTOR' : _PROGRESS,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Progress)
+  })
+_sym_db.RegisterMessage(Progress)
+
+Stats = _reflection.GeneratedProtocolMessageType('Stats', (_message.Message,), {
+  'DESCRIPTOR' : _STATS,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Stats)
+  })
+_sym_db.RegisterMessage(Stats)
+
+Exception = _reflection.GeneratedProtocolMessageType('Exception', (_message.Message,), {
+  'DESCRIPTOR' : _EXCEPTION,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Exception)
+  })
+_sym_db.RegisterMessage(Exception)
+
+Result = _reflection.GeneratedProtocolMessageType('Result', (_message.Message,), {
+  'DESCRIPTOR' : _RESULT,
+  '__module__' : 'clickhouse_grpc_pb2'
+  # @@protoc_insertion_point(class_scope:clickhouse.grpc.Result)
+  })
+_sym_db.RegisterMessage(Result)
+
+_CLICKHOUSE = DESCRIPTOR.services_by_name['ClickHouse']
+if _descriptor._USE_C_DESCRIPTORS == False:
+
+  DESCRIPTOR._options = None
+  _EXTERNALTABLE_SETTINGSENTRY._options = None
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_options = b'8\001'
+  _QUERYINFO_SETTINGSENTRY._options = None
+  _QUERYINFO_SETTINGSENTRY._serialized_options = b'8\001'
+  _LOGSLEVEL._serialized_start=2363
+  _LOGSLEVEL._serialized_end=2520
+  _NAMEANDTYPE._serialized_start=42
+  _NAMEANDTYPE._serialized_end=83
+  _EXTERNALTABLE._serialized_start=86
+  _EXTERNALTABLE._serialized_end=331
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_start=284
+  _EXTERNALTABLE_SETTINGSENTRY._serialized_end=331
+  _OBSOLETETRANSPORTCOMPRESSION._serialized_start=334
+  _OBSOLETETRANSPORTCOMPRESSION._serialized_end=723
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_start=532
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONALGORITHM._serialized_end=614
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_start=616
+  _OBSOLETETRANSPORTCOMPRESSION_COMPRESSIONLEVEL._serialized_end=723
+  _QUERYINFO._serialized_start=726
+  _QUERYINFO._serialized_end=1508
+  _QUERYINFO_SETTINGSENTRY._serialized_start=284
+  _QUERYINFO_SETTINGSENTRY._serialized_end=331
+  _LOGENTRY._serialized_start=1511
+  _LOGENTRY._serialized_end=1672
+  _PROGRESS._serialized_start=1674
+  _PROGRESS._serialized_end=1796
+  _STATS._serialized_start=1798
+  _STATS._serialized_end=1910
+  _EXCEPTION._serialized_start=1912
+  _EXCEPTION._serialized_end=1994
+  _RESULT._serialized_start=1997
+  _RESULT._serialized_end=2360
+  _CLICKHOUSE._serialized_start=2523
+  _CLICKHOUSE._serialized_end=2870
+# @@protoc_insertion_point(module_scope)
diff --git a/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
new file mode 100644
index 00000000000..1c71218bbe5
--- /dev/null
+++ b/utils/grpc-client/pb2/clickhouse_grpc_pb2_grpc.py
@@ -0,0 +1,165 @@
+# Generated by the gRPC Python protocol compiler plugin. DO NOT EDIT!
+"""Client and server classes corresponding to protobuf-defined services."""
+import grpc
+
+import clickhouse_grpc_pb2 as clickhouse__grpc__pb2
+
+
+class ClickHouseStub(object):
+    """Missing associated documentation comment in .proto file."""
+
+    def __init__(self, channel):
+        """Constructor.
+
+        Args:
+            channel: A grpc.Channel.
+        """
+        self.ExecuteQuery = channel.unary_unary(
+                '/clickhouse.grpc.ClickHouse/ExecuteQuery',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
+        self.ExecuteQueryWithStreamInput = channel.stream_unary(
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
+        self.ExecuteQueryWithStreamOutput = channel.unary_stream(
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
+        self.ExecuteQueryWithStreamIO = channel.stream_stream(
+                '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
+                request_serializer=clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+                response_deserializer=clickhouse__grpc__pb2.Result.FromString,
+                )
+
+
+class ClickHouseServicer(object):
+    """Missing associated documentation comment in .proto file."""
+
+    def ExecuteQuery(self, request, context):
+        """Missing associated documentation comment in .proto file."""
+        context.set_code(grpc.StatusCode.UNIMPLEMENTED)
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
+
+    def ExecuteQueryWithStreamInput(self, request_iterator, context):
+        """Missing associated documentation comment in .proto file."""
+        context.set_code(grpc.StatusCode.UNIMPLEMENTED)
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
+
+    def ExecuteQueryWithStreamOutput(self, request, context):
+        """Missing associated documentation comment in .proto file."""
+        context.set_code(grpc.StatusCode.UNIMPLEMENTED)
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
+
+    def ExecuteQueryWithStreamIO(self, request_iterator, context):
+        """Missing associated documentation comment in .proto file."""
+        context.set_code(grpc.StatusCode.UNIMPLEMENTED)
+        context.set_details('Method not implemented!')
+        raise NotImplementedError('Method not implemented!')
+
+
+def add_ClickHouseServicer_to_server(servicer, server):
+    rpc_method_handlers = {
+            'ExecuteQuery': grpc.unary_unary_rpc_method_handler(
+                    servicer.ExecuteQuery,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamInput': grpc.stream_unary_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamInput,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamOutput': grpc.unary_stream_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamOutput,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+            'ExecuteQueryWithStreamIO': grpc.stream_stream_rpc_method_handler(
+                    servicer.ExecuteQueryWithStreamIO,
+                    request_deserializer=clickhouse__grpc__pb2.QueryInfo.FromString,
+                    response_serializer=clickhouse__grpc__pb2.Result.SerializeToString,
+            ),
+    }
+    generic_handler = grpc.method_handlers_generic_handler(
+            'clickhouse.grpc.ClickHouse', rpc_method_handlers)
+    server.add_generic_rpc_handlers((generic_handler,))
+
+
+ # This class is part of an EXPERIMENTAL API.
+class ClickHouse(object):
+    """Missing associated documentation comment in .proto file."""
+
+    @staticmethod
+    def ExecuteQuery(request,
+            target,
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.unary_unary(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQuery',
+            clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            clickhouse__grpc__pb2.Result.FromString,
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+
+    @staticmethod
+    def ExecuteQueryWithStreamInput(request_iterator,
+            target,
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.stream_unary(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamInput',
+            clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            clickhouse__grpc__pb2.Result.FromString,
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+
+    @staticmethod
+    def ExecuteQueryWithStreamOutput(request,
+            target,
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.unary_stream(request, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamOutput',
+            clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            clickhouse__grpc__pb2.Result.FromString,
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
+
+    @staticmethod
+    def ExecuteQueryWithStreamIO(request_iterator,
+            target,
+            options=(),
+            channel_credentials=None,
+            call_credentials=None,
+            insecure=False,
+            compression=None,
+            wait_for_ready=None,
+            timeout=None,
+            metadata=None):
+        return grpc.experimental.stream_stream(request_iterator, target, '/clickhouse.grpc.ClickHouse/ExecuteQueryWithStreamIO',
+            clickhouse__grpc__pb2.QueryInfo.SerializeToString,
+            clickhouse__grpc__pb2.Result.FromString,
+            options, channel_credentials,
+            insecure, call_credentials, compression, wait_for_ready, timeout, metadata)
diff --git a/utils/grpc-client/pb2/generate.py b/utils/grpc-client/pb2/generate.py
new file mode 100755
index 00000000000..2f4b3bf5af7
--- /dev/null
+++ b/utils/grpc-client/pb2/generate.py
@@ -0,0 +1,29 @@
+#!/usr/bin/env python3
+
+import grpc_tools  # pip3 install grpcio-tools
+
+import os
+import subprocess
+
+
+script_dir = os.path.dirname(os.path.realpath(__file__))
+dest_dir = script_dir
+src_dir = os.path.abspath(os.path.join(script_dir, "../../../src/Server/grpc_protos"))
+src_filename = "clickhouse_grpc.proto"
+
+
+def generate():
+    cmd = [
+        "python3",
+        "-m",
+        "grpc_tools.protoc",
+        "-I" + src_dir,
+        "--python_out=" + dest_dir,
+        "--grpc_python_out=" + dest_dir,
+        os.path.join(src_dir, src_filename),
+    ]
+    subprocess.run(cmd)
+
+
+if __name__ == "__main__":
+    generate()
diff --git a/utils/grpc-client/protos/clickhouse_grpc.proto b/utils/grpc-client/protos/clickhouse_grpc.proto
deleted file mode 120000
index 14d51a404bd..00000000000
--- a/utils/grpc-client/protos/clickhouse_grpc.proto
+++ /dev/null
@@ -1 +0,0 @@
-../../../src/Server/grpc_protos/clickhouse_grpc.proto
\ No newline at end of file

From 0ce30ab6d5877b33a78185bbaec0e4942edff12d Mon Sep 17 00:00:00 2001
From: George Gamezardashvili <ggamezar@gmail.com>
Date: Wed, 27 Sep 2023 00:50:19 +0900
Subject: [PATCH 094/101] SSH keys authentication (#41109)

Added new type of authentication based on SSH keys. It works only for Native TCP protocol.

Co-authored-by: Nikita Mikhaylov <nikitamikhaylov@clickhouse.com>
Co-authored-by: Robert Schulze <robert@clickhouse.com>
---
 .gitmodules                                   |   3 +
 contrib/CMakeLists.txt                        |   2 +
 contrib/libssh                                |   1 +
 contrib/libssh-cmake/CMakeLists.txt           |  77 +++++
 contrib/libssh-cmake/IncludeSources.cmake     | 141 +++++++++
 contrib/libssh-cmake/darwin/config.h          | 285 ++++++++++++++++++
 contrib/libssh-cmake/freebsd/config.h         | 285 ++++++++++++++++++
 .../libssh-cmake/linux/aarch64-musl/config.h  | 285 ++++++++++++++++++
 contrib/libssh-cmake/linux/aarch64/config.h   | 285 ++++++++++++++++++
 contrib/libssh-cmake/linux/ppc64le/config.h   | 285 ++++++++++++++++++
 contrib/libssh-cmake/linux/riscv64/config.h   | 285 ++++++++++++++++++
 contrib/libssh-cmake/linux/s390x/config.h     | 285 ++++++++++++++++++
 .../libssh-cmake/linux/x86-64-musl/config.h   | 285 ++++++++++++++++++
 contrib/libssh-cmake/linux/x86-64/config.h    | 285 ++++++++++++++++++
 .../sql-reference/statements/create/user.md   |   3 +-
 .../sql-reference/statements/create/user.md   |  23 +-
 programs/client/Client.cpp                    |   6 +
 programs/copier/ClusterCopier.cpp             |   2 +-
 src/Access/Authentication.cpp                 |  53 ++++
 src/Access/AuthenticationData.cpp             |  48 ++-
 src/Access/AuthenticationData.h               |   5 +
 src/Access/Common/AuthenticationType.cpp      |   5 +
 src/Access/Common/AuthenticationType.h        |   4 +
 src/Access/Credentials.h                      |  32 ++
 src/Access/User.cpp                           |   6 +-
 src/Access/UsersConfigAccessStorage.cpp       |  58 +++-
 src/CMakeLists.txt                            |   5 +
 src/Client/Connection.cpp                     |  65 +++-
 src/Client/Connection.h                       |  10 +-
 src/Client/ConnectionParameters.cpp           |  63 +++-
 src/Client/ConnectionParameters.h             |   2 +
 src/Client/ConnectionPool.h                   |   2 +-
 src/Common/ErrorCodes.cpp                     |   1 +
 src/Common/SSH/Wrappers.cpp                   | 183 +++++++++++
 src/Common/SSH/Wrappers.h                     |  78 +++++
 src/Core/Protocol.h                           |  20 +-
 src/Core/ProtocolDefines.h                    |   4 +-
 src/Interpreters/SessionLog.cpp               |   3 +-
 src/Parsers/Access/ASTAuthenticationData.cpp  |   7 +
 src/Parsers/Access/ASTPublicSSHKey.cpp        |  17 ++
 src/Parsers/Access/ASTPublicSSHKey.h          |  25 ++
 src/Parsers/Access/ParserCreateUserQuery.cpp  |  19 +-
 src/Parsers/Access/ParserPublicSSHKey.cpp     |  44 +++
 src/Parsers/Access/ParserPublicSSHKey.h       |  16 +
 src/Server/TCPHandler.cpp                     |  62 +++-
 src/Server/TCPHandler.h                       |   2 +
 src/Storages/StorageDistributed.cpp           |   2 +-
 src/Storages/StorageReplicatedMergeTree.cpp   |   2 +-
 .../test_ssh_keys_authentication/__init__.py  |   0
 .../configs/users.xml                         |  28 ++
 .../test_ssh_keys_authentication/keys/ecdsa   |   9 +
 .../keys/ecdsa.pub                            |   1 +
 .../test_ssh_keys_authentication/keys/ed25519 |   7 +
 .../keys/ed25519.pub                          |   1 +
 .../keys/passphrase                           |   8 +
 .../keys/passphrase.pub                       |   1 +
 .../test_ssh_keys_authentication/keys/rsa     |  38 +++
 .../test_ssh_keys_authentication/keys/rsa.pub |   1 +
 .../test_ssh_keys_authentication/keys/wrong   |  38 +++
 .../keys/wrong.pub                            |   1 +
 .../test_ssh_keys_authentication/test.py      | 103 +++++++
 .../02117_show_create_table_system.reference  |   2 +-
 .../02867_create_user_ssh.reference           |   1 +
 .../0_stateless/02867_create_user_ssh.sql     |  14 +
 64 files changed, 3872 insertions(+), 47 deletions(-)
 create mode 160000 contrib/libssh
 create mode 100644 contrib/libssh-cmake/CMakeLists.txt
 create mode 100644 contrib/libssh-cmake/IncludeSources.cmake
 create mode 100644 contrib/libssh-cmake/darwin/config.h
 create mode 100644 contrib/libssh-cmake/freebsd/config.h
 create mode 100644 contrib/libssh-cmake/linux/aarch64-musl/config.h
 create mode 100644 contrib/libssh-cmake/linux/aarch64/config.h
 create mode 100644 contrib/libssh-cmake/linux/ppc64le/config.h
 create mode 100644 contrib/libssh-cmake/linux/riscv64/config.h
 create mode 100644 contrib/libssh-cmake/linux/s390x/config.h
 create mode 100644 contrib/libssh-cmake/linux/x86-64-musl/config.h
 create mode 100644 contrib/libssh-cmake/linux/x86-64/config.h
 create mode 100644 src/Common/SSH/Wrappers.cpp
 create mode 100644 src/Common/SSH/Wrappers.h
 create mode 100644 src/Parsers/Access/ASTPublicSSHKey.cpp
 create mode 100644 src/Parsers/Access/ASTPublicSSHKey.h
 create mode 100644 src/Parsers/Access/ParserPublicSSHKey.cpp
 create mode 100644 src/Parsers/Access/ParserPublicSSHKey.h
 create mode 100644 tests/integration/test_ssh_keys_authentication/__init__.py
 create mode 100644 tests/integration/test_ssh_keys_authentication/configs/users.xml
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/ecdsa
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/ecdsa.pub
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/ed25519
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/ed25519.pub
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/passphrase
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/passphrase.pub
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/rsa
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/rsa.pub
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/wrong
 create mode 100644 tests/integration/test_ssh_keys_authentication/keys/wrong.pub
 create mode 100644 tests/integration/test_ssh_keys_authentication/test.py
 create mode 100644 tests/queries/0_stateless/02867_create_user_ssh.reference
 create mode 100644 tests/queries/0_stateless/02867_create_user_ssh.sql

diff --git a/.gitmodules b/.gitmodules
index caed96b0320..f790e0f8d5a 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -257,6 +257,9 @@
 [submodule "contrib/corrosion"]
 	path = contrib/corrosion
 	url = https://github.com/corrosion-rs/corrosion
+[submodule "contrib/libssh"]
+	path = contrib/libssh
+	url = https://github.com/ClickHouse/libssh.git
 [submodule "contrib/morton-nd"]
 	path = contrib/morton-nd
 	url = https://github.com/morton-nd/morton-nd
diff --git a/contrib/CMakeLists.txt b/contrib/CMakeLists.txt
index f9c3fddff40..390b0241e7d 100644
--- a/contrib/CMakeLists.txt
+++ b/contrib/CMakeLists.txt
@@ -212,6 +212,8 @@ add_contrib (libbcrypt-cmake libbcrypt)
 add_contrib (google-benchmark-cmake google-benchmark)
 add_contrib (ulid-c-cmake ulid-c)
 
+add_contrib (libssh-cmake libssh)
+
 # Put all targets defined here and in subdirectories under "contrib/<immediate-subdir>" folders in GUI-based IDEs.
 # Some of third-party projects may override CMAKE_FOLDER or FOLDER property of their targets, so they would not appear
 # in "contrib/..." as originally planned, so we workaround this by fixing FOLDER properties of all targets manually,
diff --git a/contrib/libssh b/contrib/libssh
new file mode 160000
index 00000000000..acea3e2d5ad
--- /dev/null
+++ b/contrib/libssh
@@ -0,0 +1 @@
+Subproject commit acea3e2d5ad6e22f52961b43411b4ed2d9224b9e
diff --git a/contrib/libssh-cmake/CMakeLists.txt b/contrib/libssh-cmake/CMakeLists.txt
new file mode 100644
index 00000000000..9a7c8eb2355
--- /dev/null
+++ b/contrib/libssh-cmake/CMakeLists.txt
@@ -0,0 +1,77 @@
+set(LIB_SOURCE_DIR "${ClickHouse_SOURCE_DIR}/contrib/libssh")
+set(LIB_BINARY_DIR "${ClickHouse_BINARY_DIR}/contrib/libssh")
+# Specify search path for CMake modules to be loaded by include()
+# and find_package()
+list(APPEND CMAKE_MODULE_PATH "${LIB_SOURCE_DIR}/cmake/Modules")
+
+include(DefineCMakeDefaults)
+include(DefineCompilerFlags)
+
+project(libssh VERSION 0.9.7 LANGUAGES C)
+
+# global needed variable
+set(APPLICATION_NAME ${PROJECT_NAME})
+
+# SOVERSION scheme: CURRENT.AGE.REVISION
+#   If there was an incompatible interface change:
+#     Increment CURRENT. Set AGE and REVISION to 0
+#   If there was a compatible interface change:
+#     Increment AGE. Set REVISION to 0
+#   If the source code was changed, but there were no interface changes:
+#     Increment REVISION.
+set(LIBRARY_VERSION "4.8.7")
+set(LIBRARY_SOVERSION "4")
+
+# where to look first for cmake modules, before ${CMAKE_ROOT}/Modules/ is checked
+
+# add definitions
+
+include(DefinePlatformDefaults)
+
+# Copy library files to a lib sub-directory
+set(CMAKE_LIBRARY_OUTPUT_DIRECTORY "${LIB_BINARY_DIR}/lib")
+
+set(CMAKE_THREAD_PREFER_PTHREADS ON)
+set(THREADS_PREFER_PTHREAD_FLAG ON)
+
+set(WITH_ZLIB OFF)
+set(WITH_SYMBOL_VERSIONING OFF)
+set(WITH_SERVER ON)
+
+include(IncludeSources.cmake)
+if (OS_LINUX)
+    if (ARCH_AMD64)
+        if (USE_MUSL)
+            target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/x86-64-musl")
+        else()
+            target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/x86-64")
+        endif ()
+    elseif (ARCH_AARCH64)
+        if (USE_MUSL)
+            target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/aarch64-musl")
+        else()
+            target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/aarch64")
+        endif ()
+    elseif (ARCH_PPC64LE)
+        target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/ppc64le")
+    elseif (ARCH_S390X)
+        # Like ppc64le but with HAVE_OPENSSL_FIPS_MODE undefined. This is because the OpenSSL used by s390x doesn't support
+        # FIPS_mode(). Besides that, the custom s390x/config.h only exists to make things compile without additional ifdefs.
+        # With high probability, libssl with OpenSSL on s390x is broken.
+        target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/s390x")
+    elseif (ARCH_RISCV64)
+        target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/linux/riscv64")
+    else ()
+        message(FATAL_ERROR "Platform is not supported")
+    endif ()
+elseif (OS_DARWIN)
+    target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/darwin")
+elseif (OS_FREEBSD)
+    target_include_directories(_ssh PRIVATE "${ClickHouse_SOURCE_DIR}/contrib/libssh-cmake/freebsd")
+else ()
+    message(FATAL_ERROR "Platform is not supported")
+endif()
+
+configure_file(${LIB_SOURCE_DIR}/include/libssh/libssh_version.h.cmake
+               ${LIB_BINARY_DIR}/include/libssh/libssh_version.h
+               @ONLY)
diff --git a/contrib/libssh-cmake/IncludeSources.cmake b/contrib/libssh-cmake/IncludeSources.cmake
new file mode 100644
index 00000000000..b60d8ed6c3c
--- /dev/null
+++ b/contrib/libssh-cmake/IncludeSources.cmake
@@ -0,0 +1,141 @@
+set(LIBSSH_LINK_LIBRARIES
+  ${LIBSSH_REQUIRED_LIBRARIES}
+)
+
+
+set(LIBSSH_LINK_LIBRARIES
+  ${LIBSSH_LINK_LIBRARIES}
+  OpenSSL::Crypto
+)
+
+if (MINGW AND Threads_FOUND)
+  set(LIBSSH_LINK_LIBRARIES
+    ${LIBSSH_LINK_LIBRARIES}
+    Threads::Threads
+  )
+endif()
+
+set(libssh_SRCS
+  ${LIB_SOURCE_DIR}/src/agent.c
+  ${LIB_SOURCE_DIR}/src/auth.c
+  ${LIB_SOURCE_DIR}/src/base64.c
+  ${LIB_SOURCE_DIR}/src/bignum.c
+  ${LIB_SOURCE_DIR}/src/buffer.c
+  ${LIB_SOURCE_DIR}/src/callbacks.c
+  ${LIB_SOURCE_DIR}/src/channels.c
+  ${LIB_SOURCE_DIR}/src/client.c
+  ${LIB_SOURCE_DIR}/src/config.c
+  ${LIB_SOURCE_DIR}/src/connect.c
+  ${LIB_SOURCE_DIR}/src/connector.c
+  ${LIB_SOURCE_DIR}/src/curve25519.c
+  ${LIB_SOURCE_DIR}/src/dh.c
+  ${LIB_SOURCE_DIR}/src/ecdh.c
+  ${LIB_SOURCE_DIR}/src/error.c
+  ${LIB_SOURCE_DIR}/src/getpass.c
+  ${LIB_SOURCE_DIR}/src/init.c
+  ${LIB_SOURCE_DIR}/src/kdf.c
+  ${LIB_SOURCE_DIR}/src/kex.c
+  ${LIB_SOURCE_DIR}/src/known_hosts.c
+  ${LIB_SOURCE_DIR}/src/knownhosts.c
+  ${LIB_SOURCE_DIR}/src/legacy.c
+  ${LIB_SOURCE_DIR}/src/log.c
+  ${LIB_SOURCE_DIR}/src/match.c
+  ${LIB_SOURCE_DIR}/src/messages.c
+  ${LIB_SOURCE_DIR}/src/misc.c
+  ${LIB_SOURCE_DIR}/src/options.c
+  ${LIB_SOURCE_DIR}/src/packet.c
+  ${LIB_SOURCE_DIR}/src/packet_cb.c
+  ${LIB_SOURCE_DIR}/src/packet_crypt.c
+  ${LIB_SOURCE_DIR}/src/pcap.c
+  ${LIB_SOURCE_DIR}/src/pki.c
+  ${LIB_SOURCE_DIR}/src/pki_container_openssh.c
+  ${LIB_SOURCE_DIR}/src/poll.c
+  ${LIB_SOURCE_DIR}/src/session.c
+  ${LIB_SOURCE_DIR}/src/scp.c
+  ${LIB_SOURCE_DIR}/src/socket.c
+  ${LIB_SOURCE_DIR}/src/string.c
+  ${LIB_SOURCE_DIR}/src/threads.c
+  ${LIB_SOURCE_DIR}/src/wrapper.c
+  ${LIB_SOURCE_DIR}/src/external/bcrypt_pbkdf.c
+  ${LIB_SOURCE_DIR}/src/external/blowfish.c
+  ${LIB_SOURCE_DIR}/src/external/chacha.c
+  ${LIB_SOURCE_DIR}/src/external/poly1305.c
+  ${LIB_SOURCE_DIR}/src/chachapoly.c
+  ${LIB_SOURCE_DIR}/src/config_parser.c
+  ${LIB_SOURCE_DIR}/src/token.c
+  ${LIB_SOURCE_DIR}/src/pki_ed25519_common.c
+)
+
+if (DEFAULT_C_NO_DEPRECATION_FLAGS)
+    set_source_files_properties(known_hosts.c
+                                PROPERTIES
+                                    COMPILE_FLAGS ${DEFAULT_C_NO_DEPRECATION_FLAGS})
+endif()
+
+if (CMAKE_USE_PTHREADS_INIT)
+    set(libssh_SRCS
+        ${libssh_SRCS}
+        ${LIB_SOURCE_DIR}/src/threads/noop.c
+        ${LIB_SOURCE_DIR}/src/threads/pthread.c
+    )
+elseif (CMAKE_USE_WIN32_THREADS_INIT)
+        set(libssh_SRCS
+            ${libssh_SRCS}
+            ${LIB_SOURCE_DIR}/src/threads/noop.c
+            ${LIB_SOURCE_DIR}/src/threads/winlocks.c
+        )
+else()
+    set(libssh_SRCS
+        ${libssh_SRCS}
+        ${LIB_SOURCE_DIR}/src/threads/noop.c
+    )
+endif()
+
+# LIBCRYPT specific
+set(libssh_SRCS
+    ${libssh_SRCS}
+    ${LIB_SOURCE_DIR}/src/threads/libcrypto.c
+    ${LIB_SOURCE_DIR}/src/pki_crypto.c
+    ${LIB_SOURCE_DIR}/src/ecdh_crypto.c
+    ${LIB_SOURCE_DIR}/src/libcrypto.c
+    ${LIB_SOURCE_DIR}/src/dh_crypto.c
+)
+
+# see the comment on s390x in libssh-cmake/CMakeLists.txt
+if(OPENSSL_VERSION VERSION_LESS "1.1.0" AND NOT ARCH_S390X)
+    set(libssh_SRCS ${libssh_SRCS} ${LIB_SOURCE_DIR}/src/libcrypto-compat.c)
+endif()
+
+set(libssh_SRCS
+${libssh_SRCS}
+${LIB_SOURCE_DIR}/src/options.c
+${LIB_SOURCE_DIR}/src/server.c
+${LIB_SOURCE_DIR}/src/bind.c
+${LIB_SOURCE_DIR}/src/bind_config.c
+)
+
+
+add_library(_ssh STATIC ${libssh_SRCS})
+
+target_include_directories(_ssh PRIVATE ${LIB_BINARY_DIR})
+target_include_directories(_ssh PUBLIC "${LIB_SOURCE_DIR}/include" "${LIB_BINARY_DIR}/include")
+target_link_libraries(_ssh
+                      PRIVATE ${LIBSSH_LINK_LIBRARIES})
+
+add_library(ch_contrib::ssh ALIAS _ssh)
+
+target_compile_options(_ssh
+                     PRIVATE
+                        ${DEFAULT_C_COMPILE_FLAGS}
+                        -D_GNU_SOURCE)
+
+
+set_target_properties(_ssh
+    PROPERTIES
+      VERSION
+        ${LIBRARY_VERSION}
+      SOVERSION
+        ${LIBRARY_SOVERSION}
+      DEFINE_SYMBOL
+        LIBSSH_EXPORTS
+)
diff --git a/contrib/libssh-cmake/darwin/config.h b/contrib/libssh-cmake/darwin/config.h
new file mode 100644
index 00000000000..8d54617775e
--- /dev/null
+++ b/contrib/libssh-cmake/darwin/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/darwin"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+#define HAVE_UTMP_H 1
+
+/* Define to 1 if you have the <util.h> header file. */
+#define HAVE_UTIL_H 1
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+#define HAVE_NTOHLL 1
+
+/* Define to 1 if you have the `htonll' function. */
+#define HAVE_HTONLL 1
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+/* #undef HAVE_EXPLICIT_BZERO */
+
+/* Define to 1 if you have the `memset_s' function. */
+#define HAVE_MEMSET_S 1
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/freebsd/config.h b/contrib/libssh-cmake/freebsd/config.h
new file mode 100644
index 00000000000..264748025f2
--- /dev/null
+++ b/contrib/libssh-cmake/freebsd/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/freebsd"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+#define HAVE_EXPLICIT_BZERO 1
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/aarch64-musl/config.h b/contrib/libssh-cmake/linux/aarch64-musl/config.h
new file mode 100644
index 00000000000..6be07939bd0
--- /dev/null
+++ b/contrib/libssh-cmake/linux/aarch64-musl/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/aarch64-musl"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+/* #undef HAVE_GLOB_GL_FLAGS_MEMBER
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+#define HAVE_EXPLICIT_BZERO 1
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/aarch64/config.h b/contrib/libssh-cmake/linux/aarch64/config.h
new file mode 100644
index 00000000000..a3af7d16d5a
--- /dev/null
+++ b/contrib/libssh-cmake/linux/aarch64/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/aarch64"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+#define HAVE_EXPLICIT_BZERO 1
+
+/* Define to 1 if you have the `memset_s' function. */
+#define HAVE_MEMSET_S 1
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/ppc64le/config.h b/contrib/libssh-cmake/linux/ppc64le/config.h
new file mode 100644
index 00000000000..3528bf28485
--- /dev/null
+++ b/contrib/libssh-cmake/linux/ppc64le/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/ppc64le"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+/* #undef HAVE_EXPLICIT_BZERO 1 */
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/riscv64/config.h b/contrib/libssh-cmake/linux/riscv64/config.h
new file mode 100644
index 00000000000..3cb4336e615
--- /dev/null
+++ b/contrib/libssh-cmake/linux/riscv64/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/riscv64"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+/* #undef HAVE_OPENSSL_FIPS_MODE */
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+/* #undef HAVE_EXPLICIT_BZERO 1 */
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/s390x/config.h b/contrib/libssh-cmake/linux/s390x/config.h
new file mode 100644
index 00000000000..dcc3ee0bbea
--- /dev/null
+++ b/contrib/libssh-cmake/linux/s390x/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/ppc64le"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+/* #undef HAVE_OPENSSL_FIPS_MODE */
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+/* #undef HAVE_EXPLICIT_BZERO 1 */
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/x86-64-musl/config.h b/contrib/libssh-cmake/linux/x86-64-musl/config.h
new file mode 100644
index 00000000000..b189d71d1cd
--- /dev/null
+++ b/contrib/libssh-cmake/linux/x86-64-musl/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/musl"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+/* #undef HAVE_GLOB_GL_FLAGS_MEMBER
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+#define HAVE_EXPLICIT_BZERO 1
+
+/* Define to 1 if you have the `memset_s' function. */
+/* #undef HAVE_MEMSET_S */
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/contrib/libssh-cmake/linux/x86-64/config.h b/contrib/libssh-cmake/linux/x86-64/config.h
new file mode 100644
index 00000000000..b3395b2326c
--- /dev/null
+++ b/contrib/libssh-cmake/linux/x86-64/config.h
@@ -0,0 +1,285 @@
+/* Name of package */
+#define PACKAGE "libssh"
+
+/* Version number of package */
+#define VERSION "0.9.7"
+
+#define SYSCONFDIR "etc"
+#define BINARYDIR "/home/ubuntu/workdir/ClickHouse/build/Debug"
+#define SOURCEDIR "/home/ubuntu/workdir/ClickHouse"
+
+/* Global bind configuration file path */
+#define GLOBAL_BIND_CONFIG "/etc/ssh/libssh_server_config"
+
+/* Global client configuration file path */
+#define GLOBAL_CLIENT_CONFIG "/etc/ssh/ssh_config"
+
+/************************** HEADER FILES *************************/
+
+/* Define to 1 if you have the <argp.h> header file. */
+/* #undef HAVE_ARGP_H */
+
+/* Define to 1 if you have the <aprpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <glob.h> header file. */
+#define HAVE_GLOB_H 1
+
+/* Define to 1 if you have the <valgrind/valgrind.h> header file. */
+/* #undef HAVE_VALGRIND_VALGRIND_H */
+
+/* Define to 1 if you have the <pty.h> header file. */
+/* #undef HAVE_PTY_H */
+
+/* Define to 1 if you have the <utmp.h> header file. */
+/* #undef HAVE_UTMP_H */
+
+/* Define to 1 if you have the <util.h> header file. */
+/* #undef HAVE_UTIL_H */
+
+/* Define to 1 if you have the <libutil.h> header file. */
+/* #undef HAVE_LIBUTIL_H */
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/utime.h> header file. */
+/* #undef HAVE_SYS_UTIME_H */
+
+/* Define to 1 if you have the <io.h> header file. */
+/* #undef HAVE_IO_H */
+
+/* Define to 1 if you have the <termios.h> header file. */
+#define HAVE_TERMIOS_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <openssl/aes.h> header file. */
+#define HAVE_OPENSSL_AES_H 1
+
+/* Define to 1 if you have the <wspiapi.h> header file. */
+/* #undef HAVE_WSPIAPI_H */
+
+/* Define to 1 if you have the <openssl/blowfish.h> header file. */
+/* #undef HAVE_OPENSSL_BLOWFISH_H */
+
+/* Define to 1 if you have the <openssl/des.h> header file. */
+#define HAVE_OPENSSL_DES_H 1
+
+/* Define to 1 if you have the <openssl/ecdh.h> header file. */
+#define HAVE_OPENSSL_ECDH_H 1
+
+/* Define to 1 if you have the <openssl/ec.h> header file. */
+#define HAVE_OPENSSL_EC_H 1
+
+/* Define to 1 if you have the <openssl/ecdsa.h> header file. */
+#define HAVE_OPENSSL_ECDSA_H 1
+
+/* Define to 1 if you have the <pthread.h> header file. */
+#define HAVE_PTHREAD_H 1
+
+/* Define to 1 if you have eliptic curve cryptography in openssl */
+#define HAVE_OPENSSL_ECC 1
+
+/* Define to 1 if you have eliptic curve cryptography in gcrypt */
+/* #undef HAVE_GCRYPT_ECC */
+
+/* Define to 1 if you have eliptic curve cryptography */
+#define HAVE_ECC 1
+
+/* Define to 1 if you have DSA */
+/* #undef HAVE_DSA */
+
+/* Define to 1 if you have gl_flags as a glob_t sturct member */
+#define HAVE_GLOB_GL_FLAGS_MEMBER 1
+
+/* Define to 1 if you have OpenSSL with Ed25519 support */
+#define HAVE_OPENSSL_ED25519 1
+
+/* Define to 1 if you have OpenSSL with X25519 support */
+#define HAVE_OPENSSL_X25519 1
+
+/*************************** FUNCTIONS ***************************/
+
+/* Define to 1 if you have the `EVP_aes128_ctr' function. */
+#define HAVE_OPENSSL_EVP_AES_CTR 1
+
+/* Define to 1 if you have the `EVP_aes128_cbc' function. */
+#define HAVE_OPENSSL_EVP_AES_CBC 1
+
+/* Define to 1 if you have the `EVP_aes128_gcm' function. */
+/* #undef HAVE_OPENSSL_EVP_AES_GCM */
+
+/* Define to 1 if you have the `CRYPTO_THREADID_set_callback' function. */
+#define HAVE_OPENSSL_CRYPTO_THREADID_SET_CALLBACK 1
+
+/* Define to 1 if you have the `CRYPTO_ctr128_encrypt' function. */
+#define HAVE_OPENSSL_CRYPTO_CTR128_ENCRYPT 1
+
+/* Define to 1 if you have the `EVP_CIPHER_CTX_new' function. */
+#define HAVE_OPENSSL_EVP_CIPHER_CTX_NEW 1
+
+/* Define to 1 if you have the `EVP_KDF_CTX_new_id' function. */
+/* #undef HAVE_OPENSSL_EVP_KDF_CTX_NEW_ID */
+
+/* Define to 1 if you have the `FIPS_mode' function. */
+#define HAVE_OPENSSL_FIPS_MODE 1
+
+/* Define to 1 if you have the `EVP_DigestSign' function. */
+#define HAVE_OPENSSL_EVP_DIGESTSIGN 1
+
+/* Define to 1 if you have the `EVP_DigestVerify' function. */
+#define HAVE_OPENSSL_EVP_DIGESTVERIFY 1
+
+/* Define to 1 if you have the `OPENSSL_ia32cap_loc' function. */
+/* #undef HAVE_OPENSSL_IA32CAP_LOC */
+
+/* Define to 1 if you have the `snprintf' function. */
+#define HAVE_SNPRINTF 1
+
+/* Define to 1 if you have the `_snprintf' function. */
+/* #undef HAVE__SNPRINTF */
+
+/* Define to 1 if you have the `_snprintf_s' function. */
+/* #undef HAVE__SNPRINTF_S */
+
+/* Define to 1 if you have the `vsnprintf' function. */
+#define HAVE_VSNPRINTF 1
+
+/* Define to 1 if you have the `_vsnprintf' function. */
+/* #undef HAVE__VSNPRINTF */
+
+/* Define to 1 if you have the `_vsnprintf_s' function. */
+/* #undef HAVE__VSNPRINTF_S */
+
+/* Define to 1 if you have the `isblank' function. */
+#define HAVE_ISBLANK 1
+
+/* Define to 1 if you have the `strncpy' function. */
+#define HAVE_STRNCPY 1
+
+/* Define to 1 if you have the `strndup' function. */
+#define HAVE_STRNDUP 1
+
+/* Define to 1 if you have the `cfmakeraw' function. */
+/* #undef HAVE_CFMAKERAW */
+
+/* Define to 1 if you have the `getaddrinfo' function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if you have the `poll' function. */
+#define HAVE_POLL 1
+
+/* Define to 1 if you have the `select' function. */
+#define HAVE_SELECT 1
+
+/* Define to 1 if you have the `clock_gettime' function. */
+/* #undef HAVE_CLOCK_GETTIME */
+
+/* Define to 1 if you have the `ntohll' function. */
+/* #undef HAVE_NTOHLL */
+
+/* Define to 1 if you have the `htonll' function. */
+/* #undef HAVE_HTONLL */
+
+/* Define to 1 if you have the `strtoull' function. */
+#define HAVE_STRTOULL 1
+
+/* Define to 1 if you have the `__strtoull' function. */
+/* #undef HAVE___STRTOULL */
+
+/* Define to 1 if you have the `_strtoui64' function. */
+/* #undef HAVE__STRTOUI64 */
+
+/* Define to 1 if you have the `glob' function. */
+#define HAVE_GLOB 1
+
+/* Define to 1 if you have the `explicit_bzero' function. */
+#define HAVE_EXPLICIT_BZERO 1
+
+/* Define to 1 if you have the `memset_s' function. */
+#define HAVE_MEMSET_S 1
+
+/* Define to 1 if you have the `SecureZeroMemory' function. */
+/* #undef HAVE_SECURE_ZERO_MEMORY */
+
+/* Define to 1 if you have the `cmocka_set_test_filter' function. */
+/* #undef HAVE_CMOCKA_SET_TEST_FILTER */
+
+/*************************** LIBRARIES ***************************/
+
+/* Define to 1 if you have the `crypto' library (-lcrypto). */
+#define HAVE_LIBCRYPTO 1
+
+/* Define to 1 if you have the `gcrypt' library (-lgcrypt). */
+/* #undef HAVE_LIBGCRYPT */
+
+/* Define to 1 if you have the 'mbedTLS' library (-lmbedtls). */
+/* #undef HAVE_LIBMBEDCRYPTO */
+
+/* Define to 1 if you have the `pthread' library (-lpthread). */
+#define HAVE_PTHREAD 1
+
+/* Define to 1 if you have the `cmocka' library (-lcmocka). */
+/* #undef HAVE_CMOCKA */
+
+/**************************** OPTIONS ****************************/
+
+#define HAVE_GCC_THREAD_LOCAL_STORAGE 1
+/* #undef HAVE_MSC_THREAD_LOCAL_STORAGE */
+
+#define HAVE_FALLTHROUGH_ATTRIBUTE 1
+#define HAVE_UNUSED_ATTRIBUTE 1
+
+#define HAVE_CONSTRUCTOR_ATTRIBUTE 1
+#define HAVE_DESTRUCTOR_ATTRIBUTE 1
+
+#define HAVE_GCC_VOLATILE_MEMORY_PROTECTION 1
+
+#define HAVE_COMPILER__FUNC__ 1
+#define HAVE_COMPILER__FUNCTION__ 1
+
+/* #undef HAVE_GCC_BOUNDED_ATTRIBUTE */
+
+/* Define to 1 if you want to enable GSSAPI */
+/* #undef WITH_GSSAPI */
+
+/* Define to 1 if you want to enable ZLIB */
+/* #undef WITH_ZLIB */
+
+/* Define to 1 if you want to enable SFTP */
+/* #undef WITH_SFTP */
+
+/* Define to 1 if you want to enable server support */
+#define WITH_SERVER 1
+
+/* Define to 1 if you want to enable DH group exchange algorithms */
+/* #undef WITH_GEX */
+
+/* Define to 1 if you want to enable blowfish cipher support */
+/* #undef WITH_BLOWFISH_CIPHER */
+
+/* Define to 1 if you want to enable debug output for crypto functions */
+/* #undef DEBUG_CRYPTO */
+
+/* Define to 1 if you want to enable debug output for packet functions */
+/* #undef DEBUG_PACKET */
+
+/* Define to 1 if you want to enable pcap output support (experimental) */
+/* #undef WITH_PCAP */
+
+/* Define to 1 if you want to enable calltrace debug output */
+/* #undef DEBUG_CALLTRACE */
+
+/* Define to 1 if you want to enable NaCl support */
+/* #undef WITH_NACL */
+
+/*************************** ENDIAN *****************************/
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+/* #undef WORDS_BIGENDIAN */
diff --git a/docs/en/sql-reference/statements/create/user.md b/docs/en/sql-reference/statements/create/user.md
index f6d1960a4f3..20cd9a47e98 100644
--- a/docs/en/sql-reference/statements/create/user.md
+++ b/docs/en/sql-reference/statements/create/user.md
@@ -12,7 +12,7 @@ Syntax:
 ``` sql
 CREATE USER [IF NOT EXISTS | OR REPLACE] name1 [ON CLUSTER cluster_name1]
         [, name2 [ON CLUSTER cluster_name2] ...]
-    [NOT IDENTIFIED | IDENTIFIED {[WITH {no_password | plaintext_password | sha256_password | sha256_hash | double_sha1_password | double_sha1_hash}] BY {'password' | 'hash'}} | {WITH ldap SERVER 'server_name'} | {WITH kerberos [REALM 'realm']} | {WITH ssl_certificate CN 'common_name'}]
+    [NOT IDENTIFIED | IDENTIFIED {[WITH {no_password | plaintext_password | sha256_password | sha256_hash | double_sha1_password | double_sha1_hash}] BY {'password' | 'hash'}} | {WITH ldap SERVER 'server_name'} | {WITH kerberos [REALM 'realm']} | {WITH ssl_certificate CN 'common_name'} | {WITH ssh_key BY KEY 'public_key' TYPE 'ssh-rsa|...'}]
     [HOST {LOCAL | NAME 'name' | REGEXP 'name_regexp' | IP 'address' | LIKE 'pattern'} [,...] | ANY | NONE]
     [VALID UNTIL datetime]
     [IN access_storage_type]
@@ -39,6 +39,7 @@ There are multiple ways of user identification:
 - `IDENTIFIED WITH ldap SERVER 'server_name'`
 - `IDENTIFIED WITH kerberos` or `IDENTIFIED WITH kerberos REALM 'realm'`
 - `IDENTIFIED WITH ssl_certificate CN 'mysite.com:user'`
+- `IDENTIFIED WITH ssh_key BY KEY 'public_key' TYPE 'ssh-rsa', KEY 'another_public_key' TYPE 'ssh-ed25519'`
 - `IDENTIFIED BY 'qwerty'`
 
 Password complexity requirements can be edited in [config.xml](/docs/en/operations/configuration-files). Below is an example configuration that requires passwords to be at least 12 characters long and contain 1 number. Each password complexity rule requires a regex to match against passwords and a description of the rule.
diff --git a/docs/ru/sql-reference/statements/create/user.md b/docs/ru/sql-reference/statements/create/user.md
index 9c1f25bf6d2..76cfdb251dc 100644
--- a/docs/ru/sql-reference/statements/create/user.md
+++ b/docs/ru/sql-reference/statements/create/user.md
@@ -13,7 +13,7 @@ sidebar_label: "Пользователь"
 ``` sql
 CREATE USER [IF NOT EXISTS | OR REPLACE] name1 [ON CLUSTER cluster_name1]
         [, name2 [ON CLUSTER cluster_name2] ...]
-    [NOT IDENTIFIED | IDENTIFIED {[WITH {no_password | plaintext_password | sha256_password | sha256_hash | double_sha1_password | double_sha1_hash}] BY {'password' | 'hash'}} | {WITH ldap SERVER 'server_name'} | {WITH kerberos [REALM 'realm']}]
+    [NOT IDENTIFIED | IDENTIFIED {[WITH {no_password | plaintext_password | sha256_password | sha256_hash | double_sha1_password | double_sha1_hash}] BY {'password' | 'hash'}} | {WITH ldap SERVER 'server_name'} | {WITH kerberos [REALM 'realm']} | {WITH ssl_certificate CN 'common_name'} | {WITH ssh_key BY KEY 'public_key' TYPE 'ssh-rsa|...'}]
     [HOST {LOCAL | NAME 'name' | REGEXP 'name_regexp' | IP 'address' | LIKE 'pattern'} [,...] | ANY | NONE]
     [DEFAULT ROLE role [,...]]
     [DEFAULT DATABASE database | NONE]
@@ -27,14 +27,19 @@ CREATE USER [IF NOT EXISTS | OR REPLACE] name1 [ON CLUSTER cluster_name1]
 
 Существует несколько способов идентификации пользователя:
 
--   `IDENTIFIED WITH no_password`
--   `IDENTIFIED WITH plaintext_password BY 'qwerty'`
--   `IDENTIFIED WITH sha256_password BY 'qwerty'` or `IDENTIFIED BY 'password'`
--   `IDENTIFIED WITH sha256_hash BY 'hash'` or `IDENTIFIED WITH sha256_hash BY 'hash' SALT 'salt'`
--   `IDENTIFIED WITH double_sha1_password BY 'qwerty'`
--   `IDENTIFIED WITH double_sha1_hash BY 'hash'`
--   `IDENTIFIED WITH ldap SERVER 'server_name'`
--   `IDENTIFIED WITH kerberos` or `IDENTIFIED WITH kerberos REALM 'realm'`
+- `IDENTIFIED WITH no_password`
+- `IDENTIFIED WITH plaintext_password BY 'qwerty'`
+- `IDENTIFIED WITH sha256_password BY 'qwerty'` or `IDENTIFIED BY 'password'`
+- `IDENTIFIED WITH sha256_hash BY 'hash'` or `IDENTIFIED WITH sha256_hash BY 'hash' SALT 'salt'`
+- `IDENTIFIED WITH double_sha1_password BY 'qwerty'`
+- `IDENTIFIED WITH double_sha1_hash BY 'hash'`
+- `IDENTIFIED WITH bcrypt_password BY 'qwerty'`
+- `IDENTIFIED WITH bcrypt_hash BY 'hash'`
+- `IDENTIFIED WITH ldap SERVER 'server_name'`
+- `IDENTIFIED WITH kerberos` or `IDENTIFIED WITH kerberos REALM 'realm'`
+- `IDENTIFIED WITH ssl_certificate CN 'mysite.com:user'`
+- `IDENTIFIED WITH ssh_key BY KEY 'public_key' TYPE 'ssh-rsa', KEY 'another_public_key' TYPE 'ssh-ed25519'`
+- `IDENTIFIED BY 'qwerty'`
 
 Для идентификации с sha256_hash используя `SALT` - хэш должен быть вычислен от конкатенации 'password' и 'salt'.
 
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 64823f9ec7f..0115a500e4d 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -994,6 +994,8 @@ void Client::addOptions(OptionsDescription & options_description)
         ("user,u", po::value<std::string>()->default_value("default"), "user")
         ("password", po::value<std::string>(), "password")
         ("ask-password", "ask-password")
+        ("ssh-key-file", po::value<std::string>(), "File containing ssh private key needed for authentication. If not set does password authentication.")
+        ("ssh-key-passphrase", po::value<std::string>(), "Passphrase for imported ssh key.")
         ("quota_key", po::value<std::string>(), "A string to differentiate quotas when the user have keyed quotas configured on server")
 
         ("max_client_network_bandwidth", po::value<int>(), "the maximum speed of data exchange over the network for the client in bytes per second.")
@@ -1136,6 +1138,10 @@ void Client::processOptions(const OptionsDescription & options_description,
         config().setString("password", options["password"].as<std::string>());
     if (options.count("ask-password"))
         config().setBool("ask-password", true);
+    if (options.count("ssh-key-file"))
+        config().setString("ssh-key-file", options["ssh-key-file"].as<std::string>());
+    if (options.count("ssh-key-passphrase"))
+        config().setString("ssh-key-passphrase", options["ssh-key-passphrase"].as<std::string>());
     if (options.count("quota_key"))
         config().setString("quota_key", options["quota_key"].as<std::string>());
     if (options.count("max_client_network_bandwidth"))
diff --git a/programs/copier/ClusterCopier.cpp b/programs/copier/ClusterCopier.cpp
index 556eca808f6..29e31cf97e3 100644
--- a/programs/copier/ClusterCopier.cpp
+++ b/programs/copier/ClusterCopier.cpp
@@ -2025,7 +2025,7 @@ UInt64 ClusterCopier::executeQueryOnCluster(
             {
                 connections.emplace_back(std::make_shared<Connection>(
                     node.host_name, node.port, node.default_database,
-                    node.user, node.password, node.quota_key, node.cluster, node.cluster_secret,
+                    node.user, node.password, ssh::SSHKey(), node.quota_key, node.cluster, node.cluster_secret,
                     "ClusterCopier", node.compression, node.secure
                 ));
 
diff --git a/src/Access/Authentication.cpp b/src/Access/Authentication.cpp
index f4f5259597a..07a75db730e 100644
--- a/src/Access/Authentication.cpp
+++ b/src/Access/Authentication.cpp
@@ -7,6 +7,7 @@
 #include <Common/Exception.h>
 #include <Poco/SHA1Engine.h>
 #include <Common/typeid_cast.h>
+#include <Common/SSH/Wrappers.h>
 
 
 namespace DB
@@ -14,6 +15,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 namespace
@@ -70,6 +72,16 @@ namespace
     {
         return checkPasswordDoubleSHA1MySQL(scramble, scrambled_password, Util::encodeDoubleSHA1(password_plaintext));
     }
+
+#if USE_SSL
+    bool checkSshSignature(const std::vector<ssh::SSHKey> & keys, std::string_view signature, std::string_view original)
+    {
+        for (const auto & key: keys)
+            if (key.isPublic() && key.verifySignature(signature, original))
+                return true;
+        return false;
+    }
+#endif
 }
 
 
@@ -96,6 +108,9 @@ bool Authentication::areCredentialsValid(const Credentials & credentials, const
             case AuthenticationType::SSL_CERTIFICATE:
                 throw Authentication::Require<BasicCredentials>("ClickHouse X.509 Authentication");
 
+            case AuthenticationType::SSH_KEY:
+                throw Authentication::Require<SshCredentials>("Ssh Keys Authentication");
+
             case AuthenticationType::MAX:
                 break;
         }
@@ -123,6 +138,9 @@ bool Authentication::areCredentialsValid(const Credentials & credentials, const
             case AuthenticationType::SSL_CERTIFICATE:
                 throw Authentication::Require<BasicCredentials>("ClickHouse X.509 Authentication");
 
+            case AuthenticationType::SSH_KEY:
+                throw Authentication::Require<SshCredentials>("Ssh Keys Authentication");
+
             case AuthenticationType::MAX:
                 break;
         }
@@ -153,6 +171,9 @@ bool Authentication::areCredentialsValid(const Credentials & credentials, const
             case AuthenticationType::SSL_CERTIFICATE:
                 throw Authentication::Require<BasicCredentials>("ClickHouse X.509 Authentication");
 
+            case AuthenticationType::SSH_KEY:
+                throw Authentication::Require<SshCredentials>("Ssh Keys Authentication");
+
             case AuthenticationType::BCRYPT_PASSWORD:
                 return checkPasswordBcrypt(basic_credentials->getPassword(), auth_data.getPasswordHashBinary());
 
@@ -179,6 +200,38 @@ bool Authentication::areCredentialsValid(const Credentials & credentials, const
             case AuthenticationType::SSL_CERTIFICATE:
                 return auth_data.getSSLCertificateCommonNames().contains(ssl_certificate_credentials->getCommonName());
 
+            case AuthenticationType::SSH_KEY:
+                throw Authentication::Require<SshCredentials>("Ssh Keys Authentication");
+
+            case AuthenticationType::MAX:
+                break;
+        }
+    }
+
+    if (const auto * ssh_credentials = typeid_cast<const SshCredentials *>(&credentials))
+    {
+        switch (auth_data.getType())
+        {
+            case AuthenticationType::NO_PASSWORD:
+            case AuthenticationType::PLAINTEXT_PASSWORD:
+            case AuthenticationType::SHA256_PASSWORD:
+            case AuthenticationType::DOUBLE_SHA1_PASSWORD:
+            case AuthenticationType::BCRYPT_PASSWORD:
+            case AuthenticationType::LDAP:
+                throw Authentication::Require<BasicCredentials>("ClickHouse Basic Authentication");
+
+            case AuthenticationType::KERBEROS:
+                throw Authentication::Require<GSSAcceptorContext>(auth_data.getKerberosRealm());
+
+            case AuthenticationType::SSL_CERTIFICATE:
+                throw Authentication::Require<SSLCertificateCredentials>("ClickHouse X.509 Authentication");
+
+            case AuthenticationType::SSH_KEY:
+#if USE_SSL
+                return checkSshSignature(auth_data.getSSHKeys(), ssh_credentials->getSignature(), ssh_credentials->getOriginal());
+#else
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
+#endif
             case AuthenticationType::MAX:
                 break;
         }
diff --git a/src/Access/AuthenticationData.cpp b/src/Access/AuthenticationData.cpp
index 3bb0be160f4..483c0ecb4d6 100644
--- a/src/Access/AuthenticationData.cpp
+++ b/src/Access/AuthenticationData.cpp
@@ -5,6 +5,7 @@
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTLiteral.h>
+#include <Parsers/Access/ASTPublicSSHKey.h>
 #include <Storages/checkAndGetLiteralArgument.h>
 
 #include <Common/OpenSSLHelpers.h>
@@ -103,7 +104,8 @@ bool operator ==(const AuthenticationData & lhs, const AuthenticationData & rhs)
 {
     return (lhs.type == rhs.type) && (lhs.password_hash == rhs.password_hash)
         && (lhs.ldap_server_name == rhs.ldap_server_name) && (lhs.kerberos_realm == rhs.kerberos_realm)
-        && (lhs.ssl_certificate_common_names == rhs.ssl_certificate_common_names);
+        && (lhs.ssl_certificate_common_names == rhs.ssl_certificate_common_names)
+        && (lhs.ssh_keys == rhs.ssh_keys);
 }
 
 
@@ -125,6 +127,7 @@ void AuthenticationData::setPassword(const String & password_)
         case AuthenticationType::LDAP:
         case AuthenticationType::KERBEROS:
         case AuthenticationType::SSL_CERTIFICATE:
+        case AuthenticationType::SSH_KEY:
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot specify password for authentication type {}", toString(type));
 
         case AuthenticationType::MAX:
@@ -228,6 +231,7 @@ void AuthenticationData::setPasswordHashBinary(const Digest & hash)
         case AuthenticationType::LDAP:
         case AuthenticationType::KERBEROS:
         case AuthenticationType::SSL_CERTIFICATE:
+        case AuthenticationType::SSH_KEY:
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot specify password binary hash for authentication type {}", toString(type));
 
         case AuthenticationType::MAX:
@@ -311,6 +315,17 @@ std::shared_ptr<ASTAuthenticationData> AuthenticationData::toAST() const
 
             break;
         }
+        case AuthenticationType::SSH_KEY:
+        {
+#if USE_SSL
+            for (const auto & key : getSSHKeys())
+                node->children.push_back(std::make_shared<ASTPublicSSHKey>(key.getBase64(), key.getKeyType()));
+
+            break;
+#else
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
+#endif
+        }
 
         case AuthenticationType::NO_PASSWORD: [[fallthrough]];
         case AuthenticationType::MAX:
@@ -326,6 +341,37 @@ AuthenticationData AuthenticationData::fromAST(const ASTAuthenticationData & que
     if (query.type && query.type == AuthenticationType::NO_PASSWORD)
         return AuthenticationData();
 
+    /// For this type of authentication we have ASTPublicSSHKey as children for ASTAuthenticationData
+    if (query.type && query.type == AuthenticationType::SSH_KEY)
+    {
+#if USE_SSL
+        AuthenticationData auth_data(*query.type);
+        std::vector<ssh::SSHKey> keys;
+
+        size_t args_size = query.children.size();
+        for (size_t i = 0; i < args_size; ++i)
+        {
+            const auto & ssh_key = query.children[i]->as<ASTPublicSSHKey &>();
+            const auto & key_base64 = ssh_key.key_base64;
+            const auto & type = ssh_key.type;
+
+            try
+            {
+                keys.emplace_back(ssh::SSHKeyFactory::makePublicFromBase64(key_base64, type));
+            }
+            catch (const std::invalid_argument &)
+            {
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bad SSH key in entry: {} with type {}", key_base64, type);
+            }
+        }
+
+        auth_data.setSSHKeys(std::move(keys));
+        return auth_data;
+#else
+        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
+#endif
+    }
+
     size_t args_size = query.children.size();
     ASTs args(args_size);
     for (size_t i = 0; i < args_size; ++i)
diff --git a/src/Access/AuthenticationData.h b/src/Access/AuthenticationData.h
index 5ebef7d44f2..75859ed7c52 100644
--- a/src/Access/AuthenticationData.h
+++ b/src/Access/AuthenticationData.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Access/Common/AuthenticationType.h>
+#include <Common/SSH/Wrappers.h>
 #include <Parsers/Access/ASTAuthenticationData.h>
 #include <Interpreters/Context_fwd.h>
 
@@ -57,6 +58,9 @@ public:
     const boost::container::flat_set<String> & getSSLCertificateCommonNames() const { return ssl_certificate_common_names; }
     void setSSLCertificateCommonNames(boost::container::flat_set<String> common_names_);
 
+    const std::vector<ssh::SSHKey> & getSSHKeys() const { return ssh_keys; }
+    void setSSHKeys(std::vector<ssh::SSHKey> && ssh_keys_) { ssh_keys = std::forward<std::vector<ssh::SSHKey>>(ssh_keys_); }
+
     friend bool operator ==(const AuthenticationData & lhs, const AuthenticationData & rhs);
     friend bool operator !=(const AuthenticationData & lhs, const AuthenticationData & rhs) { return !(lhs == rhs); }
 
@@ -83,6 +87,7 @@ private:
     String kerberos_realm;
     boost::container::flat_set<String> ssl_certificate_common_names;
     String salt;
+    std::vector<ssh::SSHKey> ssh_keys;
 };
 
 }
diff --git a/src/Access/Common/AuthenticationType.cpp b/src/Access/Common/AuthenticationType.cpp
index 7ab28b5fbaf..b1f410d9285 100644
--- a/src/Access/Common/AuthenticationType.cpp
+++ b/src/Access/Common/AuthenticationType.cpp
@@ -62,6 +62,11 @@ const AuthenticationTypeInfo & AuthenticationTypeInfo::get(AuthenticationType ty
             static const auto info = make_info("BCRYPT_PASSWORD", true);
             return info;
         }
+        case AuthenticationType::SSH_KEY:
+        {
+            static const auto info = make_info("SSH_KEY");
+            return info;
+        }
         case AuthenticationType::MAX:
             break;
     }
diff --git a/src/Access/Common/AuthenticationType.h b/src/Access/Common/AuthenticationType.h
index d7c2d0cdd40..2bdef30830c 100644
--- a/src/Access/Common/AuthenticationType.h
+++ b/src/Access/Common/AuthenticationType.h
@@ -33,6 +33,10 @@ enum class AuthenticationType
     /// Password is encrypted in bcrypt hash.
     BCRYPT_PASSWORD,
 
+    /// Server sends a random string named `challenge` which client needs to encrypt with private key.
+    /// The check is performed on server side by decrypting the data and comparing with the original string.
+    SSH_KEY,
+
     MAX,
 };
 
diff --git a/src/Access/Credentials.h b/src/Access/Credentials.h
index 814382859b9..77b90eaaebc 100644
--- a/src/Access/Credentials.h
+++ b/src/Access/Credentials.h
@@ -86,4 +86,36 @@ class MySQLNative41Credentials : public CredentialsWithScramble
     using CredentialsWithScramble::CredentialsWithScramble;
 };
 
+class SshCredentials : public Credentials
+{
+public:
+    explicit SshCredentials(const String& user_name_, const String& signature_, const String& original_)
+        : Credentials(user_name_), signature(signature_), original(original_)
+    {
+        is_ready = true;
+    }
+
+    const String & getSignature() const
+    {
+        if (!isReady())
+        {
+            throwNotReady();
+        }
+        return signature;
+    }
+
+    const String & getOriginal() const
+    {
+        if (!isReady())
+        {
+            throwNotReady();
+        }
+        return original;
+    }
+
+private:
+    String signature;
+    String original;
+};
+
 }
diff --git a/src/Access/User.cpp b/src/Access/User.cpp
index 3b4055b6b1d..91477e5f3aa 100644
--- a/src/Access/User.cpp
+++ b/src/Access/User.cpp
@@ -28,8 +28,10 @@ void User::setName(const String & name_)
     /// Also it was possible to create a user with empty name for some reason.
     if (name_.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "User name is empty");
-    if (name_ == USER_INTERSERVER_MARKER)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "User name '{}' is reserved", USER_INTERSERVER_MARKER);
+    if (name_ == EncodedUserInfo::USER_INTERSERVER_MARKER)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "User name '{}' is reserved", name_);
+    if (startsWith(name_, EncodedUserInfo::SSH_KEY_AUTHENTICAION_MARKER))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "User name '{}' is reserved", name_);
     name = name_;
 }
 
diff --git a/src/Access/UsersConfigAccessStorage.cpp b/src/Access/UsersConfigAccessStorage.cpp
index 6e3367a6d15..72b4ead0c57 100644
--- a/src/Access/UsersConfigAccessStorage.cpp
+++ b/src/Access/UsersConfigAccessStorage.cpp
@@ -1,5 +1,6 @@
 #include <Access/UsersConfigAccessStorage.h>
 #include <Access/Quota.h>
+#include <Common/SSH/Wrappers.h>
 #include <Access/RowPolicy.h>
 #include <Access/User.h>
 #include <Access/Role.h>
@@ -36,6 +37,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_ADDRESS_PATTERN_TYPE;
     extern const int THERE_IS_NO_PROFILE;
     extern const int NOT_IMPLEMENTED;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 namespace
@@ -130,18 +132,21 @@ namespace
         const auto certificates_config = user_config + ".ssl_certificates";
         bool has_certificates = config.has(certificates_config);
 
-        size_t num_password_fields = has_no_password + has_password_plaintext + has_password_sha256_hex + has_password_double_sha1_hex + has_ldap + has_kerberos + has_certificates;
+        const auto ssh_keys_config = user_config + ".ssh_keys";
+        bool has_ssh_keys = config.has(ssh_keys_config);
+
+        size_t num_password_fields = has_no_password + has_password_plaintext + has_password_sha256_hex + has_password_double_sha1_hex + has_ldap + has_kerberos + has_certificates + has_ssh_keys;
 
         if (num_password_fields > 1)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "More than one field of 'password', 'password_sha256_hex', "
-                            "'password_double_sha1_hex', 'no_password', 'ldap', 'kerberos', 'ssl_certificates' "
+                            "'password_double_sha1_hex', 'no_password', 'ldap', 'kerberos', 'ssl_certificates', 'ssh_keys' "
                             "are used to specify authentication info for user {}. "
                             "Must be only one of them.", user_name);
 
         if (num_password_fields < 1)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Either 'password' or 'password_sha256_hex' "
-                            "or 'password_double_sha1_hex' or 'no_password' or 'ldap' or 'kerberos' "
-                            "or 'ssl_certificates' must be specified for user {}.", user_name);
+                            "or 'password_double_sha1_hex' or 'no_password' or 'ldap' or 'kerberos "
+                            "or 'ssl_certificates' or 'ssh_keys' must be specified for user {}.", user_name);
 
         if (has_password_plaintext)
         {
@@ -198,6 +203,51 @@ namespace
             }
             user->auth_data.setSSLCertificateCommonNames(std::move(common_names));
         }
+        else if (has_ssh_keys)
+        {
+#if USE_SSL
+            user->auth_data = AuthenticationData{AuthenticationType::SSH_KEY};
+
+            Poco::Util::AbstractConfiguration::Keys entries;
+            config.keys(ssh_keys_config, entries);
+            std::vector<ssh::SSHKey> keys;
+            for (const String& entry : entries)
+            {
+                const auto conf_pref = ssh_keys_config + "." + entry + ".";
+                if (entry.starts_with("ssh_key"))
+                {
+                    String type, base64_key;
+                    if (config.has(conf_pref + "type"))
+                    {
+                        type = config.getString(conf_pref + "type");
+                    }
+                    else
+                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected type field in {} entry", entry);
+                    if (config.has(conf_pref + "base64_key"))
+                    {
+                        base64_key = config.getString(conf_pref + "base64_key");
+                    }
+                    else
+                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected base64_key field in {} entry", entry);
+
+
+                    try
+                    {
+                        keys.emplace_back(ssh::SSHKeyFactory::makePublicFromBase64(base64_key, type));
+                    }
+                    catch (const std::invalid_argument &)
+                    {
+                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bad SSH key in entry: {}", entry);
+                    }
+                }
+                else
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown ssh_key entry pattern type: {}", entry);
+            }
+            user->auth_data.setSSHKeys(std::move(keys));
+#else
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
+#endif
+        }
 
         auto auth_type = user->auth_data.getType();
         if (((auth_type == AuthenticationType::NO_PASSWORD) && !allow_no_password) ||
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 22023ae2f5f..06d4b98b1ff 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -82,6 +82,7 @@ add_subdirectory (Formats)
 
 add_headers_and_sources(clickhouse_common_io Common)
 add_headers_and_sources(clickhouse_common_io Common/HashTable)
+add_headers_and_sources(clickhouse_common_io Common/SSH)
 add_headers_and_sources(clickhouse_common_io IO)
 add_headers_and_sources(clickhouse_common_io IO/Archives)
 add_headers_and_sources(clickhouse_common_io IO/Resource)
@@ -337,6 +338,10 @@ if (TARGET ch_contrib::crc32-vpmsum)
     target_link_libraries(clickhouse_common_io PUBLIC ch_contrib::crc32-vpmsum)
  endif()
 
+if (TARGET ch_contrib::ssh)
+ target_link_libraries(clickhouse_common_io PUBLIC ch_contrib::ssh)
+endif()
+
 dbms_target_link_libraries(PUBLIC ch_contrib::abseil_swiss_tables)
 target_link_libraries (clickhouse_common_io PUBLIC ch_contrib::abseil_swiss_tables)
 
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index 8aa36bb9349..cf25ee6e856 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -67,6 +67,7 @@ Connection::~Connection() = default;
 Connection::Connection(const String & host_, UInt16 port_,
     const String & default_database_,
     const String & user_, const String & password_,
+    const ssh::SSHKey & ssh_private_key_,
     const String & quota_key_,
     const String & cluster_,
     const String & cluster_secret_,
@@ -74,7 +75,9 @@ Connection::Connection(const String & host_, UInt16 port_,
     Protocol::Compression compression_,
     Protocol::Secure secure_)
     : host(host_), port(port_), default_database(default_database_)
-    , user(user_), password(password_), quota_key(quota_key_)
+    , user(user_), password(password_)
+    , ssh_private_key(ssh_private_key_)
+    , quota_key(quota_key_)
     , cluster(cluster_)
     , cluster_secret(cluster_secret_)
     , client_name(client_name_)
@@ -189,6 +192,7 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
 
         sendHello();
         receiveHello(timeouts.handshake_timeout);
+
         if (server_revision >= DBMS_MIN_PROTOCOL_VERSION_WITH_ADDENDUM)
             sendAddendum();
 
@@ -255,6 +259,17 @@ void Connection::disconnect()
 }
 
 
+String Connection::packStringForSshSign(String challenge)
+{
+    String message;
+    message.append(std::to_string(DBMS_TCP_PROTOCOL_VERSION));
+    message.append(default_database);
+    message.append(user);
+    message.append(challenge);
+    return message;
+}
+
+
 void Connection::sendHello()
 {
     /** Disallow control characters in user controlled parameters
@@ -291,7 +306,7 @@ void Connection::sendHello()
     /// (NOTE we do not check for DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET, since we cannot ignore inter-server secret if it was requested)
     if (!cluster_secret.empty())
     {
-        writeStringBinary(USER_INTERSERVER_MARKER, *out);
+        writeStringBinary(EncodedUserInfo::USER_INTERSERVER_MARKER, *out);
         writeStringBinary("" /* password */, *out);
 
 #if USE_SSL
@@ -301,6 +316,16 @@ void Connection::sendHello()
                         "Inter-server secret support is disabled, because ClickHouse was built without SSL library");
 #endif
     }
+#if USE_SSL
+    /// Just inform server that we will authenticate using SSH keys.
+    else if (!ssh_private_key.isEmpty())
+    {
+        writeStringBinary(fmt::format("{}{}", EncodedUserInfo::SSH_KEY_AUTHENTICAION_MARKER, user), *out);
+        writeStringBinary(password, *out);
+
+        performHandshakeForSSHAuth();
+    }
+#endif
     else
     {
         writeStringBinary(user, *out);
@@ -319,6 +344,41 @@ void Connection::sendAddendum()
 }
 
 
+void Connection::performHandshakeForSSHAuth()
+{
+#if USE_SSL
+    String challenge;
+    {
+        writeVarUInt(Protocol::Client::SSHChallengeRequest, *out);
+        out->next();
+        UInt64 packet_type = 0;
+        if (in->eof())
+            throw Poco::Net::NetException("Connection reset by peer");
+
+        readVarUInt(packet_type, *in);
+        if (packet_type == Protocol::Server::SSHChallenge)
+        {
+            readStringBinary(challenge, *in);
+        }
+        else if (packet_type == Protocol::Server::Exception)
+            receiveException()->rethrow();
+        else
+        {
+            /// Close connection, to not stay in unsynchronised state.
+            disconnect();
+            throwUnexpectedPacket(packet_type, "SSHChallenge or Exception");
+        }
+    }
+
+    writeVarUInt(Protocol::Client::SSHChallengeResponse, *out);
+    String to_sign = packStringForSshSign(challenge);
+    String signature = ssh_private_key.signString(to_sign);
+    writeStringBinary(signature, *out);
+    out->next();
+#endif
+}
+
+
 void Connection::receiveHello(const Poco::Timespan & handshake_timeout)
 {
     TimeoutSetter timeout_setter(*socket, socket->getSendTimeout(), handshake_timeout);
@@ -1202,6 +1262,7 @@ ServerConnectionPtr Connection::createConnection(const ConnectionParameters & pa
         parameters.default_database,
         parameters.user,
         parameters.password,
+        parameters.ssh_private_key,
         parameters.quota_key,
         "", /* cluster */
         "", /* cluster_secret */
diff --git a/src/Client/Connection.h b/src/Client/Connection.h
index fcd009fa389..2f209fc92d0 100644
--- a/src/Client/Connection.h
+++ b/src/Client/Connection.h
@@ -3,7 +3,7 @@
 
 #include <Poco/Net/StreamSocket.h>
 
-#include "config.h"
+#include <Common/SSH/Wrappers.h>
 #include <Client/IServerConnection.h>
 #include <Core/Defines.h>
 
@@ -21,6 +21,8 @@
 #include <atomic>
 #include <optional>
 
+#include "config.h"
+
 namespace DB
 {
 
@@ -51,6 +53,7 @@ public:
     Connection(const String & host_, UInt16 port_,
         const String & default_database_,
         const String & user_, const String & password_,
+        const ssh::SSHKey & ssh_private_key_,
         const String & quota_key_,
         const String & cluster_,
         const String & cluster_secret_,
@@ -167,6 +170,7 @@ private:
     String default_database;
     String user;
     String password;
+    ssh::SSHKey ssh_private_key;
     String quota_key;
 
     /// For inter-server authorization
@@ -259,6 +263,10 @@ private:
 
     void connect(const ConnectionTimeouts & timeouts);
     void sendHello();
+    String packStringForSshSign(String challenge);
+
+    void performHandshakeForSSHAuth();
+
     void sendAddendum();
     void receiveHello(const Poco::Timespan & handshake_timeout);
 
diff --git a/src/Client/ConnectionParameters.cpp b/src/Client/ConnectionParameters.cpp
index 1f90e757b73..3942527e5b5 100644
--- a/src/Client/ConnectionParameters.cpp
+++ b/src/Client/ConnectionParameters.cpp
@@ -5,6 +5,7 @@
 #include <Core/Types.h>
 #include <IO/ConnectionTimeouts.h>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <Common/SSH/Wrappers.h>
 #include <Common/Exception.h>
 #include <Common/isLocalAddress.h>
 #include <Common/DNSResolver.h>
@@ -19,6 +20,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 ConnectionParameters::ConnectionParameters(const Poco::Util::AbstractConfiguration & config,
@@ -35,26 +37,57 @@ ConnectionParameters::ConnectionParameters(const Poco::Util::AbstractConfigurati
     /// changed the default value to "default" to fix the issue when the user in the prompt is blank
     user = config.getString("user", "default");
 
-    bool password_prompt = false;
-    if (config.getBool("ask-password", false))
+    if (!config.has("ssh-key-file"))
     {
-        if (config.has("password"))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Specified both --password and --ask-password. Remove one of them");
-        password_prompt = true;
+        bool password_prompt = false;
+        if (config.getBool("ask-password", false))
+        {
+            if (config.has("password"))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Specified both --password and --ask-password. Remove one of them");
+            password_prompt = true;
+        }
+        else
+        {
+            password = config.getString("password", "");
+            /// if the value of --password is omitted, the password will be set implicitly to "\n"
+            if (password == ASK_PASSWORD)
+                password_prompt = true;
+        }
+        if (password_prompt)
+        {
+            std::string prompt{"Password for user (" + user + "): "};
+            char buf[1000] = {};
+            if (auto * result = readpassphrase(prompt.c_str(), buf, sizeof(buf), 0))
+                password = result;
+        }
     }
     else
     {
-        password = config.getString("password", "");
-        if (password == ASK_PASSWORD)
-            password_prompt = true;
-    }
-    if (password_prompt)
-    {
-        std::string prompt{"Password for user (" + user + "): "};
-        char buf[1000] = {};
-        if (auto * result = readpassphrase(prompt.c_str(), buf, sizeof(buf), 0))
-            password = result;
+#if USE_SSL
+        std::string filename = config.getString("ssh-key-file");
+        std::string passphrase;
+        if (config.has("ssh-key-passphrase"))
+        {
+            passphrase = config.getString("ssh-key-passphrase");
+        }
+        else
+        {
+            std::string prompt{"Enter your private key passphrase (leave empty for no passphrase): "};
+            char buf[1000] = {};
+            if (auto * result = readpassphrase(prompt.c_str(), buf, sizeof(buf), 0))
+                passphrase = result;
+        }
+
+        ssh::SSHKey key = ssh::SSHKeyFactory::makePrivateFromFile(filename, passphrase);
+        if (!key.isPrivate())
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Found public key in file: {} but expected private", filename);
+
+        ssh_private_key = std::move(key);
+#else
+        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSH is disabled, because ClickHouse is built without OpenSSL");
+#endif
     }
+
     quota_key = config.getString("quota_key", "");
 
     /// By default compression is disabled if address looks like localhost.
diff --git a/src/Client/ConnectionParameters.h b/src/Client/ConnectionParameters.h
index 86149471983..6b090d76b22 100644
--- a/src/Client/ConnectionParameters.h
+++ b/src/Client/ConnectionParameters.h
@@ -3,6 +3,7 @@
 #include <string>
 #include <Core/Protocol.h>
 #include <IO/ConnectionTimeouts.h>
+#include <Common/SSH/Wrappers.h>
 
 namespace Poco::Util
 {
@@ -19,6 +20,7 @@ struct ConnectionParameters
     std::string user;
     std::string password;
     std::string quota_key;
+    ssh::SSHKey ssh_private_key;
     Protocol::Secure security = Protocol::Secure::Disable;
     Protocol::Compression compression = Protocol::Compression::Enable;
     ConnectionTimeouts timeouts;
diff --git a/src/Client/ConnectionPool.h b/src/Client/ConnectionPool.h
index b6d03daacfb..96191cf32c3 100644
--- a/src/Client/ConnectionPool.h
+++ b/src/Client/ConnectionPool.h
@@ -115,7 +115,7 @@ protected:
     {
         return std::make_shared<Connection>(
             host, port,
-            default_database, user, password, quota_key,
+            default_database, user, password, ssh::SSHKey(), quota_key,
             cluster, cluster_secret,
             client_name, compression, secure);
     }
diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index a4837ac3c44..b730b551e8c 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -588,6 +588,7 @@
     M(703, INVALID_IDENTIFIER) \
     M(704, CANNOT_USE_QUERY_CACHE_WITH_NONDETERMINISTIC_FUNCTIONS) \
     M(705, TABLE_NOT_EMPTY) \
+    M(706, LIBSSH_ERROR) \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
     M(1001, STD_EXCEPTION) \
diff --git a/src/Common/SSH/Wrappers.cpp b/src/Common/SSH/Wrappers.cpp
new file mode 100644
index 00000000000..b38dd1f4036
--- /dev/null
+++ b/src/Common/SSH/Wrappers.cpp
@@ -0,0 +1,183 @@
+#include <Common/SSH/Wrappers.h>
+# if USE_SSL
+#    include <stdexcept>
+
+#    pragma GCC diagnostic push
+#    pragma GCC diagnostic ignored "-Wreserved-macro-identifier"
+#    pragma GCC diagnostic ignored "-Wreserved-identifier"
+
+#    include <libssh/libssh.h>
+
+#    pragma GCC diagnostic pop
+
+namespace
+{
+
+class SSHString
+{
+public:
+    explicit SSHString(std::string_view input)
+    {
+        string = ssh_string_new(input.size());
+        ssh_string_fill(string, input.data(), input.size());
+    }
+
+    explicit SSHString(ssh_string c_other) { string = c_other; }
+
+    ssh_string get() { return string; }
+
+    String toString()
+    {
+        return String(ssh_string_get_char(string), ssh_string_len(string));
+    }
+
+    ~SSHString()
+    {
+        ssh_string_free(string);
+    }
+
+private:
+    ssh_string string;
+};
+
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LIBSSH_ERROR;
+}
+
+namespace ssh
+{
+
+SSHKey SSHKeyFactory::makePrivateFromFile(String filename, String passphrase)
+{
+    ssh_key key;
+    int rc = ssh_pki_import_privkey_file(filename.c_str(), passphrase.c_str(), nullptr, nullptr, &key);
+    if (rc != SSH_OK)
+    {
+        throw Exception(ErrorCodes::LIBSSH_ERROR, "Can't import SSH private key from file");
+    }
+    return SSHKey(key);
+}
+
+SSHKey SSHKeyFactory::makePublicFromFile(String filename)
+{
+    ssh_key key;
+    int rc = ssh_pki_import_pubkey_file(filename.c_str(), &key);
+    if (rc != SSH_OK)
+        throw Exception(ErrorCodes::LIBSSH_ERROR, "Can't import SSH public key from file");
+
+    return SSHKey(key);
+}
+
+SSHKey SSHKeyFactory::makePublicFromBase64(String base64_key, String type_name)
+{
+    ssh_key key;
+    auto key_type = ssh_key_type_from_name(type_name.c_str());
+    int rc = ssh_pki_import_pubkey_base64(base64_key.c_str(), key_type, &key);
+    if (rc != SSH_OK)
+        throw Exception(ErrorCodes::LIBSSH_ERROR, "Bad SSH public key provided");
+
+    return SSHKey(key);
+}
+
+SSHKey::SSHKey(const SSHKey & other)
+{
+    key = ssh_key_dup(other.key);
+}
+
+SSHKey & SSHKey::operator=(const SSHKey & other)
+{
+    ssh_key_free(key);
+    key = ssh_key_dup(other.key);
+    return *this;
+}
+
+SSHKey & SSHKey::operator=(SSHKey && other) noexcept
+{
+    ssh_key_free(key);
+    key = other.key;
+    other.key = nullptr;
+    return *this;
+}
+
+bool SSHKey::operator==(const SSHKey & other) const
+{
+    return isEqual(other);
+}
+
+bool SSHKey::isEqual(const SSHKey & other) const
+{
+    int rc = ssh_key_cmp(key, other.key, SSH_KEY_CMP_PUBLIC);
+    return rc == 0;
+}
+
+String SSHKey::signString(std::string_view input) const
+{
+    SSHString input_str(input);
+    ssh_string c_output = nullptr;
+    int rc = pki_sign_string(key, input_str.get(), &c_output);
+    if (rc != SSH_OK)
+        throw Exception(ErrorCodes::LIBSSH_ERROR, "Error singing with ssh key");
+
+    SSHString output(c_output);
+    return output.toString();
+}
+
+bool SSHKey::verifySignature(std::string_view signature, std::string_view original) const
+{
+    SSHString sig(signature), orig(original);
+    int rc = pki_verify_string(key, sig.get(), orig.get());
+    return rc == SSH_OK;
+}
+
+bool SSHKey::isPrivate() const
+{
+    return ssh_key_is_private(key);
+}
+
+bool SSHKey::isPublic() const
+{
+    return ssh_key_is_public(key);
+}
+
+namespace
+{
+    struct CStringDeleter
+    {
+        [[maybe_unused]] void operator()(char * ptr) const { std::free(ptr); }
+    };
+}
+
+String SSHKey::getBase64() const
+{
+    char * buf = nullptr;
+    int rc = ssh_pki_export_pubkey_base64(key, &buf);
+
+    if (rc != SSH_OK)
+        throw DB::Exception(DB::ErrorCodes::LIBSSH_ERROR, "Failed to export public key to base64");
+
+    /// Create a String from cstring, which makes a copy of the first one and requires freeing memory after it
+    /// This is to safely manage buf memory
+    std::unique_ptr<char, CStringDeleter> buf_ptr(buf);
+    return String(buf_ptr.get());
+}
+
+String SSHKey::getKeyType() const
+{
+    return ssh_key_type_to_char(ssh_key_type(key));
+}
+
+SSHKey::~SSHKey()
+{
+    ssh_key_free(key); // it's safe free from libssh
+}
+
+}
+}
+
+#endif
diff --git a/src/Common/SSH/Wrappers.h b/src/Common/SSH/Wrappers.h
new file mode 100644
index 00000000000..9036fac3163
--- /dev/null
+++ b/src/Common/SSH/Wrappers.h
@@ -0,0 +1,78 @@
+#pragma once
+#include <Common/Exception.h>
+#include "config.h"
+#if USE_SSL
+#    include <string_view>
+#    include <base/types.h>
+
+using ssh_key = struct ssh_key_struct *;
+
+namespace DB
+{
+
+namespace ssh
+{
+
+class SSHKeyFactory;
+
+class SSHKey
+{
+public:
+    SSHKey() = default;
+    ~SSHKey();
+
+    SSHKey(const SSHKey & other);
+    SSHKey(SSHKey && other) noexcept
+    {
+        key = other.key;
+        other.key = nullptr;
+    }
+    SSHKey & operator=(const SSHKey & other);
+    SSHKey & operator=(SSHKey && other) noexcept;
+
+    bool operator==(const SSHKey &) const;
+    bool isEqual(const SSHKey & other) const;
+
+    bool isEmpty() { return key == nullptr; }
+    String signString(std::string_view input) const;
+    bool verifySignature(std::string_view signature, std::string_view original) const;
+
+    bool isPublic() const;
+    bool isPrivate() const;
+
+    String getBase64() const;
+    String getKeyType() const;
+
+    friend SSHKeyFactory;
+private:
+    explicit SSHKey(ssh_key key_) : key(key_) { }
+    ssh_key key = nullptr;
+};
+
+
+class SSHKeyFactory
+{
+public:
+    /// The check whether the path is allowed to read for ClickHouse has
+    /// (e.g. a file is inside `user_files` directory)
+    /// to be done outside of this functions.
+    static SSHKey makePrivateFromFile(String filename, String passphrase);
+    static SSHKey makePublicFromFile(String filename);
+    static SSHKey makePublicFromBase64(String base64_key, String type_name);
+};
+
+}
+}
+
+#else
+namespace ssh
+{
+class SSHKey
+{
+public:
+    bool operator==(const SSHKey &) const = default;
+    [[ noreturn ]] bool isEmpty() { std::terminate(); }
+    [[ noreturn ]] String signString(std::string_view) const { std::terminate(); }
+};
+}
+#endif
diff --git a/src/Core/Protocol.h b/src/Core/Protocol.h
index 7f2b3cfa26a..cc642a7f501 100644
--- a/src/Core/Protocol.h
+++ b/src/Core/Protocol.h
@@ -53,9 +53,16 @@ namespace DB
 /// Using this block the client can initialize the output formatter and display the prefix of resulting table
 /// beforehand.
 
+namespace EncodedUserInfo
+{
+
 /// Marker of the inter-server secret (passed in the user name)
 /// (anyway user cannot be started with a whitespace)
 const char USER_INTERSERVER_MARKER[] = " INTERSERVER SECRET ";
+/// Marker of the SSH keys based authentication (passed in the user name)
+const char SSH_KEY_AUTHENTICAION_MARKER[] = " SSH KEY AUTHENTICATION ";
+
+};
 
 namespace Protocol
 {
@@ -84,7 +91,8 @@ namespace Protocol
             MergeTreeAllRangesAnnouncement = 15,
             MergeTreeReadTaskRequest = 16,  /// Request from a MergeTree replica to a coordinator
             TimezoneUpdate = 17,            /// Receive server's (session-wide) default timezone
-            MAX = TimezoneUpdate,
+            SSHChallenge = 18,              /// Return challenge for SSH signature signing
+            MAX = SSHChallenge,
 
         };
 
@@ -113,6 +121,7 @@ namespace Protocol
                 "MergeTreeAllRangesAnnouncement",
                 "MergeTreeReadTaskRequest",
                 "TimezoneUpdate",
+                "SSHChallenge",
             };
             return packet <= MAX
                 ? data[packet]
@@ -150,7 +159,10 @@ namespace Protocol
             IgnoredPartUUIDs = 8,           /// List of unique parts ids to exclude from query processing
             ReadTaskResponse = 9,           /// A filename to read from s3 (used in s3Cluster)
             MergeTreeReadTaskResponse = 10, /// Coordinator's decision with a modified set of mark ranges allowed to read
-            MAX = MergeTreeReadTaskResponse,
+
+            SSHChallengeRequest = 11,       /// Request for SSH signature challenge
+            SSHChallengeResponse = 12,       /// Request for SSH signature challenge
+            MAX = SSHChallengeResponse,
         };
 
         inline const char * toString(UInt64 packet)
@@ -166,7 +178,9 @@ namespace Protocol
                 "Scalar",
                 "IgnoredPartUUIDs",
                 "ReadTaskResponse",
-                "MergeTreeReadTaskResponse"
+                "MergeTreeReadTaskResponse",
+                "SSHChallengeRequest",
+                "SSHChallengeResponse"
             };
             return packet <= MAX
                 ? data[packet]
diff --git a/src/Core/ProtocolDefines.h b/src/Core/ProtocolDefines.h
index 9897f314aa8..d0adf7b78d2 100644
--- a/src/Core/ProtocolDefines.h
+++ b/src/Core/ProtocolDefines.h
@@ -71,6 +71,8 @@
 
 #define DBMS_MIN_REVISION_WITH_SPARSE_SERIALIZATION 54465
 
+#define DBMS_MIN_REVISION_WITH_SSH_AUTHENTICATION 54466
+
 /// Version of ClickHouse TCP protocol.
 ///
 /// Should be incremented manually on protocol changes.
@@ -78,4 +80,4 @@
 /// NOTE: DBMS_TCP_PROTOCOL_VERSION has nothing common with VERSION_REVISION,
 /// later is just a number for server version (one number instead of commit SHA)
 /// for simplicity (sometimes it may be more convenient in some use cases).
-#define DBMS_TCP_PROTOCOL_VERSION 54465
+#define DBMS_TCP_PROTOCOL_VERSION 54466
diff --git a/src/Interpreters/SessionLog.cpp b/src/Interpreters/SessionLog.cpp
index b847eaf9824..e058d9c0a0b 100644
--- a/src/Interpreters/SessionLog.cpp
+++ b/src/Interpreters/SessionLog.cpp
@@ -86,11 +86,12 @@ NamesAndTypesList SessionLogElement::getNamesAndTypes()
             AUTH_TYPE_NAME_AND_VALUE(AuthType::DOUBLE_SHA1_PASSWORD),
             AUTH_TYPE_NAME_AND_VALUE(AuthType::LDAP),
             AUTH_TYPE_NAME_AND_VALUE(AuthType::KERBEROS),
+            AUTH_TYPE_NAME_AND_VALUE(AuthType::SSH_KEY),
             AUTH_TYPE_NAME_AND_VALUE(AuthType::SSL_CERTIFICATE),
             AUTH_TYPE_NAME_AND_VALUE(AuthType::BCRYPT_PASSWORD),
         });
 #undef AUTH_TYPE_NAME_AND_VALUE
-    static_assert(static_cast<int>(AuthenticationType::MAX) == 8);
+    static_assert(static_cast<int>(AuthenticationType::MAX) == 9);
 
     auto interface_type_column = std::make_shared<DataTypeEnum8>(
         DataTypeEnum8::Values
diff --git a/src/Parsers/Access/ASTAuthenticationData.cpp b/src/Parsers/Access/ASTAuthenticationData.cpp
index d730a08889d..db9a7b1fc75 100644
--- a/src/Parsers/Access/ASTAuthenticationData.cpp
+++ b/src/Parsers/Access/ASTAuthenticationData.cpp
@@ -26,6 +26,7 @@ std::optional<String> ASTAuthenticationData::getPassword() const
 
     return {};
 }
+
 std::optional<String> ASTAuthenticationData::getSalt() const
 {
     if (type && *type == AuthenticationType::SHA256_PASSWORD && children.size() == 2)
@@ -117,6 +118,12 @@ void ASTAuthenticationData::formatImpl(const FormatSettings & settings, FormatSt
                 password = true;
                 break;
             }
+            case AuthenticationType::SSH_KEY:
+            {
+                prefix = "BY";
+                parameters = true;
+                break;
+            }
             case AuthenticationType::NO_PASSWORD: [[fallthrough]];
             case AuthenticationType::MAX:
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "AST: Unexpected authentication type {}", toString(*type));
diff --git a/src/Parsers/Access/ASTPublicSSHKey.cpp b/src/Parsers/Access/ASTPublicSSHKey.cpp
new file mode 100644
index 00000000000..916202b96dc
--- /dev/null
+++ b/src/Parsers/Access/ASTPublicSSHKey.cpp
@@ -0,0 +1,17 @@
+#include <Parsers/Access/ASTPublicSSHKey.h>
+#include <Common/quoteString.h>
+#include <IO/Operators.h>
+
+
+namespace DB
+{
+
+void ASTPublicSSHKey::formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const
+{
+    settings.ostr << "KEY ";
+    settings.ostr << backQuoteIfNeed(key_base64) << ' ';
+    settings.ostr << "TYPE ";
+    settings.ostr << backQuoteIfNeed(type);
+}
+
+}
diff --git a/src/Parsers/Access/ASTPublicSSHKey.h b/src/Parsers/Access/ASTPublicSSHKey.h
new file mode 100644
index 00000000000..549ab162a7e
--- /dev/null
+++ b/src/Parsers/Access/ASTPublicSSHKey.h
@@ -0,0 +1,25 @@
+#pragma once
+
+#include <Parsers/IAST.h>
+
+
+namespace DB
+{
+
+class ASTPublicSSHKey : public IAST
+{
+public:
+    String key_base64;
+    String type;
+
+    ASTPublicSSHKey() = default;
+    ASTPublicSSHKey(String key_base64_, String type_)
+        : key_base64(key_base64_)
+        , type(type_)
+    {}
+    String getID(char) const override { return "PublicSSHKey"; }
+    ASTPtr clone() const override { return std::make_shared<ASTPublicSSHKey>(*this); }
+    void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
+};
+
+}
diff --git a/src/Parsers/Access/ParserCreateUserQuery.cpp b/src/Parsers/Access/ParserCreateUserQuery.cpp
index 0a534cc604d..8bcbc83d4b4 100644
--- a/src/Parsers/Access/ParserCreateUserQuery.cpp
+++ b/src/Parsers/Access/ParserCreateUserQuery.cpp
@@ -8,6 +8,7 @@
 #include <Parsers/Access/ParserRolesOrUsersSet.h>
 #include <Parsers/Access/ParserSettingsProfileElement.h>
 #include <Parsers/Access/ParserUserNameWithHost.h>
+#include <Parsers/Access/ParserPublicSSHKey.h>
 #include <Parsers/Access/parseUserName.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/CommonParsers.h>
@@ -18,8 +19,8 @@
 #include <base/range.h>
 #include <boost/algorithm/string/predicate.hpp>
 #include <base/insertAtEnd.h>
-#include "config.h"
 
+#include "config.h"
 
 namespace DB
 {
@@ -78,6 +79,7 @@ namespace
             bool expect_ldap_server_name = false;
             bool expect_kerberos_realm = false;
             bool expect_common_names = false;
+            bool expect_public_ssh_key = false;
 
             if (ParserKeyword{"WITH"}.ignore(pos, expected))
             {
@@ -93,6 +95,8 @@ namespace
                             expect_kerberos_realm = true;
                         else if (check_type == AuthenticationType::SSL_CERTIFICATE)
                             expect_common_names = true;
+                        else if (check_type == AuthenticationType::SSH_KEY)
+                            expect_public_ssh_key = true;
                         else if (check_type != AuthenticationType::NO_PASSWORD)
                             expect_password = true;
 
@@ -129,6 +133,8 @@ namespace
             ASTPtr value;
             ASTPtr parsed_salt;
             ASTPtr common_names;
+            ASTPtr public_ssh_keys;
+
             if (expect_password || expect_hash)
             {
                 if (!ParserKeyword{"BY"}.ignore(pos, expected) || !ParserStringAndSubstitution{}.parse(pos, value, expected))
@@ -164,6 +170,14 @@ namespace
                 if (!ParserList{std::make_unique<ParserStringAndSubstitution>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, common_names, expected))
                     return false;
             }
+            else if (expect_public_ssh_key)
+            {
+                if (!ParserKeyword{"BY"}.ignore(pos, expected))
+                    return false;
+
+                if (!ParserList{std::make_unique<ParserPublicSSHKey>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, common_names, expected))
+                    return false;
+            }
 
             auth_data = std::make_shared<ASTAuthenticationData>();
 
@@ -180,6 +194,9 @@ namespace
             if (common_names)
                 auth_data->children = std::move(common_names->children);
 
+            if (public_ssh_keys)
+                auth_data->children = std::move(public_ssh_keys->children);
+
             return true;
         });
     }
diff --git a/src/Parsers/Access/ParserPublicSSHKey.cpp b/src/Parsers/Access/ParserPublicSSHKey.cpp
new file mode 100644
index 00000000000..725fe67a75b
--- /dev/null
+++ b/src/Parsers/Access/ParserPublicSSHKey.cpp
@@ -0,0 +1,44 @@
+#include <Parsers/Access/ParserPublicSSHKey.h>
+#include <Parsers/Access/ASTPublicSSHKey.h>
+
+#include <Parsers/CommonParsers.h>
+#include <Parsers/parseIdentifierOrStringLiteral.h>
+
+
+namespace DB
+{
+
+namespace
+{
+    bool parsePublicSSHKey(IParserBase::Pos & pos, Expected & expected, std::shared_ptr<ASTPublicSSHKey> & ast)
+    {
+        return IParserBase::wrapParseImpl(pos, [&]
+        {
+            String key_base64;
+            if (!ParserKeyword{"KEY"}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, key_base64))
+                return false;
+
+            String type;
+            if (!ParserKeyword{"TYPE"}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, type))
+                return false;
+
+            ast = std::make_shared<ASTPublicSSHKey>();
+            ast->key_base64 = std::move(key_base64);
+            ast->type = std::move(type);
+            return true;
+        });
+    }
+}
+
+
+bool ParserPublicSSHKey::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
+{
+    std::shared_ptr<ASTPublicSSHKey> res;
+    if (!parsePublicSSHKey(pos, expected, res))
+        return false;
+
+    node = res;
+    return true;
+}
+
+}
diff --git a/src/Parsers/Access/ParserPublicSSHKey.h b/src/Parsers/Access/ParserPublicSSHKey.h
new file mode 100644
index 00000000000..b9d19e32867
--- /dev/null
+++ b/src/Parsers/Access/ParserPublicSSHKey.h
@@ -0,0 +1,16 @@
+#pragma once
+
+#include <Parsers/IParserBase.h>
+
+
+namespace DB
+{
+
+class ParserPublicSSHKey : public IParserBase
+{
+protected:
+    const char * getName() const override { return "PublicSSHKey"; }
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
+};
+
+}
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index c687a6064b4..766c6a49e3b 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -1,4 +1,5 @@
 #include <algorithm>
+#include <exception>
 #include <iterator>
 #include <memory>
 #include <mutex>
@@ -98,6 +99,8 @@ namespace DB::ErrorCodes
     extern const int AUTHENTICATION_FAILED;
     extern const int QUERY_WAS_CANCELLED;
     extern const int CLIENT_INFO_DOES_NOT_MATCH;
+    extern const int SUPPORT_IS_DISABLED;
+    extern const int UNSUPPORTED_METHOD;
 }
 
 namespace
@@ -1240,6 +1243,17 @@ std::string formatHTTPErrorResponseWhenUserIsConnectedToWrongPort(const Poco::Ut
     return result;
 }
 
+[[ maybe_unused ]] String createChallenge()
+{
+#if USE_SSL
+    pcg64_fast rng(randomSeed());
+    UInt64 rand = rng();
+    return encodeSHA256(&rand, sizeof(rand));
+#else
+    throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Can't generate challenge, because ClickHouse was built without OpenSSL");
+#endif
+}
+
 }
 
 std::unique_ptr<Session> TCPHandler::makeSession()
@@ -1257,6 +1271,16 @@ std::unique_ptr<Session> TCPHandler::makeSession()
     return res;
 }
 
+String TCPHandler::prepareStringForSshValidation(String username, String challenge)
+{
+    String output;
+    output.append(std::to_string(client_tcp_protocol_version));
+    output.append(default_database);
+    output.append(username);
+    output.append(challenge);
+    return output;
+}
+
 void TCPHandler::receiveHello()
 {
     /// Receive `hello` packet.
@@ -1266,6 +1290,7 @@ void TCPHandler::receiveHello()
     String default_db;
 
     readVarUInt(packet_type, *in);
+
     if (packet_type != Protocol::Client::Hello)
     {
         /** If you accidentally accessed the HTTP protocol for a port destined for an internal TCP protocol,
@@ -1303,7 +1328,7 @@ void TCPHandler::receiveHello()
         (!user.empty() ? ", user: " + user : "")
     );
 
-    is_interserver_mode = (user == USER_INTERSERVER_MARKER) && password.empty();
+    is_interserver_mode = (user == EncodedUserInfo::USER_INTERSERVER_MARKER) && password.empty();
     if (is_interserver_mode)
     {
         if (client_tcp_protocol_version < DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET_V2)
@@ -1313,6 +1338,12 @@ void TCPHandler::receiveHello()
         return;
     }
 
+    is_ssh_based_auth = startsWith(user, EncodedUserInfo::SSH_KEY_AUTHENTICAION_MARKER) && password.empty();
+    if (is_ssh_based_auth)
+    {
+        user.erase(0, String(EncodedUserInfo::SSH_KEY_AUTHENTICAION_MARKER).size());
+    }
+
     session = makeSession();
     const auto & client_info = session->getClientInfo();
 
@@ -1336,6 +1367,35 @@ void TCPHandler::receiveHello()
             }
         }
     }
+
+    /// Perform handshake for SSH authentication
+    if (is_ssh_based_auth)
+    {
+        if (session->getAuthenticationTypeOrLogInFailure(user) != AuthenticationType::SSH_KEY)
+            throw Exception(ErrorCodes::AUTHENTICATION_FAILED, "Expected authentication with SSH key");
+
+        if (client_tcp_protocol_version < DBMS_MIN_REVISION_WITH_SSH_AUTHENTICATION)
+            throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Cannot authenticate user with SSH key, because client version is too old");
+
+        readVarUInt(packet_type, *in);
+        if (packet_type != Protocol::Client::SSHChallengeRequest)
+            throw Exception(ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT, "Server expected to receive a packet for requesting a challenge string");
+
+        auto challenge = createChallenge();
+        writeVarUInt(Protocol::Server::SSHChallenge, *out);
+        writeStringBinary(challenge, *out);
+        out->next();
+
+        String signature;
+        readVarUInt(packet_type, *in);
+        if (packet_type != Protocol::Client::SSHChallengeResponse)
+            throw Exception(ErrorCodes::UNEXPECTED_PACKET_FROM_CLIENT, "Server expected to receive a packet with a response for a challenge");
+        readStringBinary(signature, *in);
+
+        auto cred = SshCredentials(user, signature, prepareStringForSshValidation(user, challenge));
+        session->authenticate(cred, getClientAddress(client_info));
+        return;
+    }
 #endif
 
     session->authenticate(user, password, getClientAddress(client_info));
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index cfb17ce6ae6..7ebb605e1c9 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -194,6 +194,7 @@ private:
 
     String default_database;
 
+    bool is_ssh_based_auth = false;
     /// For inter-server secret (remote_server.*.secret)
     bool is_interserver_mode = false;
     /// For DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET
@@ -223,6 +224,7 @@ private:
     void extractConnectionSettingsFromContext(const ContextPtr & context);
 
     std::unique_ptr<Session> makeSession();
+    String prepareStringForSshValidation(String user, String challenge);
 
     bool receiveProxyHeader();
     void receiveHello();
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 4baa43311d4..38d65946986 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -1000,7 +1000,7 @@ std::optional<QueryPipeline> StorageDistributed::distributedWriteFromClusterStor
         {
             auto connection = std::make_shared<Connection>(
                 node.host_name, node.port, query_context->getGlobalContext()->getCurrentDatabase(),
-                node.user, node.password, node.quota_key, node.cluster, node.cluster_secret,
+                node.user, node.password, ssh::SSHKey(), node.quota_key, node.cluster, node.cluster_secret,
                 "ParallelInsertSelectInititiator",
                 node.compression,
                 node.secure
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 4de7ecb7fd9..419b32f150d 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -5372,7 +5372,7 @@ std::optional<QueryPipeline> StorageReplicatedMergeTree::distributedWriteFromClu
         {
             auto connection = std::make_shared<Connection>(
                 node.host_name, node.port, query_context->getGlobalContext()->getCurrentDatabase(),
-                node.user, node.password, node.quota_key, node.cluster, node.cluster_secret,
+                node.user, node.password, ssh::SSHKey(), node.quota_key, node.cluster, node.cluster_secret,
                 "ParallelInsertSelectInititiator",
                 node.compression,
                 node.secure
diff --git a/tests/integration/test_ssh_keys_authentication/__init__.py b/tests/integration/test_ssh_keys_authentication/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_ssh_keys_authentication/configs/users.xml b/tests/integration/test_ssh_keys_authentication/configs/users.xml
new file mode 100644
index 00000000000..05b55a46598
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/configs/users.xml
@@ -0,0 +1,28 @@
+<clickhouse>
+    <users>
+        <john>
+            <ssh_keys>
+                <ssh_key>
+                     <type>ssh-ed25519</type>
+                     <base64_key>AAAAC3NzaC1lZDI1NTE5AAAAIDNf0r6vRl24Ix3tv2IgPmNPO2ATa2krvt80DdcTatLj</base64_key>
+                 </ssh_key>
+                <ssh_key>
+                     <type>ecdsa-sha2-nistp256</type>
+                     <base64_key>AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBNxeV2uN5UY6CUbCzTA1rXfYimKQA5ivNIqxdax4bcMXz4D0nSk2l5E1TkR5mG8EBWtmExSPbcEPJ8V7lyWWbA8=</base64_key>
+                 </ssh_key>
+                <ssh_key>
+                     <type>ssh-rsa</type>
+                     <base64_key>AAAAB3NzaC1yc2EAAAADAQABAAABgQCpgqL1SHhPVBOTFlOm0pu+cYBbADzC2jL41sPMawYCJHDyHuq7t+htaVVh2fRgpAPmSEnLEC2d4BEIKMtPK3bfR8plJqVXlLt6Q8t4b1oUlnjb3VPA9P6iGcW7CV1FBkZQEVx8ckOfJ3F+kI5VsrRlEDgiecm/C1VPl0/9M2llW/mPUMaD65cM9nlZgM/hUeBrfxOEqM11gDYxEZm1aRSbZoY4dfdm3vzvpSQ6lrCrkjn3X2aSmaCLcOWJhfBWMovNDB8uiPuw54g3ioZ++qEQMlfxVsqXDGYhXCrsArOVuW/5RbReO79BvXqdssiYShfwo+GhQ0+aLWMIW/jgBkkqx/n7uKLzCMX7b2F+aebRYFh+/QXEj7SnihdVfr9ud6NN3MWzZ1ltfIczlEcFLrLJ1Yq57wW6wXtviWh59WvTWFiPejGjeSjjJyqqB49tKdFVFuBnIU5u/bch2DXVgiAEdQwUrIp1ACoYPq22HFFAYUJrL32y7RxX3PGzuAv3LOc=</base64_key>
+                 </ssh_key>
+            </ssh_keys>
+        </john>
+        <lucy>
+            <ssh_keys>
+                <ssh_key>
+                     <type>ssh-ed25519</type>
+                     <base64_key>AAAAC3NzaC1lZDI1NTE5AAAAILbX3cPhyeqaY3uP5UR45pS3GOMXEdv+E2obcbl6YpUQ</base64_key>
+                 </ssh_key>
+            </ssh_keys>
+        </lucy>
+    </users>
+</clickhouse>
diff --git a/tests/integration/test_ssh_keys_authentication/keys/ecdsa b/tests/integration/test_ssh_keys_authentication/keys/ecdsa
new file mode 100644
index 00000000000..a2d8b838474
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/ecdsa
@@ -0,0 +1,9 @@
+-----BEGIN OPENSSH PRIVATE KEY-----
+b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAaAAAABNlY2RzYS
+1zaGEyLW5pc3RwMjU2AAAACG5pc3RwMjU2AAAAQQTcXldrjeVGOglGws0wNa132IpikAOY
+rzSKsXWseG3DF8+A9J0pNpeRNU5EeZhvBAVrZhMUj23BDyfFe5cllmwPAAAAsIcxFiKHMR
+YiAAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBNxeV2uN5UY6CUbC
+zTA1rXfYimKQA5ivNIqxdax4bcMXz4D0nSk2l5E1TkR5mG8EBWtmExSPbcEPJ8V7lyWWbA
+8AAAAgexIir2TzsExZo71y2LVvz4gB4C+P6uHyuuGqoHw6ZHgAAAAXdWJ1bnR1QGlwLTE3
+Mi0zMS0xMy0xMTkB
+-----END OPENSSH PRIVATE KEY-----
diff --git a/tests/integration/test_ssh_keys_authentication/keys/ecdsa.pub b/tests/integration/test_ssh_keys_authentication/keys/ecdsa.pub
new file mode 100644
index 00000000000..f9653d9483b
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/ecdsa.pub
@@ -0,0 +1 @@
+ecdsa-sha2-nistp256 AAAAE2VjZHNhLXNoYTItbmlzdHAyNTYAAAAIbmlzdHAyNTYAAABBBNxeV2uN5UY6CUbCzTA1rXfYimKQA5ivNIqxdax4bcMXz4D0nSk2l5E1TkR5mG8EBWtmExSPbcEPJ8V7lyWWbA8= test
diff --git a/tests/integration/test_ssh_keys_authentication/keys/ed25519 b/tests/integration/test_ssh_keys_authentication/keys/ed25519
new file mode 100644
index 00000000000..860cf5bbf11
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/ed25519
@@ -0,0 +1,7 @@
+-----BEGIN OPENSSH PRIVATE KEY-----
+b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAAAMwAAAAtzc2gtZW
+QyNTUxOQAAACAzX9K+r0ZduCMd7b9iID5jTztgE2tpK77fNA3XE2rS4wAAAKC44IJQuOCC
+UAAAAAtzc2gtZWQyNTUxOQAAACAzX9K+r0ZduCMd7b9iID5jTztgE2tpK77fNA3XE2rS4w
+AAAEBuJ/B1CJVyagfZRPEFosFB1PtFtk0Gzi9aqhbb9Yu9YTNf0r6vRl24Ix3tv2IgPmNP
+O2ATa2krvt80DdcTatLjAAAAF3VidW50dUBpcC0xNzItMzEtMTMtMTE5AQIDBAUG
+-----END OPENSSH PRIVATE KEY-----
diff --git a/tests/integration/test_ssh_keys_authentication/keys/ed25519.pub b/tests/integration/test_ssh_keys_authentication/keys/ed25519.pub
new file mode 100644
index 00000000000..125548d4493
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/ed25519.pub
@@ -0,0 +1 @@
+ssh-ed25519 AAAAC3NzaC1lZDI1NTE5AAAAIDNf0r6vRl24Ix3tv2IgPmNPO2ATa2krvt80DdcTatLj test
diff --git a/tests/integration/test_ssh_keys_authentication/keys/passphrase b/tests/integration/test_ssh_keys_authentication/keys/passphrase
new file mode 100644
index 00000000000..8ef4734b405
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/passphrase
@@ -0,0 +1,8 @@
+-----BEGIN OPENSSH PRIVATE KEY-----
+b3BlbnNzaC1rZXktdjEAAAAACmFlczI1Ni1jdHIAAAAGYmNyeXB0AAAAGAAAABBH+yU4Ol
+/8HIDZBoqTml6tAAAAEAAAAAEAAAAzAAAAC3NzaC1lZDI1NTE5AAAAILbX3cPhyeqaY3uP
+5UR45pS3GOMXEdv+E2obcbl6YpUQAAAAoL+7u3gc49ehkXByTuPBxcQzlKB8omUgmbzWbP
+pYSLIIEtS7Cag7kgJeZIIlPG6YmuRznAQ7tkhUQyFP03dzYoi58HuEHbJ+C/flv8Og0ZQT
+ePKQqEUseXPXRhj+xG4dv9Zt6WXD268/oBe005QUAviZ7ZGfhBAZT9GrAmFrf4cbghTe1z
+QHI2RMTcjW/bZOG1/NNh1j7BdinKPwEk3nqXo=
+-----END OPENSSH PRIVATE KEY-----
diff --git a/tests/integration/test_ssh_keys_authentication/keys/passphrase.pub b/tests/integration/test_ssh_keys_authentication/keys/passphrase.pub
new file mode 100644
index 00000000000..ecdbbb1d5f6
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/passphrase.pub
@@ -0,0 +1 @@
+ssh-ed25519 AAAAC3NzaC1lZDI1NTE5AAAAILbX3cPhyeqaY3uP5UR45pS3GOMXEdv+E2obcbl6YpUQ test
diff --git a/tests/integration/test_ssh_keys_authentication/keys/rsa b/tests/integration/test_ssh_keys_authentication/keys/rsa
new file mode 100644
index 00000000000..5033fbd933f
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/rsa
@@ -0,0 +1,38 @@
+-----BEGIN OPENSSH PRIVATE KEY-----
+b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAABlwAAAAdzc2gtcn
+NhAAAAAwEAAQAAAYEAqYKi9Uh4T1QTkxZTptKbvnGAWwA8wtoy+NbDzGsGAiRw8h7qu7fo
+bWlVYdn0YKQD5khJyxAtneARCCjLTyt230fKZSalV5S7ekPLeG9aFJZ4291TwPT+ohnFuw
+ldRQZGUBFcfHJDnydxfpCOVbK0ZRA4InnJvwtVT5dP/TNpZVv5j1DGg+uXDPZ5WYDP4VHg
+a38ThKjNdYA2MRGZtWkUm2aGOHX3Zt7876UkOpawq5I5919mkpmgi3DliYXwVjKLzQwfLo
+j7sOeIN4qGfvqhEDJX8VbKlwxmIVwq7AKzlblv+UW0Xju/Qb16nbLImEoX8KPhoUNPmi1j
+CFv44AZJKsf5+7ii8wjF+29hfmnm0WBYfv0FxI+0p4oXVX6/bnejTdzFs2dZbXyHM5RHBS
+6yydWKue8FusF7b4loefVr01hYj3oxo3ko4ycqqgePbSnRVRbgZyFObv23Idg11YIgBHUM
+FKyKdQAqGD6tthxRQGFCay99su0cV9zxs7gL9yznAAAFkMrEHAHKxBwBAAAAB3NzaC1yc2
+EAAAGBAKmCovVIeE9UE5MWU6bSm75xgFsAPMLaMvjWw8xrBgIkcPIe6ru36G1pVWHZ9GCk
+A+ZIScsQLZ3gEQgoy08rdt9HymUmpVeUu3pDy3hvWhSWeNvdU8D0/qIZxbsJXUUGRlARXH
+xyQ58ncX6QjlWytGUQOCJ5yb8LVU+XT/0zaWVb+Y9QxoPrlwz2eVmAz+FR4Gt/E4SozXWA
+NjERmbVpFJtmhjh192be/O+lJDqWsKuSOfdfZpKZoItw5YmF8FYyi80MHy6I+7DniDeKhn
+76oRAyV/FWypcMZiFcKuwCs5W5b/lFtF47v0G9ep2yyJhKF/Cj4aFDT5otYwhb+OAGSSrH
++fu4ovMIxftvYX5p5tFgWH79BcSPtKeKF1V+v253o03cxbNnWW18hzOURwUussnVirnvBb
+rBe2+JaHn1a9NYWI96MaN5KOMnKqoHj20p0VUW4GchTm79tyHYNdWCIAR1DBSsinUAKhg+
+rbYcUUBhQmsvfbLtHFfc8bO4C/cs5wAAAAMBAAEAAAGAGKI3dFXXxg992L5B4dhxcbek45
+ShP9/d0HPFeIuFEAKjt0vu6ODNEjlggxvde73aIzkWIEB1oJ/TWdAz24mBeOlB7Hk1RgkD
+Rb1ccGAeQyeq4KjFZyEzb/M23Pt7ZnCG/1PGkP85/IMK502yoZmaxaUZw0jXnL/U4gAnS7
+CQ/H3lQoKGlt1B0kxvTiZ+D0yKxJRvDbRKR20ecvsPz2E58Wtwzfu2vGhjcaAaJ7mGayiQ
+6/YdPei9gAYkFVw1lRE7KyYFzWAeUk/GV5BYNKFSMCaXPn5mAH+Iw6LKs0EpymcJdwMw/5
+L52zKMAvVQVGln3Fwm0YPmIOT6Oi+RnNPc58kL5NG/mz/smaohZCZe6hGYfGx17FIWuxJ6
+mV2OwO8b8HJLxosnfRBrEkwwiqIakZH5odqTrEMqc2V6THbrrA0xhUo416Op7dTQ+RCKLi
+YxgJru3+8kVmkfHBT8oUE90gjFsWH3irF7Yb6FGaGVi2MpS4hs3Q7l5Cgt2ZwcHFChAAAA
+wHeAvJMlpsCSM1VjECEqUOiCbmYm3a1gUP2oO/Bhf/Gyba/Z2O5+IlgIDFb3l70t56ikr6
+9qkrYcM27Rz05HiA5kB7RoBOQsKe1eYvtnADWtKq6ecK9LANRBCLx2FjfgsMSL5EAaF1wk
+YKY2JBvkkVcGuYhLdkof+u+B65d634VW76D8mNdWjVbudu2Jkv7e5WQu8srshOgI3imewX
++u6mxL5UMUifxQr6HvSrLK3wsuhtKO/VLP0LUGGJLA8uFb7QAAAMEA3RCil0qNoX0x717c
+rr6cgyQTau/NU1uZGtZ89HWIyph9VbipAFIMlOKkNpn69YQ3KlHXYi6cZUvbdhKuBN+2v1
+Ud1ZWxIznh/K5klGsw/ZmvQlKMpBHwTpmTr/5KyabbdtGTVyWFzHLFcIQ5o4yy9LSugP+f
+4CBNc0NZO1Zk6VzN7hfnXHkKsOdnmlVpTks1EPTp6yq2Np/fz6viSRVi4NDfyfokL70bsV
+QQ5GxY9u0iN7C9/mqxv3LAp1vD7bAVAAAAwQDETFCGT9sgIb6zFB+E7lBrRjF3FzKfeDZq
+T4kIiv0cLMdBDAXPIT8I/J6PfOvo0/SeN0pIQR1OK/Sd9RyBVWc0/f8mTrFhuPYD8ubPxF
+ps3iOJuxNJWQV41vzSwziU9dnOtGyBRaSHxh/f5biwX05UTq8tUU47Njvk1jIHN3vQQzaz
+IZ1WrzjtlDIToiYn5BpquElpM3FByfaTipmyixVuS+h/Y8dy7fQwPwuO9EQPlwz9lRoWdv
+CyDlFBa+7JLAsAAAAXdWJ1bnR1QGlwLTE3Mi0zMS0xMy0xMTkBAgME
+-----END OPENSSH PRIVATE KEY-----
diff --git a/tests/integration/test_ssh_keys_authentication/keys/rsa.pub b/tests/integration/test_ssh_keys_authentication/keys/rsa.pub
new file mode 100644
index 00000000000..41700c32b39
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/rsa.pub
@@ -0,0 +1 @@
+ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCpgqL1SHhPVBOTFlOm0pu+cYBbADzC2jL41sPMawYCJHDyHuq7t+htaVVh2fRgpAPmSEnLEC2d4BEIKMtPK3bfR8plJqVXlLt6Q8t4b1oUlnjb3VPA9P6iGcW7CV1FBkZQEVx8ckOfJ3F+kI5VsrRlEDgiecm/C1VPl0/9M2llW/mPUMaD65cM9nlZgM/hUeBrfxOEqM11gDYxEZm1aRSbZoY4dfdm3vzvpSQ6lrCrkjn3X2aSmaCLcOWJhfBWMovNDB8uiPuw54g3ioZ++qEQMlfxVsqXDGYhXCrsArOVuW/5RbReO79BvXqdssiYShfwo+GhQ0+aLWMIW/jgBkkqx/n7uKLzCMX7b2F+aebRYFh+/QXEj7SnihdVfr9ud6NN3MWzZ1ltfIczlEcFLrLJ1Yq57wW6wXtviWh59WvTWFiPejGjeSjjJyqqB49tKdFVFuBnIU5u/bch2DXVgiAEdQwUrIp1ACoYPq22HFFAYUJrL32y7RxX3PGzuAv3LOc= test
diff --git a/tests/integration/test_ssh_keys_authentication/keys/wrong b/tests/integration/test_ssh_keys_authentication/keys/wrong
new file mode 100644
index 00000000000..4b837b6fe09
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/wrong
@@ -0,0 +1,38 @@
+-----BEGIN OPENSSH PRIVATE KEY-----
+b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAABlwAAAAdzc2gtcn
+NhAAAAAwEAAQAAAYEAraKyK9I790CSpQ+h5zjT0UxYfpllOhxKl3m3pzekoJh28WGpzfQE
+Yo2b3t+edGgoVn9y5WKUmNvM6SIUZIJVCAL3D+OYtCGl1OCoICKxvvV1z9/IR78PCEGM2z
+kcOARFdCOpuRfZJOxUIcnEcs+NLSWRK1nFtFOE1378RQklrJxSgm0vsOPiE/tksLp+pTdC
+d5zE+Kq73UAthIt02OFZ5mNWhTsPlRsJpAMKOSM3F6cRc3opVb2HPn/DHMDPXRnWNSuaP3
+ud8Ra7Bo3Va+6acRE0wTcC2CcHNxL9u4SXAP1ra2NTx4/Xsx2MB8s494zoFinLB5i9UDS0
+e3Xttvwnz+POSl69zdp7wIvJxO7+nrrkciv/ewxN710mzdrGVh6MRrDKZYIcOA0nZFiOGS
+78M97ffztfEYjIUfqb0Na8qWTBCgZlUKbSQPwGGMneWZbEE02ofTumY7bQR/wfNF27mWto
+WLHxD8hM47Ct0KShYvked+WOfSV6ig9X92rfJG83AAAFkL58thq+fLYaAAAAB3NzaC1yc2
+EAAAGBAK2isivSO/dAkqUPoec409FMWH6ZZTocSpd5t6c3pKCYdvFhqc30BGKNm97fnnRo
+KFZ/cuVilJjbzOkiFGSCVQgC9w/jmLQhpdTgqCAisb71dc/fyEe/DwhBjNs5HDgERXQjqb
+kX2STsVCHJxHLPjS0lkStZxbRThNd+/EUJJaycUoJtL7Dj4hP7ZLC6fqU3QnecxPiqu91A
+LYSLdNjhWeZjVoU7D5UbCaQDCjkjNxenEXN6KVW9hz5/wxzAz10Z1jUrmj97nfEWuwaN1W
+vumnERNME3AtgnBzcS/buElwD9a2tjU8eP17MdjAfLOPeM6BYpyweYvVA0tHt17bb8J8/j
+zkpevc3ae8CLycTu/p665HIr/3sMTe9dJs3axlYejEawymWCHDgNJ2RYjhku/DPe3387Xx
+GIyFH6m9DWvKlkwQoGZVCm0kD8BhjJ3lmWxBNNqH07pmO20Ef8HzRdu5lraFix8Q/ITOOw
+rdCkoWL5Hnfljn0leooPV/dq3yRvNwAAAAMBAAEAAAGABjZHOuYfRcNGUSger2ULFEvaRq
+fk7+VJ4zge5+6dBy8tN4mPnPyumNAJfuRv3ijzzdRqyeYdpt0GQbj5vcwj5VDQgf2vMufu
+mjpyCWRJs6lDI8K/1EFI9Q9TThcxo+y93LUsl0tRIM8LsNcac3kVde4IJDg7/dhBwmvv8+
+WrNrezrqg1XUC/Ookd8Gyw/JGI4Tqh7ruSU7dovtCLx6PtpskbCVKJm4NcyZoKPZe9mtex
+T3j+uECQRsjPXtykY+ekAQDW2EKWlVJy6SQCoKWTeBhuyTESwwQsxY8p9pMEX0800Bp1Zs
+STRBUKRnuZYYp8ZraYsF9VprjhB6Cw0OBYoCBAPQu6TXbh4HB6b2gP17t5T7JilHx5rTC+
+N6qbbnE5Cfj3C0HGhqArsaMUvvFujB1EVRcsw9+1stPmo7A3zqisEXvpsBNX3djvzBb0qv
+ExY6kdxnGrQg5aXoWiWVA8EMHvh/recGBQWe9KAv/87aCJ8yKOwEZS5YRgKr4z0ofBAAAA
+wCabP+/26DX8WHfku7qlfhG6+lRQU3iV71waj8JbPRNDl0HKONtLeVR1PB1Hgq5l4E4p+H
+P8UJDyYdOymGyb79dnOt658CgjHG8k5D9AFimaws9MgI2Rk83CV8PfjWXPrruDfqy1yXlj
+Yks9ki+pOrxz5zCbQ4Njj81EHqVqqHZrlM/1o4gs38niW2kp+WpFjKCaM1GWpW7kZPeRh3
+k27bqAc4oJ7aZklyUcWXJh+MuL/PVXnZpjghGgYqq+o5G83QAAAMEA9KdDznTtCGvcYNHo
+W+i1NJekaT24pqW3HJ92p6VUg7qFqOc5ryn/y6FIpU2Ahs9jsCPmWk5SoC2aNYiQRnOm32
+RttWKVA/G4NuBmDxx/bPvd8LjhSXaBCgN81UCMqZ+FSFuvCSsqvnt15e057R4RX/zVzcAv
+45C1vMRGXG7orpmyh1hy+FXbOCQ3QQJie/kfWQEy2mXWi8ewRlFFVBl0MWeQknMlbmrNol
+gmMb9E16QBcMxvPmdSCYSdkReoMB1nAAAAwQC1sD8HZeFS08B8EiJFyscjJ6cFqhmiFKlf
+PoQx07p7tLoEEx773fEpw1bfHr7LTgKhPMTVwkxUCXV+4QPiGm2Go5YorZ42mZF1wl5DfR
+/KPdskGBngdJc2wXQP81hZX0ZodXW9pGowRFsvy4Ozb07RIyKxm5dfRLGRndNaLjvmXB6B
+zt10qhC+p+Dtm0pz8ODUz8KfVEeKBOpWihLW4s8fcaaBV8oJ4Zpg5yE/UtguutikMeIC3Y
+xQSg2MbSODLbEAAAAXdWJ1bnR1QGlwLTE3Mi0zMS0xMy0xMTkBAgME
+-----END OPENSSH PRIVATE KEY-----
diff --git a/tests/integration/test_ssh_keys_authentication/keys/wrong.pub b/tests/integration/test_ssh_keys_authentication/keys/wrong.pub
new file mode 100644
index 00000000000..dcd878211d4
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/keys/wrong.pub
@@ -0,0 +1 @@
+ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCtorIr0jv3QJKlD6HnONPRTFh+mWU6HEqXebenN6SgmHbxYanN9ARijZve3550aChWf3LlYpSY28zpIhRkglUIAvcP45i0IaXU4KggIrG+9XXP38hHvw8IQYzbORw4BEV0I6m5F9kk7FQhycRyz40tJZErWcW0U4TXfvxFCSWsnFKCbS+w4+IT+2Swun6lN0J3nMT4qrvdQC2Ei3TY4VnmY1aFOw+VGwmkAwo5IzcXpxFzeilVvYc+f8McwM9dGdY1K5o/e53xFrsGjdVr7ppxETTBNwLYJwc3Ev27hJcA/WtrY1PHj9ezHYwHyzj3jOgWKcsHmL1QNLR7de22/CfP485KXr3N2nvAi8nE7v6euuRyK/97DE3vXSbN2sZWHoxGsMplghw4DSdkWI4ZLvwz3t9/O18RiMhR+pvQ1rypZMEKBmVQptJA/AYYyd5ZlsQTTah9O6ZjttBH/B80XbuZa2hYsfEPyEzjsK3QpKFi+R535Y59JXqKD1f3at8kbzc= ubuntu@ip-172-31-13-119
diff --git a/tests/integration/test_ssh_keys_authentication/test.py b/tests/integration/test_ssh_keys_authentication/test.py
new file mode 100644
index 00000000000..da087752d29
--- /dev/null
+++ b/tests/integration/test_ssh_keys_authentication/test.py
@@ -0,0 +1,103 @@
+import pytest
+import os
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+instance = cluster.add_instance(
+    "node",
+    user_configs=["configs/users.xml"],
+)
+
+SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
+
+
+@pytest.fixture(scope="module", autouse=True)
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def test_ecdsa():
+    assert (
+        instance.query(
+            "SELECT currentUser()",
+            user="john",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/ecdsa",
+                "ssh-key-passphrase": "",
+            },
+        )
+        == "john\n"
+    )
+
+
+def test_ed25519():
+    assert (
+        instance.query(
+            "SELECT currentUser()",
+            user="john",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/ed25519",
+                "ssh-key-passphrase": "",
+            },
+        )
+        == "john\n"
+    )
+
+
+def test_rsa():
+    assert (
+        instance.query(
+            "SELECT currentUser()",
+            user="john",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/rsa",
+                "ssh-key-passphrase": "",
+            },
+        )
+        == "john\n"
+    )
+
+
+def test_wrong_key():
+    with pytest.raises(Exception) as err:
+        instance.query(
+            "SELECT currentUser()",
+            user="john",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/wrong",
+                "ssh-key-passphrase": "",
+            },
+        )
+
+    assert "Authentication failed" in str(err.value)
+
+
+def test_key_with_passphrase():
+    assert (
+        instance.query(
+            "SELECT currentUser()",
+            user="lucy",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/passphrase",
+                "ssh-key-passphrase": "passphrase",
+            },
+        )
+        == "lucy\n"
+    )
+
+
+def test_key_with_wrong_passphrase():
+    with pytest.raises(Exception):
+        instance.query(
+            "SELECT currentUser()",
+            user="lucy",
+            settings={
+                "ssh-key-file": f"{SCRIPT_DIR}/keys/passphrase",
+                "ssh-key-passphrase": "wrong",
+            },
+        ) == "lucy\n"
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 46373f49700..c7523ede607 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -1117,7 +1117,7 @@ CREATE TABLE system.users
     `name` String,
     `id` UUID,
     `storage` String,
-    `auth_type` Enum8('no_password' = 0, 'plaintext_password' = 1, 'sha256_password' = 2, 'double_sha1_password' = 3, 'ldap' = 4, 'kerberos' = 5, 'ssl_certificate' = 6, 'bcrypt_password' = 7),
+    `auth_type` Enum8('no_password' = 0, 'plaintext_password' = 1, 'sha256_password' = 2, 'double_sha1_password' = 3, 'ldap' = 4, 'kerberos' = 5, 'ssl_certificate' = 6, 'bcrypt_password' = 7, 'ssh_key' = 8),
     `auth_params` String,
     `host_ip` Array(String),
     `host_names` Array(String),
diff --git a/tests/queries/0_stateless/02867_create_user_ssh.reference b/tests/queries/0_stateless/02867_create_user_ssh.reference
new file mode 100644
index 00000000000..8c3ffb30522
--- /dev/null
+++ b/tests/queries/0_stateless/02867_create_user_ssh.reference
@@ -0,0 +1 @@
+CREATE USER test_user_02867 IDENTIFIED WITH ssh_key BY KEY `AAAAB3NzaC1yc2EAAAADAQABAAABgQCVTUso7/LQcBljfsHwyuL6fWfIvS3BaVpYB8lwf/ZylSOltBy6YlABtTU3mIb197d2DW99RcLKk174f5Zj5rUukXbV0fnufWvwd37fbb1eKM8zxBYvXs53EI5QBPZgKACIzMpYYZeJnAP0oZhUfWWtKXpy/SQ5CHiEIGD9RNYDL+uXZejMwC5r/+f2AmrATBo+Y+WJFZIvhj4uznFYvyvNTUz/YDvZCk+vwwIgiv4BpFCaZm2TeETTj6SvK567bZznLP5HXrkVbB5lhxjAkahc2w/Yjm//Fwto3xsMoJwROxJEU8L1kZ40QWPqjo7Tmr6C/hL2cKDNgWOEqrjLKQmh576s1+PfxwXpVPjLK4PHVSvuJLV88sn0iPdspLlKlDCdc7T9MqIrjJfxuhqnaoFQ7U+oBte8vkm1wGu76+WEC3iNWVAiIVZxLx9rUEsDqj3OovqfLiRsTmNLeY94p2asZjkx7rU48ZwuYN5XGafYsArPscj9Ve6RoRrof+5Q7cc=` TYPE `ssh-rsa`
diff --git a/tests/queries/0_stateless/02867_create_user_ssh.sql b/tests/queries/0_stateless/02867_create_user_ssh.sql
new file mode 100644
index 00000000000..08236bdbcfe
--- /dev/null
+++ b/tests/queries/0_stateless/02867_create_user_ssh.sql
@@ -0,0 +1,14 @@
+-- Tags: no-fasttest, no-parallel
+
+DROP USER IF EXISTS test_user_02867;
+
+CREATE USER test_user_02867 IDENTIFIED WITH ssh_key BY KEY 'clickhouse' TYPE 'ssh-rsa'; -- { serverError LIBSSH_ERROR }
+CREATE USER test_user_02867 IDENTIFIED WITH ssh_key BY KEY 'clickhouse' TYPE 'clickhouse'; -- { serverError LIBSSH_ERROR }
+CREATE USER test_user_02867 IDENTIFIED WITH ssh_key BY KEY 'key1' TYPE 'ssh-rsa', KEY 'key2' TYPE 'ssh-rsa'; -- { serverError LIBSSH_ERROR }
+CREATE USER test_user_02867 IDENTIFIED WITH ssh_key
+BY KEY 'AAAAB3NzaC1yc2EAAAADAQABAAABgQCVTUso7/LQcBljfsHwyuL6fWfIvS3BaVpYB8lwf/ZylSOltBy6YlABtTU3mIb197d2DW99RcLKk174f5Zj5rUukXbV0fnufWvwd37fbb1eKM8zxBYvXs53EI5QBPZgKACIzMpYYZeJnAP0oZhUfWWtKXpy/SQ5CHiEIGD9RNYDL+uXZejMwC5r/+f2AmrATBo+Y+WJFZIvhj4uznFYvyvNTUz/YDvZCk+vwwIgiv4BpFCaZm2TeETTj6SvK567bZznLP5HXrkVbB5lhxjAkahc2w/Yjm//Fwto3xsMoJwROxJEU8L1kZ40QWPqjo7Tmr6C/hL2cKDNgWOEqrjLKQmh576s1+PfxwXpVPjLK4PHVSvuJLV88sn0iPdspLlKlDCdc7T9MqIrjJfxuhqnaoFQ7U+oBte8vkm1wGu76+WEC3iNWVAiIVZxLx9rUEsDqj3OovqfLiRsTmNLeY94p2asZjkx7rU48ZwuYN5XGafYsArPscj9Ve6RoRrof+5Q7cc='
+TYPE 'ssh-rsa';
+
+SHOW CREATE USER test_user_02867;
+
+DROP USER test_user_02867;

From eb1b3e6a3ada95bfd3e9258946e19efc68b1b013 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 26 Sep 2023 19:08:22 +0300
Subject: [PATCH 095/101] ProfileEvents added ContextLockWaitMicroseconds

---
 src/Common/ProfileEvents.cpp | 1 +
 src/Interpreters/Context.cpp | 6 +++++-
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index fd7b47b4f87..0df0bc89b38 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -211,6 +211,7 @@
     \
     M(RegexpCreated, "Compiled regular expressions. Identical regular expressions compiled just once and cached forever.") \
     M(ContextLock, "Number of times the lock of Context was acquired or tried to acquire. This is global lock.") \
+    M(ContextLockWaitMicroseconds, "Context lock wait time in microseconds") \
     \
     M(StorageBufferFlush, "Number of times a buffer in a 'Buffer' table was flushed.") \
     M(StorageBufferErrorOnFlush, "Number of times a buffer in the 'Buffer' table has not been able to flush due to error writing in the destination table.") \
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 86651f31e7c..edec3d6bb29 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -108,6 +108,7 @@ namespace fs = std::filesystem;
 namespace ProfileEvents
 {
     extern const Event ContextLock;
+    extern const Event ContextLockWaitMicroseconds;
 }
 
 namespace CurrentMetrics
@@ -704,7 +705,10 @@ std::unique_lock<std::recursive_mutex> Context::getLock() const
 {
     ProfileEvents::increment(ProfileEvents::ContextLock);
     CurrentMetrics::Increment increment{CurrentMetrics::ContextLockWait};
-    return std::unique_lock(shared->mutex);
+    Stopwatch watch;
+    auto lock = std::unique_lock(shared->mutex);
+    ProfileEvents::increment(ProfileEvents::ContextLockWaitMicroseconds, watch.elapsedMicroseconds());
+    return lock;
 }
 
 ProcessList & Context::getProcessList() { return shared->process_list; }

From c12c114ade6939b5929cf2e6af0c445053bf4e39 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 26 Sep 2023 15:58:08 +0300
Subject: [PATCH 096/101] Setting compile_aggregate_expressions comment fix

---
 src/Core/Settings.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 71356d6fb36..901ac6a2860 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -149,7 +149,7 @@ class IColumn;
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
     M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
     M(UInt64, min_count_to_compile_expression, 3, "The number of identical expressions before they are JIT-compiled", 0) \
-    M(Bool, compile_aggregate_expressions, true, "Compile aggregate functions to native code. This feature has a bug and should not be used.", 0) \
+    M(Bool, compile_aggregate_expressions, true, "Compile aggregate functions to native code.", 0) \
     M(UInt64, min_count_to_compile_aggregate_expression, 3, "The number of identical aggregate expressions before they are JIT-compiled", 0) \
     M(Bool, compile_sort_description, true, "Compile sort description to native code.", 0) \
     M(UInt64, min_count_to_compile_sort_description, 3, "The number of identical sort descriptions before they are JIT-compiled", 0) \

From 252627ea8c76b8214520738bf6787bf9ea8e64f8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 26 Sep 2023 21:34:32 +0200
Subject: [PATCH 097/101] Refuse anything other than LLD

---
 cmake/tools.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmake/tools.cmake b/cmake/tools.cmake
index 7fb45bc15d8..fcba3465b35 100644
--- a/cmake/tools.cmake
+++ b/cmake/tools.cmake
@@ -76,7 +76,7 @@ endif ()
 if (LINKER_NAME)
     message(STATUS "Using linker: ${LINKER_NAME}")
 else()
-    message(STATUS "Using linker: <default>")
+    message (FATAL_ERROR "The only supported linker is LLVM's LLD, but we cannot find it.")
 endif()
 
 # Archiver

From f0b570d0c3a76d4423b7d73a1c083ad94f5ffd92 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Tue, 26 Sep 2023 21:59:51 +0200
Subject: [PATCH 098/101] Fix pre-build scripts for old branches (#55032)

---
 docker/packager/binary/build.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/packager/binary/build.sh b/docker/packager/binary/build.sh
index 93de6eeb374..4875cb596af 100755
--- a/docker/packager/binary/build.sh
+++ b/docker/packager/binary/build.sh
@@ -56,7 +56,7 @@ ccache_status
 ccache --zero-stats ||:
 
 # Check whether the directory with pre-build scripts exists and not empty.
-if [ -d "/build/packages/pre-build" ] && [ -z "$(ls -A /build/packages/pre-build)" ]; then
+if [ ! -d "/build/packages/pre-build" ] || [ -n "$(ls -A /build/packages/pre-build)" ]; then
    echo "There are no subcommands to execute :)"
 else
   # Execute all commands

From 23bc2862806ccf6f755d5f2b7a62d8f42ebfdebd Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Tue, 26 Sep 2023 13:23:26 -0700
Subject: [PATCH 099/101] Print more information about one logical error in
 MergeTreeDataWriter (#55001)

---
 src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h   | 1 +
 src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.h    | 1 +
 .../Merges/Algorithms/FinishAggregatingInOrderAlgorithm.h       | 1 +
 .../Merges/Algorithms/GraphiteRollupSortedAlgorithm.h           | 1 +
 src/Processors/Merges/Algorithms/IMergingAlgorithm.h            | 1 +
 src/Processors/Merges/Algorithms/MergingSortedAlgorithm.h       | 1 +
 src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h     | 1 +
 src/Processors/Merges/Algorithms/SummingSortedAlgorithm.h       | 1 +
 src/Processors/Merges/Algorithms/VersionedCollapsingAlgorithm.h | 1 +
 src/Processors/Transforms/ColumnGathererTransform.h             | 1 +
 src/Processors/Transforms/MergeJoinTransform.h                  | 1 +
 src/Storages/MergeTree/MergeTreeDataWriter.cpp                  | 2 +-
 12 files changed, 12 insertions(+), 1 deletion(-)

diff --git a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
index 456b94c69ce..72a1f4871d8 100644
--- a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
@@ -24,6 +24,7 @@ public:
         size_t max_block_size_rows_,
         size_t max_block_size_bytes_);
 
+    const char * getName() const override { return "AggregatingSortedAlgorithm"; }
     void initialize(Inputs inputs) override;
     void consume(Input & input, size_t source_num) override;
     Status merge() override;
diff --git a/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.h
index c90ddbbab5d..28bb87cb394 100644
--- a/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.h
@@ -38,6 +38,7 @@ public:
         WriteBuffer * out_row_sources_buf_ = nullptr,
         bool use_average_block_sizes = false);
 
+    const char * getName() const override { return "CollapsingSortedAlgorithm"; }
     Status merge() override;
 
 private:
diff --git a/src/Processors/Merges/Algorithms/FinishAggregatingInOrderAlgorithm.h b/src/Processors/Merges/Algorithms/FinishAggregatingInOrderAlgorithm.h
index 13522b70834..cc6578e79be 100644
--- a/src/Processors/Merges/Algorithms/FinishAggregatingInOrderAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/FinishAggregatingInOrderAlgorithm.h
@@ -45,6 +45,7 @@ public:
         size_t max_block_size_rows_,
         size_t max_block_size_bytes_);
 
+    const char * getName() const override { return "FinishAggregatingInOrderAlgorithm"; }
     void initialize(Inputs inputs) override;
     void consume(Input & input, size_t source_num) override;
     Status merge() override;
diff --git a/src/Processors/Merges/Algorithms/GraphiteRollupSortedAlgorithm.h b/src/Processors/Merges/Algorithms/GraphiteRollupSortedAlgorithm.h
index f920d623b1f..a20a6eaf11f 100644
--- a/src/Processors/Merges/Algorithms/GraphiteRollupSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/GraphiteRollupSortedAlgorithm.h
@@ -30,6 +30,7 @@ public:
         Graphite::Params params_,
         time_t time_of_merge_);
 
+    const char * getName() const override { return "GraphiteRollupSortedAlgorithm"; }
     Status merge() override;
 
     struct ColumnsDefinition
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithm.h b/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
index c56324c7d9a..d55ceb78af4 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
@@ -47,6 +47,7 @@ public:
 
     using Inputs = std::vector<Input>;
 
+    virtual const char * getName() const = 0;
     virtual void initialize(Inputs inputs) = 0;
     virtual void consume(Input & input, size_t source_num) = 0;
     virtual Status merge() = 0;
diff --git a/src/Processors/Merges/Algorithms/MergingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/MergingSortedAlgorithm.h
index 1357e58f0f1..bcb111baadf 100644
--- a/src/Processors/Merges/Algorithms/MergingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/MergingSortedAlgorithm.h
@@ -26,6 +26,7 @@ public:
 
     void addInput();
 
+    const char * getName() const override { return "MergingSortedAlgorithm"; }
     void initialize(Inputs inputs) override;
     void consume(Input & input, size_t source_num) override;
     Status merge() override;
diff --git a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
index 6ee138aca88..b2258918fde 100644
--- a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
@@ -30,6 +30,7 @@ public:
         bool cleanup = false,
         size_t * cleanedup_rows_count = nullptr);
 
+    const char * getName() const override { return "ReplacingSortedAlgorithm"; }
     Status merge() override;
 
 private:
diff --git a/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.h
index 8943e235729..dbbe4e53a5f 100644
--- a/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.h
@@ -25,6 +25,7 @@ public:
         size_t max_block_size_rows,
         size_t max_block_size_bytes);
 
+    const char * getName() const override { return "SummingSortedAlgorithm"; }
     void initialize(Inputs inputs) override;
     void consume(Input & input, size_t source_num) override;
     Status merge() override;
diff --git a/src/Processors/Merges/Algorithms/VersionedCollapsingAlgorithm.h b/src/Processors/Merges/Algorithms/VersionedCollapsingAlgorithm.h
index 578100f080d..d98529b301c 100644
--- a/src/Processors/Merges/Algorithms/VersionedCollapsingAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/VersionedCollapsingAlgorithm.h
@@ -25,6 +25,7 @@ public:
         WriteBuffer * out_row_sources_buf_ = nullptr,
         bool use_average_block_sizes = false);
 
+    const char * getName() const override { return "VersionedCollapsingAlgorithm"; }
     Status merge() override;
 
 private:
diff --git a/src/Processors/Transforms/ColumnGathererTransform.h b/src/Processors/Transforms/ColumnGathererTransform.h
index da6dc877abf..b5bbbff9aca 100644
--- a/src/Processors/Transforms/ColumnGathererTransform.h
+++ b/src/Processors/Transforms/ColumnGathererTransform.h
@@ -59,6 +59,7 @@ class ColumnGathererStream final : public IMergingAlgorithm
 public:
     ColumnGathererStream(size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
 
+    const char * getName() const override { return "ColumnGathererStream"; }
     void initialize(Inputs inputs) override;
     void consume(Input & input, size_t source_num) override;
     Status merge() override;
diff --git a/src/Processors/Transforms/MergeJoinTransform.h b/src/Processors/Transforms/MergeJoinTransform.h
index 6bf4484df24..0dd4e24c922 100644
--- a/src/Processors/Transforms/MergeJoinTransform.h
+++ b/src/Processors/Transforms/MergeJoinTransform.h
@@ -229,6 +229,7 @@ class MergeJoinAlgorithm final : public IMergingAlgorithm
 public:
     explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
 
+    const char * getName() const override { return "MergeJoinAlgorithm"; }
     virtual void initialize(Inputs inputs) override;
     virtual void consume(Input & input, size_t source_num) override;
     virtual Status merge() override;
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index d6ba7cb3093..0f4a9c28884 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -365,7 +365,7 @@ Block MergeTreeDataWriter::mergeBlock(
 
     /// Check that after first merge merging_algorithm is waiting for data from input 0.
     if (status.required_source != 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: required source after the first merge is not 0.");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: required source after the first merge is not 0. Chunk rows: {}, is_finished: {}, required_source: {}, algorithm: {}", status.chunk.getNumRows(), status.is_finished, status.required_source, merging_algorithm->getName());
 
     status = merging_algorithm->merge();
 

From 1ac2247b3cc2aa020bc7b7fadb89edb1981493f6 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Tue, 26 Sep 2023 13:24:06 -0700
Subject: [PATCH 100/101] Add desperate instrumentation for debugging deadlock
 in MultiplexedConnections (#54940)

---
 base/base/hex.h                       | 10 ++++++++
 src/Client/MultiplexedConnections.cpp | 37 ++++++++++++++++++++++++++-
 src/Client/MultiplexedConnections.h   | 12 ++++++---
 3 files changed, 55 insertions(+), 4 deletions(-)

diff --git a/base/base/hex.h b/base/base/hex.h
index 937218fec5a..931f220aa08 100644
--- a/base/base/hex.h
+++ b/base/base/hex.h
@@ -289,3 +289,13 @@ inline void writeBinByte(UInt8 byte, void * out)
 {
     memcpy(out, &impl::bin_byte_to_char_table[static_cast<size_t>(byte) * 8], 8);
 }
+
+/// Converts byte array to a hex string. Useful for debug logging.
+inline std::string hexString(const void * data, size_t size)
+{
+    const char * p = reinterpret_cast<const char *>(data);
+    std::string s(size * 2, '\0');
+    for (size_t i = 0; i < size; ++i)
+        writeHexByteLowercase(p[i], s.data() + i * 2);
+    return s;
+}
diff --git a/src/Client/MultiplexedConnections.cpp b/src/Client/MultiplexedConnections.cpp
index c0218568d67..80d35b7dc1a 100644
--- a/src/Client/MultiplexedConnections.cpp
+++ b/src/Client/MultiplexedConnections.cpp
@@ -1,10 +1,13 @@
 #include <Client/MultiplexedConnections.h>
 
 #include <Common/thread_local_rng.h>
+#include <Common/logger_useful.h>
 #include <Core/Protocol.h>
 #include <IO/ConnectionTimeouts.h>
 #include <IO/Operators.h>
 #include <Interpreters/ClientInfo.h>
+#include <base/getThreadId.h>
+#include <base/hex.h>
 
 namespace DB
 {
@@ -19,6 +22,13 @@ namespace ErrorCodes
 }
 
 
+#define MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION \
+    mutex_last_locked_by.store((getThreadId() << 32) | __LINE__); \
+    memcpy(mutex_memory_dump.data(), &cancel_mutex, mutex_memory_dump.size()); \
+    mutex_locked += 1; \
+    SCOPE_EXIT({ mutex_locked -= 1; });
+
+
 MultiplexedConnections::MultiplexedConnections(Connection & connection, const Settings & settings_, const ThrottlerPtr & throttler)
     : settings(settings_)
 {
@@ -73,6 +83,7 @@ MultiplexedConnections::MultiplexedConnections(
 void MultiplexedConnections::sendScalarsData(Scalars & data)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (!sent_query)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot send scalars data: query not yet sent.");
@@ -88,6 +99,7 @@ void MultiplexedConnections::sendScalarsData(Scalars & data)
 void MultiplexedConnections::sendExternalTablesData(std::vector<ExternalTablesData> & data)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (!sent_query)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot send external tables data: query not yet sent.");
@@ -116,6 +128,7 @@ void MultiplexedConnections::sendQuery(
     bool with_pending_data)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (sent_query)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Query already sent.");
@@ -173,6 +186,7 @@ void MultiplexedConnections::sendQuery(
 void MultiplexedConnections::sendIgnoredPartUUIDs(const std::vector<UUID> & uuids)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (sent_query)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot send uuids after query is sent.");
@@ -189,6 +203,7 @@ void MultiplexedConnections::sendIgnoredPartUUIDs(const std::vector<UUID> & uuid
 void MultiplexedConnections::sendReadTaskResponse(const String & response)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
     if (cancelled)
         return;
     current_connection->sendReadTaskResponse(response);
@@ -198,6 +213,7 @@ void MultiplexedConnections::sendReadTaskResponse(const String & response)
 void MultiplexedConnections::sendMergeTreeReadTaskResponse(const ParallelReadResponse & response)
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
     if (cancelled)
         return;
     current_connection->sendMergeTreeReadTaskResponse(response);
@@ -207,13 +223,29 @@ void MultiplexedConnections::sendMergeTreeReadTaskResponse(const ParallelReadRes
 Packet MultiplexedConnections::receivePacket()
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
     Packet packet = receivePacketUnlocked({});
     return packet;
 }
 
 void MultiplexedConnections::disconnect()
 {
-    std::lock_guard lock(cancel_mutex);
+    /// We've seen this lock mysteriously get stuck forever, without any other thread seeming to
+    /// hold the mutex. This is temporary code to print some extra information next time it happens.
+    /// std::lock_guard lock(cancel_mutex);
+    if (!cancel_mutex.try_lock_for(std::chrono::hours(1)))
+    {
+        UInt64 last_locked = mutex_last_locked_by.load();
+        std::array<UInt8, sizeof(std::timed_mutex)> new_memory_dump;
+        memcpy(new_memory_dump.data(), &cancel_mutex, new_memory_dump.size());
+        LOG_ERROR(&Poco::Logger::get("MultiplexedConnections"), "Deadlock in MultiplexedConnections::disconnect()! Mutex was last (instrumentedly) locked by thread {} on line {}, lock balance: {}, mutex memory when last locked: {}, mutex memory now: {}", last_locked >> 32, last_locked & 0xffffffff, mutex_locked.load(), hexString(mutex_memory_dump.data(), mutex_memory_dump.size()), hexString(new_memory_dump.data(), new_memory_dump.size()));
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Deadlock in MultiplexedConnections::disconnect()");
+    }
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wthread-safety-analysis"
+    std::lock_guard lock(cancel_mutex, std::adopt_lock);
+#pragma clang diagnostic pop
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     for (ReplicaState & state : replica_states)
     {
@@ -229,6 +261,7 @@ void MultiplexedConnections::disconnect()
 void MultiplexedConnections::sendCancel()
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (!sent_query || cancelled)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot cancel. Either no query sent or already cancelled.");
@@ -246,6 +279,7 @@ void MultiplexedConnections::sendCancel()
 Packet MultiplexedConnections::drain()
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
 
     if (!cancelled)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot drain connections: cancel first.");
@@ -286,6 +320,7 @@ Packet MultiplexedConnections::drain()
 std::string MultiplexedConnections::dumpAddresses() const
 {
     std::lock_guard lock(cancel_mutex);
+    MUTEX_LOCK_TEMPORARY_DEBUG_INSTRUMENTATION
     return dumpAddressesUnlocked();
 }
 
diff --git a/src/Client/MultiplexedConnections.h b/src/Client/MultiplexedConnections.h
index 371639d14c4..4c776e6e168 100644
--- a/src/Client/MultiplexedConnections.h
+++ b/src/Client/MultiplexedConnections.h
@@ -105,9 +105,15 @@ private:
     /// std::nullopt if parallel reading from replicas is not used
     std::optional<ReplicaInfo> replica_info;
 
-    /// A mutex for the sendCancel function to execute safely
-    /// in separate thread.
-    mutable std::mutex cancel_mutex;
+    /// A mutex for the sendCancel function to execute safely in separate thread.
+    mutable std::timed_mutex cancel_mutex;
+
+    /// Temporary instrumentation to debug a weird deadlock on cancel_mutex.
+    /// TODO: Once the investigation is done, get rid of these, and of INSTRUMENTED_LOCK_MUTEX, and
+    ///       change cancel_mutex to std::mutex.
+    mutable std::atomic<UInt64> mutex_last_locked_by{0};
+    mutable std::atomic<Int64> mutex_locked{0};
+    mutable std::array<UInt8, sizeof(std::timed_mutex)> mutex_memory_dump;
 
     friend struct RemoteQueryExecutorRoutine;
 };

From b11e8763231364a95b9d121f88e0bc9cc9c8bd23 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 27 Sep 2023 00:37:17 +0300
Subject: [PATCH 101/101] Update tools.cmake

---
 cmake/tools.cmake | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/cmake/tools.cmake b/cmake/tools.cmake
index fcba3465b35..e03b1d9d72a 100644
--- a/cmake/tools.cmake
+++ b/cmake/tools.cmake
@@ -75,9 +75,11 @@ endif ()
 
 if (LINKER_NAME)
     message(STATUS "Using linker: ${LINKER_NAME}")
-else()
+elseif (NOT ARCH_S390X AND NOT OS_FREEBSD)
     message (FATAL_ERROR "The only supported linker is LLVM's LLD, but we cannot find it.")
-endif()
+else ()
+    message(STATUS "Using linker: <default>")
+endif ()
 
 # Archiver