From 82a849ba8e1b95833d2ae7f3bcdd3e1c008bacb5 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Sat, 18 Sep 2021 09:36:02 +0000
Subject: [PATCH 001/104] add options method

---
 programs/server/config.xml    | 19 ++++++++++++++++++
 src/Interpreters/ClientInfo.h |  5 +++--
 src/Server/HTTPHandler.cpp    | 37 +++++++++++++++++++++++++++++++++++
 3 files changed, 59 insertions(+), 2 deletions(-)
diff --git a/programs/server/config.xml b/programs/server/config.xml
index 6c98ac740fe..bec51de6126 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -62,6 +62,25 @@
         -->
     </logger>
 
+    <http_options_response>
+        <header>
+            <name>Access-Control-Allow-Origin</name>
+            <value>*</value>
+        </header>
+        <header>
+            <name>Access-Control-Allow-Headers</name>
+            <value>origin, x-requested-with</value>
+        </header>
+        <header>
+            <name>Access-Control-Allow-Methods</name>
+            <value>POST, GET, OPTIONS</value>
+        </header>
+        <header>
+            <name>Access-Control-Max-Age</name>
+            <value>86400</value>
+        </header>
+    </http_options_response>
+
     <!-- It is the name that will be shown in the clickhouse-client.
          By default, anything with "production" will be highlighted in red in query prompt.
     -->
diff --git a/src/Interpreters/ClientInfo.h b/src/Interpreters/ClientInfo.h
index 71570778645..294bf3b426c 100644
--- a/src/Interpreters/ClientInfo.h
+++ b/src/Interpreters/ClientInfo.h
@@ -35,8 +35,9 @@ public:
     enum class HTTPMethod : uint8_t
     {
         UNKNOWN = 0,
-        GET = 1,
-        POST = 2,
+        GET     = 1,
+        POST    = 2,
+        OPTIONS = 3
     };
 
     enum class QueryKind : uint8_t
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 0492b58dc88..99502261aa9 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -32,6 +32,7 @@
 #include <Common/typeid_cast.h>
 #include <common/getFQDNOrHostName.h>
 #include <common/scope_guard.h>
+#include "Server/HTTP/HTTPResponse.h"
 
 #if !defined(ARCADIA_BUILD)
 #    include <Common/config.h>
@@ -108,6 +109,37 @@ namespace ErrorCodes
     extern const int HTTP_LENGTH_REQUIRED;
 }
 
+namespace
+{
+    /// Process options request. Usefull for CORS.
+    void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
+    {
+        /// If answer for options request was not defined, return 501 to client.
+        if (!config.has("http_options_response"))
+        {
+            response.setStatusAndReason(HTTPResponse::HTTP_NOT_IMPLEMENTED);
+            response.send();
+        }
+        else
+        {
+            /// otherwise fill response.
+            Strings config_keys;
+            config.keys("http_options_response", config_keys);
+            for (const std::string & config_key : config_keys)
+            {
+                if (config_key == "header" || config_key.starts_with("header["))
+                {
+                    response.add(config.getString("http_options_response." + config_key + ".name", "Empty header"),
+                                 config.getString("http_options_response." + config_key + ".value", ""));
+                    response.setKeepAlive(false);
+                }
+            }
+            response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
+            response.send();
+        }
+    }
+}
+
 static String base64Decode(const String & encoded)
 {
     String decoded;
@@ -850,6 +882,11 @@ void HTTPHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse
 
     try
     {
+        if (request.getMethod() == HTTPServerRequest::HTTP_OPTIONS)
+        {
+            processOptionsRequest(response, server.config());
+            return;
+        }
         response.setContentType("text/plain; charset=UTF-8");
         response.set("X-ClickHouse-Server-Display-Name", server_display_name);
         /// For keep-alive to work.

From c8892ec7a71eac73a852ab1b8d200a86148b08c5 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 22 Sep 2021 10:34:48 +0000
Subject: [PATCH 002/104] add options support

---
 src/Server/HTTPHandler.cpp        | 19 +++++++++++++------
 src/Server/HTTPHandlerFactory.cpp |  4 ++--
 src/Server/HTTPHandlerFactory.h   |  6 ++++--
 3 files changed, 19 insertions(+), 10 deletions(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 99502261aa9..017bc82a475 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -25,6 +25,7 @@
 #include <Server/HTTPHandlerFactory.h>
 #include <Server/HTTPHandlerRequestFilter.h>
 #include <Server/IServer.h>
+#include "common/logger_useful.h"
 #include <Common/SettingsChanges.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/escapeForFileName.h>
@@ -111,10 +112,11 @@ namespace ErrorCodes
 
 namespace
 {
-    /// Process options request. Usefull for CORS.
+    /// Process options request. Useful for CORS.
     void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
     {
-        /// If answer for options request was not defined, return 501 to client.
+        /// If response for options request was not defined, return 501 to client.
+        /// TODO should it be here?
         if (!config.has("http_options_response"))
         {
             response.setStatusAndReason(HTTPResponse::HTTP_NOT_IMPLEMENTED);
@@ -129,12 +131,17 @@ namespace
             {
                 if (config_key == "header" || config_key.starts_with("header["))
                 {
-                    response.add(config.getString("http_options_response." + config_key + ".name", "Empty header"),
-                                 config.getString("http_options_response." + config_key + ".value", ""));
-                    response.setKeepAlive(false);
+                    /// If there is empty header name, it will not be processed and message about it will be in logs
+                    if (config.getString("http_options_response." + config_key + ".name", "").empty())
+                        LOG_WARNING(&Poco::Logger::get("processOptionsRequest"), "Empty header was found in config. It will not be processed.");
+                    else 
+                        response.add(config.getString("http_options_response." + config_key + ".name", ""),
+                                     config.getString("http_options_response." + config_key + ".value", ""));
+
                 }
             }
-            response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
+            response.setKeepAlive(false);
+            response.setStatusAndReason(HTTPResponse::HTTP_OK);
             response.send();
         }
     }
diff --git a/src/Server/HTTPHandlerFactory.cpp b/src/Server/HTTPHandlerFactory.cpp
index 1e3d02b85ab..526b86a5c28 100644
--- a/src/Server/HTTPHandlerFactory.cpp
+++ b/src/Server/HTTPHandlerFactory.cpp
@@ -123,7 +123,7 @@ static inline HTTPRequestHandlerFactoryPtr createInterserverHTTPHandlerFactory(I
     addCommonDefaultHandlersFactory(*factory, server);
 
     auto main_handler = std::make_shared<HandlingRuleHTTPHandlerFactory<InterserverIOHTTPHandler>>(server);
-    main_handler->allowPostAndGetParamsRequest();
+    main_handler->allowPostAndGetParamsAndOptionsRequest();
     factory->addHandler(main_handler);
 
     return factory;
@@ -180,7 +180,7 @@ void addDefaultHandlersFactory(HTTPRequestHandlerFactoryMain & factory, IServer
     addCommonDefaultHandlersFactory(factory, server);
 
     auto query_handler = std::make_shared<HandlingRuleHTTPHandlerFactory<DynamicQueryHandler>>(server, "query");
-    query_handler->allowPostAndGetParamsRequest();
+    query_handler->allowPostAndGetParamsAndOptionsRequest();
     factory.addHandler(query_handler);
 
     /// We check that prometheus handler will be served on current (default) port.
diff --git a/src/Server/HTTPHandlerFactory.h b/src/Server/HTTPHandlerFactory.h
index 6297f988eaa..5497d585d43 100644
--- a/src/Server/HTTPHandlerFactory.h
+++ b/src/Server/HTTPHandlerFactory.h
@@ -104,11 +104,13 @@ public:
     }
 
     /// Handle POST or GET with params
-    void allowPostAndGetParamsRequest()
+    void allowPostAndGetParamsAndOptionsRequest()
     {
         addFilter([](const auto & request)
         {
-            return request.getURI().find('?') != std::string::npos
+            return (request.getURI().find('?') != std::string::npos
+                && request.getMethod() == Poco::Net::HTTPRequest::HTTP_GET)
+                || request.getMethod() == Poco::Net::HTTPRequest::HTTP_OPTIONS
                 || request.getMethod() == Poco::Net::HTTPRequest::HTTP_POST;
         });
     }

From 2cffa98a60677517a372f72a1fea746a19bb0328 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 22 Sep 2021 12:22:21 +0000
Subject: [PATCH 003/104] add test and comments in config

---
 programs/server/config.xml                    |  6 ++++--
 src/Server/HTTPHandler.cpp                    | 14 ++++---------
 tests/config/config.d/CORS.xml                | 20 +++++++++++++++++++
 .../02029_test_options_requests.reference     |  5 +++++
 .../02029_test_options_requests.sh            |  8 ++++++++
 5 files changed, 41 insertions(+), 12 deletions(-)
 create mode 100644 tests/config/config.d/CORS.xml
 create mode 100644 tests/queries/0_stateless/02029_test_options_requests.reference
 create mode 100755 tests/queries/0_stateless/02029_test_options_requests.sh

diff --git a/programs/server/config.xml b/programs/server/config.xml
index bec51de6126..26c3107e972 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -62,7 +62,9 @@
         -->
     </logger>
 
-    <http_options_response>
+    <!-- Add headers to response in options request. OPTIONS method is used in CORS preflight requests. -->
+    <!-- It is off by default. Next headers are obligate for CORS.-->
+    <!-- http_options_response>
         <header>
             <name>Access-Control-Allow-Origin</name>
             <value>*</value>
@@ -79,7 +81,7 @@
             <name>Access-Control-Max-Age</name>
             <value>86400</value>
         </header>
-    </http_options_response>
+    </http_options_response -->
 
     <!-- It is the name that will be shown in the clickhouse-client.
          By default, anything with "production" will be highlighted in red in query prompt.
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 017bc82a475..cec7e1c8b3d 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -115,16 +115,10 @@ namespace
     /// Process options request. Useful for CORS.
     void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
     {
-        /// If response for options request was not defined, return 501 to client.
-        /// TODO should it be here?
-        if (!config.has("http_options_response"))
+        /// If there is information for options request in cofing, fill response.
+        /// For this purpose find all headers related to http_options_response and add them with their values to response
+        if (config.has("http_options_response"))
         {
-            response.setStatusAndReason(HTTPResponse::HTTP_NOT_IMPLEMENTED);
-            response.send();
-        }
-        else
-        {
-            /// otherwise fill response.
             Strings config_keys;
             config.keys("http_options_response", config_keys);
             for (const std::string & config_key : config_keys)
@@ -141,7 +135,7 @@ namespace
                 }
             }
             response.setKeepAlive(false);
-            response.setStatusAndReason(HTTPResponse::HTTP_OK);
+            response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
             response.send();
         }
     }
diff --git a/tests/config/config.d/CORS.xml b/tests/config/config.d/CORS.xml
new file mode 100644
index 00000000000..49fe48f6ff2
--- /dev/null
+++ b/tests/config/config.d/CORS.xml
@@ -0,0 +1,20 @@
+<yandex>
+    <http_options_response>
+        <header>
+            <name>Access-Control-Allow-Origin</name>
+            <value>*</value>
+        </header>
+        <header>
+            <name>Access-Control-Allow-Headers</name>
+            <value>origin, x-requested-with</value>
+        </header>
+        <header>
+            <name>Access-Control-Allow-Methods</name>
+            <value>POST, GET, OPTIONS</value>
+        </header>
+        <header>
+            <name>Access-Control-Max-Age</name>
+            <value>86400</value>
+        </header>
+    </http_options_response>
+<yandex>
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02029_test_options_requests.reference b/tests/queries/0_stateless/02029_test_options_requests.reference
new file mode 100644
index 00000000000..8b001eacbe3
--- /dev/null
+++ b/tests/queries/0_stateless/02029_test_options_requests.reference
@@ -0,0 +1,5 @@
+< HTTP/1.1 204 No Content
+< Access-Control-Allow-Origin: *
+< Access-Control-Allow-Headers: origin, x-requested-with
+< Access-Control-Allow-Methods: POST, GET, OPTIONS
+< Access-Control-Max-Age: 86400
diff --git a/tests/queries/0_stateless/02029_test_options_requests.sh b/tests/queries/0_stateless/02029_test_options_requests.sh
new file mode 100755
index 00000000000..8ea09e3ffe6
--- /dev/null
+++ b/tests/queries/0_stateless/02029_test_options_requests.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# grep all fields, that should be set for CORS support (see CORS.xml)
+$CLICKHOUSE_CURL "${CLICKHOUSE_URL}" -X OPTIONS -vs 2>&1 | grep -E "HTTP/1.1 204 No Content|Access-Control-Allow-Origin|Access-Control-Allow-Headers|Access-Control-Allow-Methods|Access-Control-Max-Age"

From ec5ae5d86a2b9c32ca2f80884c2cca8f2cd6b435 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Wed, 22 Sep 2021 15:23:08 +0300
Subject: [PATCH 004/104] Update CORS.xml

---
 tests/config/config.d/CORS.xml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/config/config.d/CORS.xml b/tests/config/config.d/CORS.xml
index 49fe48f6ff2..9dd7d402416 100644
--- a/tests/config/config.d/CORS.xml
+++ b/tests/config/config.d/CORS.xml
@@ -17,4 +17,5 @@
             <value>86400</value>
         </header>
     </http_options_response>
-<yandex>
\ No newline at end of file
+<yandex>
+    

From 36223b5f23e005739f0565894500a90c16887a1c Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 22 Sep 2021 12:30:55 +0000
Subject: [PATCH 005/104] update comments for filter

---
 src/Server/HTTPHandlerFactory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Server/HTTPHandlerFactory.h b/src/Server/HTTPHandlerFactory.h
index 5497d585d43..e81955ef2b2 100644
--- a/src/Server/HTTPHandlerFactory.h
+++ b/src/Server/HTTPHandlerFactory.h
@@ -103,7 +103,7 @@ public:
         });
     }
 
-    /// Handle POST or GET with params
+    /// Handle POST or GET with params or OPTIONS queries
     void allowPostAndGetParamsAndOptionsRequest()
     {
         addFilter([](const auto & request)

From 2ad7641e7fc7bb362c4cdad4fbb769fef986867d Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 22 Sep 2021 16:54:36 +0000
Subject: [PATCH 006/104] activate add_http_cors_header by default.

---
 programs/server/users.xml                     |  3 +
 .../WriteBufferFromHTTPServerResponse.cpp     |  3 -
 .../HTTP/WriteBufferFromHTTPServerResponse.h  |  8 ---
 src/Server/HTTPHandler.cpp                    | 57 +++++++++++--------
 4 files changed, 36 insertions(+), 35 deletions(-)

diff --git a/programs/server/users.xml b/programs/server/users.xml
index 5166b135e33..9af8282b1ba 100644
--- a/programs/server/users.xml
+++ b/programs/server/users.xml
@@ -18,6 +18,9 @@
                  first_or_random - if first replica one has higher number of errors, pick a random one from replicas with minimum number of errors.
             -->
             <load_balancing>random</load_balancing>
+
+            <!-- Always try to add http cors header. -->
+            <add_http_cors_header>1</add_http_cors_header>
         </default>
 
         <!-- Profile that allows only read queries. -->
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
index a4fe3649e6f..5bc10841726 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
@@ -29,9 +29,6 @@ void WriteBufferFromHTTPServerResponse::startSendHeaders()
     {
         headers_started_sending = true;
 
-        if (add_cors_header)
-            response.set("Access-Control-Allow-Origin", "*");
-
         setResponseDefaultHeaders(response, keep_alive_timeout);
 
         if (!is_http_method_head)
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
index b4ff454195f..7cebf5ca770 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
@@ -36,7 +36,6 @@ private:
     HTTPServerResponse & response;
 
     bool is_http_method_head;
-    bool add_cors_header = false;
     unsigned keep_alive_timeout = 0;
     bool compress = false;
     CompressionMethod compression_method;
@@ -103,13 +102,6 @@ public:
         compression_level = level;
     }
 
-    /// Turn CORS on or off.
-    /// The setting has any effect only if HTTP headers haven't been sent yet.
-    void addHeaderCORS(bool enable_cors)
-    {
-        add_cors_header = enable_cors;
-    }
-
     /// Don't send HTTP headers with progress more frequently.
     void setSendProgressInterval(size_t send_progress_interval_ms_)
     {
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index cec7e1c8b3d..c27d5343e90 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -33,7 +33,7 @@
 #include <Common/typeid_cast.h>
 #include <common/getFQDNOrHostName.h>
 #include <common/scope_guard.h>
-#include "Server/HTTP/HTTPResponse.h"
+#include <Server/HTTP/HTTPResponse.h>
 
 #if !defined(ARCADIA_BUILD)
 #    include <Common/config.h>
@@ -112,33 +112,41 @@ namespace ErrorCodes
 
 namespace
 {
-    /// Process options request. Useful for CORS.
-    void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
+bool tryAddHeadersFromConfig(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
+{
+    if (config.has("http_options_response"))
     {
-        /// If there is information for options request in cofing, fill response.
-        /// For this purpose find all headers related to http_options_response and add them with their values to response
-        if (config.has("http_options_response"))
+        Strings config_keys;
+        config.keys("http_options_response", config_keys);
+        for (const std::string & config_key : config_keys)
         {
-            Strings config_keys;
-            config.keys("http_options_response", config_keys);
-            for (const std::string & config_key : config_keys)
+            if (config_key == "header" || config_key.starts_with("header["))
             {
-                if (config_key == "header" || config_key.starts_with("header["))
-                {
-                    /// If there is empty header name, it will not be processed and message about it will be in logs
-                    if (config.getString("http_options_response." + config_key + ".name", "").empty())
-                        LOG_WARNING(&Poco::Logger::get("processOptionsRequest"), "Empty header was found in config. It will not be processed.");
-                    else 
-                        response.add(config.getString("http_options_response." + config_key + ".name", ""),
-                                     config.getString("http_options_response." + config_key + ".value", ""));
+                /// If there is empty header name, it will not be processed and message about it will be in logs
+                if (config.getString("http_options_response." + config_key + ".name", "").empty())
+                    LOG_WARNING(&Poco::Logger::get("processOptionsRequest"), "Empty header was found in config. It will not be processed.");
+                else 
+                    response.add(config.getString("http_options_response." + config_key + ".name", ""),
+                                    config.getString("http_options_response." + config_key + ".value", ""));
 
-                }
             }
-            response.setKeepAlive(false);
-            response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
-            response.send();
         }
+        return true;
     }
+    return false;
+}
+
+/// Process options request. Useful for CORS.
+void processOptionsRequest(HTTPServerResponse & response, const Poco::Util::LayeredConfiguration & config)
+{
+    /// If can add some headers from config
+    if (tryAddHeadersFromConfig(response, config))
+    {
+        response.setKeepAlive(false);
+        response.setStatusAndReason(HTTPResponse::HTTP_NO_CONTENT);
+        response.send();
+    }
+}
 }
 
 static String base64Decode(const String & encoded)
@@ -739,9 +747,10 @@ void HTTPHandler::processQuery(
     if (in_post_compressed && settings.http_native_compression_disable_checksumming_on_decompress)
         static_cast<CompressedReadBuffer &>(*in_post_maybe_compressed).disableChecksumming();
 
-    /// Add CORS header if 'add_http_cors_header' setting is turned on and the client passed
-    /// Origin header.
-    used_output.out->addHeaderCORS(settings.add_http_cors_header && !request.get("Origin", "").empty());
+    /// Add CORS header if 'add_http_cors_header' setting is turned on or config has http_options_response,
+    /// which means that there are some headers to be sent, and the client passed Origin header.
+    if ((settings.add_http_cors_header || config.has("http_options_response")) && !request.get("Origin", "").empty())
+        tryAddHeadersFromConfig(response, config);
 
     auto append_callback = [context] (ProgressCallback callback)
     {

From ce4193fe957367d28da59e6c94fc54aefb3038db Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 22 Sep 2021 17:10:15 +0000
Subject: [PATCH 007/104] small refactoring

---
 src/Server/HTTPHandler.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index c27d5343e90..046e7bdfaad 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -749,7 +749,7 @@ void HTTPHandler::processQuery(
 
     /// Add CORS header if 'add_http_cors_header' setting is turned on or config has http_options_response,
     /// which means that there are some headers to be sent, and the client passed Origin header.
-    if ((settings.add_http_cors_header || config.has("http_options_response")) && !request.get("Origin", "").empty())
+    if (settings.add_http_cors_header && config.has("http_options_response") && !request.get("Origin", "").empty())
         tryAddHeadersFromConfig(response, config);
 
     auto append_callback = [context] (ProgressCallback callback)

From 7bbd08cb5d4c90357fc23b0cbfe96f36cfecff33 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Fri, 24 Sep 2021 15:40:27 +0300
Subject: [PATCH 008/104] Update HTTPHandler.cpp

---
 src/Server/HTTPHandler.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index bd4452ac6cb..7357c56ad2e 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -125,7 +125,7 @@ bool tryAddHeadersFromConfig(HTTPServerResponse & response, const Poco::Util::La
                 /// If there is empty header name, it will not be processed and message about it will be in logs
                 if (config.getString("http_options_response." + config_key + ".name", "").empty())
                     LOG_WARNING(&Poco::Logger::get("processOptionsRequest"), "Empty header was found in config. It will not be processed.");
-                else 
+                else
                     response.add(config.getString("http_options_response." + config_key + ".name", ""),
                                     config.getString("http_options_response." + config_key + ".value", ""));
 

From fcebf7b9853452caaffc39d91a31d19ae55a45ba Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Wed, 29 Sep 2021 11:29:24 +0000
Subject: [PATCH 009/104] correct tests

---
 src/Server/HTTPHandlerFactory.h | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Server/HTTPHandlerFactory.h b/src/Server/HTTPHandlerFactory.h
index e81955ef2b2..f6d96189d92 100644
--- a/src/Server/HTTPHandlerFactory.h
+++ b/src/Server/HTTPHandlerFactory.h
@@ -108,8 +108,7 @@ public:
     {
         addFilter([](const auto & request)
         {
-            return (request.getURI().find('?') != std::string::npos
-                && request.getMethod() == Poco::Net::HTTPRequest::HTTP_GET)
+            return request.getURI().find('?') != std::string::npos
                 || request.getMethod() == Poco::Net::HTTPRequest::HTTP_OPTIONS
                 || request.getMethod() == Poco::Net::HTTPRequest::HTTP_POST;
         });

From 36b699659e466c1deaf4737f973adcfc95fe378b Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Wed, 29 Sep 2021 14:32:04 +0300
Subject: [PATCH 010/104] Update CORS.xml

---
 tests/config/config.d/CORS.xml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/config/config.d/CORS.xml b/tests/config/config.d/CORS.xml
index 9dd7d402416..873821478dc 100644
--- a/tests/config/config.d/CORS.xml
+++ b/tests/config/config.d/CORS.xml
@@ -1,4 +1,4 @@
-<yandex>
+<clickhouse>
     <http_options_response>
         <header>
             <name>Access-Control-Allow-Origin</name>
@@ -17,5 +17,5 @@
             <value>86400</value>
         </header>
     </http_options_response>
-<yandex>
+<clickhouse>
     

From cac28833d247617804627e3059589da17c09de1d Mon Sep 17 00:00:00 2001
From: Artur Filatenkov <613623@mail.ru>
Date: Wed, 29 Sep 2021 18:54:04 +0300
Subject: [PATCH 011/104] apply added config in tests

---
 tests/config/install.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/config/install.sh b/tests/config/install.sh
index df62cba0ea9..936c44a4e7b 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -37,6 +37,7 @@ ln -sf $SRC_PATH/config.d/tcp_with_proxy.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/top_level_domains_lists.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/top_level_domains_path.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/encryption.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/CORS.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/zookeeper_log.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/logger.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/users.d/log_queries.xml $DEST_SERVER_PATH/users.d/
@@ -57,7 +58,6 @@ ln -sf $SRC_PATH/strings_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/decimals_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/executable_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/executable_pool_dictionary.xml $DEST_SERVER_PATH/
-ln -sf $SRC_PATH/test_function.xml $DEST_SERVER_PATH/
 
 ln -sf $SRC_PATH/top_level_domains $DEST_SERVER_PATH/
 

From 68f8b9d235e7417537e4066fb864a71dd8149fd0 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 29 Sep 2021 20:45:01 +0300
Subject: [PATCH 012/104] Update ColumnGathererStream

---
 src/DataStreams/ColumnGathererStream.cpp      | 164 ++++++++++++------
 src/DataStreams/ColumnGathererStream.h        |  98 ++++++-----
 .../MergeTree/IMergedBlockOutputStream.h      |   4 +-
 src/Storages/MergeTree/MergeTask.cpp          |   5 -
 .../MergeTree/MergedBlockOutputStream.cpp     |   5 -
 .../MergeTree/MergedBlockOutputStream.h       |   7 +-
 .../MergedColumnOnlyOutputStream.cpp          |   5 -
 .../MergeTree/MergedColumnOnlyOutputStream.h  |   5 +-
 8 files changed, 168 insertions(+), 125 deletions(-)

diff --git a/src/DataStreams/ColumnGathererStream.cpp b/src/DataStreams/ColumnGathererStream.cpp
index 683b8012efe..90da7792c21 100644
--- a/src/DataStreams/ColumnGathererStream.cpp
+++ b/src/DataStreams/ColumnGathererStream.cpp
@@ -18,97 +18,151 @@ namespace ErrorCodes
 }
 
 ColumnGathererStream::ColumnGathererStream(
-        const String & column_name_, const BlockInputStreams & source_streams, ReadBuffer & row_sources_buf_,
-        size_t block_preferred_size_)
-    : column_name(column_name_), sources(source_streams.size()), row_sources_buf(row_sources_buf_)
-    , block_preferred_size(block_preferred_size_), log(&Poco::Logger::get("ColumnGathererStream"))
+    size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_)
+    : sources(num_inputs), row_sources_buf(row_sources_buf_)
+    , block_preferred_size(block_preferred_size_)
 {
-    if (source_streams.empty())
+    if (num_inputs == 0)
         throw Exception("There are no streams to gather", ErrorCodes::EMPTY_DATA_PASSED);
+}
 
-    children.assign(source_streams.begin(), source_streams.end());
-
-    for (size_t i = 0; i < children.size(); ++i)
+void ColumnGathererStream::initialize(Inputs inputs)
+{
+    for (size_t i = 0; i < inputs.size(); ++i)
     {
-        const Block & header = children[i]->getHeader();
-
-        /// Sometimes MergeTreeReader injects additional column with partitioning key
-        if (header.columns() > 2)
-            throw Exception(
-                "Block should have 1 or 2 columns, but contains " + toString(header.columns()),
-                ErrorCodes::INCORRECT_NUMBER_OF_COLUMNS);
-
-        if (i == 0)
+        if (inputs[i].chunk)
         {
-            column.name = column_name;
-            column.type = header.getByName(column_name).type;
-            column.column = column.type->createColumn();
+            sources[i].update(inputs[i].chunk.detachColumns().at(0));
+            if (!result_column)
+                result_column = sources[i].column->cloneEmpty();
         }
-        else if (header.getByName(column_name).column->getName() != column.column->getName())
-            throw Exception("Column types don't match", ErrorCodes::INCOMPATIBLE_COLUMNS);
     }
 }
 
-
-Block ColumnGathererStream::readImpl()
+IMergingAlgorithm::Status ColumnGathererStream::merge()
 {
+    /// Nothing to read after initialize.
+    if (!result_column)
+        return Status(Chunk(), true);
+
+    if (source_to_fully_copy) /// Was set on a previous iteration
+    {
+        Chunk res;
+        res.addColumn(source_to_fully_copy->column);
+        merged_rows += source_to_fully_copy->size;
+        source_to_fully_copy->pos = source_to_fully_copy->size;
+        source_to_fully_copy = nullptr;
+        return Status(std::move(res));
+    }
+
     /// Special case: single source and there are no skipped rows
-    if (children.size() == 1 && row_sources_buf.eof() && !source_to_fully_copy)
-        return children[0]->read();
+    /// Note: looks like this should never happen because row_sources_buf cannot just skip row info.
+    if (sources.size() == 1 && row_sources_buf.eof())
+    {
+        if (sources.front().pos < sources.front().size)
+        {
+            next_required_source = 0;
+            Chunk res;
+            merged_rows += sources.front().column->size();
+            merged_bytes += sources.front().column->allocatedBytes();
+            res.addColumn(std::move(sources.front().column));
+            sources.front().pos = sources.front().size = 0;
+            return Status(std::move(res));
+        }
 
-    if (!source_to_fully_copy && row_sources_buf.eof())
-        return Block();
+        if (next_required_source == -1)
+            return Status(Chunk(), true);
 
-    MutableColumnPtr output_column = column.column->cloneEmpty();
-    output_block = Block{column.cloneEmpty()};
-    /// Surprisingly this call may directly change output_block, bypassing
+        next_required_source = 0;
+        return Status(next_required_source);
+    }
+
+    if (next_required_source != -1 && sources[next_required_source].size == 0)
+        throw Exception("Cannot fetch required block. Source " + toString(next_required_source), ErrorCodes::RECEIVED_EMPTY_DATA);
+
+    /// Surprisingly this call may directly change some internal state of ColumnGathererStream.
     /// output_column. See ColumnGathererStream::gather.
-    output_column->gather(*this);
-    if (!output_column->empty())
-        output_block.getByPosition(0).column = std::move(output_column);
+    result_column->gather(*this);
 
-    return output_block;
+    if (next_required_source != -1)
+        return Status(next_required_source);
+
+    if (source_to_fully_copy && result_column->empty())
+    {
+        Chunk res;
+        merged_rows += source_to_fully_copy->column->size();
+        merged_bytes += source_to_fully_copy->column->allocatedBytes();
+        res.addColumn(source_to_fully_copy->column);
+        source_to_fully_copy->pos = source_to_fully_copy->size;
+        source_to_fully_copy = nullptr;
+        return Status(std::move(res));
+    }
+
+    auto col = result_column->cloneEmpty();
+    result_column.swap(col);
+
+    Chunk res;
+    merged_rows += col->size();
+    merged_bytes += col->allocatedBytes();
+    res.addColumn(std::move(col));
+    return Status(std::move(res), row_sources_buf.eof());
 }
 
 
-void ColumnGathererStream::fetchNewBlock(Source & source, size_t source_num)
+void ColumnGathererStream::consume(Input & input, size_t source_num)
 {
-    try
-    {
-        source.block = children[source_num]->read();
-        source.update(column_name);
-    }
-    catch (Exception & e)
-    {
-        e.addMessage("Cannot fetch required block. Stream " + children[source_num]->getName() + ", part " + toString(source_num));
-        throw;
-    }
+    auto & source = sources[source_num];
+    if (input.chunk)
+        source.update(input.chunk.getColumns().at(0));
 
     if (0 == source.size)
     {
-        throw Exception("Fetched block is empty. Stream " + children[source_num]->getName() + ", part " + toString(source_num),
+        throw Exception("Fetched block is empty. Source " + toString(source_num),
                         ErrorCodes::RECEIVED_EMPTY_DATA);
     }
 }
 
-
-void ColumnGathererStream::readSuffixImpl()
+ColumnGathererTransform::ColumnGathererTransform(
+    const Block & header,
+    size_t num_inputs,
+    ReadBuffer & row_sources_buf_,
+    size_t block_preferred_size_)
+    : IMergingTransform<ColumnGathererStream>(
+        num_inputs, header, header, /*have_all_inputs_=*/ true, /*has_limit_below_one_block_=*/ false,
+        num_inputs, row_sources_buf_, block_preferred_size_)
+    , log(&Poco::Logger::get("ColumnGathererStream"))
 {
-    const BlockStreamProfileInfo & profile_info = getProfileInfo();
+    if (header.columns() != 1)
+        throw Exception(
+            "Header should have 1 column, but contains " + toString(header.columns()),
+            ErrorCodes::INCORRECT_NUMBER_OF_COLUMNS);
+}
 
+void ColumnGathererTransform::work()
+{
+    Stopwatch stopwatch;
+    IMergingTransform<ColumnGathererStream>::work();
+    elapsed_ns += stopwatch.elapsedNanoseconds();
+}
+
+void ColumnGathererTransform::onFinish()
+{
+    auto merged_rows = algorithm.getMergedRows();
+    auto merged_bytes = algorithm.getMergedRows();
     /// Don't print info for small parts (< 10M rows)
-    if (profile_info.rows < 10000000)
+    if (merged_rows < 10000000)
         return;
 
-    double seconds = profile_info.total_stopwatch.elapsedSeconds();
+    double seconds = static_cast<double>(elapsed_ns) / 1000000000ULL;
+    const auto & column_name = getOutputPort().getHeader().getByPosition(0).name;
 
     if (!seconds)
         LOG_DEBUG(log, "Gathered column {} ({} bytes/elem.) in 0 sec.",
-            column_name, static_cast<double>(profile_info.bytes) / profile_info.rows);
+            column_name, static_cast<double>(merged_bytes) / merged_rows);
     else
         LOG_DEBUG(log, "Gathered column {} ({} bytes/elem.) in {} sec., {} rows/sec., {}/sec.",
-            column_name, static_cast<double>(profile_info.bytes) / profile_info.rows, seconds,
-            profile_info.rows / seconds, ReadableSize(profile_info.bytes / seconds));
+            column_name, static_cast<double>(merged_bytes) / merged_rows, seconds,
+            merged_rows / seconds, ReadableSize(merged_bytes / seconds));
 }
 
 }
diff --git a/src/DataStreams/ColumnGathererStream.h b/src/DataStreams/ColumnGathererStream.h
index 05665ab3f42..43cbf7094d8 100644
--- a/src/DataStreams/ColumnGathererStream.h
+++ b/src/DataStreams/ColumnGathererStream.h
@@ -1,8 +1,9 @@
 #pragma once
 
-#include <DataStreams/IBlockInputStream.h>
 #include <IO/ReadBuffer.h>
 #include <Common/PODArray.h>
+#include <Processors/Merges/Algorithms/IMergingAlgorithm.h>
+#include <Processors/Merges/IMergingTransform.h>
 
 
 namespace Poco { class Logger; }
@@ -53,77 +54,91 @@ using MergedRowSources = PODArray<RowSourcePart>;
   * Stream mask maps row number to index of source stream.
   * Streams should contain exactly one column.
   */
-class ColumnGathererStream : public IBlockInputStream
+class ColumnGathererStream final : public IMergingAlgorithm
 {
 public:
-    ColumnGathererStream(
-        const String & column_name_, const BlockInputStreams & source_streams, ReadBuffer & row_sources_buf_,
-        size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+    ColumnGathererStream(size_t num_inputs, ReadBuffer & row_sources_buf_, size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
 
-    String getName() const override { return "ColumnGatherer"; }
-
-    Block readImpl() override;
-
-    void readSuffixImpl() override;
-
-    Block getHeader() const override { return children.at(0)->getHeader(); }
+    void initialize(Inputs inputs) override;
+    void consume(Input & input, size_t source_num) override;
+    Status merge() override;
 
     /// for use in implementations of IColumn::gather()
     template <typename Column>
     void gather(Column & column_res);
 
+    UInt64 getMergedRows() const { return merged_rows; }
+    UInt64 getMergedBytes() const { return merged_bytes; }
+
 private:
     /// Cache required fields
     struct Source
     {
-        const IColumn * column = nullptr;
+        ColumnPtr column;
         size_t pos = 0;
         size_t size = 0;
-        Block block;
 
-        void update(const String & name)
+        void update(ColumnPtr column_)
         {
-            column = block.getByName(name).column.get();
-            size = block.rows();
+            column = std::move(column_);
+            size = column->size();
             pos = 0;
         }
     };
 
-    void fetchNewBlock(Source & source, size_t source_num);
-
-    String column_name;
-    ColumnWithTypeAndName column;
+    MutableColumnPtr result_column;
 
     std::vector<Source> sources;
     ReadBuffer & row_sources_buf;
 
-    size_t block_preferred_size;
+    const size_t block_preferred_size;
 
     Source * source_to_fully_copy = nullptr;
-    Block output_block;
+
+    ssize_t next_required_source = -1;
+    size_t cur_block_preferred_size;
+
+    UInt64 merged_rows = 0;
+    UInt64 merged_bytes = 0;
+};
+
+class ColumnGathererTransform final : public IMergingTransform<ColumnGathererStream>
+{
+public:
+    ColumnGathererTransform(
+        const Block & header,
+        size_t num_inputs,
+        ReadBuffer & row_sources_buf_,
+        size_t block_preferred_size_ = DEFAULT_BLOCK_SIZE);
+
+    String getName() const override { return "ColumnGathererTransform"; }
+
+    void work() override;
+
+protected:
+    void onFinish() override;
+    UInt64 elapsed_ns = 0;
 
     Poco::Logger * log;
 };
 
+
 template <typename Column>
 void ColumnGathererStream::gather(Column & column_res)
 {
-    if (source_to_fully_copy) /// Was set on a previous iteration
-    {
-        output_block.getByPosition(0).column = source_to_fully_copy->block.getByName(column_name).column;
-        source_to_fully_copy->pos = source_to_fully_copy->size;
-        source_to_fully_copy = nullptr;
-        return;
-    }
-
     row_sources_buf.nextIfAtEnd();
     RowSourcePart * row_source_pos = reinterpret_cast<RowSourcePart *>(row_sources_buf.position());
     RowSourcePart * row_sources_end = reinterpret_cast<RowSourcePart *>(row_sources_buf.buffer().end());
 
-    size_t cur_block_preferred_size = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size);
-    column_res.reserve(cur_block_preferred_size);
+    if (next_required_source == -1)
+    {
+        /// Start new column.
+        cur_block_preferred_size = std::min(static_cast<size_t>(row_sources_end - row_source_pos), block_preferred_size);
+        column_res.reserve(cur_block_preferred_size);
+    }
 
-    size_t cur_size = 0;
+    size_t cur_size = column_res->size();
+    next_required_source = -1;
 
     while (row_source_pos < row_sources_end && cur_size < cur_block_preferred_size)
     {
@@ -131,13 +146,15 @@ void ColumnGathererStream::gather(Column & column_res)
         size_t source_num = row_source.getSourceNum();
         Source & source = sources[source_num];
         bool source_skip = row_source.getSkipFlag();
-        ++row_source_pos;
 
         if (source.pos >= source.size) /// Fetch new block from source_num part
         {
-            fetchNewBlock(source, source_num);
+            next_required_source = source_num;
+            return;
         }
 
+        ++row_source_pos;
+
         /// Consecutive optimization. TODO: precompute lengths
         size_t len = 1;
         size_t max_len = std::min(static_cast<size_t>(row_sources_end - row_source_pos), source.size - source.pos); // interval should be in the same block
@@ -156,14 +173,7 @@ void ColumnGathererStream::gather(Column & column_res)
             {
                 /// If current block already contains data, return it.
                 /// Whole column from current source will be returned on next read() iteration.
-                if (cur_size > 0)
-                {
-                    source_to_fully_copy = &source;
-                    return;
-                }
-
-                output_block.getByPosition(0).column = source.block.getByName(column_name).column;
-                source.pos += len;
+                source_to_fully_copy = &source;
                 return;
             }
             else if (len == 1)
diff --git a/src/Storages/MergeTree/IMergedBlockOutputStream.h b/src/Storages/MergeTree/IMergedBlockOutputStream.h
index 0e689b7c84c..133f0804838 100644
--- a/src/Storages/MergeTree/IMergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/IMergedBlockOutputStream.h
@@ -2,14 +2,13 @@
 
 #include <Storages/MergeTree/MergeTreeIndexGranularity.h>
 #include <Storages/MergeTree/MergeTreeData.h>
-#include <DataStreams/IBlockOutputStream.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/IMergeTreeDataPartWriter.h>
 
 namespace DB
 {
 
-class IMergedBlockOutputStream : public IBlockOutputStream
+class IMergedBlockOutputStream
 {
 public:
     IMergedBlockOutputStream(
@@ -35,7 +34,6 @@ protected:
         NamesAndTypesList & columns,
         MergeTreeData::DataPart::Checksums & checksums);
 
-protected:
     const MergeTreeData & storage;
     StorageMetadataPtr metadata_snapshot;
 
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index e6b37d0657c..54230f56a6c 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -238,9 +238,6 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
 
     global_ctx->merged_stream->readPrefix();
 
-    /// TODO: const
-    const_cast<MergedBlockOutputStream&>(*global_ctx->to).writePrefix();
-
     global_ctx->rows_written = 0;
     ctx->initial_reservation = global_ctx->space_reservation ? global_ctx->space_reservation->getSize() : 0;
 
@@ -421,8 +418,6 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
         global_ctx->to->getIndexGranularity());
 
     ctx->column_elems_written = 0;
-
-    ctx->column_to->writePrefix();
 }
 
 
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index 31675789257..495ce5ee933 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -51,11 +51,6 @@ void MergedBlockOutputStream::writeWithPermutation(const Block & block, const IC
     writeImpl(block, permutation);
 }
 
-void MergedBlockOutputStream::writeSuffix()
-{
-    throw Exception("Method writeSuffix is not supported by MergedBlockOutputStream", ErrorCodes::NOT_IMPLEMENTED);
-}
-
 void MergedBlockOutputStream::writeSuffixAndFinalizePart(
         MergeTreeData::MutableDataPartPtr & new_part,
         bool sync,
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.h b/src/Storages/MergeTree/MergedBlockOutputStream.h
index 95cc91a8ebc..3586ac17298 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.h
@@ -21,18 +21,16 @@ public:
         CompressionCodecPtr default_codec_,
         bool blocks_are_granules_size = false);
 
-    Block getHeader() const override { return metadata_snapshot->getSampleBlock(); }
+    Block getHeader() const { return metadata_snapshot->getSampleBlock(); }
 
     /// If the data is pre-sorted.
-    void write(const Block & block) override;
+    void write(const Block & block);
 
     /** If the data is not sorted, but we have previously calculated the permutation, that will sort it.
       * This method is used to save RAM, since you do not need to keep two blocks at once - the original one and the sorted one.
       */
     void writeWithPermutation(const Block & block, const IColumn::Permutation * permutation);
 
-    void writeSuffix() override;
-
     /// Finalize writing part and fill inner structures
     /// If part is new and contains projections, they should be added before invoking this method.
     void writeSuffixAndFinalizePart(
@@ -53,7 +51,6 @@ private:
             MergeTreeData::DataPart::Checksums & checksums,
             bool sync);
 
-private:
     NamesAndTypesList columns_list;
     IMergeTreeDataPart::MinMaxIndex minmax_idx;
     size_t rows_count = 0;
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
index 3638212b320..4b760103750 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.cpp
@@ -53,11 +53,6 @@ void MergedColumnOnlyOutputStream::write(const Block & block)
     writer->write(block, nullptr);
 }
 
-void MergedColumnOnlyOutputStream::writeSuffix()
-{
-    throw Exception("Method writeSuffix is not supported by MergedColumnOnlyOutputStream", ErrorCodes::NOT_IMPLEMENTED);
-}
-
 MergeTreeData::DataPart::Checksums
 MergedColumnOnlyOutputStream::writeSuffixAndGetChecksums(
     MergeTreeData::MutableDataPartPtr & new_part,
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
index c82357dfb1d..7a146a91331 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
@@ -23,9 +23,8 @@ public:
         const MergeTreeIndexGranularity & index_granularity = {},
         const MergeTreeIndexGranularityInfo * index_granularity_info_ = nullptr);
 
-    Block getHeader() const override { return header; }
-    void write(const Block & block) override;
-    void writeSuffix() override;
+    Block getHeader() const { return header; }
+    void write(const Block & block);
     MergeTreeData::DataPart::Checksums
     writeSuffixAndGetChecksums(MergeTreeData::MutableDataPartPtr & new_part, MergeTreeData::DataPart::Checksums & all_checksums, bool sync = false);
 

From cfb9875acf3df38fe3f28188a0c79aff7a3e7a97 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Thu, 30 Sep 2021 13:47:12 +0000
Subject: [PATCH 013/104] Trigger Build


From ccdcaa21ff1696a1566374117caf49acece8358d Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Fri, 1 Oct 2021 16:13:10 +0300
Subject: [PATCH 014/104] Update install.sh

---
 tests/config/install.sh | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/config/install.sh b/tests/config/install.sh
index f39bd951f46..764bc891c28 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -48,6 +48,7 @@ ln -sf $SRC_PATH/users.d/opentelemetry.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/remote_queries.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/session_log_test.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/memory_profiler.xml $DEST_SERVER_PATH/users.d/
+ln -sf $SRC_PATH/test_function.xml $DEST_SERVER_PATH/
 
 # FIXME DataPartsExchange may hang for http_send_timeout seconds
 # when nobody is going to read from the other side of socket (due to "Fetching of part was cancelled"),

From 77081f33c29ebc436aec415d220c6a8ffb88e38f Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Fri, 1 Oct 2021 16:13:51 +0300
Subject: [PATCH 015/104] Update install.sh

---
 tests/config/install.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/config/install.sh b/tests/config/install.sh
index 764bc891c28..94ad55504a8 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -48,7 +48,6 @@ ln -sf $SRC_PATH/users.d/opentelemetry.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/remote_queries.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/session_log_test.xml $DEST_SERVER_PATH/users.d/
 ln -sf $SRC_PATH/users.d/memory_profiler.xml $DEST_SERVER_PATH/users.d/
-ln -sf $SRC_PATH/test_function.xml $DEST_SERVER_PATH/
 
 # FIXME DataPartsExchange may hang for http_send_timeout seconds
 # when nobody is going to read from the other side of socket (due to "Fetching of part was cancelled"),
@@ -60,6 +59,7 @@ ln -sf $SRC_PATH/strings_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/decimals_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/executable_dictionary.xml $DEST_SERVER_PATH/
 ln -sf $SRC_PATH/executable_pool_dictionary.xml $DEST_SERVER_PATH/
+ln -sf $SRC_PATH/test_function.xml $DEST_SERVER_PATH/
 
 ln -sf $SRC_PATH/top_level_domains $DEST_SERVER_PATH/
 

From d41ef6a9f8b4ae47aadf8c572cd90c04208ad087 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Fri, 1 Oct 2021 17:08:22 +0300
Subject: [PATCH 016/104] Update CORS.xml

---
 tests/config/config.d/CORS.xml | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/config/config.d/CORS.xml b/tests/config/config.d/CORS.xml
index 873821478dc..b96209866a7 100644
--- a/tests/config/config.d/CORS.xml
+++ b/tests/config/config.d/CORS.xml
@@ -17,5 +17,4 @@
             <value>86400</value>
         </header>
     </http_options_response>
-<clickhouse>
-    
+</clickhouse>

From a99a6fccc7289fb75bb55a3b47cfda8d144478b0 Mon Sep 17 00:00:00 2001
From: WangZengrui <joeywang98@outlook.com>
Date: Sat, 2 Oct 2021 02:34:53 +0800
Subject: [PATCH 017/104] init

---
 src/Interpreters/getOSKernelVersion.cpp | 37 +++++++++++++++++++++++++
 src/Interpreters/getOSKernelVersion.h   | 31 +++++++++++++++++++++
 2 files changed, 68 insertions(+)
 create mode 100644 src/Interpreters/getOSKernelVersion.cpp
 create mode 100644 src/Interpreters/getOSKernelVersion.h

diff --git a/src/Interpreters/getOSKernelVersion.cpp b/src/Interpreters/getOSKernelVersion.cpp
new file mode 100644
index 00000000000..44df948be3c
--- /dev/null
+++ b/src/Interpreters/getOSKernelVersion.cpp
@@ -0,0 +1,37 @@
+#if defined(OS_LINUX)
+#include <Interpreters/getOSKernelVersion.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+    
+String getOSKernelVersion()
+{
+    struct utsname os_kernel_version;
+    int buf = uname(&os_kernel_version);
+    if (buf < 0)
+    {
+        throw Exception(
+            "EFAULT buf is not valid.",
+            ErrorCodes::BAD_ARGUMENTS);
+    }
+    else
+    {
+        // std::cout <<"sysname: " << os_kernel_version.sysname << " nodename: " << os_kernel_version.nodename 
+        //           << " release: " << os_kernel_version.release << " version: " << os_kernel_version.version 
+        //           << " machine: " << os_kernel_version.machine << std::endl;
+
+        return "sysname: " + String(os_kernel_version.sysname) + " nodename: " + String(os_kernel_version.nodename) 
+                  + " release: " + String(os_kernel_version.release) + " version: " + String(os_kernel_version.version) 
+                  + " machine: " + String(os_kernel_version.machine);
+    }
+}
+
+}
+
+#endif
\ No newline at end of file
diff --git a/src/Interpreters/getOSKernelVersion.h b/src/Interpreters/getOSKernelVersion.h
new file mode 100644
index 00000000000..14b42d2a19a
--- /dev/null
+++ b/src/Interpreters/getOSKernelVersion.h
@@ -0,0 +1,31 @@
+#if defined(OS_LINUX)
+#pragma once
+
+#include <Common/typeid_cast.h>
+
+#include <string>
+#include <sys/utsname.h>
+
+namespace DB
+{
+
+/// Returns String with OS Kernel version.
+/* To get name and information about current kernel.
+   For simplicity, the function can be implemented only for Linux. 
+*/
+    
+String getOSKernelVersion();
+
+// String getSysName();
+
+// String getNodeName();
+
+// String getReleaseName();
+
+// String getVersion();
+
+// String getMachineName();
+
+}
+
+#endif
\ No newline at end of file

From 1c62a53afe8344908a7d8b0c6ea3baf55e3aada9 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Mon, 4 Oct 2021 20:49:21 +0300
Subject: [PATCH 018/104] Document the enable_positional_arguments setting

---
 docs/en/operations/settings/settings.md       | 36 +++++++++++++++++++
 .../sql-reference/statements/select/index.md  |  2 +-
 2 files changed, 37 insertions(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index de7a1835038..320dadb6783 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3749,3 +3749,39 @@ Exception: Total regexp lengths too large.
 **See Also**
 
 -   [max_hyperscan_regexp_length](#max-hyperscan-regexp-length)
+
+## enable_positional_arguments {#enable-positional-arguments}
+
+Enables or disables supporting positional arguments for [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md) statement. When you want to use column numbers instead of titles in these clauses, set `enable_positional_arguments = 1`.
+
+Possible values:
+
+-   0 — Disabled.
+-   1 — Enabled.
+
+Default value: `0`.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE positional_arguments(one Int, two Int, tree Int) ENGINE=Memory();
+
+INSERT INTO positional_arguments VALUES (10, 20, 30), (20, 30, 10), (30, 10, 20);
+
+SET enable_positional_arguments = 1;
+
+SELECT * FROM positional_arguments ORDER BY 2,3;
+```
+
+Result:
+
+```text
+┌─one─┬─two─┬─tree─┐
+│  30 │  10 │   20 │
+│  10 │  20 │   30 │
+│  20 │  30 │   10 │
+└─────┴─────┴──────┘
+
+```
\ No newline at end of file
diff --git a/docs/en/sql-reference/statements/select/index.md b/docs/en/sql-reference/statements/select/index.md
index b3cc7555d91..2bfaf4af297 100644
--- a/docs/en/sql-reference/statements/select/index.md
+++ b/docs/en/sql-reference/statements/select/index.md
@@ -144,7 +144,7 @@ Extreme values are calculated for rows before `LIMIT`, but after `LIMIT BY`. How
 
 You can use synonyms (`AS` aliases) in any part of a query.
 
-The `GROUP BY` and `ORDER BY` clauses do not support positional arguments. This contradicts MySQL, but conforms to standard SQL. For example, `GROUP BY 1, 2` will be interpreted as grouping by constants (i.e. aggregation of all rows into one).
+The `GROUP BY`, `ORDER BY` and `LIMIT BY` clauses support positional arguments. For example, ORDER BY 1,2 will be sorting rows on the table on the first and then the second column.
 
 ## Implementation Details {#implementation-details}
 

From 83424685fc6af68d66e3eacf6d7cc5f095ff6947 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Mon, 4 Oct 2021 21:11:12 +0300
Subject: [PATCH 019/104] update example

---
 docs/en/operations/settings/settings.md          | 6 +++---
 docs/en/sql-reference/statements/select/index.md | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 320dadb6783..46f72bd4f2b 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3752,7 +3752,7 @@ Exception: Total regexp lengths too large.
 
 ## enable_positional_arguments {#enable-positional-arguments}
 
-Enables or disables supporting positional arguments for [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md) statement. When you want to use column numbers instead of titles in these clauses, set `enable_positional_arguments = 1`.
+Enables or disables supporting positional arguments for [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md) statements. When you want to use column numbers instead of titles in these clauses, set `enable_positional_arguments = 1`.
 
 Possible values:
 
@@ -3768,7 +3768,7 @@ Query:
 ```sql
 CREATE TABLE positional_arguments(one Int, two Int, tree Int) ENGINE=Memory();
 
-INSERT INTO positional_arguments VALUES (10, 20, 30), (20, 30, 10), (30, 10, 20);
+INSERT INTO positional_arguments VALUES (10, 20, 30), (20, 20, 10), (30, 10, 20);
 
 SET enable_positional_arguments = 1;
 
@@ -3780,8 +3780,8 @@ Result:
 ```text
 ┌─one─┬─two─┬─tree─┐
 │  30 │  10 │   20 │
+│  20 │  20 │   10 │
 │  10 │  20 │   30 │
-│  20 │  30 │   10 │
 └─────┴─────┴──────┘
 
 ```
\ No newline at end of file
diff --git a/docs/en/sql-reference/statements/select/index.md b/docs/en/sql-reference/statements/select/index.md
index 2bfaf4af297..35bbb7de2cf 100644
--- a/docs/en/sql-reference/statements/select/index.md
+++ b/docs/en/sql-reference/statements/select/index.md
@@ -144,7 +144,7 @@ Extreme values are calculated for rows before `LIMIT`, but after `LIMIT BY`. How
 
 You can use synonyms (`AS` aliases) in any part of a query.
 
-The `GROUP BY`, `ORDER BY` and `LIMIT BY` clauses support positional arguments. For example, ORDER BY 1,2 will be sorting rows on the table on the first and then the second column.
+The `GROUP BY`, `ORDER BY`, and `LIMIT BY` clauses support positional arguments. For example, `ORDER BY 1,2` will be sorting rows on the table on the first and then the second column.
 
 ## Implementation Details {#implementation-details}
 

From c049170f7820a57cd8f7c5d7fc037dc6f88b110d Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Mon, 4 Oct 2021 21:26:04 +0300
Subject: [PATCH 020/104] minor fix

---
 docs/en/operations/settings/settings.md          | 4 ++--
 docs/en/sql-reference/statements/select/index.md | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 46f72bd4f2b..e6e912e74db 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3766,7 +3766,7 @@ Default value: `0`.
 Query:
 
 ```sql
-CREATE TABLE positional_arguments(one Int, two Int, tree Int) ENGINE=Memory();
+CREATE TABLE positional_arguments(one Int, two Int, three Int) ENGINE=Memory();
 
 INSERT INTO positional_arguments VALUES (10, 20, 30), (20, 20, 10), (30, 10, 20);
 
@@ -3778,7 +3778,7 @@ SELECT * FROM positional_arguments ORDER BY 2,3;
 Result:
 
 ```text
-┌─one─┬─two─┬─tree─┐
+┌─one─┬─two─┬─three─┐
 │  30 │  10 │   20 │
 │  20 │  20 │   10 │
 │  10 │  20 │   30 │
diff --git a/docs/en/sql-reference/statements/select/index.md b/docs/en/sql-reference/statements/select/index.md
index 35bbb7de2cf..e31ba6b1f4b 100644
--- a/docs/en/sql-reference/statements/select/index.md
+++ b/docs/en/sql-reference/statements/select/index.md
@@ -144,7 +144,7 @@ Extreme values are calculated for rows before `LIMIT`, but after `LIMIT BY`. How
 
 You can use synonyms (`AS` aliases) in any part of a query.
 
-The `GROUP BY`, `ORDER BY`, and `LIMIT BY` clauses support positional arguments. For example, `ORDER BY 1,2` will be sorting rows on the table on the first and then the second column.
+The `GROUP BY`, `ORDER BY`, and `LIMIT BY` clauses support positional arguments. For example, `ORDER BY 1,2` will be sorting rows in the table on the first and then the second column.
 
 ## Implementation Details {#implementation-details}
 

From 1afe2dfb40840e34dfd2087e7b23e07191b117e4 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Mon, 4 Oct 2021 21:35:54 +0300
Subject: [PATCH 021/104] fix example

---
 docs/en/operations/settings/settings.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index e6e912e74db..246f97e47fc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3779,9 +3779,9 @@ Result:
 
 ```text
 ┌─one─┬─two─┬─three─┐
-│  30 │  10 │   20 │
-│  20 │  20 │   10 │
-│  10 │  20 │   30 │
-└─────┴─────┴──────┘
+│  30 │  10 │   20  │
+│  20 │  20 │   10  │
+│  10 │  20 │   30  │
+└─────┴─────┴─────-─┘
 
 ```
\ No newline at end of file

From 2001ebbf9d493b5803b0370efc9f0fa272fbf98f Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Mon, 4 Oct 2021 21:52:31 +0300
Subject: [PATCH 022/104] Fix build.

---
 src/DataStreams/ColumnGathererStream.h        |  2 +-
 src/Storages/MergeTree/DataPartsExchange.cpp  |  2 --
 src/Storages/MergeTree/MergeTask.cpp          | 29 +++++++++++--------
 src/Storages/MergeTree/MergeTask.h            |  5 ++--
 .../MergeTree/MergeTreeDataPartInMemory.cpp   |  2 --
 .../MergeTree/MergeTreeDataWriter.cpp         |  2 --
 .../MergeTree/MergeTreeWriteAheadLog.cpp      |  1 -
 src/Storages/MergeTree/MutateTask.cpp         |  3 --
 src/Storages/StorageReplicatedMergeTree.cpp   |  1 -
 9 files changed, 21 insertions(+), 26 deletions(-)

diff --git a/src/DataStreams/ColumnGathererStream.h b/src/DataStreams/ColumnGathererStream.h
index 43cbf7094d8..39ba57bce35 100644
--- a/src/DataStreams/ColumnGathererStream.h
+++ b/src/DataStreams/ColumnGathererStream.h
@@ -137,7 +137,7 @@ void ColumnGathererStream::gather(Column & column_res)
         column_res.reserve(cur_block_preferred_size);
     }
 
-    size_t cur_size = column_res->size();
+    size_t cur_size = column_res.size();
     next_required_source = -1;
 
     while (row_source_pos < row_sources_end && cur_size < cur_block_preferred_size)
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 2683b5a6042..e8ba5d6acd9 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -589,7 +589,6 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToMemory(
             block.getNamesAndTypesList(),
             {},
             CompressionCodecFactory::instance().get("NONE", {}));
-        part_out.writePrefix();
         part_out.write(block);
         part_out.writeSuffixAndFinalizePart(new_projection_part);
         new_projection_part->checksums.checkEqual(checksums, /* have_uncompressed = */ true);
@@ -612,7 +611,6 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToMemory(
 
     MergedBlockOutputStream part_out(
         new_data_part, metadata_snapshot, block.getNamesAndTypesList(), {}, CompressionCodecFactory::instance().get("NONE", {}));
-    part_out.writePrefix();
     part_out.write(block);
     part_out.writeSuffixAndFinalizePart(new_data_part);
     new_data_part->checksums.checkEqual(checksums, /* have_uncompressed = */ true);
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 54230f56a6c..70451413b41 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -350,8 +350,6 @@ bool MergeTask::VerticalMergeStage::prepareVerticalMergeForAllColumns() const
     global_ctx->merge_list_element_ptr->columns_written = global_ctx->merging_column_names.size();
     global_ctx->merge_list_element_ptr->progress.store(ctx->column_sizes->keyColumnsWeight(), std::memory_order_relaxed);
 
-    ctx->column_part_streams = BlockInputStreams(global_ctx->future_part->parts.size());
-
     ctx->rows_sources_write_buf->next();
     ctx->rows_sources_uncompressed_write_buf->next();
     /// Ensure data has written to disk.
@@ -386,6 +384,7 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
 
     global_ctx->column_progress = std::make_unique<MergeStageProgress>(ctx->progress_before, ctx->column_sizes->columnWeight(column_name));
 
+    Pipes pipes;
     for (size_t part_num = 0; part_num < global_ctx->future_part->parts.size(); ++part_num)
     {
         auto column_part_source = std::make_shared<MergeTreeSequentialSource>(
@@ -395,20 +394,22 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
         column_part_source->setProgressCallback(
             MergeProgressCallback(global_ctx->merge_list_element_ptr, global_ctx->watch_prev_elapsed, *global_ctx->column_progress));
 
-        QueryPipeline column_part_pipeline(Pipe(std::move(column_part_source)));
-        column_part_pipeline.setNumThreads(1);
-
-        ctx->column_part_streams[part_num] =
-                std::make_shared<PipelineExecutingBlockInputStream>(std::move(column_part_pipeline));
+        pipes.emplace_back(std::move(column_part_source));
     }
 
+    auto pipe = Pipe::unitePipes(std::move(pipes));
+
     ctx->rows_sources_read_buf->seek(0, 0);
-    ctx->column_gathered_stream = std::make_unique<ColumnGathererStream>(column_name, ctx->column_part_streams, *ctx->rows_sources_read_buf);
+    auto transform = std::make_unique<ColumnGathererTransform>(pipe.getHeader(), pipe.numOutputPorts(), *ctx->rows_sources_read_buf);
+    pipe.addTransform(std::move(transform));
+
+    ctx->column_parts_pipeline = QueryPipeline(std::move(pipe));
+    ctx->executor = std::make_unique<PullingPipelineExecutor>(ctx->column_parts_pipeline);
 
     ctx->column_to = std::make_unique<MergedColumnOnlyOutputStream>(
         global_ctx->new_data_part,
         global_ctx->metadata_snapshot,
-        ctx->column_gathered_stream->getHeader(),
+        ctx->executor->getHeader(),
         ctx->compression_codec,
         /// we don't need to recalc indices here
         /// because all of them were already recalculated and written
@@ -424,7 +425,7 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
 bool MergeTask::VerticalMergeStage::executeVerticalMergeForOneColumn() const
 {
     Block block;
-    if (!global_ctx->merges_blocker->isCancelled() && (block = ctx->column_gathered_stream->read()))
+    if (!global_ctx->merges_blocker->isCancelled() && ctx->executor->pull(block))
     {
         ctx->column_elems_written += block.rows();
         ctx->column_to->write(block);
@@ -442,7 +443,7 @@ void MergeTask::VerticalMergeStage::finalizeVerticalMergeForOneColumn() const
     if (global_ctx->merges_blocker->isCancelled())
         throw Exception("Cancelled merging parts", ErrorCodes::ABORTED);
 
-    ctx->column_gathered_stream->readSuffix();
+    ctx->executor.reset();
     auto changed_checksums = ctx->column_to->writeSuffixAndGetChecksums(global_ctx->new_data_part, global_ctx->checksums_gathered_columns, ctx->need_sync);
     global_ctx->checksums_gathered_columns.add(std::move(changed_checksums));
 
@@ -452,10 +453,14 @@ void MergeTask::VerticalMergeStage::finalizeVerticalMergeForOneColumn() const
                         ", but " + toString(global_ctx->rows_written) + " rows of PK columns", ErrorCodes::LOGICAL_ERROR);
     }
 
+    UInt64 rows = 0;
+    UInt64 bytes = 0;
+    ctx->column_parts_pipeline.tryGetResultRowsAndBytes(rows, bytes);
+
     /// NOTE: 'progress' is modified by single thread, but it may be concurrently read from MergeListElement::getInfo() (StorageSystemMerges).
 
     global_ctx->merge_list_element_ptr->columns_written += 1;
-    global_ctx->merge_list_element_ptr->bytes_written_uncompressed += ctx->column_gathered_stream->getProfileInfo().bytes;
+    global_ctx->merge_list_element_ptr->bytes_written_uncompressed += bytes;
     global_ctx->merge_list_element_ptr->progress.store(ctx->progress_before + ctx->column_sizes->columnWeight(column_name), std::memory_order_relaxed);
 
     /// This is the external cycle increment.
diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index 54b0255fd5c..ce628d831ae 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -9,6 +9,7 @@
 #include <Storages/MergeTree/ColumnSizeEstimator.h>
 #include <Storages/MergeTree/MergedColumnOnlyOutputStream.h>
 #include <DataStreams/ColumnGathererStream.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Compression/CompressedReadBufferFromFile.h>
 
 #include <memory>
@@ -263,8 +264,8 @@ private:
         Float64 progress_before = 0;
         std::unique_ptr<MergedColumnOnlyOutputStream> column_to{nullptr};
         size_t column_elems_written{0};
-        BlockInputStreams column_part_streams;
-        std::unique_ptr<ColumnGathererStream> column_gathered_stream;
+        QueryPipeline column_parts_pipeline;
+        std::unique_ptr<PullingPipelineExecutor> executor;
         std::unique_ptr<CompressedReadBufferFromFile> rows_sources_read_buf{nullptr};
     };
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp b/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
index 635da7e2ede..d43855fa8de 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
@@ -92,7 +92,6 @@ void MergeTreeDataPartInMemory::flushToDisk(const String & base_path, const Stri
     auto compression_codec = storage.getContext()->chooseCompressionCodec(0, 0);
     auto indices = MergeTreeIndexFactory::instance().getMany(metadata_snapshot->getSecondaryIndices());
     MergedBlockOutputStream out(new_data_part, metadata_snapshot, columns, indices, compression_codec);
-    out.writePrefix();
     out.write(block);
     const auto & projections = metadata_snapshot->getProjections();
     for (const auto & [projection_name, projection] : projection_parts)
@@ -123,7 +122,6 @@ void MergeTreeDataPartInMemory::flushToDisk(const String & base_path, const Stri
             auto projection_indices = MergeTreeIndexFactory::instance().getMany(desc.metadata->getSecondaryIndices());
             MergedBlockOutputStream projection_out(
                 projection_data_part, desc.metadata, projection_part->columns, projection_indices, projection_compression_codec);
-            projection_out.writePrefix();
             projection_out.write(projection_part->block);
             projection_out.writeSuffixAndFinalizePart(projection_data_part);
             new_data_part->addProjectionPart(projection_name, std::move(projection_data_part));
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index 95ddf105b79..d939312c0bb 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -412,7 +412,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeTempPart(
     MergedBlockOutputStream out(new_data_part, metadata_snapshot, columns, index_factory.getMany(metadata_snapshot->getSecondaryIndices()), compression_codec);
     bool sync_on_insert = data.getSettings()->fsync_after_insert;
 
-    out.writePrefix();
     out.writeWithPermutation(block, perm_ptr);
 
     for (const auto & projection : metadata_snapshot->getProjections())
@@ -508,7 +507,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataWriter::writeProjectionPartImpl(
         {},
         compression_codec);
 
-    out.writePrefix();
     out.writeWithPermutation(block, perm_ptr);
     out.writeSuffixAndFinalizePart(new_data_part);
 
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
index 3e8aa6af536..2c1d785236c 100644
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
@@ -202,7 +202,6 @@ MergeTreeData::MutableDataPartsVector MergeTreeWriteAheadLog::restore(const Stor
             if (metadata_snapshot->hasSortingKey())
                 metadata_snapshot->getSortingKey().expression->execute(block);
 
-            part_out.writePrefix();
             part_out.write(block);
 
             for (const auto & projection : metadata_snapshot->getProjections())
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 0655806bf0e..b93075d0ce6 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -793,7 +793,6 @@ bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
         if (ctx->minmax_idx)
             ctx->minmax_idx->update(block, ctx->data->getMinMaxColumnsNames(ctx->metadata_snapshot->getPartitionKey()));
 
-        ctx->out->write(block);
 
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
         {
@@ -952,7 +951,6 @@ private:
             ctx->compression_codec);
 
         ctx->mutating_stream->readPrefix();
-        ctx->out->writePrefix();
 
         part_merger_writer_task = std::make_unique<PartMergerWriter>(ctx);
     }
@@ -1102,7 +1100,6 @@ private:
             );
 
             ctx->mutating_stream->readPrefix();
-            ctx->out->writePrefix();
             ctx->projections_to_build = std::vector<ProjectionDescriptionRawPtr>{ctx->projections_to_recalc.begin(), ctx->projections_to_recalc.end()};
 
             part_merger_writer_task = std::make_unique<PartMergerWriter>(ctx);
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 3b84c4c4a03..eafe81f8c88 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -7157,7 +7157,6 @@ bool StorageReplicatedMergeTree::createEmptyPartInsteadOfLost(zkutil::ZooKeeperP
     MergedBlockOutputStream out(new_data_part, metadata_snapshot, columns, index_factory.getMany(metadata_snapshot->getSecondaryIndices()), compression_codec);
     bool sync_on_insert = settings->fsync_after_insert;
 
-    out.writePrefix();
     out.write(block);
     /// TODO(ab): What projections should we add to the empty part? How can we make sure that it
     /// won't block future merges? Perhaps we should also check part emptiness when selecting parts

From 6febfeea77ad6e28e23a2ccb0cde99e7bbca35b5 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Mon, 4 Oct 2021 21:55:03 +0300
Subject: [PATCH 023/104] fix table

---
 docs/en/operations/settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 246f97e47fc..22bde8cffa8 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3782,6 +3782,6 @@ Result:
 │  30 │  10 │   20  │
 │  20 │  20 │   10  │
 │  10 │  20 │   30  │
-└─────┴─────┴─────-─┘
+└─────┴─────┴───────┘
 
 ```
\ No newline at end of file

From a638c40fdcfd1b8b01153713e070664c1c38976f Mon Sep 17 00:00:00 2001
From: WangZengrui <joeywang98@outlook.com>
Date: Tue, 5 Oct 2021 09:08:16 +0800
Subject: [PATCH 024/104] add getOSKernelVersion

---
 src/Interpreters/getOSKernelVersion.cpp | 18 ++++++------------
 src/Interpreters/getOSKernelVersion.h   | 12 +-----------
 2 files changed, 7 insertions(+), 23 deletions(-)

diff --git a/src/Interpreters/getOSKernelVersion.cpp b/src/Interpreters/getOSKernelVersion.cpp
index 44df948be3c..c4b4564f46e 100644
--- a/src/Interpreters/getOSKernelVersion.cpp
+++ b/src/Interpreters/getOSKernelVersion.cpp
@@ -7,28 +7,22 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int BAD_ARGUMENTS;
+    extern const int SYSTEM_ERROR;
 }
     
 String getOSKernelVersion()
 {
-    struct utsname os_kernel_version;
-    int buf = uname(&os_kernel_version);
+    struct utsname os_kernel_info;
+    int buf = uname(&os_kernel_info);
     if (buf < 0)
     {
         throw Exception(
-            "EFAULT buf is not valid.",
-            ErrorCodes::BAD_ARGUMENTS);
+            "EFAULT buffer is not valid.",
+            ErrorCodes::SYSTEM_ERROR);
     }
     else
     {
-        // std::cout <<"sysname: " << os_kernel_version.sysname << " nodename: " << os_kernel_version.nodename 
-        //           << " release: " << os_kernel_version.release << " version: " << os_kernel_version.version 
-        //           << " machine: " << os_kernel_version.machine << std::endl;
-
-        return "sysname: " + String(os_kernel_version.sysname) + " nodename: " + String(os_kernel_version.nodename) 
-                  + " release: " + String(os_kernel_version.release) + " version: " + String(os_kernel_version.version) 
-                  + " machine: " + String(os_kernel_version.machine);
+        return String(os_kernel_info.sysname) + " " + String(os_kernel_info.release);
     }
 }
 
diff --git a/src/Interpreters/getOSKernelVersion.h b/src/Interpreters/getOSKernelVersion.h
index 14b42d2a19a..fc3c7583aef 100644
--- a/src/Interpreters/getOSKernelVersion.h
+++ b/src/Interpreters/getOSKernelVersion.h
@@ -1,5 +1,5 @@
-#if defined(OS_LINUX)
 #pragma once
+#if defined(OS_LINUX)
 
 #include <Common/typeid_cast.h>
 
@@ -16,16 +16,6 @@ namespace DB
     
 String getOSKernelVersion();
 
-// String getSysName();
-
-// String getNodeName();
-
-// String getReleaseName();
-
-// String getVersion();
-
-// String getMachineName();
-
 }
 
 #endif
\ No newline at end of file

From c106f1e38000dd7b8847ad99c6dac231af3e20b8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Oct 2021 12:51:43 +0300
Subject: [PATCH 025/104] Fix tests.

---
 src/DataStreams/ColumnGathererStream.cpp | 2 +-
 src/Processors/Chunk.cpp                 | 4 +++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/DataStreams/ColumnGathererStream.cpp b/src/DataStreams/ColumnGathererStream.cpp
index 90da7792c21..add473190c0 100644
--- a/src/DataStreams/ColumnGathererStream.cpp
+++ b/src/DataStreams/ColumnGathererStream.cpp
@@ -105,7 +105,7 @@ IMergingAlgorithm::Status ColumnGathererStream::merge()
     merged_rows += col->size();
     merged_bytes += col->allocatedBytes();
     res.addColumn(std::move(col));
-    return Status(std::move(res), row_sources_buf.eof());
+    return Status(std::move(res), row_sources_buf.eof() && !source_to_fully_copy);
 }
 
 
diff --git a/src/Processors/Chunk.cpp b/src/Processors/Chunk.cpp
index 4800bfca2ce..d904f3755bc 100644
--- a/src/Processors/Chunk.cpp
+++ b/src/Processors/Chunk.cpp
@@ -104,7 +104,9 @@ Columns Chunk::detachColumns()
 
 void Chunk::addColumn(ColumnPtr column)
 {
-    if (column->size() != num_rows)
+    if (empty())
+        num_rows = column->size();
+    else if (column->size() != num_rows)
         throw Exception("Invalid number of rows in Chunk column " + column->getName()+ ": expected " +
                         toString(num_rows) + ", got " + toString(column->size()), ErrorCodes::LOGICAL_ERROR);
 

From 82e6ac8fa2cdba5ef016bbe4278d7c17888dafb7 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Tue, 5 Oct 2021 13:39:18 +0300
Subject: [PATCH 026/104] Update HTTPHandler.cpp

---
 src/Server/HTTPHandler.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 413cfe18696..1036d5031f7 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -24,7 +24,7 @@
 #include <Server/HTTPHandlerFactory.h>
 #include <Server/HTTPHandlerRequestFilter.h>
 #include <Server/IServer.h>
-#include "common/logger_useful.h"
+#include <common/logger_useful.h>
 #include <Common/SettingsChanges.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/escapeForFileName.h>

From 96d070a5baf2847ea35a9587944f73772295afa2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Oct 2021 16:58:24 +0300
Subject: [PATCH 027/104] Fix tests.

---
 src/Storages/MergeTree/IMergedBlockOutputStream.h     | 4 ++++
 src/Storages/MergeTree/MergedBlockOutputStream.h      | 2 +-
 src/Storages/MergeTree/MergedColumnOnlyOutputStream.h | 2 +-
 src/Storages/MergeTree/MutateTask.cpp                 | 1 +
 4 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/IMergedBlockOutputStream.h b/src/Storages/MergeTree/IMergedBlockOutputStream.h
index 133f0804838..36fbe76cca2 100644
--- a/src/Storages/MergeTree/IMergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/IMergedBlockOutputStream.h
@@ -15,8 +15,12 @@ public:
         const MergeTreeDataPartPtr & data_part,
         const StorageMetadataPtr & metadata_snapshot_);
 
+    virtual ~IMergedBlockOutputStream() = default;
+
     using WrittenOffsetColumns = std::set<std::string>;
 
+    virtual void write(const Block & block) = 0;
+
     const MergeTreeIndexGranularity & getIndexGranularity() const
     {
         return writer->getIndexGranularity();
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.h b/src/Storages/MergeTree/MergedBlockOutputStream.h
index 3586ac17298..5965331ee81 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.h
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.h
@@ -24,7 +24,7 @@ public:
     Block getHeader() const { return metadata_snapshot->getSampleBlock(); }
 
     /// If the data is pre-sorted.
-    void write(const Block & block);
+    void write(const Block & block) override;
 
     /** If the data is not sorted, but we have previously calculated the permutation, that will sort it.
       * This method is used to save RAM, since you do not need to keep two blocks at once - the original one and the sorted one.
diff --git a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
index 7a146a91331..4b75bc52f72 100644
--- a/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
+++ b/src/Storages/MergeTree/MergedColumnOnlyOutputStream.h
@@ -24,7 +24,7 @@ public:
         const MergeTreeIndexGranularityInfo * index_granularity_info_ = nullptr);
 
     Block getHeader() const { return header; }
-    void write(const Block & block);
+    void write(const Block & block) override;
     MergeTreeData::DataPart::Checksums
     writeSuffixAndGetChecksums(MergeTreeData::MutableDataPartPtr & new_part, MergeTreeData::DataPart::Checksums & all_checksums, bool sync = false);
 
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index b93075d0ce6..1900b694a8d 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -793,6 +793,7 @@ bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
         if (ctx->minmax_idx)
             ctx->minmax_idx->update(block, ctx->data->getMinMaxColumnsNames(ctx->metadata_snapshot->getPartitionKey()));
 
+        ctx->out->write(block);
 
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
         {

From 9b1a39fdb9c4b79d2f045f88d97a1ce33c7d4797 Mon Sep 17 00:00:00 2001
From: Artur Filatenkov <613623@mail.ru>
Date: Tue, 5 Oct 2021 17:43:33 +0300
Subject: [PATCH 028/104] refactor after move common to base

---
 src/Server/HTTPHandler.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 1036d5031f7..9edef8a7223 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -24,15 +24,15 @@
 #include <Server/HTTPHandlerFactory.h>
 #include <Server/HTTPHandlerRequestFilter.h>
 #include <Server/IServer.h>
-#include <common/logger_useful.h>
+#include <base/logger_useful.h>
 #include <Common/SettingsChanges.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/escapeForFileName.h>
 #include <Common/setThreadName.h>
 #include <Common/typeid_cast.h>
 
-#include <common/getFQDNOrHostName.h>
-#include <common/scope_guard.h>
+#include <base/getFQDNOrHostName.h>
+#include <base/scope_guard.h>
 #include <Server/HTTP/HTTPResponse.h>
 
 #if !defined(ARCADIA_BUILD)

From aeb670dbe00a9328ed361b84e277f3138fa2ab64 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 5 Oct 2021 21:02:00 +0300
Subject: [PATCH 029/104] Simplify obtaining of server pid in fuzzer tests

---
 docker/test/fuzzer/run-fuzzer.sh | 22 +++-------------------
 1 file changed, 3 insertions(+), 19 deletions(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 3c3fcd42fde..15590902b68 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -125,25 +125,9 @@ function fuzz
 
     # interferes with gdb
     export CLICKHOUSE_WATCHDOG_ENABLE=0
-    # NOTE: that $! cannot be used to obtain the server pid, since it will be
-    # the pid of the bash, due to piping the output of clickhouse-server to
-    # tail
-    PID_FILE=clickhouse-server.pid
-    clickhouse-server --pidfile=$PID_FILE --config-file db/config.xml -- --path db 2>&1 | tail -100000 > server.log &
-
-    server_pid=-1
-    for _ in {1..60}; do
-        if [ -s $PID_FILE ]; then
-            server_pid=$(cat $PID_FILE)
-            break
-        fi
-        sleep 1
-    done
-
-    if [ $server_pid = -1 ]; then
-        echo "Server did not started" >&2
-        exit 1
-    fi
+    # NOTE: we use process substitution here to preserve keep $! as a pid of clickhouse-server
+    clickhouse-server --config-file db/config.xml -- --path db > >(tail -100000 > server.log) 2>&1 &
+    server_pid=$!
 
     kill -0 $server_pid
 

From bd4b0af2e14dfa22257d4778bf135f65dee1723c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Oct 2021 02:34:48 +0300
Subject: [PATCH 030/104] Fix bad cast in ParserCreateQuery

---
 src/Parsers/ParserCreateQuery.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index d4525883e36..2ea1663fc80 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -481,7 +481,7 @@ bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
     if (attach && s_from.ignore(pos, expected))
     {
-        ParserLiteral from_path_p;
+        ParserStringLiteral from_path_p;
         if (!from_path_p.parse(pos, from_path, expected))
             return false;
     }

From a518f5ea11667e56e48b065354dd3f81dae945e5 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Wed, 6 Oct 2021 12:26:22 +0300
Subject: [PATCH 031/104] Update docs/en/operations/settings/settings.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/operations/settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 22bde8cffa8..fa4b96b8fbc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3752,7 +3752,7 @@ Exception: Total regexp lengths too large.
 
 ## enable_positional_arguments {#enable-positional-arguments}
 
-Enables or disables supporting positional arguments for [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md) statements. When you want to use column numbers instead of titles in these clauses, set `enable_positional_arguments = 1`.
+Enables or disables supporting positional arguments for [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md) statements. When you want to use column numbers instead of column names in these clauses, set `enable_positional_arguments = 1`.
 
 Possible values:
 

From 6b619512aa1c1feef9b8bde48fa91b279e2266e6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 6 Oct 2021 12:37:56 +0300
Subject: [PATCH 032/104] Fix style.

---
 src/DataStreams/ColumnGathererStream.cpp           | 1 -
 src/DataStreams/ColumnGathererStream.h             | 2 +-
 src/Storages/MergeTree/MergedBlockOutputStream.cpp | 1 -
 3 files changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/DataStreams/ColumnGathererStream.cpp b/src/DataStreams/ColumnGathererStream.cpp
index 319580cf8f3..9b2fac79bb0 100644
--- a/src/DataStreams/ColumnGathererStream.cpp
+++ b/src/DataStreams/ColumnGathererStream.cpp
@@ -11,7 +11,6 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int INCOMPATIBLE_COLUMNS;
     extern const int INCORRECT_NUMBER_OF_COLUMNS;
     extern const int EMPTY_DATA_PASSED;
     extern const int RECEIVED_EMPTY_DATA;
diff --git a/src/DataStreams/ColumnGathererStream.h b/src/DataStreams/ColumnGathererStream.h
index 39ba57bce35..2d013e596ce 100644
--- a/src/DataStreams/ColumnGathererStream.h
+++ b/src/DataStreams/ColumnGathererStream.h
@@ -96,7 +96,7 @@ private:
     Source * source_to_fully_copy = nullptr;
 
     ssize_t next_required_source = -1;
-    size_t cur_block_preferred_size;
+    size_t cur_block_preferred_size = 0;
 
     UInt64 merged_rows = 0;
     UInt64 merged_bytes = 0;
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index 495ce5ee933..5206f77290b 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -8,7 +8,6 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NOT_IMPLEMENTED;
     extern const int LOGICAL_ERROR;
 }
 

From c0ee6d46f7dafda4784c4c2db4837015ea934005 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 6 Oct 2021 15:39:14 +0300
Subject: [PATCH 033/104] resolve dependency of StorageDictionary

---
 src/Databases/DDLDependencyVisitor.cpp               | 12 ++++++++++++
 src/Databases/DDLDependencyVisitor.h                 |  2 ++
 .../integration/helpers/0_common_instance_config.xml |  2 +-
 .../integration/test_dictionaries_dependency/test.py |  2 ++
 4 files changed, 17 insertions(+), 1 deletion(-)

diff --git a/src/Databases/DDLDependencyVisitor.cpp b/src/Databases/DDLDependencyVisitor.cpp
index 73800e84256..98f697ef641 100644
--- a/src/Databases/DDLDependencyVisitor.cpp
+++ b/src/Databases/DDLDependencyVisitor.cpp
@@ -16,6 +16,8 @@ void DDLDependencyVisitor::visit(const ASTPtr & ast, Data & data)
         visit(*function, data);
     else if (const auto * dict_source = ast->as<ASTFunctionWithKeyValueArguments>())
         visit(*dict_source, data);
+    else if (const auto * storage = ast->as<ASTStorage>())
+        visit(*storage, data);
 }
 
 bool DDLDependencyVisitor::needChildVisit(const ASTPtr & node, const ASTPtr & child)
@@ -66,6 +68,16 @@ void DDLDependencyVisitor::visit(const ASTFunctionWithKeyValueArguments & dict_s
     data.dependencies.emplace(std::move(info->table_name));
 }
 
+void DDLDependencyVisitor::visit(const ASTStorage & storage, Data & data)
+{
+    if (!storage.engine)
+        return;
+    if (storage.engine->name != "Dictionary")
+        return;
+
+    extractTableNameFromArgument(*storage.engine, data, 0);
+}
+
 
 void DDLDependencyVisitor::extractTableNameFromArgument(const ASTFunction & function, Data & data, size_t arg_idx)
 {
diff --git a/src/Databases/DDLDependencyVisitor.h b/src/Databases/DDLDependencyVisitor.h
index c0b39d70b08..5779aee7d33 100644
--- a/src/Databases/DDLDependencyVisitor.h
+++ b/src/Databases/DDLDependencyVisitor.h
@@ -8,6 +8,7 @@ namespace DB
 
 class ASTFunction;
 class ASTFunctionWithKeyValueArguments;
+class ASTStorage;
 
 /// Visits ASTCreateQuery and extracts names of table (or dictionary) dependencies
 /// from column default expressions (joinGet, dictGet, etc)
@@ -33,6 +34,7 @@ public:
 private:
     static void visit(const ASTFunction & function, Data & data);
     static void visit(const ASTFunctionWithKeyValueArguments & dict_source, Data & data);
+    static void visit(const ASTStorage & storage, Data & data);
 
     static void extractTableNameFromArgument(const ASTFunction & function, Data & data, size_t arg_idx);
 };
diff --git a/tests/integration/helpers/0_common_instance_config.xml b/tests/integration/helpers/0_common_instance_config.xml
index 717f6db7e4b..c848ebdf45c 100644
--- a/tests/integration/helpers/0_common_instance_config.xml
+++ b/tests/integration/helpers/0_common_instance_config.xml
@@ -9,7 +9,7 @@
     <users_config>users.xml</users_config>
 
   <logger>
-        <level>trace</level>
+        <level>test</level>
         <log>/var/log/clickhouse-server/clickhouse-server.log</log>
         <errorlog>/var/log/clickhouse-server/clickhouse-server.err.log</errorlog>
         <size>1000M</size>
diff --git a/tests/integration/test_dictionaries_dependency/test.py b/tests/integration/test_dictionaries_dependency/test.py
index d615f90dc79..ceab39aacb8 100644
--- a/tests/integration/test_dictionaries_dependency/test.py
+++ b/tests/integration/test_dictionaries_dependency/test.py
@@ -36,6 +36,8 @@ def cleanup_after_test():
         yield
     finally:
         for node in nodes:
+            for i in range(4):
+                node.query("DROP DICTIONARY IF EXISTS test.other_{}".format(i))
             node.query("DROP DICTIONARY IF EXISTS test.adict")
             node.query("DROP DICTIONARY IF EXISTS test.zdict")
             node.query("DROP DICTIONARY IF EXISTS atest.dict")

From d0c6f11fcb203b50e32fbab6b9488c6ffa87fcde Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Wed, 6 Oct 2021 20:59:27 +0300
Subject: [PATCH 034/104] More.

---
 .../DistinctSortedBlockInputStream.cpp        | 78 +++++++++---------
 .../DistinctSortedBlockInputStream.h          | 22 +++--
 src/DataStreams/TTLBlockInputStream.cpp       | 40 ++++++---
 src/DataStreams/TTLBlockInputStream.h         | 16 ++--
 src/DataStreams/TTLCalcInputStream.cpp        | 34 +++++---
 src/DataStreams/TTLCalcInputStream.h          | 15 ++--
 src/Interpreters/MutationsInterpreter.cpp     |  7 +-
 src/Interpreters/MutationsInterpreter.h       |  2 +-
 src/Storages/MergeTree/MergeTask.cpp          | 37 +++++----
 src/Storages/MergeTree/MergeTask.h            |  3 +-
 src/Storages/MergeTree/MutateTask.cpp         | 82 ++++++++++++-------
 src/Storages/StorageJoin.cpp                  | 10 +--
 src/Storages/StorageMemory.cpp                |  9 +-
 13 files changed, 197 insertions(+), 158 deletions(-)

diff --git a/src/DataStreams/DistinctSortedBlockInputStream.cpp b/src/DataStreams/DistinctSortedBlockInputStream.cpp
index eab706924c1..a3105d6330c 100644
--- a/src/DataStreams/DistinctSortedBlockInputStream.cpp
+++ b/src/DataStreams/DistinctSortedBlockInputStream.cpp
@@ -8,40 +8,28 @@ namespace ErrorCodes
     extern const int SET_SIZE_LIMIT_EXCEEDED;
 }
 
-DistinctSortedBlockInputStream::DistinctSortedBlockInputStream(
-    const BlockInputStreamPtr & input, SortDescription sort_description, const SizeLimits & set_size_limits_, UInt64 limit_hint_, const Names & columns)
-    : description(std::move(sort_description))
+DistinctSortedTransform::DistinctSortedTransform(
+    const Block & header, SortDescription sort_description, const SizeLimits & set_size_limits_, UInt64 limit_hint_, const Names & columns)
+    : ISimpleTransform(header, header, true)
+    , description(std::move(sort_description))
     , columns_names(columns)
     , limit_hint(limit_hint_)
     , set_size_limits(set_size_limits_)
 {
-    children.push_back(input);
 }
 
-Block DistinctSortedBlockInputStream::readImpl()
+void DistinctSortedTransform::transform(Chunk & chunk)
 {
-    /// Execute until end of stream or until
-    /// a block with some new records will be gotten.
-    for (;;)
-    {
-        /// Stop reading if we already reached the limit.
-        if (limit_hint && data.getTotalRowCount() >= limit_hint)
-            return Block();
-
-        Block block = children.back()->read();
-        if (!block)
-            return Block();
-
-        const ColumnRawPtrs column_ptrs(getKeyColumns(block));
+        const ColumnRawPtrs column_ptrs(getKeyColumns(chunk));
         if (column_ptrs.empty())
-            return block;
+            return;
 
-        const ColumnRawPtrs clearing_hint_columns(getClearingColumns(block, column_ptrs));
+        const ColumnRawPtrs clearing_hint_columns(getClearingColumns(chunk, column_ptrs));
 
         if (data.type == ClearableSetVariants::Type::EMPTY)
             data.init(ClearableSetVariants::chooseMethod(column_ptrs, key_sizes));
 
-        const size_t rows = block.rows();
+        const size_t rows = chunk.getNumRows();
         IColumn::Filter filter(rows);
 
         bool has_new_data = false;
@@ -59,25 +47,33 @@ Block DistinctSortedBlockInputStream::readImpl()
 
         /// Just go to the next block if there isn't any new record in the current one.
         if (!has_new_data)
-            continue;
+            return;
 
         if (!set_size_limits.check(data.getTotalRowCount(), data.getTotalByteCount(), "DISTINCT", ErrorCodes::SET_SIZE_LIMIT_EXCEEDED))
-            return {};
+        {
+            stopReading();
+            chunk.clear();
+            return;
+        }
 
-        prev_block.block = block;
-        prev_block.clearing_hint_columns = std::move(clearing_hint_columns);
+        /// Stop reading if we already reached the limit.
+        if (limit_hint && data.getTotalRowCount() >= limit_hint)
+            stopReading();
 
-        size_t all_columns = block.columns();
+        prev_chunk.chunk = std::move(chunk);
+        prev_chunk.clearing_hint_columns = std::move(clearing_hint_columns);
+
+        size_t all_columns = prev_chunk.chunk.getNumColumns();
+        Chunk res_chunk;
         for (size_t i = 0; i < all_columns; ++i)
-            block.safeGetByPosition(i).column = block.safeGetByPosition(i).column->filter(filter, -1);
+            res_chunk.addColumn(prev_chunk.chunk.getColumns().at(i)->filter(filter, -1));
 
-        return block;
-    }
+        chunk = std::move(res_chunk);
 }
 
 
 template <typename Method>
-bool DistinctSortedBlockInputStream::buildFilter(
+bool DistinctSortedTransform::buildFilter(
     Method & method,
     const ColumnRawPtrs & columns,
     const ColumnRawPtrs & clearing_hint_columns,
@@ -90,8 +86,8 @@ bool DistinctSortedBlockInputStream::buildFilter(
     /// Compare last row of previous block and first row of current block,
     /// If rows not equal, we can clear HashSet,
     /// If clearing_hint_columns is empty, we CAN'T clear HashSet.
-    if (!clearing_hint_columns.empty() && !prev_block.clearing_hint_columns.empty()
-        && !rowsEqual(clearing_hint_columns, 0, prev_block.clearing_hint_columns, prev_block.block.rows() - 1))
+    if (!clearing_hint_columns.empty() && !prev_chunk.clearing_hint_columns.empty()
+        && !rowsEqual(clearing_hint_columns, 0, prev_chunk.clearing_hint_columns, prev_chunk.chunk.getNumRows() - 1))
     {
         method.data.clear();
     }
@@ -117,18 +113,20 @@ bool DistinctSortedBlockInputStream::buildFilter(
     return has_new_data;
 }
 
-ColumnRawPtrs DistinctSortedBlockInputStream::getKeyColumns(const Block & block) const
+ColumnRawPtrs DistinctSortedTransform::getKeyColumns(const Chunk & chunk) const
 {
-    size_t columns = columns_names.empty() ? block.columns() : columns_names.size();
+    size_t columns = columns_names.empty() ? chunk.getNumColumns() : columns_names.size();
 
     ColumnRawPtrs column_ptrs;
     column_ptrs.reserve(columns);
 
     for (size_t i = 0; i < columns; ++i)
     {
-        const auto & column = columns_names.empty()
-            ? block.safeGetByPosition(i).column
-            : block.getByName(columns_names[i]).column;
+        auto pos = i;
+        if (!columns_names.empty())
+            pos = input.getHeader().getPositionByName(columns_names[i]);
+
+        const auto & column = chunk.getColumns()[pos];
 
         /// Ignore all constant columns.
         if (!isColumnConst(*column))
@@ -138,13 +136,13 @@ ColumnRawPtrs DistinctSortedBlockInputStream::getKeyColumns(const Block & block)
     return column_ptrs;
 }
 
-ColumnRawPtrs DistinctSortedBlockInputStream::getClearingColumns(const Block & block, const ColumnRawPtrs & key_columns) const
+ColumnRawPtrs DistinctSortedTransform::getClearingColumns(const Chunk & chunk, const ColumnRawPtrs & key_columns) const
 {
     ColumnRawPtrs clearing_hint_columns;
     clearing_hint_columns.reserve(description.size());
     for (const auto & sort_column_description : description)
     {
-        const auto * sort_column_ptr = block.safeGetByPosition(sort_column_description.column_number).column.get();
+        const auto * sort_column_ptr = chunk.getColumns().at(sort_column_description.column_number).get();
         const auto it = std::find(key_columns.cbegin(), key_columns.cend(), sort_column_ptr);
         if (it != key_columns.cend()) /// if found in key_columns
             clearing_hint_columns.emplace_back(sort_column_ptr);
@@ -154,7 +152,7 @@ ColumnRawPtrs DistinctSortedBlockInputStream::getClearingColumns(const Block & b
     return clearing_hint_columns;
 }
 
-bool DistinctSortedBlockInputStream::rowsEqual(const ColumnRawPtrs & lhs, size_t n, const ColumnRawPtrs & rhs, size_t m)
+bool DistinctSortedTransform::rowsEqual(const ColumnRawPtrs & lhs, size_t n, const ColumnRawPtrs & rhs, size_t m)
 {
     for (size_t column_index = 0, num_columns = lhs.size(); column_index < num_columns; ++column_index)
     {
diff --git a/src/DataStreams/DistinctSortedBlockInputStream.h b/src/DataStreams/DistinctSortedBlockInputStream.h
index 146c9326e5d..ddac6c18a64 100644
--- a/src/DataStreams/DistinctSortedBlockInputStream.h
+++ b/src/DataStreams/DistinctSortedBlockInputStream.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <DataStreams/IBlockInputStream.h>
+#include <Processors/ISimpleTransform.h>
 #include <Interpreters/SetVariants.h>
 #include <Core/SortDescription.h>
 
@@ -18,24 +18,22 @@ namespace DB
   * set limit_hint to non zero value. So we stop emitting new rows after
   * count of already emitted rows will reach the limit_hint.
   */
-class DistinctSortedBlockInputStream : public IBlockInputStream
+class DistinctSortedTransform : public ISimpleTransform
 {
 public:
     /// Empty columns_ means all columns.
-    DistinctSortedBlockInputStream(const BlockInputStreamPtr & input, SortDescription sort_description, const SizeLimits & set_size_limits_, UInt64 limit_hint_, const Names & columns);
+    DistinctSortedTransform(const Block & header, SortDescription sort_description, const SizeLimits & set_size_limits_, UInt64 limit_hint_, const Names & columns);
 
-    String getName() const override { return "DistinctSorted"; }
-
-    Block getHeader() const override { return children.at(0)->getHeader(); }
+    String getName() const override { return "DistinctSortedTransform"; }
 
 protected:
-    Block readImpl() override;
+    void transform(Chunk & chunk) override;
 
 private:
-    ColumnRawPtrs getKeyColumns(const Block & block) const;
+    ColumnRawPtrs getKeyColumns(const Chunk & chunk) const;
     /// When clearing_columns changed, we can clean HashSet to memory optimization
     /// clearing_columns is a left-prefix of SortDescription exists in key_columns
-    ColumnRawPtrs getClearingColumns(const Block & block, const ColumnRawPtrs & key_columns) const;
+    ColumnRawPtrs getClearingColumns(const Chunk & chunk, const ColumnRawPtrs & key_columns) const;
     static bool rowsEqual(const ColumnRawPtrs & lhs, size_t n, const ColumnRawPtrs & rhs, size_t m);
 
     /// return true if has new data
@@ -50,12 +48,12 @@ private:
 
     SortDescription description;
 
-    struct PreviousBlock
+    struct PreviousChunk
     {
-        Block block;
+        Chunk chunk;
         ColumnRawPtrs clearing_hint_columns;
     };
-    PreviousBlock prev_block;
+    PreviousChunk prev_chunk;
 
     Names columns_names;
     ClearableSetVariants data;
diff --git a/src/DataStreams/TTLBlockInputStream.cpp b/src/DataStreams/TTLBlockInputStream.cpp
index 05d4ba0a395..1a1484fc08e 100644
--- a/src/DataStreams/TTLBlockInputStream.cpp
+++ b/src/DataStreams/TTLBlockInputStream.cpp
@@ -16,18 +16,17 @@
 namespace DB
 {
 
-TTLBlockInputStream::TTLBlockInputStream(
-    const BlockInputStreamPtr & input_,
+TTLTransform::TTLTransform(
+    const Block & header_,
     const MergeTreeData & storage_,
     const StorageMetadataPtr & metadata_snapshot_,
     const MergeTreeData::MutableDataPartPtr & data_part_,
     time_t current_time_,
     bool force_)
-    : data_part(data_part_)
-    , log(&Poco::Logger::get(storage_.getLogName() + " (TTLBlockInputStream)"))
+    : ISimpleTransform(header_, header_, false)
+    , data_part(data_part_)
+    , log(&Poco::Logger::get(storage_.getLogName() + " (TTLTransform)"))
 {
-    children.push_back(input_);
-    header = children.at(0)->getHeader();
     auto old_ttl_infos = data_part->ttl_infos;
 
     if (metadata_snapshot_->hasRowsTTL())
@@ -50,7 +49,7 @@ TTLBlockInputStream::TTLBlockInputStream(
 
     for (const auto & group_by_ttl : metadata_snapshot_->getGroupByTTLs())
         algorithms.emplace_back(std::make_unique<TTLAggregationAlgorithm>(
-            group_by_ttl, old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_, header, storage_));
+            group_by_ttl, old_ttl_infos.group_by_ttl[group_by_ttl.result_column], current_time_, force_, getInputPort().getHeader(), storage_));
 
     if (metadata_snapshot_->hasAnyColumnTTL())
     {
@@ -98,22 +97,28 @@ Block reorderColumns(Block block, const Block & header)
     return res;
 }
 
-Block TTLBlockInputStream::readImpl()
+void TTLTransform::transform(Chunk & chunk)
 {
     if (all_data_dropped)
-        return {};
+    {
+        stopReading();
+        chunk.clear();
+        return;
+    }
 
-    auto block = children.at(0)->read();
+    auto block = getInputPort().getHeader().cloneWithColumns(chunk.detachColumns());
     for (const auto & algorithm : algorithms)
         algorithm->execute(block);
 
     if (!block)
-        return block;
+        return;
 
-    return reorderColumns(std::move(block), header);
+    size_t num_rows = block.rows();
+
+    chunk = Chunk(reorderColumns(std::move(block), getOutputPort().getHeader()).getColumns(), num_rows);
 }
 
-void TTLBlockInputStream::readSuffixImpl()
+void TTLTransform::finalize()
 {
     data_part->ttl_infos = {};
     for (const auto & algorithm : algorithms)
@@ -126,4 +131,13 @@ void TTLBlockInputStream::readSuffixImpl()
     }
 }
 
+IProcessor::Status TTLTransform::prepare()
+{
+    auto status = ISimpleTransform::prepare();
+    if (status == Status::Finished)
+        finalize();
+
+    return status;
+}
+
 }
diff --git a/src/DataStreams/TTLBlockInputStream.h b/src/DataStreams/TTLBlockInputStream.h
index bf854d9cc9c..986181df652 100644
--- a/src/DataStreams/TTLBlockInputStream.h
+++ b/src/DataStreams/TTLBlockInputStream.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <DataStreams/IBlockInputStream.h>
+#include <Processors/ISimpleTransform.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Core/Block.h>
@@ -12,11 +12,11 @@
 namespace DB
 {
 
-class TTLBlockInputStream : public IBlockInputStream
+class TTLTransform : public ISimpleTransform
 {
 public:
-    TTLBlockInputStream(
-        const BlockInputStreamPtr & input_,
+    TTLTransform(
+        const Block & header_,
         const MergeTreeData & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
         const MergeTreeData::MutableDataPartPtr & data_part_,
@@ -25,13 +25,14 @@ public:
     );
 
     String getName() const override { return "TTL"; }
-    Block getHeader() const override { return header; }
+
+    Status prepare() override;
 
 protected:
-    Block readImpl() override;
+    void transform(Chunk & chunk) override;
 
     /// Finalizes ttl infos and updates data part
-    void readSuffixImpl() override;
+    void finalize();
 
 private:
     std::vector<TTLAlgorithmPtr> algorithms;
@@ -41,7 +42,6 @@ private:
     /// ttl_infos and empty_columns are updating while reading
     const MergeTreeData::MutableDataPartPtr & data_part;
     Poco::Logger * log;
-    Block header;
 };
 
 }
diff --git a/src/DataStreams/TTLCalcInputStream.cpp b/src/DataStreams/TTLCalcInputStream.cpp
index 2353e9ec259..c156b31428a 100644
--- a/src/DataStreams/TTLCalcInputStream.cpp
+++ b/src/DataStreams/TTLCalcInputStream.cpp
@@ -4,18 +4,17 @@
 namespace DB
 {
 
-TTLCalcInputStream::TTLCalcInputStream(
-    const BlockInputStreamPtr & input_,
+TTLCalcTransform::TTLCalcTransform(
+    const Block & header_,
     const MergeTreeData & storage_,
     const StorageMetadataPtr & metadata_snapshot_,
     const MergeTreeData::MutableDataPartPtr & data_part_,
     time_t current_time_,
     bool force_)
-    : data_part(data_part_)
+    : ISimpleTransform(header_, header_, true)
+    , data_part(data_part_)
     , log(&Poco::Logger::get(storage_.getLogName() + " (TTLCalcInputStream)"))
 {
-    children.push_back(input_);
-    header = children.at(0)->getHeader();
     auto old_ttl_infos = data_part->ttl_infos;
 
     if (metadata_snapshot_->hasRowsTTL())
@@ -51,27 +50,36 @@ TTLCalcInputStream::TTLCalcInputStream(
             recompression_ttl, TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
 }
 
-Block TTLCalcInputStream::readImpl()
+void TTLCalcTransform::transform(Chunk & chunk)
 {
-    auto block = children.at(0)->read();
+    auto block = getInputPort().getHeader().cloneWithColumns(chunk.detachColumns());
     for (const auto & algorithm : algorithms)
         algorithm->execute(block);
 
     if (!block)
-        return block;
+        return;
 
-    Block res;
-    for (const auto & col : header)
-        res.insert(block.getByName(col.name));
+    Chunk res;
+    for (const auto & col : getOutputPort().getHeader())
+        res.addColumn(block.getByName(col.name).column);
 
-    return res;
+    chunk = std::move(res);
 }
 
-void TTLCalcInputStream::readSuffixImpl()
+void TTLCalcTransform::finalize()
 {
     data_part->ttl_infos = {};
     for (const auto & algorithm : algorithms)
         algorithm->finalize(data_part);
 }
 
+IProcessor::Status TTLCalcTransform::prepare()
+{
+    auto status = ISimpleTransform::prepare();
+    if (status == Status::Finished)
+        finalize();
+
+    return status;
+}
+
 }
diff --git a/src/DataStreams/TTLCalcInputStream.h b/src/DataStreams/TTLCalcInputStream.h
index 20148eadfc2..d0e7b0055f2 100644
--- a/src/DataStreams/TTLCalcInputStream.h
+++ b/src/DataStreams/TTLCalcInputStream.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <DataStreams/IBlockInputStream.h>
+#include <Processors/ISimpleTransform.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Core/Block.h>
@@ -11,11 +11,11 @@
 namespace DB
 {
 
-class TTLCalcInputStream : public IBlockInputStream
+class TTLCalcTransform : public ISimpleTransform
 {
 public:
-    TTLCalcInputStream(
-        const BlockInputStreamPtr & input_,
+    TTLCalcTransform(
+        const Block & header_,
         const MergeTreeData & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
         const MergeTreeData::MutableDataPartPtr & data_part_,
@@ -24,13 +24,13 @@ public:
     );
 
     String getName() const override { return "TTL_CALC"; }
-    Block getHeader() const override { return header; }
+    Status prepare() override;
 
 protected:
-    Block readImpl() override;
+    void transform(Chunk & chunk) override;
 
     /// Finalizes ttl infos and updates data part
-    void readSuffixImpl() override;
+    void finalize();
 
 private:
     std::vector<TTLAlgorithmPtr> algorithms;
@@ -38,7 +38,6 @@ private:
     /// ttl_infos and empty_columns are updating while reading
     const MergeTreeData::MutableDataPartPtr & data_part;
     Poco::Logger * log;
-    Block header;
 };
 
 }
diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 540d5c76c97..e5a129cbe12 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -932,7 +932,7 @@ void MutationsInterpreter::validate()
     auto pipeline = addStreamsForLaterStages(stages, plan);
 }
 
-BlockInputStreamPtr MutationsInterpreter::execute()
+QueryPipeline MutationsInterpreter::execute()
 {
     if (!can_execute)
         throw Exception("Cannot execute mutations interpreter because can_execute flag set to false", ErrorCodes::LOGICAL_ERROR);
@@ -956,12 +956,11 @@ BlockInputStreamPtr MutationsInterpreter::execute()
     }
 
     auto pipeline = QueryPipelineBuilder::getPipeline(std::move(*builder));
-    BlockInputStreamPtr result_stream = std::make_shared<PipelineExecutingBlockInputStream>(std::move(pipeline));
 
     if (!updated_header)
-        updated_header = std::make_unique<Block>(result_stream->getHeader());
+        updated_header = std::make_unique<Block>(pipeline.getHeader());
 
-    return result_stream;
+    return pipeline;
 }
 
 Block MutationsInterpreter::getUpdatedHeader() const
diff --git a/src/Interpreters/MutationsInterpreter.h b/src/Interpreters/MutationsInterpreter.h
index b0540f7d2ed..7b0ccb3bae5 100644
--- a/src/Interpreters/MutationsInterpreter.h
+++ b/src/Interpreters/MutationsInterpreter.h
@@ -50,7 +50,7 @@ public:
     size_t evaluateCommandsSize();
 
     /// The resulting stream will return blocks containing only changed columns and columns, that we need to recalculate indices.
-    BlockInputStreamPtr execute();
+    QueryPipeline execute();
 
     /// Only changed columns.
     Block getUpdatedHeader() const;
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index e5fcaae3417..0810d45a805 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -11,6 +11,7 @@
 #include "Storages/MergeTree/MergeTreeSequentialSource.h"
 #include "Storages/MergeTree/FutureMergedMutatedPart.h"
 #include "Processors/Transforms/ExpressionTransform.h"
+#include "Processors/Transforms/MaterializingTransform.h"
 #include "Processors/Merges/MergingSortedTransform.h"
 #include "Processors/Merges/CollapsingSortedTransform.h"
 #include "Processors/Merges/SummingSortedTransform.h"
@@ -236,8 +237,6 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
         ctx->compression_codec,
         ctx->blocks_are_granules_size);
 
-    global_ctx->merged_stream->readPrefix();
-
     global_ctx->rows_written = 0;
     ctx->initial_reservation = global_ctx->space_reservation ? global_ctx->space_reservation->getSize() : 0;
 
@@ -298,14 +297,17 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::execute()
 bool MergeTask::ExecuteAndFinalizeHorizontalPart::executeImpl()
 {
     Block block;
-    if (!ctx->is_cancelled() && (block = global_ctx->merged_stream->read()))
+    if (!ctx->is_cancelled() && (global_ctx->merging_executor->pull(block)))
     {
         global_ctx->rows_written += block.rows();
 
         const_cast<MergedBlockOutputStream &>(*global_ctx->to).write(block);
 
-        global_ctx->merge_list_element_ptr->rows_written = global_ctx->merged_stream->getProfileInfo().rows;
-        global_ctx->merge_list_element_ptr->bytes_written_uncompressed = global_ctx->merged_stream->getProfileInfo().bytes;
+        UInt64 result_rows = 0;
+        UInt64 result_bytes = 0;
+        global_ctx->merged_pipeline.tryGetResultRowsAndBytes(result_rows, result_bytes);
+        global_ctx->merge_list_element_ptr->rows_written = result_rows;
+        global_ctx->merge_list_element_ptr->bytes_written_uncompressed = result_bytes;
 
         /// Reservation updates is not performed yet, during the merge it may lead to higher free space requirements
         if (global_ctx->space_reservation && ctx->sum_input_rows_upper_bound)
@@ -323,8 +325,8 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::executeImpl()
         return true;
     }
 
-    global_ctx->merged_stream->readSuffix();
-    global_ctx->merged_stream.reset();
+    global_ctx->merging_executor.reset();
+    global_ctx->merged_pipeline.reset();
 
     if (global_ctx->merges_blocker->isCancelled())
         throw Exception("Cancelled merging parts", ErrorCodes::ABORTED);
@@ -799,26 +801,25 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
 
     auto res_pipe = Pipe::unitePipes(std::move(pipes));
     res_pipe.addTransform(std::move(merged_transform));
-    QueryPipeline pipeline(std::move(res_pipe));
-    pipeline.setNumThreads(1);
-
-    global_ctx->merged_stream = std::make_shared<PipelineExecutingBlockInputStream>(std::move(pipeline));
 
     if (global_ctx->deduplicate)
-        global_ctx->merged_stream = std::make_shared<DistinctSortedBlockInputStream>(
-            global_ctx->merged_stream, sort_description, SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns);
+        res_pipe.addTransform(std::make_shared<DistinctSortedTransform>(
+            res_pipe.getHeader(), sort_description, SizeLimits(), 0 /*limit_hint*/, global_ctx->deduplicate_by_columns));
 
     if (ctx->need_remove_expired_values)
-        global_ctx->merged_stream = std::make_shared<TTLBlockInputStream>(
-            global_ctx->merged_stream, *global_ctx->data, global_ctx->metadata_snapshot, global_ctx->new_data_part, global_ctx->time_of_merge, ctx->force_ttl);
+        res_pipe.addTransform(std::make_shared<TTLTransform>(
+            res_pipe.getHeader(), *global_ctx->data, global_ctx->metadata_snapshot, global_ctx->new_data_part, global_ctx->time_of_merge, ctx->force_ttl));
 
     if (global_ctx->metadata_snapshot->hasSecondaryIndices())
     {
         const auto & indices = global_ctx->metadata_snapshot->getSecondaryIndices();
-        global_ctx->merged_stream = std::make_shared<ExpressionBlockInputStream>(
-            global_ctx->merged_stream, indices.getSingleExpressionForIndices(global_ctx->metadata_snapshot->getColumns(), global_ctx->data->getContext()));
-        global_ctx->merged_stream = std::make_shared<MaterializingBlockInputStream>(global_ctx->merged_stream);
+        res_pipe.addTransform(std::make_shared<ExpressionTransform>(
+            res_pipe.getHeader(), indices.getSingleExpressionForIndices(global_ctx->metadata_snapshot->getColumns(), global_ctx->data->getContext())));
+        res_pipe.addTransform(std::make_shared<MaterializingTransform>(res_pipe.getHeader()));
     }
+
+    global_ctx->merged_pipeline = QueryPipeline(std::move(res_pipe));
+    global_ctx->merging_executor = std::make_unique<PullingPipelineExecutor>(global_ctx->merged_pipeline);
 }
 
 
diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index ce628d831ae..aceca912cea 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -148,7 +148,8 @@ private:
         std::unique_ptr<MergeStageProgress> column_progress{nullptr};
 
         std::shared_ptr<MergedBlockOutputStream> to{nullptr};
-        BlockInputStreamPtr merged_stream{nullptr};
+        QueryPipeline merged_pipeline;
+        std::unique_ptr<PullingPipelineExecutor> merging_executor;
 
         SyncGuardPtr sync_guard{nullptr};
         MergeTreeData::MutableDataPartPtr new_data_part{nullptr};
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 746f0c879d3..e38342e21dd 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -11,6 +11,9 @@
 #include <DataStreams/SquashingBlockInputStream.h>
 #include <Parsers/queryToString.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
+#include <Processors/Transforms/ExpressionTransform.h>
+#include <Processors/Transforms/MaterializingTransform.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Storages/MergeTree/StorageFromMergeTreeDataPart.h>
 #include <Storages/MergeTree/MergeTreeDataWriter.h>
 #include <Storages/MutationCommands.h>
@@ -182,7 +185,7 @@ static std::vector<ProjectionDescriptionRawPtr> getProjectionsForNewDataPart(
 /// Return set of indices which should be recalculated during mutation also
 /// wraps input stream into additional expression stream
 static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
-    BlockInputStreamPtr & input_stream,
+    QueryPipeline & pipeline,
     const NameSet & updated_columns,
     const StorageMetadataPtr & metadata_snapshot,
     ContextPtr context,
@@ -234,9 +237,9 @@ static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
         }
     }
 
-    if (!indices_to_recalc.empty() && input_stream)
+    if (!indices_to_recalc.empty() && pipeline.initialized())
     {
-        auto indices_recalc_syntax = TreeRewriter(context).analyze(indices_recalc_expr_list, input_stream->getHeader().getNamesAndTypesList());
+        auto indices_recalc_syntax = TreeRewriter(context).analyze(indices_recalc_expr_list, pipeline.getHeader().getNamesAndTypesList());
         auto indices_recalc_expr = ExpressionAnalyzer(
                 indices_recalc_expr_list,
                 indices_recalc_syntax, context).getActions(false);
@@ -246,8 +249,11 @@ static std::set<MergeTreeIndexPtr> getIndicesToRecalculate(
         /// MutationsInterpreter which knows about skip indices and stream 'in' already has
         /// all required columns.
         /// TODO move this logic to single place.
-        input_stream = std::make_shared<MaterializingBlockInputStream>(
-            std::make_shared<ExpressionBlockInputStream>(input_stream, indices_recalc_expr));
+        QueryPipelineBuilder builder;
+        builder.init(std::move(pipeline));
+        builder.addTransform(std::make_shared<ExpressionTransform>(builder.getHeader(), indices_recalc_expr));
+        builder.addTransform(std::make_shared<MaterializingTransform>(builder.getHeader()));
+        pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
     }
     return indices_to_recalc;
 }
@@ -500,7 +506,8 @@ struct MutationContext
 
     std::unique_ptr<CurrentMetrics::Increment> num_mutations;
 
-    BlockInputStreamPtr mutating_stream{nullptr}; // in
+    QueryPipeline mutating_pipeline; // in
+    std::unique_ptr<PullingPipelineExecutor> mutating_executor;
     Block updated_header;
 
     std::unique_ptr<MutationsInterpreter> interpreter;
@@ -795,24 +802,25 @@ void PartMergerWriter::prepare()
 
 bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
 {
-    if (MutationHelpers::checkOperationIsNotCanceled(*ctx->merges_blocker, ctx->mutate_entry) && (block = ctx->mutating_stream->read()))
+    Block cur_block;
+    if (MutationHelpers::checkOperationIsNotCanceled(*ctx->merges_blocker, ctx->mutate_entry) && ctx->mutating_executor->pull(cur_block))
     {
         if (ctx->minmax_idx)
-            ctx->minmax_idx->update(block, ctx->data->getMinMaxColumnsNames(ctx->metadata_snapshot->getPartitionKey()));
+            ctx->minmax_idx->update(cur_block, ctx->data->getMinMaxColumnsNames(ctx->metadata_snapshot->getPartitionKey()));
 
-        ctx->out->write(block);
+        ctx->out->write(cur_block);
 
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
         {
             const auto & projection = *ctx->projections_to_build[i];
-            auto projection_block = projection_squashes[i].add(projection.calculate(block, ctx->context));
+            auto projection_block = projection_squashes[i].add(projection.calculate(cur_block, ctx->context));
             if (projection_block)
                 projection_parts[projection.name].emplace_back(MergeTreeDataWriter::writeTempProjectionPart(
                     *ctx->data, ctx->log, projection_block, projection, ctx->new_data_part.get(), ++block_num));
         }
 
-        (*ctx->mutate_entry)->rows_written += block.rows();
-        (*ctx->mutate_entry)->bytes_written_uncompressed += block.bytes();
+        (*ctx->mutate_entry)->rows_written += cur_block.rows();
+        (*ctx->mutate_entry)->bytes_written_uncompressed += cur_block.bytes();
 
         /// Need execute again
         return true;
@@ -937,18 +945,25 @@ private:
         auto skip_part_indices = MutationHelpers::getIndicesForNewDataPart(ctx->metadata_snapshot->getSecondaryIndices(), ctx->for_file_renames);
         ctx->projections_to_build = MutationHelpers::getProjectionsForNewDataPart(ctx->metadata_snapshot->getProjections(), ctx->for_file_renames);
 
-        if (ctx->mutating_stream == nullptr)
+        if (!ctx->mutating_pipeline.initialized())
             throw Exception("Cannot mutate part columns with uninitialized mutations stream. It's a bug", ErrorCodes::LOGICAL_ERROR);
 
+        QueryPipelineBuilder builder;
+        builder.init(std::move(ctx->mutating_pipeline));
+
         if (ctx->metadata_snapshot->hasPrimaryKey() || ctx->metadata_snapshot->hasSecondaryIndices())
-            ctx->mutating_stream = std::make_shared<MaterializingBlockInputStream>(
-                std::make_shared<ExpressionBlockInputStream>(ctx->mutating_stream, ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot)));
+        {
+            builder.addTransform(
+                std::make_shared<ExpressionTransform>(builder.getHeader(), ctx->data->getPrimaryKeyAndSkipIndicesExpression(ctx->metadata_snapshot)));
+
+            builder.addTransform(std::make_shared<MaterializingTransform>(builder.getHeader()));
+        }
 
         if (ctx->execute_ttl_type == ExecuteTTLType::NORMAL)
-            ctx->mutating_stream = std::make_shared<TTLBlockInputStream>(ctx->mutating_stream, *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+            builder.addTransform(std::make_shared<TTLTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
 
         if (ctx->execute_ttl_type == ExecuteTTLType::RECALCULATE)
-            ctx->mutating_stream = std::make_shared<TTLCalcInputStream>(ctx->mutating_stream, *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+            builder.addTransform(std::make_shared<TTLCalcTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
 
         ctx->minmax_idx = std::make_shared<IMergeTreeDataPart::MinMaxIndex>();
 
@@ -959,7 +974,8 @@ private:
             skip_part_indices,
             ctx->compression_codec);
 
-        ctx->mutating_stream->readPrefix();
+        ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
+        ctx->mutating_executor = std::make_unique<PullingPipelineExecutor>(ctx->mutating_pipeline);
 
         part_merger_writer_task = std::make_unique<PartMergerWriter>(ctx);
     }
@@ -968,7 +984,8 @@ private:
     void finalize()
     {
         ctx->new_data_part->minmax_idx = std::move(ctx->minmax_idx);
-        ctx->mutating_stream->readSuffix();
+        ctx->mutating_executor.reset();
+        ctx->mutating_pipeline.reset();
 
         static_pointer_cast<MergedBlockOutputStream>(ctx->out)->writeSuffixAndFinalizePart(ctx->new_data_part, ctx->need_sync);
     }
@@ -1087,16 +1104,16 @@ private:
 
         ctx->compression_codec = ctx->source_part->default_codec;
 
-        if (ctx->mutating_stream)
+        if (ctx->mutating_pipeline.initialized())
         {
-            if (ctx->mutating_stream == nullptr)
-                throw Exception("Cannot mutate part columns with uninitialized mutations stream. It's a bug", ErrorCodes::LOGICAL_ERROR);
+            QueryPipelineBuilder builder;
+            builder.init(std::move(ctx->mutating_pipeline));
 
             if (ctx->execute_ttl_type == ExecuteTTLType::NORMAL)
-                ctx->mutating_stream = std::make_shared<TTLBlockInputStream>(ctx->mutating_stream, *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+                builder.addTransform(std::make_shared<TTLTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
 
             if (ctx->execute_ttl_type == ExecuteTTLType::RECALCULATE)
-                ctx->mutating_stream = std::make_shared<TTLCalcInputStream>(ctx->mutating_stream, *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true);
+                builder.addTransform(std::make_shared<TTLCalcTransform>(builder.getHeader(), *ctx->data, ctx->metadata_snapshot, ctx->new_data_part, ctx->time_of_mutation, true));
 
             ctx->out = std::make_shared<MergedColumnOnlyOutputStream>(
                 ctx->new_data_part,
@@ -1109,7 +1126,9 @@ private:
                 &ctx->source_part->index_granularity_info
             );
 
-            ctx->mutating_stream->readPrefix();
+            ctx->mutating_pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
+            ctx->mutating_executor = std::make_unique<PullingPipelineExecutor>(ctx->mutating_pipeline);
+
             ctx->projections_to_build = std::vector<ProjectionDescriptionRawPtr>{ctx->projections_to_recalc.begin(), ctx->projections_to_recalc.end()};
 
             part_merger_writer_task = std::make_unique<PartMergerWriter>(ctx);
@@ -1119,9 +1138,10 @@ private:
 
     void finalize()
     {
-        if (ctx->mutating_stream)
+        if (ctx->mutating_executor)
         {
-            ctx->mutating_stream->readSuffix();
+            ctx->mutating_executor.reset();
+            ctx->mutating_pipeline.reset();
 
             auto changed_checksums =
                 static_pointer_cast<MergedColumnOnlyOutputStream>(ctx->out)->writeSuffixAndGetChecksums(
@@ -1267,9 +1287,9 @@ bool MutateTask::prepare()
         ctx->materialized_indices = ctx->interpreter->grabMaterializedIndices();
         ctx->materialized_projections = ctx->interpreter->grabMaterializedProjections();
         ctx->mutation_kind = ctx->interpreter->getMutationKind();
-        ctx->mutating_stream = ctx->interpreter->execute();
+        ctx->mutating_pipeline = ctx->interpreter->execute();
         ctx->updated_header = ctx->interpreter->getUpdatedHeader();
-        ctx->mutating_stream->setProgressCallback(MergeProgressCallback((*ctx->mutate_entry)->ptr(), ctx->watch_prev_elapsed, *ctx->stage_progress));
+        ctx->mutating_pipeline.setProgressCallback(MergeProgressCallback((*ctx->mutate_entry)->ptr(), ctx->watch_prev_elapsed, *ctx->stage_progress));
     }
 
     ctx->single_disk_volume = std::make_shared<SingleDiskVolume>("volume_" + ctx->future_part->name, ctx->space_reservation->getDisk(), 0);
@@ -1299,7 +1319,7 @@ bool MutateTask::prepare()
     ctx->need_sync = needSyncPart(ctx->source_part->rows_count, ctx->source_part->getBytesOnDisk(), *data_settings);
     ctx->execute_ttl_type = ExecuteTTLType::NONE;
 
-    if (ctx->mutating_stream)
+    if (ctx->mutating_pipeline.initialized())
         ctx->execute_ttl_type = MergeTreeDataMergerMutator::shouldExecuteTTL(ctx->metadata_snapshot, ctx->interpreter->getColumnDependencies());
 
 
@@ -1318,7 +1338,7 @@ bool MutateTask::prepare()
             ctx->updated_columns.emplace(name_type.name);
 
         ctx->indices_to_recalc = MutationHelpers::getIndicesToRecalculate(
-            ctx->mutating_stream, ctx->updated_columns, ctx->metadata_snapshot, ctx->context, ctx->materialized_indices, ctx->source_part);
+            ctx->mutating_pipeline, ctx->updated_columns, ctx->metadata_snapshot, ctx->context, ctx->materialized_indices, ctx->source_part);
         ctx->projections_to_recalc = MutationHelpers::getProjectionsToRecalculate(
             ctx->updated_columns, ctx->metadata_snapshot, ctx->materialized_projections, ctx->source_part);
 
diff --git a/src/Storages/StorageJoin.cpp b/src/Storages/StorageJoin.cpp
index e45183591f2..2acdba18c2d 100644
--- a/src/Storages/StorageJoin.cpp
+++ b/src/Storages/StorageJoin.cpp
@@ -18,6 +18,7 @@
 #include <Compression/CompressedWriteBuffer.h>
 #include <Processors/Sources/SourceWithProgress.h>
 #include <Processors/Pipe.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Poco/String.h> /// toLower
 
 
@@ -114,17 +115,16 @@ void StorageJoin::mutate(const MutationCommands & commands, ContextPtr context)
     {
         auto storage_ptr = DatabaseCatalog::instance().getTable(getStorageID(), context);
         auto interpreter = std::make_unique<MutationsInterpreter>(storage_ptr, metadata_snapshot, commands, context, true);
-        auto in = interpreter->execute();
-        in->readPrefix();
+        auto pipeline = interpreter->execute();
+        PullingPipelineExecutor executor(pipeline);
 
-        while (const Block & block = in->read())
+        Block block;
+        while (executor.pull(block))
         {
             new_data->addJoinedBlock(block, true);
             if (persistent)
                 backup_stream.write(block);
         }
-
-        in->readSuffix();
     }
 
     /// Now acquire exclusive lock and modify storage.
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 3fe6083ab13..299e39a3836 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -10,6 +10,7 @@
 #include <Processors/Sources/SourceWithProgress.h>
 #include <Processors/Pipe.h>
 #include <Processors/Sinks/SinkToStorage.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
 
 
 namespace DB
@@ -263,11 +264,12 @@ void StorageMemory::mutate(const MutationCommands & commands, ContextPtr context
     new_context->setSetting("max_threads", 1);
 
     auto interpreter = std::make_unique<MutationsInterpreter>(storage_ptr, metadata_snapshot, commands, new_context, true);
-    auto in = interpreter->execute();
+    auto pipeline = interpreter->execute();
+    PullingPipelineExecutor executor(pipeline);
 
-    in->readPrefix();
     Blocks out;
-    while (Block block = in->read())
+    Block block;
+    while (executor.pull(block))
     {
         if (compress)
             for (auto & elem : block)
@@ -275,7 +277,6 @@ void StorageMemory::mutate(const MutationCommands & commands, ContextPtr context
 
         out.push_back(block);
     }
-    in->readSuffix();
 
     std::unique_ptr<Blocks> new_data;
 

From 2bfcdc431b4f15d6f3610745db164b3296ecb8e8 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Wed, 6 Oct 2021 21:42:07 +0300
Subject: [PATCH 035/104] translate

---
 docs/en/operations/settings/settings.md       |  4 +--
 .../statements/select/group-by.md             |  2 ++
 .../statements/select/limit-by.md             |  3 ++
 .../statements/select/order-by.md             |  4 ++-
 docs/ru/operations/settings/settings.md       | 36 +++++++++++++++++++
 .../statements/select/group-by.md             |  2 ++
 .../sql-reference/statements/select/index.md  |  3 +-
 .../statements/select/limit-by.md             |  2 ++
 .../statements/select/order-by.md             |  4 ++-
 9 files changed, 54 insertions(+), 6 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index fa4b96b8fbc..7868dfaaf79 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3756,8 +3756,8 @@ Enables or disables supporting positional arguments for [GROUP BY](../../sql-ref
 
 Possible values:
 
--   0 — Disabled.
--   1 — Enabled.
+-   1 — Column numbers can use instead of column names.
+-   0 — Positional arguments aren't supported.
 
 Default value: `0`.
 
diff --git a/docs/en/sql-reference/statements/select/group-by.md b/docs/en/sql-reference/statements/select/group-by.md
index 7c2d3a20f43..26dd51d806d 100644
--- a/docs/en/sql-reference/statements/select/group-by.md
+++ b/docs/en/sql-reference/statements/select/group-by.md
@@ -10,6 +10,8 @@ toc_title: GROUP BY
 -   All the expressions in the [SELECT](../../../sql-reference/statements/select/index.md), [HAVING](../../../sql-reference/statements/select/having.md), and [ORDER BY](../../../sql-reference/statements/select/order-by.md) clauses **must** be calculated based on key expressions **or** on [aggregate functions](../../../sql-reference/aggregate-functions/index.md) over non-key expressions (including plain columns). In other words, each column selected from the table must be used either in a key expression or inside an aggregate function, but not both.
 -   Result of aggregating `SELECT` query will contain as many rows as there were unique values of “grouping key” in source table. Usually this signficantly reduces the row count, often by orders of magnitude, but not necessarily: row count stays the same if all “grouping key” values were distinct.
 
+When you want to group data in the table by column numbers instead of column names, enable the setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
+
 !!! note "Note"
     There’s an additional way to run aggregation over a table. If a query contains table columns only inside aggregate functions, the `GROUP BY clause` can be omitted, and aggregation by an empty set of keys is assumed. Such queries always return exactly one row.
 
diff --git a/docs/en/sql-reference/statements/select/limit-by.md b/docs/en/sql-reference/statements/select/limit-by.md
index 34645b68b03..e13c46e0c29 100644
--- a/docs/en/sql-reference/statements/select/limit-by.md
+++ b/docs/en/sql-reference/statements/select/limit-by.md
@@ -16,6 +16,9 @@ During query processing, ClickHouse selects data ordered by sorting key. The sor
 !!! note "Note"
     `LIMIT BY` is not related to [LIMIT](../../../sql-reference/statements/select/limit.md). They can both be used in the same query.
 
+If you want to use column numbers instead of column names in the `LIMIT BY` clause, enable setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).	
+	
+
 ## Examples {#examples}
 
 Sample table:
diff --git a/docs/en/sql-reference/statements/select/order-by.md b/docs/en/sql-reference/statements/select/order-by.md
index 030f04d5e83..8a281a8c16f 100644
--- a/docs/en/sql-reference/statements/select/order-by.md
+++ b/docs/en/sql-reference/statements/select/order-by.md
@@ -4,7 +4,9 @@ toc_title: ORDER BY
 
 # ORDER BY Clause {#select-order-by}
 
-The `ORDER BY` clause contains a list of expressions, which can each be attributed with `DESC` (descending) or `ASC` (ascending) modifier which determine the sorting direction. If the direction is not specified, `ASC` is assumed, so it’s usually omitted. The sorting direction applies to a single expression, not to the entire list. Example: `ORDER BY Visits DESC, SearchPhrase`
+The `ORDER BY` clause contains a list of expressions, which can each be attributed with `DESC` (descending) or `ASC` (ascending) modifier which determine the sorting direction. If the direction is not specified, `ASC` is assumed, so it’s usually omitted. The sorting direction applies to a single expression, not to the entire list. Example: `ORDER BY Visits DESC, SearchPhrase`.
+
+If you want to sort by column numbers instead of column names, set `enable_positional_arguments = 1`.
 
 Rows that have identical values for the list of sorting expressions are output in an arbitrary order, which can also be non-deterministic (different each time).
 If the ORDER BY clause is omitted, the order of the rows is also undefined, and may be non-deterministic as well.
diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index e639c0a0df2..430a26f71d1 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -3538,3 +3538,39 @@ Exception: Total regexp lengths too large.
 **См. также**
 
 -   [max_hyperscan_regexp_length](#max-hyperscan-regexp-length)
+
+## enable_positional_arguments {#enable-positional-arguments}
+
+Включает и отключает поддержку позиционных аргументов для [GROUP BY](../../sql-reference/statements/select/group-by.md), [LIMIT BY](../../sql-reference/statements/select/limit-by.md), [ORDER BY](../../sql-reference/statements/select/order-by.md). Если вы хотите использовать номера столбцов вместо названий в выражениях этих операторов, установите `enable_positional_arguments = 1`.
+
+Возможные значения:
+
+-   1 — Можно использовать номера столбцов вместо названий столбцов.
+-   0 — Позиционные аргументы не поддерживаются.
+
+Значение по умолчанию: `0`.
+
+**Пример**
+
+Запрос:
+
+```sql
+CREATE TABLE positional_arguments(one Int, two Int, three Int) ENGINE=Memory();
+
+INSERT INTO positional_arguments VALUES (10, 20, 30), (20, 20, 10), (30, 10, 20);
+
+SET enable_positional_arguments = 1;
+
+SELECT * FROM positional_arguments ORDER BY 2,3;
+```
+
+Результат:
+
+```text
+┌─one─┬─two─┬─three─┐
+│  30 │  10 │   20  │
+│  20 │  20 │   10  │
+│  10 │  20 │   30  │
+└─────┴─────┴───────┘
+
+```
\ No newline at end of file
diff --git a/docs/ru/sql-reference/statements/select/group-by.md b/docs/ru/sql-reference/statements/select/group-by.md
index 2f0cabd14fb..ac06636e79f 100644
--- a/docs/ru/sql-reference/statements/select/group-by.md
+++ b/docs/ru/sql-reference/statements/select/group-by.md
@@ -10,6 +10,8 @@ toc_title: GROUP BY
 -   Все выражения в секциях [SELECT](index.md), [HAVING](having.md), и [ORDER BY](order-by.md) статьи **должны** быть вычисленными на основе ключевых выражений **или** на [агрегатных функций](../../../sql-reference/aggregate-functions/index.md) над неключевыми выражениями (включая столбцы). Другими словами, каждый столбец, выбранный из таблицы, должен использоваться либо в ключевом выражении, либо внутри агрегатной функции, но не в обоих.
 -   В результате агрегирования `SELECT` запрос будет содержать столько строк, сколько было уникальных значений ключа группировки в исходной таблице. Обычно агрегация значительно уменьшает количество строк, часто на порядки, но не обязательно: количество строк остается неизменным, если все исходные значения ключа группировки ценности были различны.
 
+Если вы хотите группировать данные в таблице по номерам столбцов, а не по названиям, включите настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
+
 !!! note "Примечание"
     Есть ещё один способ запустить агрегацию по таблице. Если запрос содержит столбцы исходной таблицы только внутри агрегатных функций, то `GROUP BY` секцию можно опустить, и предполагается агрегирование по пустому набору ключей. Такие запросы всегда возвращают ровно одну строку.
 
diff --git a/docs/ru/sql-reference/statements/select/index.md b/docs/ru/sql-reference/statements/select/index.md
index c2820bc7be4..f4e8a3a24b0 100644
--- a/docs/ru/sql-reference/statements/select/index.md
+++ b/docs/ru/sql-reference/statements/select/index.md
@@ -140,8 +140,7 @@ Code: 42. DB::Exception: Received from localhost:9000. DB::Exception: Number of
 
 Вы можете использовать синонимы (алиасы `AS`) в любом месте запроса.
 
-В секциях `GROUP BY`, `ORDER BY`, в отличие от диалекта MySQL, и в соответствии со стандартным SQL, не поддерживаются позиционные аргументы.
-Например, если вы напишите `GROUP BY 1, 2` - то это будет воспринято, как группировка по константам (то есть, агрегация всех строк в одну).
+В секциях `GROUP BY`, `ORDER BY` и `LIMIT BY` поддерживаются позиционные аргументы. Например, если вы напишите `ORDER BY 1,2` - будет выполнена сортировка сначала по первому, а затем по второму столбцу.
 
 
 ## Детали реализации {#implementation-details}
diff --git a/docs/ru/sql-reference/statements/select/limit-by.md b/docs/ru/sql-reference/statements/select/limit-by.md
index fba81c023b5..861d88dcafb 100644
--- a/docs/ru/sql-reference/statements/select/limit-by.md
+++ b/docs/ru/sql-reference/statements/select/limit-by.md
@@ -15,6 +15,8 @@ ClickHouse поддерживает следующий синтаксис:
 
 `LIMIT BY` не связана с секцией `LIMIT`. Их можно использовать в одном запросе.
 
+Если вы хотите использовать в секции `LIMIT BY` номера столбцов вместо названий, включите настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).	
+
 ## Примеры
 
 Образец таблицы:
diff --git a/docs/ru/sql-reference/statements/select/order-by.md b/docs/ru/sql-reference/statements/select/order-by.md
index d7d2e9c7574..fca5653d0bc 100644
--- a/docs/ru/sql-reference/statements/select/order-by.md
+++ b/docs/ru/sql-reference/statements/select/order-by.md
@@ -4,7 +4,9 @@ toc_title: ORDER BY
 
 # Секция ORDER BY {#select-order-by}
 
-Секция `ORDER BY` содержит список выражений, к каждому из которых также может быть приписано `DESC` или `ASC` (направление сортировки). Если ничего не приписано - это аналогично приписыванию `ASC`. `ASC` - сортировка по возрастанию, `DESC` - сортировка по убыванию. Обозначение направления сортировки действует на одно выражение, а не на весь список. Пример: `ORDER BY Visits DESC, SearchPhrase`
+Секция `ORDER BY` содержит список выражений, к каждому из которых также может быть приписано `DESC` или `ASC` (направление сортировки). Если ничего не приписано - это аналогично приписыванию `ASC`. `ASC` - сортировка по возрастанию, `DESC` - сортировка по убыванию. Обозначение направления сортировки действует на одно выражение, а не на весь список. Пример: `ORDER BY Visits DESC, SearchPhrase`.
+
+Если вы хотите сортировать данные по номерам столбцов, а не по названиям, установите настройку `enable_positional_arguments = 1`.
 
 Строки, для которых список выражений, по которым производится сортировка, принимает одинаковые значения, выводятся в произвольном порядке, который может быть также недетерминированным (каждый раз разным).
 Если секция ORDER BY отсутствует, то, аналогично, порядок, в котором идут строки, не определён, и может быть недетерминированным.

From 88c4a9030cd47f3e595bc6b4c2c33655a1206eb0 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:25:44 +0300
Subject: [PATCH 036/104] Update docs/en/operations/settings/settings.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/operations/settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 7868dfaaf79..ff0ce28a5ba 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3756,8 +3756,8 @@ Enables or disables supporting positional arguments for [GROUP BY](../../sql-ref
 
 Possible values:
 
--   1 — Column numbers can use instead of column names.
 -   0 — Positional arguments aren't supported.
+-   1 — Positional arguments are supported: column numbers can use instead of column names.
 
 Default value: `0`.
 

From 21197e1820f9c9e7b43b606dc8e4c0fc7f0a4d7d Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:26:07 +0300
Subject: [PATCH 037/104] Update docs/en/operations/settings/settings.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/operations/settings/settings.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index ff0ce28a5ba..f78fbc8a2bc 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -3783,5 +3783,4 @@ Result:
 │  20 │  20 │   10  │
 │  10 │  20 │   30  │
 └─────┴─────┴───────┘
-
 ```
\ No newline at end of file

From c70ce36ff40a75b031922f0d06e05194bd4587f5 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:27:00 +0300
Subject: [PATCH 038/104] Update
 docs/en/sql-reference/statements/select/index.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/sql-reference/statements/select/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/select/index.md b/docs/en/sql-reference/statements/select/index.md
index e31ba6b1f4b..0427764475a 100644
--- a/docs/en/sql-reference/statements/select/index.md
+++ b/docs/en/sql-reference/statements/select/index.md
@@ -144,7 +144,7 @@ Extreme values are calculated for rows before `LIMIT`, but after `LIMIT BY`. How
 
 You can use synonyms (`AS` aliases) in any part of a query.
 
-The `GROUP BY`, `ORDER BY`, and `LIMIT BY` clauses support positional arguments. For example, `ORDER BY 1,2` will be sorting rows in the table on the first and then the second column.
+The `GROUP BY`, `ORDER BY`, and `LIMIT BY` clauses can support positional arguments. To enable this, switch on the [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments) setting. Then, for example, `ORDER BY 1,2` will be sorting rows in the table on the first and then the second column.
 
 ## Implementation Details {#implementation-details}
 

From 0ed02e689dc939939d95b2adccb3a0be8028237c Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:27:17 +0300
Subject: [PATCH 039/104] Update
 docs/en/sql-reference/statements/select/limit-by.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/sql-reference/statements/select/limit-by.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/select/limit-by.md b/docs/en/sql-reference/statements/select/limit-by.md
index e13c46e0c29..e1ca58cdec8 100644
--- a/docs/en/sql-reference/statements/select/limit-by.md
+++ b/docs/en/sql-reference/statements/select/limit-by.md
@@ -16,7 +16,7 @@ During query processing, ClickHouse selects data ordered by sorting key. The sor
 !!! note "Note"
     `LIMIT BY` is not related to [LIMIT](../../../sql-reference/statements/select/limit.md). They can both be used in the same query.
 
-If you want to use column numbers instead of column names in the `LIMIT BY` clause, enable setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).	
+If you want to use column numbers instead of column names in the `LIMIT BY` clause, enable the setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).	
 	
 
 ## Examples {#examples}

From 5aef3e761792a2bf4d60e6ad81d6d8a26e8f7f49 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:27:30 +0300
Subject: [PATCH 040/104] Update docs/ru/operations/settings/settings.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/ru/operations/settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index 430a26f71d1..50376b64e5e 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -3545,8 +3545,8 @@ Exception: Total regexp lengths too large.
 
 Возможные значения:
 
--   1 — Можно использовать номера столбцов вместо названий столбцов.
 -   0 — Позиционные аргументы не поддерживаются.
+-   1 — Позиционные аргументы поддерживаются: можно использовать номера столбцов вместо названий столбцов.
 
 Значение по умолчанию: `0`.
 

From f3e0edd9a98cc97f332d1a51a32699c6bd55348d Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:27:40 +0300
Subject: [PATCH 041/104] Update docs/ru/operations/settings/settings.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/ru/operations/settings/settings.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index 50376b64e5e..500485aea2f 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -3572,5 +3572,4 @@ SELECT * FROM positional_arguments ORDER BY 2,3;
 │  20 │  20 │   10  │
 │  10 │  20 │   30  │
 └─────┴─────┴───────┘
-
 ```
\ No newline at end of file

From 6b927f1bda3ebefe819ccb9db4b119e0b60065d6 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:28:10 +0300
Subject: [PATCH 042/104] Update
 docs/ru/sql-reference/statements/select/group-by.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/ru/sql-reference/statements/select/group-by.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/sql-reference/statements/select/group-by.md b/docs/ru/sql-reference/statements/select/group-by.md
index ac06636e79f..8bc1b765ad3 100644
--- a/docs/ru/sql-reference/statements/select/group-by.md
+++ b/docs/ru/sql-reference/statements/select/group-by.md
@@ -10,7 +10,7 @@ toc_title: GROUP BY
 -   Все выражения в секциях [SELECT](index.md), [HAVING](having.md), и [ORDER BY](order-by.md) статьи **должны** быть вычисленными на основе ключевых выражений **или** на [агрегатных функций](../../../sql-reference/aggregate-functions/index.md) над неключевыми выражениями (включая столбцы). Другими словами, каждый столбец, выбранный из таблицы, должен использоваться либо в ключевом выражении, либо внутри агрегатной функции, но не в обоих.
 -   В результате агрегирования `SELECT` запрос будет содержать столько строк, сколько было уникальных значений ключа группировки в исходной таблице. Обычно агрегация значительно уменьшает количество строк, часто на порядки, но не обязательно: количество строк остается неизменным, если все исходные значения ключа группировки ценности были различны.
 
-Если вы хотите группировать данные в таблице по номерам столбцов, а не по названиям, включите настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
+Если вы хотите для группировки данных в таблице указывать номера столбцов, а не названия, включите настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
 
 !!! note "Примечание"
     Есть ещё один способ запустить агрегацию по таблице. Если запрос содержит столбцы исходной таблицы только внутри агрегатных функций, то `GROUP BY` секцию можно опустить, и предполагается агрегирование по пустому набору ключей. Такие запросы всегда возвращают ровно одну строку.

From fc627bc096fc33ec1c5aae65e20be965136fa51d Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:28:37 +0300
Subject: [PATCH 043/104] Update
 docs/ru/sql-reference/statements/select/order-by.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/ru/sql-reference/statements/select/order-by.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/sql-reference/statements/select/order-by.md b/docs/ru/sql-reference/statements/select/order-by.md
index fca5653d0bc..190a46dacc9 100644
--- a/docs/ru/sql-reference/statements/select/order-by.md
+++ b/docs/ru/sql-reference/statements/select/order-by.md
@@ -6,7 +6,7 @@ toc_title: ORDER BY
 
 Секция `ORDER BY` содержит список выражений, к каждому из которых также может быть приписано `DESC` или `ASC` (направление сортировки). Если ничего не приписано - это аналогично приписыванию `ASC`. `ASC` - сортировка по возрастанию, `DESC` - сортировка по убыванию. Обозначение направления сортировки действует на одно выражение, а не на весь список. Пример: `ORDER BY Visits DESC, SearchPhrase`.
 
-Если вы хотите сортировать данные по номерам столбцов, а не по названиям, установите настройку `enable_positional_arguments = 1`.
+Если вы хотите для сортировки данных указывать номера столбцов, а не названия, включите настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
 
 Строки, для которых список выражений, по которым производится сортировка, принимает одинаковые значения, выводятся в произвольном порядке, который может быть также недетерминированным (каждый раз разным).
 Если секция ORDER BY отсутствует, то, аналогично, порядок, в котором идут строки, не определён, и может быть недетерминированным.

From a96cae23244cccb77b3bf012aac9239221f5dd3f Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:28:57 +0300
Subject: [PATCH 044/104] Update
 docs/ru/sql-reference/statements/select/index.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/ru/sql-reference/statements/select/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/sql-reference/statements/select/index.md b/docs/ru/sql-reference/statements/select/index.md
index f4e8a3a24b0..ffaae74b1d9 100644
--- a/docs/ru/sql-reference/statements/select/index.md
+++ b/docs/ru/sql-reference/statements/select/index.md
@@ -140,7 +140,7 @@ Code: 42. DB::Exception: Received from localhost:9000. DB::Exception: Number of
 
 Вы можете использовать синонимы (алиасы `AS`) в любом месте запроса.
 
-В секциях `GROUP BY`, `ORDER BY` и `LIMIT BY` поддерживаются позиционные аргументы. Например, если вы напишите `ORDER BY 1,2` - будет выполнена сортировка сначала по первому, а затем по второму столбцу.
+В секциях `GROUP BY`, `ORDER BY` и `LIMIT BY` можно использовать не названия столбцов, а номера. Для этого нужно включить настройку [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments). Тогда, например, в запросе с `ORDER BY 1,2` будет выполнена сортировка сначала по первому, а затем по второму столбцу.
 
 
 ## Детали реализации {#implementation-details}

From 0362083843ed014f0ba58a026d60875fcf80bf07 Mon Sep 17 00:00:00 2001
From: Tatiana Kirillova <kirillikoff@yandex-team.ru>
Date: Thu, 7 Oct 2021 08:29:28 +0300
Subject: [PATCH 045/104] Update
 docs/en/sql-reference/statements/select/order-by.md

Co-authored-by: olgarev <56617294+olgarev@users.noreply.github.com>
---
 docs/en/sql-reference/statements/select/order-by.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/select/order-by.md b/docs/en/sql-reference/statements/select/order-by.md
index 8a281a8c16f..ee6893812cc 100644
--- a/docs/en/sql-reference/statements/select/order-by.md
+++ b/docs/en/sql-reference/statements/select/order-by.md
@@ -6,7 +6,7 @@ toc_title: ORDER BY
 
 The `ORDER BY` clause contains a list of expressions, which can each be attributed with `DESC` (descending) or `ASC` (ascending) modifier which determine the sorting direction. If the direction is not specified, `ASC` is assumed, so it’s usually omitted. The sorting direction applies to a single expression, not to the entire list. Example: `ORDER BY Visits DESC, SearchPhrase`.
 
-If you want to sort by column numbers instead of column names, set `enable_positional_arguments = 1`.
+If you want to sort by column numbers instead of column names, enable the setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
 
 Rows that have identical values for the list of sorting expressions are output in an arbitrary order, which can also be non-deterministic (different each time).
 If the ORDER BY clause is omitted, the order of the rows is also undefined, and may be non-deterministic as well.

From 71cffbf521324ff2613d0e6b3fc2b6e4642fdc45 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 10:51:03 +0300
Subject: [PATCH 046/104] Make memory_profiler_step API cleaner

Right now to configure memory_profiler_step/total_memory_profiler_step
you need to call:

    MemoryTracker::setOrRaiseProfilerLimit()
    MemoryTracker::setProfilerStep()

But it is easy to forget about setOrRaiseProfilerLimit(), since there is
no even any comments about this.

So instead, make setOrRaiseProfilerLimit() private and call it from
setProfilerStep()
---
 programs/server/Server.cpp           | 1 -
 src/Common/MemoryTracker.h           | 4 +++-
 src/Interpreters/ProcessList.cpp     | 1 -
 src/Storages/MergeTree/MergeList.cpp | 1 -
 4 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index cd5d72cfba4..4ed5b114082 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1159,7 +1159,6 @@ if (ThreadFuzzer::instance().isEffective())
         UInt64 total_memory_profiler_step = config().getUInt64("total_memory_profiler_step", 0);
         if (total_memory_profiler_step)
         {
-            total_memory_tracker.setOrRaiseProfilerLimit(total_memory_profiler_step);
             total_memory_tracker.setProfilerStep(total_memory_profiler_step);
         }
 
diff --git a/src/Common/MemoryTracker.h b/src/Common/MemoryTracker.h
index 36560fec334..8ca8e4a6455 100644
--- a/src/Common/MemoryTracker.h
+++ b/src/Common/MemoryTracker.h
@@ -61,6 +61,8 @@ private:
     void updatePeak(Int64 will_be, bool log_memory_usage);
     void logMemoryUsage(Int64 current) const;
 
+    void setOrRaiseProfilerLimit(Int64 value);
+
 public:
     explicit MemoryTracker(VariableContext level_ = VariableContext::Thread);
     explicit MemoryTracker(MemoryTracker * parent_, VariableContext level_ = VariableContext::Thread);
@@ -106,7 +108,6 @@ public:
       * Otherwise, set limit to new value, if new value is greater than previous limit.
       */
     void setOrRaiseHardLimit(Int64 value);
-    void setOrRaiseProfilerLimit(Int64 value);
 
     void setFaultProbability(double value)
     {
@@ -121,6 +122,7 @@ public:
     void setProfilerStep(Int64 value)
     {
         profiler_step = value;
+        setOrRaiseProfilerLimit(value);
     }
 
     /// next should be changed only once: from nullptr to some value.
diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index 8576f4662ec..f8402cf0287 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -203,7 +203,6 @@ ProcessList::EntryPtr ProcessList::insert(const String & query_, const IAST * as
             if (query_context->hasTraceCollector())
             {
                 /// Set up memory profiling
-                thread_group->memory_tracker.setOrRaiseProfilerLimit(settings.memory_profiler_step);
                 thread_group->memory_tracker.setProfilerStep(settings.memory_profiler_step);
                 thread_group->memory_tracker.setSampleProbability(settings.memory_profiler_sample_probability);
             }
diff --git a/src/Storages/MergeTree/MergeList.cpp b/src/Storages/MergeTree/MergeList.cpp
index cd2668988a8..07aabf64dfd 100644
--- a/src/Storages/MergeTree/MergeList.cpp
+++ b/src/Storages/MergeTree/MergeList.cpp
@@ -82,7 +82,6 @@ MergeListElement::MergeListElement(
 
     memory_tracker.setDescription("Mutate/Merge");
     memory_tracker.setProfilerStep(memory_profiler_step);
-    memory_tracker.setOrRaiseProfilerLimit(memory_profiler_step);
     memory_tracker.setSampleProbability(memory_profiler_sample_probability);
 }
 

From 298f613557ceff080498b8f4fff6a2abb211051b Mon Sep 17 00:00:00 2001
From: Shoh Jahon <16575814+Shohjahon@users.noreply.github.com>
Date: Thu, 7 Oct 2021 14:59:23 +0500
Subject: [PATCH 047/104] Update fetchPostgreSQLTableStructure.cpp

added partitioned table prefix 'p' for the query for fetching replica identity index @kssenii !
---
 src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
index 4f5743035a7..5ac4180ec27 100644
--- a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
+++ b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
@@ -250,7 +250,7 @@ PostgreSQLTableStructure fetchPostgreSQLTableStructure(
             "and i.oid = ix.indexrelid "
             "and a.attrelid = t.oid "
             "and a.attnum = ANY(ix.indkey) "
-            "and t.relkind = 'r' " /// simple tables
+            "and t.relkind in ('r', 'p') " /// simple tables
             "and t.relname = {} " /// Connection is already done to a needed database, only table name is needed.
             "and ix.indisreplident = 't' " /// index is is replica identity index
             "ORDER BY a.attname", /// column names

From 4119848a41512caf641c0f190d1caee245382a9f Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Wed, 6 Oct 2021 20:07:35 +0300
Subject: [PATCH 048/104] better diagnostic for OPTIMIZE

---
 .../MergeTree/MergeTreeDataMergerMutator.cpp  |   6 +
 src/Storages/StorageReplicatedMergeTree.cpp   | 200 ++++++++----------
 2 files changed, 96 insertions(+), 110 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 9885a10cd62..b35a41d5d19 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -328,7 +328,11 @@ SelectPartsDecision MergeTreeDataMergerMutator::selectAllPartsToMergeWithinParti
     MergeTreeData::DataPartsVector parts = selectAllPartsFromPartition(partition_id);
 
     if (parts.empty())
+    {
+        if (out_disable_reason)
+            *out_disable_reason = "There are no parts inside partition";
         return SelectPartsDecision::CANNOT_SELECT;
+    }
 
     if (!final && parts.size() == 1)
     {
@@ -342,6 +346,8 @@ SelectPartsDecision MergeTreeDataMergerMutator::selectAllPartsToMergeWithinParti
     if (final && optimize_skip_merged_partitions && parts.size() == 1 && parts[0]->info.level > 0 &&
         (!metadata_snapshot->hasAnyTTL() || parts[0]->checkAllTTLCalculated(metadata_snapshot)))
     {
+        if (out_disable_reason)
+            *out_disable_reason = "Partition skipped due to optimize_skip_merged_partitions";
         return SelectPartsDecision::NOTHING_TO_MERGE;
     }
 
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index e5d59f2a950..06bf06b0ef3 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -4203,143 +4203,123 @@ bool StorageReplicatedMergeTree::optimize(
     if (!is_leader)
         throw Exception("OPTIMIZE cannot be done on this replica because it is not a leader", ErrorCodes::NOT_A_LEADER);
 
-    constexpr size_t max_retries = 10;
-
-    std::vector<ReplicatedMergeTreeLogEntryData> merge_entries;
+    auto handle_noop = [&] (const String & message)
     {
-        auto zookeeper = getZooKeeper();
+        if (query_context->getSettingsRef().optimize_throw_if_noop)
+            throw Exception(message, ErrorCodes::CANNOT_ASSIGN_OPTIMIZE);
+        return false;
+    };
 
-        auto handle_noop = [&] (const String & message)
+    auto zookeeper = getZooKeeper();
+    UInt64 disk_space = getStoragePolicy()->getMaxUnreservedFreeSpace();
+    const auto storage_settings_ptr = getSettings();
+    auto metadata_snapshot = getInMemoryMetadataPtr();
+    std::vector<ReplicatedMergeTreeLogEntryData> merge_entries;
+
+    auto try_assign_merge = [&](const String & partition_id) -> bool
+    {
+        constexpr size_t max_retries = 10;
+        size_t try_no = 0;
+        for (; try_no < max_retries; ++try_no)
         {
-            if (query_context->getSettingsRef().optimize_throw_if_noop)
-                throw Exception(message, ErrorCodes::CANNOT_ASSIGN_OPTIMIZE);
-            return false;
-        };
+            /// We must select parts for merge under merge_selecting_mutex because other threads
+            /// (merge_selecting_thread or OPTIMIZE queries) could assign new merges.
+            std::lock_guard merge_selecting_lock(merge_selecting_mutex);
+            ReplicatedMergeTreeMergePredicate can_merge = queue.getMergePredicate(zookeeper);
 
-        const auto storage_settings_ptr = getSettings();
-        auto metadata_snapshot = getInMemoryMetadataPtr();
+            auto future_merged_part = std::make_shared<FutureMergedMutatedPart>();
+            if (storage_settings.get()->assign_part_uuids)
+                future_merged_part->uuid = UUIDHelpers::generateV4();
 
-        if (!partition && final)
-        {
-            DataPartsVector data_parts = getDataPartsVector();
-            std::unordered_set<String> partition_ids;
+            constexpr const char * unknown_disable_reason = "unknown reason";
+            String disable_reason = unknown_disable_reason;
+            SelectPartsDecision select_decision = SelectPartsDecision::CANNOT_SELECT;
 
-            for (const DataPartPtr & part : data_parts)
-                partition_ids.emplace(part->info.partition_id);
-
-            UInt64 disk_space = getStoragePolicy()->getMaxUnreservedFreeSpace();
-
-            for (const String & partition_id : partition_ids)
+            if (partition_id.empty())
             {
-                size_t try_no = 0;
-                for (; try_no < max_retries; ++try_no)
-                {
-                    /// We must select parts for merge under merge_selecting_mutex because other threads
-                    /// (merge_selecting_thread or OPTIMIZE queries) could assign new merges.
-                    std::lock_guard merge_selecting_lock(merge_selecting_mutex);
-                    ReplicatedMergeTreeMergePredicate can_merge = queue.getMergePredicate(zookeeper);
-
-                    auto future_merged_part = std::make_shared<FutureMergedMutatedPart>();
-
-                    if (storage_settings.get()->assign_part_uuids)
-                        future_merged_part->uuid = UUIDHelpers::generateV4();
-
-                    SelectPartsDecision select_decision = merger_mutator.selectAllPartsToMergeWithinPartition(
-                        future_merged_part, disk_space, can_merge, partition_id, true, metadata_snapshot, nullptr, query_context->getSettingsRef().optimize_skip_merged_partitions);
-
-                    if (select_decision != SelectPartsDecision::SELECTED)
-                        break;
-
-                    ReplicatedMergeTreeLogEntryData merge_entry;
-                    CreateMergeEntryResult create_result = createLogEntryToMergeParts(
-                        zookeeper, future_merged_part->parts,
-                        future_merged_part->name, future_merged_part->uuid, future_merged_part->type,
-                        deduplicate, deduplicate_by_columns,
-                        &merge_entry, can_merge.getVersion(), future_merged_part->merge_type);
-
-                    if (create_result == CreateMergeEntryResult::MissingPart)
-                        return handle_noop("Can't create merge queue node in ZooKeeper, because some parts are missing");
-
-                    if (create_result == CreateMergeEntryResult::LogUpdated)
-                        continue;
-
-                    merge_entries.push_back(std::move(merge_entry));
-                    break;
-                }
-                if (try_no == max_retries)
-                    return handle_noop("Can't create merge queue node in ZooKeeper, because log was updated in every of "
-                        + toString(max_retries) + " tries");
+                select_decision = merger_mutator.selectPartsToMerge(
+                    future_merged_part, /* aggressive */ true, storage_settings_ptr->max_bytes_to_merge_at_max_space_in_pool,
+                    can_merge, /* merge_with_ttl_allowed */ false, &disable_reason);
             }
-        }
-        else
-        {
-            size_t try_no = 0;
-            for (; try_no < max_retries; ++try_no)
+            else
             {
-                std::lock_guard merge_selecting_lock(merge_selecting_mutex);
-                ReplicatedMergeTreeMergePredicate can_merge = queue.getMergePredicate(zookeeper);
+                select_decision = merger_mutator.selectAllPartsToMergeWithinPartition(
+                    future_merged_part, disk_space, can_merge, partition_id, final, metadata_snapshot,
+                    &disable_reason, query_context->getSettingsRef().optimize_skip_merged_partitions);
+            }
 
-                auto future_merged_part = std::make_shared<FutureMergedMutatedPart>();
-                if (storage_settings.get()->assign_part_uuids)
-                    future_merged_part->uuid = UUIDHelpers::generateV4();
+            /// If there is nothing to merge then we treat this merge as successful (needed for optimize final optimization)
+            if (select_decision == SelectPartsDecision::NOTHING_TO_MERGE)
+                return false;
 
-                String disable_reason;
-                SelectPartsDecision select_decision = SelectPartsDecision::CANNOT_SELECT;
+            if (select_decision != SelectPartsDecision::SELECTED)
+            {
+                constexpr const char * message_fmt = "Cannot select parts for optimization: {}";
+                assert(disable_reason != unknown_disable_reason);
+                if (!partition_id.empty())
+                    disable_reason += fmt::format(" (in partition {})", partition_id);
+                String message = fmt::format(message_fmt, disable_reason);
+                LOG_INFO(log, message);
+                return handle_noop(message);
+            }
 
-                if (!partition)
-                {
-                    select_decision = merger_mutator.selectPartsToMerge(
-                        future_merged_part, true, storage_settings_ptr->max_bytes_to_merge_at_max_space_in_pool, can_merge, false, &disable_reason);
-                }
-                else
-                {
-                    UInt64 disk_space = getStoragePolicy()->getMaxUnreservedFreeSpace();
-                    String partition_id = getPartitionIDFromQuery(partition, query_context);
-                    select_decision = merger_mutator.selectAllPartsToMergeWithinPartition(
-                        future_merged_part, disk_space, can_merge, partition_id, final, metadata_snapshot, &disable_reason, query_context->getSettingsRef().optimize_skip_merged_partitions);
-                }
+            ReplicatedMergeTreeLogEntryData merge_entry;
+            CreateMergeEntryResult create_result = createLogEntryToMergeParts(
+                zookeeper, future_merged_part->parts,
+                future_merged_part->name, future_merged_part->uuid, future_merged_part->type,
+                deduplicate, deduplicate_by_columns,
+                &merge_entry, can_merge.getVersion(), future_merged_part->merge_type);
 
-                /// If there is nothing to merge then we treat this merge as successful (needed for optimize final optimization)
-                if (select_decision == SelectPartsDecision::NOTHING_TO_MERGE)
-                    break;
+            if (create_result == CreateMergeEntryResult::MissingPart)
+            {
+                String message = "Can't create merge queue node in ZooKeeper, because some parts are missing";
+                LOG_TRACE(log, message);
+                return handle_noop(message);
+            }
 
-                if (select_decision != SelectPartsDecision::SELECTED)
-                {
-                    constexpr const char * message_fmt = "Cannot select parts for optimization: {}";
-                    if (disable_reason.empty())
-                        disable_reason = "unknown reason";
-                    LOG_INFO(log, message_fmt, disable_reason);
-                    return handle_noop(fmt::format(message_fmt, disable_reason));
-                }
+            if (create_result == CreateMergeEntryResult::LogUpdated)
+                continue;
 
-                ReplicatedMergeTreeLogEntryData merge_entry;
-                CreateMergeEntryResult create_result = createLogEntryToMergeParts(
-                    zookeeper, future_merged_part->parts,
-                    future_merged_part->name, future_merged_part->uuid, future_merged_part->type,
-                    deduplicate, deduplicate_by_columns,
-                    &merge_entry, can_merge.getVersion(), future_merged_part->merge_type);
+            merge_entries.push_back(std::move(merge_entry));
+            return true;
+        }
 
-                if (create_result == CreateMergeEntryResult::MissingPart)
-                    return handle_noop("Can't create merge queue node in ZooKeeper, because some parts are missing");
+        assert(try_no == max_retries);
+        String message = fmt::format("Can't create merge queue node in ZooKeeper, because log was updated in every of {} tries", try_no);
+        LOG_TRACE(log, message);
+        return handle_noop(message);
+    };
 
-                if (create_result == CreateMergeEntryResult::LogUpdated)
-                    continue;
+    bool assigned = false;
+    if (!partition && final)
+    {
+        DataPartsVector data_parts = getDataPartsVector();
+        std::unordered_set<String> partition_ids;
 
-                merge_entries.push_back(std::move(merge_entry));
+        for (const DataPartPtr & part : data_parts)
+            partition_ids.emplace(part->info.partition_id);
+
+        for (const String & partition_id : partition_ids)
+        {
+            assigned = try_assign_merge(partition_id);
+            if (!assigned)
                 break;
-            }
-            if (try_no == max_retries)
-                return handle_noop("Can't create merge queue node in ZooKeeper, because log was updated in every of "
-                    + toString(max_retries) + " tries");
         }
     }
+    else
+    {
+        String partition_id;
+        if (partition)
+            partition_id = getPartitionIDFromQuery(partition, query_context);
+        assigned = try_assign_merge(partition_id);
+    }
 
     table_lock.reset();
 
     for (auto & merge_entry : merge_entries)
         waitForLogEntryToBeProcessedIfNecessary(merge_entry, query_context);
 
-    return true;
+    return assigned;
 }
 
 bool StorageReplicatedMergeTree::executeMetadataAlter(const StorageReplicatedMergeTree::LogEntry & entry)

From 0db1e3614c82777de8f4f389b2cb9c06146b7534 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 7 Oct 2021 13:21:42 +0300
Subject: [PATCH 049/104] fix test

---
 tests/integration/test_dictionaries_dependency/test.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_dictionaries_dependency/test.py b/tests/integration/test_dictionaries_dependency/test.py
index ceab39aacb8..9b1019822e3 100644
--- a/tests/integration/test_dictionaries_dependency/test.py
+++ b/tests/integration/test_dictionaries_dependency/test.py
@@ -106,8 +106,11 @@ def test_dependency_via_dictionary_database(node):
         for d_name in d_names:
             assert node.query("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"
 
-    check()
+
+    for d_name in d_names:
+        assert node.query("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"
 
     # Restart must not break anything.
     node.restart_clickhouse()
-    check()
+    for d_name in d_names:
+        assert node.query_with_retry("SELECT dictGet({}, 'y', toUInt64(5))".format(d_name)) == "6\n"

From 7e2bc184ec29358cce749059bf776eccc784231e Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 7 Oct 2021 16:43:49 +0300
Subject: [PATCH 050/104] fix another suspicious places, add test

---
 src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp       | 2 +-
 src/Parsers/ParserCreateQuery.cpp                          | 2 +-
 src/Storages/MergeTree/MergeTreeIndexSet.cpp               | 2 +-
 tests/queries/0_stateless/01188_attach_table_from_path.sql | 1 +
 4 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
index f2860235117..a96713e3b5d 100644
--- a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
+++ b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
@@ -120,7 +120,7 @@ static NamesAndTypesList getColumnsList(const ASTExpressionList * columns_defini
                     auto * literal = child->as<ASTLiteral>();
 
                     new_child->arguments = std::make_shared<ASTExpressionList>();
-                    new_child->arguments->children.push_back(std::make_shared<ASTLiteral>(literal->value.get<String>()));
+                    new_child->arguments->children.push_back(std::make_shared<ASTLiteral>(literal->value.safeGet<String>()));
                     new_child->arguments->children.push_back(std::make_shared<ASTLiteral>(Int16(++i)));
                     child = new_child;
                 }
diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index 2ea1663fc80..1da1bfba491 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -896,7 +896,7 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 
     if (ParserKeyword{"TO INNER UUID"}.ignore(pos, expected))
     {
-        ParserLiteral literal_p;
+        ParserStringLiteral literal_p;
         if (!literal_p.parse(pos, to_inner_uuid, expected))
             return false;
     }
diff --git a/src/Storages/MergeTree/MergeTreeIndexSet.cpp b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
index 024b87c9a3e..60b9ddae329 100644
--- a/src/Storages/MergeTree/MergeTreeIndexSet.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
@@ -461,7 +461,7 @@ bool MergeTreeIndexConditionSet::checkASTUseless(const ASTPtr & node, bool atomi
                 [this](const auto & arg) { return checkASTUseless(arg, true); });
     }
     else if (const auto * literal = node->as<ASTLiteral>())
-        return !atomic && literal->value.get<bool>();
+        return !atomic && literal->value.safeGet<bool>();
     else if (const auto * identifier = node->as<ASTIdentifier>())
         return key_columns.find(identifier->getColumnName()) == std::end(key_columns);
     else
diff --git a/tests/queries/0_stateless/01188_attach_table_from_path.sql b/tests/queries/0_stateless/01188_attach_table_from_path.sql
index 5b99c07e986..9bf401c8ea4 100644
--- a/tests/queries/0_stateless/01188_attach_table_from_path.sql
+++ b/tests/queries/0_stateless/01188_attach_table_from_path.sql
@@ -7,6 +7,7 @@ drop table if exists mt;
 attach table test from 'some/path' (n UInt8) engine=Memory; -- { serverError 48 }
 attach table test from '/etc/passwd' (s String) engine=File(TSVRaw); -- { serverError 481 }
 attach table test from '../../../../../../../../../etc/passwd' (s String) engine=File(TSVRaw); -- { serverError 481 }
+attach table test from 42 (s String) engine=File(TSVRaw); -- { clientError 62 }
 
 insert into table function file('01188_attach/file/data.TSV', 'TSV', 's String, n UInt8') values ('file', 42);
 attach table file from '01188_attach/file' (s String, n UInt8) engine=File(TSV);

From d24bfce93fda2d35360213adc3f90936d8cab010 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 7 Oct 2021 17:03:54 +0300
Subject: [PATCH 051/104] Add coroutines example.

---
 src/Core/examples/CMakeLists.txt |   3 +
 src/Core/examples/coro.cpp       | 202 +++++++++++++++++++++++++++++++
 2 files changed, 205 insertions(+)
 create mode 100644 src/Core/examples/coro.cpp

diff --git a/src/Core/examples/CMakeLists.txt b/src/Core/examples/CMakeLists.txt
index 6b07dfbbfa6..c8846eb1743 100644
--- a/src/Core/examples/CMakeLists.txt
+++ b/src/Core/examples/CMakeLists.txt
@@ -13,3 +13,6 @@ target_link_libraries (mysql_protocol PRIVATE dbms)
 if(USE_SSL)
     target_include_directories (mysql_protocol SYSTEM PRIVATE ${OPENSSL_INCLUDE_DIR})
 endif()
+
+add_executable (coro coro.cpp)
+target_link_libraries (coro PRIVATE clickhouse_common_io)
diff --git a/src/Core/examples/coro.cpp b/src/Core/examples/coro.cpp
new file mode 100644
index 00000000000..c8e2f7418e4
--- /dev/null
+++ b/src/Core/examples/coro.cpp
@@ -0,0 +1,202 @@
+#include <iostream>
+
+#include <cassert>
+#include <iostream>
+#include <string>
+#include <optional>
+
+#include <Common/Exception.h>
+#include <base/logger_useful.h>
+#include <Poco/ConsoleChannel.h>
+#include <Poco/Logger.h>
+#include <Poco/AutoPtr.h>
+
+#if defined(__clang__)
+
+#include <experimental/coroutine>
+
+template <typename T>
+using coroutine_handle = std::experimental::coroutine_handle<T>;
+
+using default_coroutine_handle = std::experimental::coroutine_handle<>;
+
+using suspend_never = std::experimental::suspend_never;
+using suspend_always = std::experimental::suspend_always;
+
+#else
+
+#include <coroutine>
+
+template <typename T>
+using coroutine_handle = std::coroutine_handle<T>;
+
+using default_coroutine_handle = std::coroutine_handle<>;
+
+using suspend_never = std::suspend_never;
+using suspend_always = std::suspend_always;
+
+#endif
+
+
+template <typename T>
+struct suspend_never_val
+{
+    constexpr bool await_ready() const noexcept { return true; }
+    constexpr void await_suspend(default_coroutine_handle) const noexcept {}
+    constexpr T await_resume() const noexcept
+    {
+        std::cout << "  ret " << val << std::endl;
+        return val;
+    }
+
+    T val;
+};
+
+template <typename T>
+struct resumable
+{
+    struct promise_type
+    {
+        using coro_handle = coroutine_handle<promise_type>;
+        auto get_return_object() { return coro_handle::from_promise(*this); }
+        auto initial_suspend() { return suspend_never(); }
+        auto final_suspend() noexcept { return suspend_never_val<T>{*r->value}; }
+        //void return_void() {}
+        void return_value(T value_) { r->value = value_; }
+        void unhandled_exception()
+        {
+            DB::tryLogCurrentException("Logger");
+            r->exception = std::current_exception();
+        }
+
+        explicit promise_type(std::string tag_) : tag(tag_) {}
+        ~promise_type() { std::cout << "~promise_type " << tag << std::endl; }
+        std::string tag;
+        coro_handle next;
+        resumable * r = nullptr;
+    };
+
+    using coro_handle = coroutine_handle<promise_type>;
+
+    bool await_ready() const noexcept { return false; }
+    void await_suspend(coro_handle g) noexcept
+    {
+        std::cout << "  await_suspend " << my.promise().tag << std::endl;
+        std::cout << "  g tag " << g.promise().tag << std::endl;
+        g.promise().next = my;
+    }
+    T await_resume() noexcept
+    {
+        std::cout << "  await_res " << my.promise().tag << std::endl;
+        return *value;
+    }
+
+    resumable(coro_handle handle) : my(handle), tag(handle.promise().tag)
+    {
+        assert(handle);
+        my.promise().r = this;
+        std::cout << "    resumable " << tag << std::endl;
+    }
+    resumable(resumable &) = delete;
+    resumable(resumable &&rhs) : my(rhs.my), tag(rhs.tag)
+    {
+        rhs.my = {};
+        std::cout << "    resumable&& " << tag << std::endl;
+    }
+    static bool resume_impl(resumable *r)
+    {
+        if (r->value)
+        return false;
+
+        auto & next = r->my.promise().next;
+
+        if (next)
+        {
+            if (resume_impl(next.promise().r))
+            return true;
+            next = {};
+        }
+
+        if (!r->value)
+        {
+            r->my.resume();
+            if (r->exception)
+                std::rethrow_exception(r->exception);
+        }
+        return !r->value;
+    }
+
+    bool resume()
+    {
+        return resume_impl(this);
+    }
+
+    T res()
+    {
+        return *value;
+    }
+
+    ~resumable()
+    {
+        std::cout << "    ~resumable " << tag << std::endl;
+    }
+
+private:
+    coro_handle my;
+    std::string tag;
+    std::optional<T> value;
+    std::exception_ptr exception;
+};
+
+resumable<int> boo(std::string tag)
+{
+    std::cout << "x" << std::endl;
+    co_await suspend_always();
+    std::cout << StackTrace().toString();
+    std::cout << "y" << std::endl;
+    co_return 1;
+}
+
+resumable<int> bar(std::string tag)
+{
+    std::cout << "a" << std::endl;
+    int res1 = co_await boo("boo1");
+    std::cout << "b " << res1 << std::endl;
+    int res2 = co_await boo("boo2");
+    if (res2 == 1)
+        throw DB::Exception(1, "hello");
+    std::cout << "c " << res2 << std::endl;
+    co_return res1 + res2;  // 1 + 1 = 2
+}
+
+resumable<int> foo(std::string tag) {
+    std::cout << "Hello" << std::endl;
+    auto res1 = co_await bar("bar1");
+    std::cout << "Coro " << res1 << std::endl;
+    auto res2 = co_await bar("bar2");
+    std::cout << "World " << res2 << std::endl;
+    co_return res1 * res2; // 2 * 2 = 4
+}
+
+int main()
+{
+    Poco::AutoPtr<Poco::ConsoleChannel> app_channel(new Poco::ConsoleChannel(std::cerr));
+    Poco::Logger::root().setChannel(app_channel);
+    Poco::Logger::root().setLevel("trace");
+
+    LOG_INFO(&Poco::Logger::get(""), "Starting");
+
+    try
+    {
+        auto t = foo("foo");
+        std::cout << ".. started" << std::endl;
+        while (t.resume())
+        std::cout << ".. yielded" << std::endl;
+        std::cout << ".. done: " << t.res() << std::endl;
+    }
+    catch (DB::Exception & e)
+    {
+        std::cout << "Got exception " << e.what() << std::endl;
+        std::cout << e.getStackTraceString() << std::endl;
+    }
+}

From 213d68d9958855c07f5551e617eaa091af6fa36e Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Thu, 7 Oct 2021 20:27:13 +0300
Subject: [PATCH 052/104] Fix some tests.

---
 .../DistinctSortedBlockInputStream.cpp        |  3 +++
 src/DataStreams/TTLBlockInputStream.cpp       | 24 ++++++++++++-----
 src/DataStreams/TTLBlockInputStream.h         |  7 ++---
 src/DataStreams/TTLCalcInputStream.cpp        | 26 +++++++++++++++----
 src/DataStreams/TTLCalcInputStream.h          |  7 ++---
 5 files changed, 50 insertions(+), 17 deletions(-)

diff --git a/src/DataStreams/DistinctSortedBlockInputStream.cpp b/src/DataStreams/DistinctSortedBlockInputStream.cpp
index a3105d6330c..47421941b45 100644
--- a/src/DataStreams/DistinctSortedBlockInputStream.cpp
+++ b/src/DataStreams/DistinctSortedBlockInputStream.cpp
@@ -47,7 +47,10 @@ void DistinctSortedTransform::transform(Chunk & chunk)
 
         /// Just go to the next block if there isn't any new record in the current one.
         if (!has_new_data)
+        {
+            chunk.clear();
             return;
+        }
 
         if (!set_size_limits.check(data.getTotalRowCount(), data.getTotalByteCount(), "DISTINCT", ErrorCodes::SET_SIZE_LIMIT_EXCEEDED))
         {
diff --git a/src/DataStreams/TTLBlockInputStream.cpp b/src/DataStreams/TTLBlockInputStream.cpp
index 1a1484fc08e..b476f689e60 100644
--- a/src/DataStreams/TTLBlockInputStream.cpp
+++ b/src/DataStreams/TTLBlockInputStream.cpp
@@ -23,7 +23,7 @@ TTLTransform::TTLTransform(
     const MergeTreeData::MutableDataPartPtr & data_part_,
     time_t current_time_,
     bool force_)
-    : ISimpleTransform(header_, header_, false)
+    : IAccumulatingTransform(header_, header_)
     , data_part(data_part_)
     , log(&Poco::Logger::get(storage_.getLogName() + " (TTLTransform)"))
 {
@@ -97,16 +97,16 @@ Block reorderColumns(Block block, const Block & header)
     return res;
 }
 
-void TTLTransform::transform(Chunk & chunk)
+void TTLTransform::consume(Chunk chunk)
 {
     if (all_data_dropped)
     {
-        stopReading();
-        chunk.clear();
+        finishConsume();
         return;
     }
 
     auto block = getInputPort().getHeader().cloneWithColumns(chunk.detachColumns());
+
     for (const auto & algorithm : algorithms)
         algorithm->execute(block);
 
@@ -114,8 +114,20 @@ void TTLTransform::transform(Chunk & chunk)
         return;
 
     size_t num_rows = block.rows();
+    setReadyChunk(Chunk(reorderColumns(std::move(block), getOutputPort().getHeader()).getColumns(), num_rows));
+}
 
-    chunk = Chunk(reorderColumns(std::move(block), getOutputPort().getHeader()).getColumns(), num_rows);
+Chunk TTLTransform::generate()
+{
+    Block block;
+    for (const auto & algorithm : algorithms)
+        algorithm->execute(block);
+
+    if (!block)
+        return {};
+
+    size_t num_rows = block.rows();
+    return Chunk(reorderColumns(std::move(block), getOutputPort().getHeader()).getColumns(), num_rows);
 }
 
 void TTLTransform::finalize()
@@ -133,7 +145,7 @@ void TTLTransform::finalize()
 
 IProcessor::Status TTLTransform::prepare()
 {
-    auto status = ISimpleTransform::prepare();
+    auto status = IAccumulatingTransform::prepare();
     if (status == Status::Finished)
         finalize();
 
diff --git a/src/DataStreams/TTLBlockInputStream.h b/src/DataStreams/TTLBlockInputStream.h
index 986181df652..50b28e81bdf 100644
--- a/src/DataStreams/TTLBlockInputStream.h
+++ b/src/DataStreams/TTLBlockInputStream.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Processors/ISimpleTransform.h>
+#include <Processors/IAccumulatingTransform.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Core/Block.h>
@@ -12,7 +12,7 @@
 namespace DB
 {
 
-class TTLTransform : public ISimpleTransform
+class TTLTransform : public IAccumulatingTransform
 {
 public:
     TTLTransform(
@@ -29,7 +29,8 @@ public:
     Status prepare() override;
 
 protected:
-    void transform(Chunk & chunk) override;
+    void consume(Chunk chunk) override;
+    Chunk generate() override;
 
     /// Finalizes ttl infos and updates data part
     void finalize();
diff --git a/src/DataStreams/TTLCalcInputStream.cpp b/src/DataStreams/TTLCalcInputStream.cpp
index c156b31428a..fe85e40c003 100644
--- a/src/DataStreams/TTLCalcInputStream.cpp
+++ b/src/DataStreams/TTLCalcInputStream.cpp
@@ -11,9 +11,9 @@ TTLCalcTransform::TTLCalcTransform(
     const MergeTreeData::MutableDataPartPtr & data_part_,
     time_t current_time_,
     bool force_)
-    : ISimpleTransform(header_, header_, true)
+    : IAccumulatingTransform(header_, header_)
     , data_part(data_part_)
-    , log(&Poco::Logger::get(storage_.getLogName() + " (TTLCalcInputStream)"))
+    , log(&Poco::Logger::get(storage_.getLogName() + " (TTLCalcTransform)"))
 {
     auto old_ttl_infos = data_part->ttl_infos;
 
@@ -50,7 +50,7 @@ TTLCalcTransform::TTLCalcTransform(
             recompression_ttl, TTLUpdateField::RECOMPRESSION_TTL, recompression_ttl.result_column, old_ttl_infos.recompression_ttl[recompression_ttl.result_column], current_time_, force_));
 }
 
-void TTLCalcTransform::transform(Chunk & chunk)
+void TTLCalcTransform::consume(Chunk chunk)
 {
     auto block = getInputPort().getHeader().cloneWithColumns(chunk.detachColumns());
     for (const auto & algorithm : algorithms)
@@ -63,7 +63,23 @@ void TTLCalcTransform::transform(Chunk & chunk)
     for (const auto & col : getOutputPort().getHeader())
         res.addColumn(block.getByName(col.name).column);
 
-    chunk = std::move(res);
+    setReadyChunk(std::move(res));
+}
+
+Chunk TTLCalcTransform::generate()
+{
+    Block block;
+    for (const auto & algorithm : algorithms)
+        algorithm->execute(block);
+
+    if (!block)
+        return {};
+
+    Chunk res;
+    for (const auto & col : getOutputPort().getHeader())
+        res.addColumn(block.getByName(col.name).column);
+
+    return res;
 }
 
 void TTLCalcTransform::finalize()
@@ -75,7 +91,7 @@ void TTLCalcTransform::finalize()
 
 IProcessor::Status TTLCalcTransform::prepare()
 {
-    auto status = ISimpleTransform::prepare();
+    auto status = IAccumulatingTransform::prepare();
     if (status == Status::Finished)
         finalize();
 
diff --git a/src/DataStreams/TTLCalcInputStream.h b/src/DataStreams/TTLCalcInputStream.h
index d0e7b0055f2..b6318026b8c 100644
--- a/src/DataStreams/TTLCalcInputStream.h
+++ b/src/DataStreams/TTLCalcInputStream.h
@@ -1,5 +1,5 @@
 #pragma once
-#include <Processors/ISimpleTransform.h>
+#include <Processors/IAccumulatingTransform.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Core/Block.h>
@@ -11,7 +11,7 @@
 namespace DB
 {
 
-class TTLCalcTransform : public ISimpleTransform
+class TTLCalcTransform : public IAccumulatingTransform
 {
 public:
     TTLCalcTransform(
@@ -27,7 +27,8 @@ public:
     Status prepare() override;
 
 protected:
-    void transform(Chunk & chunk) override;
+    void consume(Chunk chunk) override;
+    Chunk generate() override;
 
     /// Finalizes ttl infos and updates data part
     void finalize();

From ee347fc4160c36c0505fbf79bdab8e1f19dce4f4 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:02:38 +0300
Subject: [PATCH 053/104] Update changelog to include caveats about Nullable
 types in data skipping indexes

---
 CHANGELOG.md | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index babb5ebca8d..d203fcba4c8 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -110,6 +110,7 @@
 * Fix the issue that in case of some sophisticated query with column aliases identical to the names of expressions, bad cast may happen. This fixes [#25447](https://github.com/ClickHouse/ClickHouse/issues/25447). This fixes [#26914](https://github.com/ClickHouse/ClickHouse/issues/26914). This fix may introduce backward incompatibility: if there are different expressions with identical names, exception will be thrown. It may break some rare cases when `enable_optimize_predicate_expression` is set. [#26639](https://github.com/ClickHouse/ClickHouse/pull/26639) ([alexey-milovidov](https://github.com/alexey-milovidov)).
 * Now, scalar subquery always returns `Nullable` result if it's type can be `Nullable`. It is needed because in case of empty subquery it's result should be `Null`. Previously, it was possible to get error about incompatible types (type deduction does not execute scalar subquery, and it could use not-nullable type). Scalar subquery with empty result which can't be converted to `Nullable` (like `Array` or `Tuple`) now throws error. Fixes [#25411](https://github.com/ClickHouse/ClickHouse/issues/25411). [#26423](https://github.com/ClickHouse/ClickHouse/pull/26423) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
 * Introduce syntax for here documents. Example `SELECT $doc$ VALUE $doc$`. [#26671](https://github.com/ClickHouse/ClickHouse/pull/26671) ([Maksim Kita](https://github.com/kitaisreal)). This change is backward incompatible if in query there are identifiers that contain `$` [#28768](https://github.com/ClickHouse/ClickHouse/issues/28768).
+* Now indices can handle Nullable types, including `isNull` and `isNotNull`. [#12433](https://github.com/ClickHouse/ClickHouse/pull/12433) and [#12455](https://github.com/ClickHouse/ClickHouse/pull/12455) ([Amos Bird](https://github.com/amosbird)) and [#27250](https://github.com/ClickHouse/ClickHouse/pull/27250) ([Azat Khuzhin](https://github.com/azat)). But this was done with on-disk format changes, and even though new server can read old data, old server cannot. Also, in case you have `MINMAX` data skipping indices, you may get `Data after mutation/merge is not byte-identical` error, since new index will have `.idx2` extension while before it was `.idx`. That said, that you should not delay updating all existing replicas, in this case, otherwise, if old replica (<21.9) will download data from new replica with 21.9+ it will not be able to apply index for downloaded part.
 
 #### New Feature
 
@@ -179,7 +180,6 @@
 * Add setting `log_formatted_queries` to log additional formatted query into `system.query_log`. It's useful for normalized query analysis because functions like `normalizeQuery` and `normalizeQueryKeepNames` don't parse/format queries in order to achieve better performance. [#27380](https://github.com/ClickHouse/ClickHouse/pull/27380) ([Amos Bird](https://github.com/amosbird)).
 * Add two settings `max_hyperscan_regexp_length` and `max_hyperscan_regexp_total_length` to prevent huge regexp being used in hyperscan related functions, such as `multiMatchAny`. [#27378](https://github.com/ClickHouse/ClickHouse/pull/27378) ([Amos Bird](https://github.com/amosbird)).
 * Memory consumed by bitmap aggregate functions now is taken into account for memory limits. This closes [#26555](https://github.com/ClickHouse/ClickHouse/issues/26555). [#27252](https://github.com/ClickHouse/ClickHouse/pull/27252) ([alexey-milovidov](https://github.com/alexey-milovidov)).
-* Add new index data skipping minmax index format for proper Nullable support. [#27250](https://github.com/ClickHouse/ClickHouse/pull/27250) ([Azat Khuzhin](https://github.com/azat)).
 * Add 10 seconds cache for S3 proxy resolver. [#27216](https://github.com/ClickHouse/ClickHouse/pull/27216) ([ianton-ru](https://github.com/ianton-ru)).
 * Split global mutex into individual regexp construction. This helps avoid huge regexp construction blocking other related threads. [#27211](https://github.com/ClickHouse/ClickHouse/pull/27211) ([Amos Bird](https://github.com/amosbird)).
 * Support schema for PostgreSQL database engine. Closes [#27166](https://github.com/ClickHouse/ClickHouse/issues/27166). [#27198](https://github.com/ClickHouse/ClickHouse/pull/27198) ([Kseniia Sumarokova](https://github.com/kssenii)).
@@ -234,7 +234,6 @@
 * Fix multiple block insertion into distributed table with `insert_distributed_one_random_shard = 1`. This is a marginal feature. Mark as improvement. [#23140](https://github.com/ClickHouse/ClickHouse/pull/23140) ([Amos Bird](https://github.com/amosbird)).
 * Support `LowCardinality` and `FixedString` keys/values for `Map` type. [#21543](https://github.com/ClickHouse/ClickHouse/pull/21543) ([hexiaoting](https://github.com/hexiaoting)).
 * Enable reloading of local disk config. [#19526](https://github.com/ClickHouse/ClickHouse/pull/19526) ([taiyang-li](https://github.com/taiyang-li)).
-* Now KeyConditions can correctly skip nullable keys, including `isNull` and `isNotNull`. https://github.com/ClickHouse/ClickHouse/pull/12433. [#12455](https://github.com/ClickHouse/ClickHouse/pull/12455) ([Amos Bird](https://github.com/amosbird)).
 
 #### Bug Fix
 

From 1b8e3b6b962df0c0bf26fbdf86cefbc2e12ebaa0 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:10:44 +0300
Subject: [PATCH 054/104] Fix system tables recreation check (fails to detect
 changes in enum values)

Fixes: #23934 (cc @kitaisreal)
---
 src/Interpreters/SystemLog.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/SystemLog.h b/src/Interpreters/SystemLog.h
index 615180d27dd..ce0062e8c77 100644
--- a/src/Interpreters/SystemLog.h
+++ b/src/Interpreters/SystemLog.h
@@ -527,7 +527,7 @@ void SystemLog<LogElement>::prepareTable()
         auto alias_columns = LogElement::getNamesAndAliases();
         auto current_query = InterpreterCreateQuery::formatColumns(ordinary_columns, alias_columns);
 
-        if (old_query->getTreeHash() != current_query->getTreeHash())
+        if (serializeAST(*old_query) != serializeAST(*current_query))
         {
             /// Rename the existing table.
             int suffix = 0;

From bf88f102fe7e0cd94b80ab29dbf2ebaebd9645bb Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:13:56 +0300
Subject: [PATCH 055/104] Add ability to trace peak memory usage (with new
 trace_type - MemoryPeak)

---
 src/Common/MemoryTracker.cpp                  | 19 ++++++++++++++++---
 src/Common/MemoryTracker.h                    |  2 +-
 src/Common/TraceCollector.h                   |  3 ++-
 src/Interpreters/TraceLog.cpp                 |  1 +
 .../01092_memory_profiler.reference           |  1 +
 .../0_stateless/01092_memory_profiler.sql     |  1 +
 6 files changed, 22 insertions(+), 5 deletions(-)

diff --git a/src/Common/MemoryTracker.cpp b/src/Common/MemoryTracker.cpp
index 205771a5f6c..013005442be 100644
--- a/src/Common/MemoryTracker.cpp
+++ b/src/Common/MemoryTracker.cpp
@@ -200,11 +200,13 @@ void MemoryTracker::allocImpl(Int64 size, bool throw_if_memory_exceeded)
     }
 
 
+    bool allocation_traced = false;
     if (unlikely(current_profiler_limit && will_be > current_profiler_limit))
     {
         BlockerInThread untrack_lock(VariableContext::Global);
         DB::TraceCollector::collect(DB::TraceType::Memory, StackTrace(), size);
         setOrRaiseProfilerLimit((will_be + profiler_step - 1) / profiler_step * profiler_step);
+        allocation_traced = true;
     }
 
     std::bernoulli_distribution sample(sample_probability);
@@ -212,6 +214,7 @@ void MemoryTracker::allocImpl(Int64 size, bool throw_if_memory_exceeded)
     {
         BlockerInThread untrack_lock(VariableContext::Global);
         DB::TraceCollector::collect(DB::TraceType::MemorySample, StackTrace(), size);
+        allocation_traced = true;
     }
 
     if (unlikely(current_hard_limit && will_be > current_hard_limit) && memoryTrackerCanThrow(level, false) && throw_if_memory_exceeded)
@@ -230,17 +233,24 @@ void MemoryTracker::allocImpl(Int64 size, bool throw_if_memory_exceeded)
             formatReadableSizeWithBinarySuffix(current_hard_limit));
     }
 
+    bool peak_updated;
     if (throw_if_memory_exceeded)
     {
         /// Prevent recursion. Exception::ctor -> std::string -> new[] -> MemoryTracker::alloc
         BlockerInThread untrack_lock(VariableContext::Global);
         bool log_memory_usage = true;
-        updatePeak(will_be, log_memory_usage);
+        peak_updated = updatePeak(will_be, log_memory_usage);
     }
     else
     {
         bool log_memory_usage = false;
-        updatePeak(will_be, log_memory_usage);
+        peak_updated = updatePeak(will_be, log_memory_usage);
+    }
+
+    if (peak_updated && allocation_traced)
+    {
+        BlockerInThread untrack_lock(VariableContext::Global);
+        DB::TraceCollector::collect(DB::TraceType::MemoryPeak, StackTrace(), will_be);
     }
 
     if (auto * loaded_next = parent.load(std::memory_order_relaxed))
@@ -259,7 +269,7 @@ void MemoryTracker::allocNoThrow(Int64 size)
     allocImpl(size, throw_if_memory_exceeded);
 }
 
-void MemoryTracker::updatePeak(Int64 will_be, bool log_memory_usage)
+bool MemoryTracker::updatePeak(Int64 will_be, bool log_memory_usage)
 {
     auto peak_old = peak.load(std::memory_order_relaxed);
     if (will_be > peak_old)        /// Races doesn't matter. Could rewrite with CAS, but not worth.
@@ -269,7 +279,10 @@ void MemoryTracker::updatePeak(Int64 will_be, bool log_memory_usage)
         if (log_memory_usage && (level == VariableContext::Process || level == VariableContext::Global)
             && will_be / log_peak_memory_usage_every > peak_old / log_peak_memory_usage_every)
             logMemoryUsage(will_be);
+
+        return true;
     }
+    return false;
 }
 
 
diff --git a/src/Common/MemoryTracker.h b/src/Common/MemoryTracker.h
index 36560fec334..af5cdd1e41b 100644
--- a/src/Common/MemoryTracker.h
+++ b/src/Common/MemoryTracker.h
@@ -58,7 +58,7 @@ private:
     /// This description will be used as prefix into log messages (if isn't nullptr)
     std::atomic<const char *> description_ptr = nullptr;
 
-    void updatePeak(Int64 will_be, bool log_memory_usage);
+    bool updatePeak(Int64 will_be, bool log_memory_usage);
     void logMemoryUsage(Int64 current) const;
 
 public:
diff --git a/src/Common/TraceCollector.h b/src/Common/TraceCollector.h
index 86e9d659d0a..d3bbc74726e 100644
--- a/src/Common/TraceCollector.h
+++ b/src/Common/TraceCollector.h
@@ -20,7 +20,8 @@ enum class TraceType : uint8_t
     Real,
     CPU,
     Memory,
-    MemorySample
+    MemorySample,
+    MemoryPeak,
 };
 
 class TraceCollector
diff --git a/src/Interpreters/TraceLog.cpp b/src/Interpreters/TraceLog.cpp
index dac27aebe58..c16a73e75dc 100644
--- a/src/Interpreters/TraceLog.cpp
+++ b/src/Interpreters/TraceLog.cpp
@@ -19,6 +19,7 @@ const TraceDataType::Values TraceLogElement::trace_values =
     {"CPU", static_cast<UInt8>(TraceType::CPU)},
     {"Memory", static_cast<UInt8>(TraceType::Memory)},
     {"MemorySample", static_cast<UInt8>(TraceType::MemorySample)},
+    {"MemoryPeak", static_cast<UInt8>(TraceType::MemoryPeak)},
 };
 
 NamesAndTypesList TraceLogElement::getNamesAndTypes()
diff --git a/tests/queries/0_stateless/01092_memory_profiler.reference b/tests/queries/0_stateless/01092_memory_profiler.reference
index 0d66ea1aee9..986394f7c0f 100644
--- a/tests/queries/0_stateless/01092_memory_profiler.reference
+++ b/tests/queries/0_stateless/01092_memory_profiler.reference
@@ -1,2 +1,3 @@
 0
 1
+1
diff --git a/tests/queries/0_stateless/01092_memory_profiler.sql b/tests/queries/0_stateless/01092_memory_profiler.sql
index 0988f56413e..658877a1dee 100644
--- a/tests/queries/0_stateless/01092_memory_profiler.sql
+++ b/tests/queries/0_stateless/01092_memory_profiler.sql
@@ -6,3 +6,4 @@ SET memory_profiler_step = 1000000;
 SELECT ignore(groupArray(number), 'test memory profiler') FROM numbers(10000000);
 SYSTEM FLUSH LOGS;
 WITH addressToSymbol(arrayJoin(trace)) AS symbol SELECT count() > 0 FROM system.trace_log t WHERE event_date >= yesterday() AND trace_type = 'Memory' AND query_id = (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND event_date >= yesterday() AND query LIKE '%test memory profiler%' ORDER BY event_time DESC LIMIT 1);
+WITH addressToSymbol(arrayJoin(trace)) AS symbol SELECT count() > 0 FROM system.trace_log t WHERE event_date >= yesterday() AND trace_type = 'MemoryPeak' AND query_id = (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND event_date >= yesterday() AND query LIKE '%test memory profiler%' ORDER BY event_time DESC LIMIT 1);

From 0c0427dc45e0e30b47ac65fd376e14f6f8d0894d Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:13:56 +0300
Subject: [PATCH 056/104] Cover memory_profiler_sample_probability in
 01092_memory_profiler

---
 tests/queries/0_stateless/01092_memory_profiler.reference | 1 +
 tests/queries/0_stateless/01092_memory_profiler.sql       | 3 +++
 2 files changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/01092_memory_profiler.reference b/tests/queries/0_stateless/01092_memory_profiler.reference
index 986394f7c0f..74240c4b196 100644
--- a/tests/queries/0_stateless/01092_memory_profiler.reference
+++ b/tests/queries/0_stateless/01092_memory_profiler.reference
@@ -1,3 +1,4 @@
 0
 1
 1
+1
diff --git a/tests/queries/0_stateless/01092_memory_profiler.sql b/tests/queries/0_stateless/01092_memory_profiler.sql
index 658877a1dee..b997550e093 100644
--- a/tests/queries/0_stateless/01092_memory_profiler.sql
+++ b/tests/queries/0_stateless/01092_memory_profiler.sql
@@ -3,7 +3,10 @@
 SET allow_introspection_functions = 1;
 
 SET memory_profiler_step = 1000000;
+SET memory_profiler_sample_probability = 1;
+
 SELECT ignore(groupArray(number), 'test memory profiler') FROM numbers(10000000);
 SYSTEM FLUSH LOGS;
 WITH addressToSymbol(arrayJoin(trace)) AS symbol SELECT count() > 0 FROM system.trace_log t WHERE event_date >= yesterday() AND trace_type = 'Memory' AND query_id = (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND event_date >= yesterday() AND query LIKE '%test memory profiler%' ORDER BY event_time DESC LIMIT 1);
 WITH addressToSymbol(arrayJoin(trace)) AS symbol SELECT count() > 0 FROM system.trace_log t WHERE event_date >= yesterday() AND trace_type = 'MemoryPeak' AND query_id = (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND event_date >= yesterday() AND query LIKE '%test memory profiler%' ORDER BY event_time DESC LIMIT 1);
+WITH addressToSymbol(arrayJoin(trace)) AS symbol SELECT count() > 0 FROM system.trace_log t WHERE event_date >= yesterday() AND trace_type = 'MemorySample' AND query_id = (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND event_date >= yesterday() AND query LIKE '%test memory profiler%' ORDER BY event_time DESC LIMIT 1);

From a171dfd75ec3f27e630696b46ee30f77bca66eb6 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:13:56 +0300
Subject: [PATCH 057/104] Make 01092_memory_profiler more robust for dev env

---
 tests/queries/0_stateless/01092_memory_profiler.sql | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/01092_memory_profiler.sql b/tests/queries/0_stateless/01092_memory_profiler.sql
index b997550e093..0db88bb14b3 100644
--- a/tests/queries/0_stateless/01092_memory_profiler.sql
+++ b/tests/queries/0_stateless/01092_memory_profiler.sql
@@ -4,6 +4,7 @@ SET allow_introspection_functions = 1;
 
 SET memory_profiler_step = 1000000;
 SET memory_profiler_sample_probability = 1;
+SET log_queries = 1;
 
 SELECT ignore(groupArray(number), 'test memory profiler') FROM numbers(10000000);
 SYSTEM FLUSH LOGS;

From 90cc63aecd37ffe7a3f6497b462be55540bc70a5 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Thu, 7 Oct 2021 22:05:51 +0300
Subject: [PATCH 058/104] fix tests

---
 tests/integration/helpers/cluster.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 5ac4dbc8ad0..5ba67085d73 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -2357,17 +2357,20 @@ class ClickHouseInstance:
         dictionaries_dir = p.abspath(p.join(instance_config_dir, 'dictionaries'))
         os.mkdir(dictionaries_dir)
 
-        def write_embedded_config(name, dest_dir):
+        def write_embedded_config(name, dest_dir, fix_log_level=False):
             with open(p.join(HELPERS_DIR, name), 'r') as f:
                 data = f.read()
                 data = data.replace('yandex', self.config_root_name)
+                if fix_log_level:
+                    data = data.replace('<level>test</level>', '<level>trace</level>')
                 with open(p.join(dest_dir, name), 'w') as r:
                     r.write(data)
 
         logging.debug("Copy common configuration from helpers")
         # The file is named with 0_ prefix to be processed before other configuration overloads.
         if self.copy_common_configs:
-            write_embedded_config('0_common_instance_config.xml', self.config_d_dir)
+            need_fix_log_level = self.tag != 'latest'
+            write_embedded_config('0_common_instance_config.xml', self.config_d_dir, need_fix_log_level)
 
         write_embedded_config('0_common_instance_users.xml', users_d_dir)
 

From c734ada95ba7d5f13591acd32edb38f716784f64 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 7 Oct 2021 20:26:58 +0000
Subject: [PATCH 059/104] Fix

---
 src/Client/ClientBase.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index cde5a5f9977..b68df11fd60 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -426,10 +426,8 @@ void ClientBase::processTextAsSingleQuery(const String & full_query)
     catch (Exception & e)
     {
         if (!is_interactive)
-        {
             e.addMessage("(in query: {})", full_query);
-            throw;
-        }
+        throw;
     }
 
     if (have_error)

From e07a6f3fc0ea0b496483287d85b50d29f5a8c330 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:09:35 +0300
Subject: [PATCH 060/104] docker: add pandas/clickhouse_driver into test images

---
 docker/test/fasttest/Dockerfile  | 2 +-
 docker/test/fuzzer/Dockerfile    | 2 +-
 docker/test/stateless/Dockerfile | 2 +-
 docker/test/style/Dockerfile     | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docker/test/fasttest/Dockerfile b/docker/test/fasttest/Dockerfile
index 798910fb952..f50c65bb9f2 100644
--- a/docker/test/fasttest/Dockerfile
+++ b/docker/test/fasttest/Dockerfile
@@ -67,7 +67,7 @@ RUN apt-get update \
         unixodbc \
        --yes --no-install-recommends
 
-RUN pip3 install numpy scipy pandas Jinja2
+RUN pip3 install numpy scipy pandas Jinja2 pandas clickhouse_driver
 
 # This symlink required by gcc to find lld compiler
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld
diff --git a/docker/test/fuzzer/Dockerfile b/docker/test/fuzzer/Dockerfile
index 6444e745c47..13353bc2960 100644
--- a/docker/test/fuzzer/Dockerfile
+++ b/docker/test/fuzzer/Dockerfile
@@ -27,7 +27,7 @@ RUN apt-get update \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/*
 
-RUN pip3 install Jinja2
+RUN pip3 install Jinja2 pandas clickhouse_driver
 
 COPY * /
 
diff --git a/docker/test/stateless/Dockerfile b/docker/test/stateless/Dockerfile
index 7de8c061673..a5733d11dd2 100644
--- a/docker/test/stateless/Dockerfile
+++ b/docker/test/stateless/Dockerfile
@@ -34,7 +34,7 @@ RUN apt-get update -y \
             postgresql-client \
             sqlite3
 
-RUN pip3 install numpy scipy pandas Jinja2
+RUN pip3 install numpy scipy pandas Jinja2 clickhouse_driver
 
 RUN mkdir -p /tmp/clickhouse-odbc-tmp \
    && wget -nv -O - ${odbc_driver_url} | tar --strip-components=1 -xz -C /tmp/clickhouse-odbc-tmp \
diff --git a/docker/test/style/Dockerfile b/docker/test/style/Dockerfile
index 33cdb9db57a..64cc0c9c7b7 100644
--- a/docker/test/style/Dockerfile
+++ b/docker/test/style/Dockerfile
@@ -10,7 +10,7 @@ RUN apt-get update && env DEBIAN_FRONTEND=noninteractive apt-get install --yes \
     python3-pip \
     pylint \
     yamllint \
-    && pip3 install codespell
+    && pip3 install codespell pandas clickhouse_driver
 
 COPY run.sh /
 COPY process_style_check_result.py /

From 9dd0fca1edd383c00667ce4c1a953e4f6d2bca1a Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 23:45:18 +0300
Subject: [PATCH 061/104] Suppress some existed warnings in clickhouse-test
 (will be fixed separately)

---
 tests/clickhouse-test | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 19080f3934f..2c8093190ea 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1,6 +1,12 @@
 #!/usr/bin/env python3
 
 # pylint: disable=too-many-return-statements
+# pylint: disable=consider-using-f-string
+# pylint: disable=global-variable-not-assigned
+# pylint: disable=consider-using-with
+# pylint: disable=unspecified-encoding
+# pylint: disable=consider-using-min-builtin
+
 import enum
 import shutil
 import sys

From df129d7efc70eb2abc394b72a0dd64c421de8549 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Oct 2021 21:05:42 +0300
Subject: [PATCH 062/104] Rewrite clickhouse-test to use python
 clickhouse_driver

Pros:
- Using native protocol over executing binaries is always better
- `clickhouse-client` in debug build takes almost a second to execute simple `SELECT 1`
  and `clickhouse-test` requires ~5 queries at start (determine some
  flags, zk, alive, create database)

Notes:
- `FORMAT Vertical` had been replaced with printing of `pandas.DataFrame`

And after this patch tiny tests work with the speed of the test, and
does not requires +-5 seconds of bootstrapping.
---
 tests/clickhouse-test | 424 +++++++++++++++++++-----------------------
 1 file changed, 193 insertions(+), 231 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 2c8093190ea..e8c85a6ae79 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -19,13 +19,10 @@ import traceback
 import math
 
 from argparse import ArgumentParser
-from typing import Tuple, Union, Optional, TextIO, Dict, Set, List
-import shlex
+from typing import Tuple, Union, Optional, Dict, Set, List
 import subprocess
 from subprocess import Popen
 from subprocess import PIPE
-from subprocess import CalledProcessError
-from subprocess import TimeoutExpired
 from datetime import datetime
 from time import time, sleep
 from errno import ESRCH
@@ -41,6 +38,9 @@ import multiprocessing
 import socket
 from contextlib import closing
 
+import clickhouse_driver
+import pandas
+
 USE_JINJA = True
 try:
     import jinja2
@@ -48,20 +48,45 @@ except ImportError:
     USE_JINJA = False
     print('WARNING: jinja2 not installed! Template tests will be skipped.')
 
-DISTRIBUTED_DDL_TIMEOUT_MSG = "is executing longer than distributed_ddl_task_timeout"
-
 MESSAGES_TO_RETRY = [
     "ConnectionPoolWithFailover: Connection failed at try",
     "DB::Exception: New table appeared in database being dropped or detached. Try again",
     "is already started to be removing by another replica right now",
     "DB::Exception: Cannot enqueue query",
-    DISTRIBUTED_DDL_TIMEOUT_MSG  # FIXME
+    "is executing longer than distributed_ddl_task_timeout" # FIXME
+]
+error_codes = clickhouse_driver.errors.ErrorCodes
+error_codes.NOT_A_LEADER = 529
+ERROR_CODES_TO_RETRY = [
+    error_codes.ALL_CONNECTION_TRIES_FAILED,
+    error_codes.DATABASE_NOT_EMPTY,
+    error_codes.NOT_A_LEADER,
+    error_codes.UNFINISHED,
 ]
 
 MAX_RETRIES = 3
 
 TEST_FILE_EXTENSIONS = ['.sql', '.sql.j2', '.sh', '.py', '.expect']
 
+class Client(clickhouse_driver.Client):
+    # return first column of the first row
+    def execute_one(self, *args, **kwargs):
+        return super().execute(*args, **kwargs)[0][0]
+
+    # return pandas.DataFrame
+    def execute_pandas(self, *args, **kwargs):
+        data = super().execute(*args, **kwargs, with_column_types=True)
+        return Client.__combine(data)
+
+    @staticmethod
+    def __combine(data):
+        cols = data[1]
+        rows = data[0]
+        header = [ i[0] for i in cols ]
+        data = pandas.DataFrame(data=rows, columns=header)
+        return data
+
+
 class Terminated(KeyboardInterrupt):
     pass
 
@@ -103,18 +128,16 @@ def get_db_engine(args, database_name):
 
 
 def get_zookeeper_session_uptime(args):
+    global clickhouse_client
+
     try:
-        query = b"SELECT zookeeperSessionUptime()"
-
         if args.replicated_database:
-            query = b"SELECT min(materialize(zookeeperSessionUptime())) " \
-                    b"FROM clusterAllReplicas('test_cluster_database_replicated', system.one) "
-
-        clickhouse_proc = open_client_process(args.client)
-
-        (stdout, _) = clickhouse_proc.communicate((query), timeout=20)
-
-        return int(stdout.decode('utf-8').strip())
+            return int(clickhouse_client.execute_one("""
+            SELECT min(materialize(zookeeperSessionUptime()))
+            FROM clusterAllReplicas('test_cluster_database_replicated', system.one)
+            """))
+        else:
+            return int(clickhouse_client.execute_one('SELECT zookeeperSessionUptime()'))
     except:
         return None
 
@@ -128,24 +151,31 @@ def need_retry(args, stdout, stderr, total_time):
         return True
     return any(msg in stdout for msg in MESSAGES_TO_RETRY) or any(msg in stderr for msg in MESSAGES_TO_RETRY)
 
+def need_retry_error(args, error, total_time):
+    # Sometimes we may get unexpected exception like "Replica is readonly" or "Shutdown is called for table"
+    # instead of "Session expired" or "Connection loss"
+    # Retry if session was expired during test execution
+    session_uptime = get_zookeeper_session_uptime(args)
+    if session_uptime is not None and session_uptime < math.ceil(total_time):
+        return True
+    if isinstance(error, clickhouse_driver.errors.Error):
+        if error.code in ERROR_CODES_TO_RETRY:
+            return True
+        if any(msg in error.message for msg in MESSAGES_TO_RETRY):
+            return True
+    return False
+
 
 def get_processlist(args):
-    try:
-        query = b"SHOW PROCESSLIST FORMAT Vertical"
-
-        if args.replicated_database:
-            query = b"SELECT materialize((hostName(), tcpPort())) as host, * " \
-                    b"FROM clusterAllReplicas('test_cluster_database_replicated', system.processes) " \
-                    b"WHERE query NOT LIKE '%system.processes%' FORMAT Vertical"
-
-        clickhouse_proc = open_client_process(args.client)
-
-        (stdout, _) = clickhouse_proc.communicate((query), timeout=20)
-
-        return False, stdout.decode('utf-8')
-    except Exception as ex:
-        print("Exception", ex)
-        return True, ""
+    global clickhouse_client
+    if args.replicated_database:
+        return clickhouse_client.execute_pandas("""
+        SELECT materialize((hostName(), tcpPort())) as host, *
+        FROM clusterAllReplicas('test_cluster_database_replicated', system.processes)
+        WHERE query NOT LIKE '%system.processes%'
+        """)
+    else:
+        return clickhouse_client.execute_pandas('SHOW PROCESSLIST')
 
 
 # collect server stacktraces using gdb
@@ -311,7 +341,8 @@ class TestCase:
         return None
 
     @staticmethod
-    def configure_testcase_args(args, case_file, suite_tmp_dir, stderr_file):
+    def configure_testcase_args(args, case_file, suite_tmp_dir):
+        global clickhouse_client
         testcase_args = copy.deepcopy(args)
 
         testcase_args.testcase_start_time = datetime.now()
@@ -331,23 +362,11 @@ class TestCase:
 
             database = 'test_{suffix}'.format(suffix=random_str())
 
-            with open(stderr_file, 'w') as stderr:
-                client_cmd = testcase_args.testcase_client + " " \
-                             + get_additional_client_options(args)
-
-                clickhouse_proc_create = open_client_process(
-                    universal_newlines=True,
-                    client_args=client_cmd,
-                    stderr_file=stderr)
-
-                try:
-                    clickhouse_proc_create.communicate(
-                        ("CREATE DATABASE " + database + get_db_engine(testcase_args, database)),
-                        timeout=testcase_args.timeout)
-                except TimeoutExpired:
-                    total_time = (datetime.now() - testcase_args.testcase_start_time).total_seconds()
-                    return clickhouse_proc_create, "", "Timeout creating database {} before test".format(
-                        database), total_time
+            try:
+                clickhouse_client.execute("CREATE DATABASE " + database + get_db_engine(testcase_args, database), settings={'log_comment': testcase_basename})
+            except (TimeoutError, clickhouse_driver.errors.SocketTimeoutError):
+                total_time = (datetime.now() - testcase_args.testcase_start_time).total_seconds()
+                return None, "", f"Timeout creating database {database} before test", total_time
 
             os.environ["CLICKHOUSE_DATABASE"] = database
             # Set temporary directory to match the randomly generated database,
@@ -418,41 +437,42 @@ class TestCase:
     def process_result_impl(self, proc, stdout: str, stderr: str, total_time: float):
         description = ""
 
-        if proc.returncode is None:
-            try:
-                proc.kill()
-            except OSError as e:
-                if e.errno != ESRCH:
-                    raise
+        if proc:
+            if proc.returncode is None:
+                try:
+                    proc.kill()
+                except OSError as e:
+                    if e.errno != ESRCH:
+                        raise
 
-            if stderr:
-                description += stderr
-            return TestResult(self.name, TestStatus.FAIL, FailureReason.TIMEOUT, total_time, description)
+                if stderr:
+                    description += stderr
+                return TestResult(self.name, TestStatus.FAIL, FailureReason.TIMEOUT, total_time, description)
 
-        if proc.returncode != 0:
-            reason = FailureReason.EXIT_CODE
-            description += str(proc.returncode)
+            if proc.returncode != 0:
+                reason = FailureReason.EXIT_CODE
+                description += str(proc.returncode)
 
-            if stderr:
-                description += "\n"
-                description += stderr
+                if stderr:
+                    description += "\n"
+                    description += stderr
 
-            # Stop on fatal errors like segmentation fault. They are sent to client via logs.
-            if ' <Fatal> ' in stderr:
-                reason = FailureReason.SERVER_DIED
+                # Stop on fatal errors like segmentation fault. They are sent to client via logs.
+                if ' <Fatal> ' in stderr:
+                    reason = FailureReason.SERVER_DIED
 
-            if self.testcase_args.stop \
-                    and ('Connection refused' in stderr or 'Attempt to read after eof' in stderr) \
-                    and 'Received exception from server' not in stderr:
-                reason = FailureReason.SERVER_DIED
+                if self.testcase_args.stop \
+                        and ('Connection refused' in stderr or 'Attempt to read after eof' in stderr) \
+                        and 'Received exception from server' not in stderr:
+                    reason = FailureReason.SERVER_DIED
 
-            if os.path.isfile(self.stdout_file):
-                description += ", result:\n\n"
-                description += '\n'.join(open(self.stdout_file).read().split('\n')[:100])
-                description += '\n'
+                if os.path.isfile(self.stdout_file):
+                    description += ", result:\n\n"
+                    description += '\n'.join(open(self.stdout_file).read().split('\n')[:100])
+                    description += '\n'
 
-            description += "\nstdout:\n{}\n".format(stdout)
-            return TestResult(self.name, TestStatus.FAIL, reason, total_time, description)
+                description += "\nstdout:\n{}\n".format(stdout)
+                return TestResult(self.name, TestStatus.FAIL, reason, total_time, description)
 
         if stderr:
             description += "\n{}\n".format('\n'.join(stderr.split('\n')[:100]))
@@ -516,21 +536,12 @@ class TestCase:
 
     @staticmethod
     def send_test_name_failed(suite: str, case: str) -> bool:
-        clickhouse_proc = open_client_process(args.client, universal_newlines=True)
-
-        failed_to_check = False
-
+        global clickhouse_client
         pid = os.getpid()
-        query = f"SELECT 'Running test {suite}/{case} from pid={pid}';"
-
-        try:
-            clickhouse_proc.communicate((query), timeout=20)
-        except:
-            failed_to_check = True
-
-        return failed_to_check or clickhouse_proc.returncode != 0
+        clickhouse_client.execute(f"SELECT 'Running test {suite}/{case} from pid={pid}'")
 
     def run_single_test(self, server_logs_level, client_options):
+        global clickhouse_client
         args = self.testcase_args
         client = args.testcase_client
         start_time = args.testcase_start_time
@@ -572,28 +583,13 @@ class TestCase:
             need_drop_database = not maybe_passed
 
         if need_drop_database:
-            with open(self.stderr_file, 'a') as stderr:
-                clickhouse_proc_create = open_client_process(client, universal_newlines=True, stderr_file=stderr)
-
             seconds_left = max(args.timeout - (datetime.now() - start_time).total_seconds(), 20)
-
             try:
-                drop_database_query = "DROP DATABASE " + database
-                if args.replicated_database:
-                    drop_database_query += " ON CLUSTER test_cluster_database_replicated"
-                clickhouse_proc_create.communicate((drop_database_query), timeout=seconds_left)
-            except TimeoutExpired:
-                # kill test process because it can also hung
-                if proc.returncode is None:
-                    try:
-                        proc.kill()
-                    except OSError as e:
-                        if e.errno != ESRCH:
-                            raise
-
+                with clickhouse_client.connection.timeout_setter(seconds_left):
+                    clickhouse_client.execute("DROP DATABASE " + database)
+            except (TimeoutError, clickhouse_driver.errors.SocketTimeoutError):
                 total_time = (datetime.now() - start_time).total_seconds()
-                return clickhouse_proc_create, "", f"Timeout dropping database {database} after test", total_time
-
+                return None, "", f"Timeout dropping database {database} after test", total_time
             shutil.rmtree(args.test_tmp_dir)
 
         total_time = (datetime.now() - start_time).total_seconds()
@@ -624,12 +620,15 @@ class TestCase:
             if skip_reason is not None:
                 return TestResult(self.name, TestStatus.SKIPPED, skip_reason, 0., "")
 
-            if args.testname and self.send_test_name_failed(suite.suite, self.case):
-                description = "\nServer does not respond to health check\n"
-                return TestResult(self.name, TestStatus.FAIL, FailureReason.SERVER_DIED, 0., description)
+            if args.testname:
+                try:
+                    self.send_test_name_failed(suite.suite, self.case)
+                except:
+                    return TestResult(self.name, TestStatus.FAIL, FailureReason.SERVER_DIED, 0.,
+                        "\nServer does not respond to health check\n")
 
             self.runs_count += 1
-            self.testcase_args = self.configure_testcase_args(args, self.case_file, suite.suite_tmp_path, self.stderr_file)
+            self.testcase_args = self.configure_testcase_args(args, self.case_file, suite.suite_tmp_path)
             proc, stdout, stderr, total_time = self.run_single_test(server_logs_level, client_options)
 
             result = self.process_result_impl(proc, stdout, stderr, total_time)
@@ -794,12 +793,8 @@ class TestSuite:
     @staticmethod
     def readTestSuite(args, suite_dir_name: str):
         def is_data_present():
-            clickhouse_proc = open_client_process(args.client)
-            (stdout, stderr) = clickhouse_proc.communicate(b"EXISTS TABLE test.hits")
-            if clickhouse_proc.returncode != 0:
-                raise CalledProcessError(clickhouse_proc.returncode, args.client, stderr)
-
-            return stdout.startswith(b'1')
+            global clickhouse_client
+            return int(clickhouse_client.execute_one('EXISTS TABLE test.hits'))
 
         base_dir = os.path.abspath(args.queries)
         tmp_dir = os.path.abspath(args.tmp)
@@ -832,6 +827,7 @@ class TestSuite:
 
 
 stop_time = None
+clickhouse_client = None
 exit_code = None
 server_died = None
 stop_tests_triggered_lock = None
@@ -961,42 +957,26 @@ def run_tests_array(all_tests_with_params):
 server_logs_level = "warning"
 
 
-def check_server_started(client, retry_count):
+def check_server_started(retry_count):
+    global clickhouse_client
     print("Connecting to ClickHouse server...", end='')
 
     sys.stdout.flush()
-
     while retry_count > 0:
-        clickhouse_proc = open_client_process(client)
-        (stdout, stderr) = clickhouse_proc.communicate(b"SELECT 1")
-
-        if clickhouse_proc.returncode == 0 and stdout.startswith(b"1"):
+        try:
+            clickhouse_client.execute('SELECT 1')
             print(" OK")
             sys.stdout.flush()
             return True
-
-        if clickhouse_proc.returncode == 210:
-            # Connection refused, retry
+        except (ConnectionRefusedError, ConnectionResetError, clickhouse_driver.errors.NetworkError):
             print('.', end='')
             sys.stdout.flush()
             retry_count -= 1
             sleep(0.5)
             continue
 
-        code: int = clickhouse_proc.returncode
-
-        print(f"\nClient invocation failed with code {code}:\n\
-            stdout: {stdout}\n\
-            stderr: {stderr}\n\
-            args: {''.join(clickhouse_proc.args)}\n")
-
-        sys.stdout.flush()
-
-        return False
-
     print('\nAll connection tries failed')
     sys.stdout.flush()
-
     return False
 
 
@@ -1012,60 +992,38 @@ class BuildFlags():
     POLYMORPHIC_PARTS = 'polymorphic-parts'
 
 
-def collect_build_flags(client):
-    clickhouse_proc = open_client_process(client)
-    (stdout, stderr) = clickhouse_proc.communicate(b"SELECT value FROM system.build_options WHERE name = 'CXX_FLAGS'")
+def collect_build_flags():
+    global clickhouse_client
+
     result = []
 
-    if clickhouse_proc.returncode == 0:
-        if b'-fsanitize=thread' in stdout:
-            result.append(BuildFlags.THREAD)
-        elif b'-fsanitize=address' in stdout:
-            result.append(BuildFlags.ADDRESS)
-        elif b'-fsanitize=undefined' in stdout:
-            result.append(BuildFlags.UNDEFINED)
-        elif b'-fsanitize=memory' in stdout:
-            result.append(BuildFlags.MEMORY)
-    else:
-        raise Exception("Cannot get information about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))
+    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'CXX_FLAGS'")
+    if '-fsanitize=thread' in value:
+        result.append(BuildFlags.THREAD)
+    elif '-fsanitize=address' in value:
+        result.append(BuildFlags.ADDRESS)
+    elif '-fsanitize=undefined' in value:
+        result.append(BuildFlags.UNDEFINED)
+    elif '-fsanitize=memory' in value:
+        result.append(BuildFlags.MEMORY)
 
-    clickhouse_proc = open_client_process(client)
-    (stdout, stderr) = clickhouse_proc.communicate(b"SELECT value FROM system.build_options WHERE name = 'BUILD_TYPE'")
+    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'BUILD_TYPE'")
+    if 'Debug' in value:
+        result.append(BuildFlags.DEBUG)
+    elif 'RelWithDebInfo' in value or 'Release' in value:
+        result.append(BuildFlags.RELEASE)
 
-    if clickhouse_proc.returncode == 0:
-        if b'Debug' in stdout:
-            result.append(BuildFlags.DEBUG)
-        elif b'RelWithDebInfo' in stdout or b'Release' in stdout:
-            result.append(BuildFlags.RELEASE)
-    else:
-        raise Exception("Cannot get information about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))
+    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'UNBUNDLED'")
+    if value in ('ON', '1'):
+        result.append(BuildFlags.UNBUNDLED)
 
-    clickhouse_proc = open_client_process(client)
-    (stdout, stderr) = clickhouse_proc.communicate(b"SELECT value FROM system.build_options WHERE name = 'UNBUNDLED'")
+    value = clickhouse_client.execute_one("SELECT value FROM system.settings WHERE name = 'default_database_engine'")
+    if value == 'Ordinary':
+        result.append(BuildFlags.ORDINARY_DATABASE)
 
-    if clickhouse_proc.returncode == 0:
-        if b'ON' in stdout or b'1' in stdout:
-            result.append(BuildFlags.UNBUNDLED)
-    else:
-        raise Exception("Cannot get information about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))
-
-    clickhouse_proc = open_client_process(client)
-    (stdout, stderr) = clickhouse_proc.communicate(b"SELECT value FROM system.settings WHERE name = 'default_database_engine'")
-
-    if clickhouse_proc.returncode == 0:
-        if b'Ordinary' in stdout:
-            result.append(BuildFlags.ORDINARY_DATABASE)
-    else:
-        raise Exception("Cannot get information about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))
-
-    clickhouse_proc = open_client_process(client)
-    (stdout, stderr) = clickhouse_proc.communicate(b"SELECT value FROM system.merge_tree_settings WHERE name = 'min_bytes_for_wide_part'")
-
-    if clickhouse_proc.returncode == 0:
-        if stdout == b'0\n':
-            result.append(BuildFlags.POLYMORPHIC_PARTS)
-    else:
-        raise Exception("Cannot get inforamtion about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))
+    value = int(clickhouse_client.execute_one("SELECT value FROM system.merge_tree_settings WHERE name = 'min_bytes_for_wide_part'"))
+    if value == 0:
+        result.append(BuildFlags.POLYMORPHIC_PARTS)
 
     return result
 
@@ -1092,16 +1050,6 @@ def extract_key(key: str) -> str:
         args.configserver + key)[1]
 
 
-def open_client_process(
-    client_args: str,
-    universal_newlines: bool = False,
-    stderr_file: Optional[TextIO] = None):
-    return Popen(
-        shlex.split(client_args), stdin=PIPE, stdout=PIPE,
-        stderr=stderr_file if stderr_file is not None else PIPE,
-        universal_newlines=True if universal_newlines else None)
-
-
 def do_run_tests(jobs, test_suite: TestSuite, parallel):
     if jobs > 1 and len(test_suite.parallel_tests) > 0:
         print("Found", len(test_suite.parallel_tests), "parallel tests and", len(test_suite.sequential_tests), "sequential tests")
@@ -1170,8 +1118,9 @@ def main(args):
     global exit_code
     global server_logs_level
     global restarted_tests
+    global clickhouse_client
 
-    if not check_server_started(args.client, args.server_check_retries):
+    if not check_server_started(args.server_check_retries):
         msg = "Server is not responding. Cannot execute 'SELECT 1' query. \
             If you are using split build, you have to specify -c option."
         if args.hung_check:
@@ -1181,13 +1130,12 @@ def main(args):
             print_stacktraces()
         raise Exception(msg)
 
-    args.build_flags = collect_build_flags(args.client)
+    args.build_flags = collect_build_flags()
 
     if args.skip:
         args.skip = set(args.skip)
 
     base_dir = os.path.abspath(args.queries)
-    tmp_dir = os.path.abspath(args.tmp)
 
     # Keep same default values as in queries/shell_config.sh
     os.environ.setdefault("CLICKHOUSE_BINARY", args.binary)
@@ -1218,17 +1166,12 @@ def main(args):
         create_database_retries = 0
         while create_database_retries < MAX_RETRIES:
             start_time = datetime.now()
-
-            client_cmd = args.client + " " + get_additional_client_options(args)
-
-            clickhouse_proc_create = open_client_process(client_cmd, universal_newlines=True)
-
-            (stdout, stderr) = clickhouse_proc_create.communicate(("CREATE DATABASE IF NOT EXISTS " + db_name + get_db_engine(args, db_name)))
-
-            total_time = (datetime.now() - start_time).total_seconds()
-
-            if not need_retry(args, stdout, stderr, total_time):
-                break
+            try:
+                clickhouse_client.execute("CREATE DATABASE IF NOT EXISTS " + db_name + get_db_engine(args, db_name))
+            except Exception as e:
+                total_time = (datetime.now() - start_time).total_seconds()
+                if not need_retry_error(args, e, total_time):
+                    break
             create_database_retries += 1
 
     if args.database and args.database != "test":
@@ -1255,18 +1198,14 @@ def main(args):
 
         # Some queries may execute in background for some time after test was finished. This is normal.
         for _ in range(1, 60):
-            timeout, processlist = get_processlist(args)
-            if timeout or not processlist:
+            processlist = get_processlist(args)
+            if processlist.empty:
                 break
             sleep(1)
 
-        if timeout or processlist:
-            if processlist:
-                print(colored("\nFound hung queries in processlist:", args, "red", attrs=["bold"]))
-                print(processlist)
-            else:
-                print(colored("Seems like server hung and cannot respond to queries", args, "red", attrs=["bold"]))
-
+        if not processlist.empty:
+            print(colored("\nFound hung queries in processlist:", args, "red", attrs=["bold"]))
+            print(processlist)
 
             print_stacktraces()
             exit_code.value = 1
@@ -1311,16 +1250,20 @@ def find_binary(name):
 def get_additional_client_options(args):
     if args.client_option:
         return ' '.join('--' + option for option in args.client_option)
-
     return ''
 
-
 def get_additional_client_options_url(args):
     if args.client_option:
         return '&'.join(args.client_option)
-
     return ''
 
+def get_additional_client_options_dict(args):
+    settings = {}
+    if args.client_option:
+        for key, value in map(lambda x: x.split('='), args.client_option):
+            settings[key] = value
+    return settings
+
 
 if __name__ == '__main__':
     stop_time = None
@@ -1439,14 +1382,24 @@ if __name__ == '__main__':
         if args.configclient:
             args.client += ' --config-file=' + args.configclient
 
-        if os.getenv("CLICKHOUSE_HOST"):
-            args.client += ' --host=' + os.getenv("CLICKHOUSE_HOST")
+        tcp_host = os.getenv("CLICKHOUSE_HOST")
+        if tcp_host is not None:
+            args.client += f' --host={tcp_host}'
+        else:
+            tcp_host = 'localhost'
 
-        args.tcp_port = int(os.getenv("CLICKHOUSE_PORT_TCP", "9000"))
-        args.client += f" --port={args.tcp_port}"
+        tcp_port = os.getenv("CLICKHOUSE_PORT_TCP")
+        if tcp_port is not None:
+            args.tcp_port = int(tcp_port)
+            args.client += f" --port={tcp_port}"
+        else:
+            args.tcp_port = 9000
 
-        if os.getenv("CLICKHOUSE_DATABASE"):
-            args.client += ' --database=' + os.getenv("CLICKHOUSE_DATABASE")
+        client_database = os.getenv("CLICKHOUSE_DATABASE")
+        if client_database is not None:
+            args.client += f' --database={client_database}'
+        else:
+            client_database = 'default'
 
     if args.client_option:
         # Set options for client
@@ -1474,4 +1427,13 @@ if __name__ == '__main__':
     if args.jobs is None:
         args.jobs = multiprocessing.cpu_count()
 
+    # configure pandas to make it more like Vertical format
+    pandas.options.display.max_columns = None
+    pandas.options.display.width = None
+
+    clickhouse_client = Client(host=tcp_host,
+        port=args.tcp_port,
+        database=client_database,
+        settings=get_additional_client_options_dict(args))
+
     main(args)

From e2d6698244d43979b3fe2478dfdcd8dc3a91a0fd Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 8 Oct 2021 00:07:05 +0300
Subject: [PATCH 063/104] clickhouse-test: do not use persistent connection for
 simplicity (due to threads)

---
 tests/clickhouse-test | 77 +++++++++++++++++++++----------------------
 1 file changed, 38 insertions(+), 39 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index e8c85a6ae79..6bbfa97ab66 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -86,6 +86,17 @@ class Client(clickhouse_driver.Client):
         data = pandas.DataFrame(data=rows, columns=header)
         return data
 
+# Helpers
+def make_clickhouse_client(base_args, *args, **kwargs):
+    return Client(host=base_args.tcp_host, port=base_args.tcp_port,
+        settings=get_additional_client_options_dict(base_args))
+def clickhouse_execute_one(base_args, *args, **kwargs):
+    return make_clickhouse_client(base_args).execute_one(*args, **kwargs)
+def clickhouse_execute(base_args, *args, **kwargs):
+    return make_clickhouse_client(base_args).execute(*args, **kwargs)
+def clickhouse_execute_pandas(base_args, *args, **kwargs):
+    return make_clickhouse_client(base_args).execute_pandas(*args, **kwargs)
+
 
 class Terminated(KeyboardInterrupt):
     pass
@@ -128,16 +139,14 @@ def get_db_engine(args, database_name):
 
 
 def get_zookeeper_session_uptime(args):
-    global clickhouse_client
-
     try:
         if args.replicated_database:
-            return int(clickhouse_client.execute_one("""
+            return int(clickhouse_execute_one(args, """
             SELECT min(materialize(zookeeperSessionUptime()))
             FROM clusterAllReplicas('test_cluster_database_replicated', system.one)
             """))
         else:
-            return int(clickhouse_client.execute_one('SELECT zookeeperSessionUptime()'))
+            return int(clickhouse_execute_one(args, 'SELECT zookeeperSessionUptime()'))
     except:
         return None
 
@@ -167,15 +176,14 @@ def need_retry_error(args, error, total_time):
 
 
 def get_processlist(args):
-    global clickhouse_client
     if args.replicated_database:
-        return clickhouse_client.execute_pandas("""
+        return clickhouse_execute_pandas(args, """
         SELECT materialize((hostName(), tcpPort())) as host, *
         FROM clusterAllReplicas('test_cluster_database_replicated', system.processes)
         WHERE query NOT LIKE '%system.processes%'
         """)
     else:
-        return clickhouse_client.execute_pandas('SHOW PROCESSLIST')
+        return clickhouse_execute_pandas(args, 'SHOW PROCESSLIST')
 
 
 # collect server stacktraces using gdb
@@ -342,7 +350,6 @@ class TestCase:
 
     @staticmethod
     def configure_testcase_args(args, case_file, suite_tmp_dir):
-        global clickhouse_client
         testcase_args = copy.deepcopy(args)
 
         testcase_args.testcase_start_time = datetime.now()
@@ -363,7 +370,7 @@ class TestCase:
             database = 'test_{suffix}'.format(suffix=random_str())
 
             try:
-                clickhouse_client.execute("CREATE DATABASE " + database + get_db_engine(testcase_args, database), settings={'log_comment': testcase_basename})
+                clickhouse_execute(args, "CREATE DATABASE " + database + get_db_engine(testcase_args, database), settings={'log_comment': testcase_basename})
             except (TimeoutError, clickhouse_driver.errors.SocketTimeoutError):
                 total_time = (datetime.now() - testcase_args.testcase_start_time).total_seconds()
                 return None, "", f"Timeout creating database {database} before test", total_time
@@ -536,12 +543,10 @@ class TestCase:
 
     @staticmethod
     def send_test_name_failed(suite: str, case: str) -> bool:
-        global clickhouse_client
         pid = os.getpid()
-        clickhouse_client.execute(f"SELECT 'Running test {suite}/{case} from pid={pid}'")
+        clickhouse_execute(args, f"SELECT 'Running test {suite}/{case} from pid={pid}'")
 
     def run_single_test(self, server_logs_level, client_options):
-        global clickhouse_client
         args = self.testcase_args
         client = args.testcase_client
         start_time = args.testcase_start_time
@@ -585,8 +590,10 @@ class TestCase:
         if need_drop_database:
             seconds_left = max(args.timeout - (datetime.now() - start_time).total_seconds(), 20)
             try:
-                with clickhouse_client.connection.timeout_setter(seconds_left):
-                    clickhouse_client.execute("DROP DATABASE " + database)
+                client = make_clickhouse_client(args)
+                client.connection.force_connect()
+                with client.connection.timeout_setter(seconds_left):
+                    client.execute("DROP DATABASE " + database)
             except (TimeoutError, clickhouse_driver.errors.SocketTimeoutError):
                 total_time = (datetime.now() - start_time).total_seconds()
                 return None, "", f"Timeout dropping database {database} after test", total_time
@@ -793,8 +800,7 @@ class TestSuite:
     @staticmethod
     def readTestSuite(args, suite_dir_name: str):
         def is_data_present():
-            global clickhouse_client
-            return int(clickhouse_client.execute_one('EXISTS TABLE test.hits'))
+            return int(clickhouse_execute_one(args, 'EXISTS TABLE test.hits'))
 
         base_dir = os.path.abspath(args.queries)
         tmp_dir = os.path.abspath(args.tmp)
@@ -827,7 +833,6 @@ class TestSuite:
 
 
 stop_time = None
-clickhouse_client = None
 exit_code = None
 server_died = None
 stop_tests_triggered_lock = None
@@ -957,14 +962,14 @@ def run_tests_array(all_tests_with_params):
 server_logs_level = "warning"
 
 
-def check_server_started(retry_count):
-    global clickhouse_client
+def check_server_started(args):
     print("Connecting to ClickHouse server...", end='')
 
     sys.stdout.flush()
+    retry_count = args.server_check_retries
     while retry_count > 0:
         try:
-            clickhouse_client.execute('SELECT 1')
+            clickhouse_execute(args, 'SELECT 1')
             print(" OK")
             sys.stdout.flush()
             return True
@@ -992,12 +997,10 @@ class BuildFlags():
     POLYMORPHIC_PARTS = 'polymorphic-parts'
 
 
-def collect_build_flags():
-    global clickhouse_client
-
+def collect_build_flags(args):
     result = []
 
-    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'CXX_FLAGS'")
+    value = clickhouse_execute_one(args, "SELECT value FROM system.build_options WHERE name = 'CXX_FLAGS'")
     if '-fsanitize=thread' in value:
         result.append(BuildFlags.THREAD)
     elif '-fsanitize=address' in value:
@@ -1007,21 +1010,21 @@ def collect_build_flags():
     elif '-fsanitize=memory' in value:
         result.append(BuildFlags.MEMORY)
 
-    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'BUILD_TYPE'")
+    value = clickhouse_execute_one(args, "SELECT value FROM system.build_options WHERE name = 'BUILD_TYPE'")
     if 'Debug' in value:
         result.append(BuildFlags.DEBUG)
     elif 'RelWithDebInfo' in value or 'Release' in value:
         result.append(BuildFlags.RELEASE)
 
-    value = clickhouse_client.execute_one("SELECT value FROM system.build_options WHERE name = 'UNBUNDLED'")
+    value = clickhouse_execute_one(args, "SELECT value FROM system.build_options WHERE name = 'UNBUNDLED'")
     if value in ('ON', '1'):
         result.append(BuildFlags.UNBUNDLED)
 
-    value = clickhouse_client.execute_one("SELECT value FROM system.settings WHERE name = 'default_database_engine'")
+    value = clickhouse_execute_one(args, "SELECT value FROM system.settings WHERE name = 'default_database_engine'")
     if value == 'Ordinary':
         result.append(BuildFlags.ORDINARY_DATABASE)
 
-    value = int(clickhouse_client.execute_one("SELECT value FROM system.merge_tree_settings WHERE name = 'min_bytes_for_wide_part'"))
+    value = int(clickhouse_execute_one(args, "SELECT value FROM system.merge_tree_settings WHERE name = 'min_bytes_for_wide_part'"))
     if value == 0:
         result.append(BuildFlags.POLYMORPHIC_PARTS)
 
@@ -1118,9 +1121,8 @@ def main(args):
     global exit_code
     global server_logs_level
     global restarted_tests
-    global clickhouse_client
 
-    if not check_server_started(args.server_check_retries):
+    if not check_server_started(args):
         msg = "Server is not responding. Cannot execute 'SELECT 1' query. \
             If you are using split build, you have to specify -c option."
         if args.hung_check:
@@ -1130,7 +1132,7 @@ def main(args):
             print_stacktraces()
         raise Exception(msg)
 
-    args.build_flags = collect_build_flags()
+    args.build_flags = collect_build_flags(args)
 
     if args.skip:
         args.skip = set(args.skip)
@@ -1167,7 +1169,7 @@ def main(args):
         while create_database_retries < MAX_RETRIES:
             start_time = datetime.now()
             try:
-                clickhouse_client.execute("CREATE DATABASE IF NOT EXISTS " + db_name + get_db_engine(args, db_name))
+                clickhouse_execute(args, "CREATE DATABASE IF NOT EXISTS " + db_name + get_db_engine(args, db_name))
             except Exception as e:
                 total_time = (datetime.now() - start_time).total_seconds()
                 if not need_retry_error(args, e, total_time):
@@ -1384,9 +1386,10 @@ if __name__ == '__main__':
 
         tcp_host = os.getenv("CLICKHOUSE_HOST")
         if tcp_host is not None:
+            args.tcp_host = tcp_host
             args.client += f' --host={tcp_host}'
         else:
-            tcp_host = 'localhost'
+            args.tcp_host = 'localhost'
 
         tcp_port = os.getenv("CLICKHOUSE_PORT_TCP")
         if tcp_port is not None:
@@ -1398,8 +1401,9 @@ if __name__ == '__main__':
         client_database = os.getenv("CLICKHOUSE_DATABASE")
         if client_database is not None:
             args.client += f' --database={client_database}'
+            args.client_database = client_database
         else:
-            client_database = 'default'
+            args.client_database = 'default'
 
     if args.client_option:
         # Set options for client
@@ -1431,9 +1435,4 @@ if __name__ == '__main__':
     pandas.options.display.max_columns = None
     pandas.options.display.width = None
 
-    clickhouse_client = Client(host=tcp_host,
-        port=args.tcp_port,
-        database=client_database,
-        settings=get_additional_client_options_dict(args))
-
     main(args)

From 004b71d5464cbc608a9f82371f504ec305c4779a Mon Sep 17 00:00:00 2001
From: pawelsz-rb <76971683+pawelsz-rb@users.noreply.github.com>
Date: Thu, 7 Oct 2021 15:27:14 -0700
Subject: [PATCH 064/104] Update adopters.md

added Rollbar
---
 docs/en/introduction/adopters.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/en/introduction/adopters.md b/docs/en/introduction/adopters.md
index 72ebe33292f..20bf9a10986 100644
--- a/docs/en/introduction/adopters.md
+++ b/docs/en/introduction/adopters.md
@@ -102,6 +102,7 @@ toc_title: Adopters
 | <a href="https://www.rbinternational.com/" class="favicon">Raiffeisenbank</a> | Banking | Analytics | — | — | [Lecture in Russian, December 2020](https://cs.hse.ru/announcements/421965599.html) |
 | <a href="https://rambler.ru" class="favicon">Rambler</a> | Internet services | Analytics | — | — | [Talk in Russian, April 2018](https://medium.com/@ramblertop/разработка-api-clickhouse-для-рамблер-топ-100-f4c7e56f3141) |
 | <a href="https://retell.cc/" class="favicon">Retell</a> | Speech synthesis | Analytics | — | — | [Blog Article, August 2020](https://vc.ru/services/153732-kak-sozdat-audiostati-na-vashem-sayte-i-zachem-eto-nuzhno) |
+| <a href="https://www.rollbar.com" class="favicon">Rollbar</a> | Software Development | Main Product | — | — | [Official Website](https://www.rollbar.com) |
 | <a href="https://rspamd.com/" class="favicon">Rspamd</a> | Antispam | Analytics | — | — | [Official Website](https://rspamd.com/doc/modules/clickhouse.html) |
 | <a href="https://rusiem.com/en" class="favicon">RuSIEM</a> | SIEM | Main Product | — | — | [Official Website](https://rusiem.com/en/products/architecture) |
 | <a href="https://www.s7.ru" class="favicon">S7 Airlines</a> | Airlines | Metrics, Logging | — | — | [Talk in Russian, March 2019](https://www.youtube.com/watch?v=nwG68klRpPg&t=15s) |

From bb55fb41c62b8412d2b245b58152d8a014c831b1 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 8 Oct 2021 07:48:05 +0000
Subject: [PATCH 065/104] Add test

---
 .../0_stateless/02047_client_exception.expect | 32 +++++++++++++++++++
 .../02047_client_exception.reference          |  0
 2 files changed, 32 insertions(+)
 create mode 100755 tests/queries/0_stateless/02047_client_exception.expect
 create mode 100644 tests/queries/0_stateless/02047_client_exception.reference

diff --git a/tests/queries/0_stateless/02047_client_exception.expect b/tests/queries/0_stateless/02047_client_exception.expect
new file mode 100755
index 00000000000..120f8ef11e3
--- /dev/null
+++ b/tests/queries/0_stateless/02047_client_exception.expect
@@ -0,0 +1,32 @@
+#!/usr/bin/expect -f
+# Tags: no-unbundled, no-fasttest
+
+log_user 0
+set timeout 20
+match_max 100000
+
+# A default timeout action is to fail
+expect_after {
+    timeout {
+        exit 1
+    }
+}
+
+set basedir [file dirname $argv0]
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion"
+expect ":) "
+
+send -- "DROP TABLE IF EXISTS test_02047\r"
+expect "Ok."
+
+send -- "CREATE TABLE test_02047 (s Int32) ENGINE=Memory()\r"
+expect "Ok."
+
+send -- "INSERT INTO test_02047 SELECT 'f' \r"
+expect "Received exception from server"
+
+send -- "DROP TABLE test_02047\r"
+expect "Ok."
+
+send -- "\4"
+expect eof
diff --git a/tests/queries/0_stateless/02047_client_exception.reference b/tests/queries/0_stateless/02047_client_exception.reference
new file mode 100644
index 00000000000..e69de29bb2d

From b081f58db51a10a1d0fc6977cd4d9f108f12a265 Mon Sep 17 00:00:00 2001
From: MaxWk <610379995@qq.com>
Date: Fri, 8 Oct 2021 16:49:02 +0800
Subject: [PATCH 066/104] add alias

---
 src/Storages/System/StorageSystemTables.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index f1f7fa4fa08..254e6f77e0c 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -59,6 +59,8 @@ StorageSystemTables::StorageSystemTables(const StorageID & table_id_)
         {"lifetime_bytes", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
         {"comment", std::make_shared<DataTypeString>()},
         {"has_own_data", std::make_shared<DataTypeUInt8>()},
+    }, {
+        {"table", std::make_shared<DataTypeString>(), "name"}
     }));
     setInMemoryMetadata(storage_metadata);
 }

From 383f3a3a20ff7268b4c2fad14d0e20f266682b77 Mon Sep 17 00:00:00 2001
From: vesslanjin <jun.i.jin@intel.com>
Date: Fri, 8 Oct 2021 09:19:58 -0400
Subject: [PATCH 067/104] =?UTF-8?q?Remove=C2=A0branchy=C2=A0code=C2=A0in?=
 =?UTF-8?q?=C2=A0filter=C2=A0operation=C2=A0with=C2=A0a=C2=A0better=C2=A0i?=
 =?UTF-8?q?mplementation=C2=A0with=C2=A0popcnt/ctz=C2=A0which=C2=A0have?=
 =?UTF-8?q?=C2=A0better=C2=A0performance?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Zhu Jasper <jasper.zhu@intel.com>
---
 src/Columns/ColumnFixedString.cpp | 22 +++++++++-------------
 src/Columns/ColumnVector.cpp      | 11 +++++++----
 src/Columns/ColumnsCommon.cpp     | 11 +++++++----
 3 files changed, 23 insertions(+), 21 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index ce39ab0994c..4bfc6513263 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -231,7 +231,7 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
     const UInt8 * filt_end = filt_pos + col_size;
     const UInt8 * data_pos = chars.data();
 
-#ifdef __SSE2__
+#if defined(__SSE2__) && defined(__POPCNT__)
     /** A slightly more optimized version.
         * Based on the assumption that often pieces of consecutive values
         *  completely pass or do not pass the filter.
@@ -251,28 +251,24 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
         if (0 == mask)
         {
             /// Nothing is inserted.
-            data_pos += chars_per_simd_elements;
         }
         else if (0xFFFF == mask)
         {
             res->chars.insert(data_pos, data_pos + chars_per_simd_elements);
-            data_pos += chars_per_simd_elements;
         }
         else
         {
             size_t res_chars_size = res->chars.size();
-            for (size_t i = 0; i < SIMD_BYTES; ++i)
-            {
-                if (filt_pos[i])
-                {
-                    res->chars.resize(res_chars_size + n);
-                    memcpySmallAllowReadWriteOverflow15(&res->chars[res_chars_size], data_pos, n);
-                    res_chars_size += n;
-                }
-                data_pos += n;
+            size_t pcnt = __builtin_popcount(mask);
+            for(size_t j = 0; j < pcnt; j++) {
+                size_t index = __builtin_ctz(mask);
+                res->chars.resize(res_chars_size + n);
+                memcpySmallAllowReadWriteOverflow15(&res->chars[res_chars_size], data_pos+index*n, n);
+                res_chars_size += n;
+                mask = mask & (mask-1);
             }
         }
-
+        data_pos += chars_per_simd_elements;
         filt_pos += SIMD_BYTES;
     }
 #endif
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index 7f3cdaeec7f..ff84204a7cb 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -311,7 +311,7 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
     const UInt8 * filt_end = filt_pos + size;
     const T * data_pos = data.data();
 
-#ifdef __SSE2__
+#if defined(__SSE2__) && defined(__POPCNT__)
     /** A slightly more optimized version.
     * Based on the assumption that often pieces of consecutive values
     *  completely pass or do not pass the filter.
@@ -337,9 +337,12 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
         }
         else
         {
-            for (size_t i = 0; i < SIMD_BYTES; ++i)
-                if (filt_pos[i])
-                    res_data.push_back(data_pos[i]);
+            size_t pcnt = __builtin_popcount(mask);
+            for(size_t j = 0; j < pcnt; j++) {
+                size_t index = __builtin_ctz(mask);
+                res_data.push_back(data_pos[index]);
+                mask = mask & (mask-1);
+            }         
         }
 
         filt_pos += SIMD_BYTES;
diff --git a/src/Columns/ColumnsCommon.cpp b/src/Columns/ColumnsCommon.cpp
index 41933ed08ed..5c0214054b2 100644
--- a/src/Columns/ColumnsCommon.cpp
+++ b/src/Columns/ColumnsCommon.cpp
@@ -229,7 +229,7 @@ namespace
             memcpy(&res_elems[elems_size_old], &src_elems[arr_offset], arr_size * sizeof(T));
         };
 
-    #ifdef __SSE2__
+    #if defined(__SSE2__) && defined(__POPCNT__)
         const __m128i zero_vec = _mm_setzero_si128();
         static constexpr size_t SIMD_BYTES = 16;
         const auto * filt_end_aligned = filt_pos + size / SIMD_BYTES * SIMD_BYTES;
@@ -262,9 +262,12 @@ namespace
             }
             else
             {
-                for (size_t i = 0; i < SIMD_BYTES; ++i)
-                    if (filt_pos[i])
-                        copy_array(offsets_pos + i);
+                size_t pcnt = __builtin_popcount(mask);
+                for(size_t j = 0; j < pcnt; j++) {
+                    size_t index = __builtin_ctz(mask);
+                    copy_array(offsets_pos + index);
+                    mask = mask & (mask-1);
+                }
             }
 
             filt_pos += SIMD_BYTES;

From 35feb082365eb0517f2c58659507de34ed47d3af Mon Sep 17 00:00:00 2001
From: Vladimir C <vdimir@clickhouse.com>
Date: Fri, 8 Oct 2021 12:03:55 +0300
Subject: [PATCH 068/104] Whitespace changes

---
 src/Columns/ColumnFixedString.cpp | 7 ++++---
 src/Columns/ColumnVector.cpp      | 5 +++--
 src/Columns/ColumnsCommon.cpp     | 5 +++--
 3 files changed, 10 insertions(+), 7 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index 4bfc6513263..1080f29b5aa 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -260,12 +260,13 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
         {
             size_t res_chars_size = res->chars.size();
             size_t pcnt = __builtin_popcount(mask);
-            for(size_t j = 0; j < pcnt; j++) {
+            for (size_t j = 0; j < pcnt; ++j)
+            {
                 size_t index = __builtin_ctz(mask);
                 res->chars.resize(res_chars_size + n);
-                memcpySmallAllowReadWriteOverflow15(&res->chars[res_chars_size], data_pos+index*n, n);
+                memcpySmallAllowReadWriteOverflow15(&res->chars[res_chars_size], data_pos + index * n, n);
                 res_chars_size += n;
-                mask = mask & (mask-1);
+                mask = mask & (mask - 1);
             }
         }
         data_pos += chars_per_simd_elements;
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index ff84204a7cb..e7c56a57d51 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -338,10 +338,11 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
         else
         {
             size_t pcnt = __builtin_popcount(mask);
-            for(size_t j = 0; j < pcnt; j++) {
+            for (size_t j = 0; j < pcnt; ++j)
+            {
                 size_t index = __builtin_ctz(mask);
                 res_data.push_back(data_pos[index]);
-                mask = mask & (mask-1);
+                mask = mask & (mask - 1);
             }         
         }
 
diff --git a/src/Columns/ColumnsCommon.cpp b/src/Columns/ColumnsCommon.cpp
index 5c0214054b2..b4614abe490 100644
--- a/src/Columns/ColumnsCommon.cpp
+++ b/src/Columns/ColumnsCommon.cpp
@@ -263,10 +263,11 @@ namespace
             else
             {
                 size_t pcnt = __builtin_popcount(mask);
-                for(size_t j = 0; j < pcnt; j++) {
+                for (size_t j = 0; j < pcnt; ++j)
+                {
                     size_t index = __builtin_ctz(mask);
                     copy_array(offsets_pos + index);
-                    mask = mask & (mask-1);
+                    mask = mask & (mask - 1);
                 }
             }
 

From 525df998934368aedb3baac72645453b080cf01d Mon Sep 17 00:00:00 2001
From: Vladimir C <vdimir@clickhouse.com>
Date: Fri, 8 Oct 2021 12:10:19 +0300
Subject: [PATCH 069/104] Whitespace fix

---
 src/Columns/ColumnVector.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index e7c56a57d51..61ba2074bd7 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -343,7 +343,7 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
                 size_t index = __builtin_ctz(mask);
                 res_data.push_back(data_pos[index]);
                 mask = mask & (mask - 1);
-            }         
+            }
         }
 
         filt_pos += SIMD_BYTES;

From 3acdcc6ec5b31d3b5e7c33e0e49df99b39dbdda4 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Fri, 8 Oct 2021 15:03:31 +0300
Subject: [PATCH 070/104] Update example

---
 src/Core/examples/coro.cpp | 44 ++++++++++++++------------------------
 1 file changed, 16 insertions(+), 28 deletions(-)

diff --git a/src/Core/examples/coro.cpp b/src/Core/examples/coro.cpp
index c8e2f7418e4..a9728314495 100644
--- a/src/Core/examples/coro.cpp
+++ b/src/Core/examples/coro.cpp
@@ -12,37 +12,25 @@
 #include <Poco/AutoPtr.h>
 
 #if defined(__clang__)
-
 #include <experimental/coroutine>
 
-template <typename T>
-using coroutine_handle = std::experimental::coroutine_handle<T>;
-
-using default_coroutine_handle = std::experimental::coroutine_handle<>;
-
-using suspend_never = std::experimental::suspend_never;
-using suspend_always = std::experimental::suspend_always;
+namespace std
+{
+    using namespace experimental::coroutines_v1;
+}
 
 #else
-
 #include <coroutine>
-
-template <typename T>
-using coroutine_handle = std::coroutine_handle<T>;
-
-using default_coroutine_handle = std::coroutine_handle<>;
-
-using suspend_never = std::suspend_never;
-using suspend_always = std::suspend_always;
-
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wzero-as-null-pointer-constant"
 #endif
 
 
 template <typename T>
-struct suspend_never_val
+struct suspend_value
 {
     constexpr bool await_ready() const noexcept { return true; }
-    constexpr void await_suspend(default_coroutine_handle) const noexcept {}
+    constexpr void await_suspend(std::coroutine_handle<>) const noexcept {}
     constexpr T await_resume() const noexcept
     {
         std::cout << "  ret " << val << std::endl;
@@ -57,10 +45,10 @@ struct resumable
 {
     struct promise_type
     {
-        using coro_handle = coroutine_handle<promise_type>;
+        using coro_handle = std::coroutine_handle<promise_type>;
         auto get_return_object() { return coro_handle::from_promise(*this); }
-        auto initial_suspend() { return suspend_never(); }
-        auto final_suspend() noexcept { return suspend_never_val<T>{*r->value}; }
+        auto initial_suspend() { return std::suspend_never(); }
+        auto final_suspend() noexcept { return suspend_value<T>{*r->value}; }
         //void return_void() {}
         void return_value(T value_) { r->value = value_; }
         void unhandled_exception()
@@ -76,7 +64,7 @@ struct resumable
         resumable * r = nullptr;
     };
 
-    using coro_handle = coroutine_handle<promise_type>;
+    using coro_handle = std::coroutine_handle<promise_type>;
 
     bool await_ready() const noexcept { return false; }
     void await_suspend(coro_handle g) noexcept
@@ -148,16 +136,16 @@ private:
     std::exception_ptr exception;
 };
 
-resumable<int> boo(std::string tag)
+resumable<int> boo([[maybe_unused]] std::string tag)
 {
     std::cout << "x" << std::endl;
-    co_await suspend_always();
+    co_await std::suspend_always();
     std::cout << StackTrace().toString();
     std::cout << "y" << std::endl;
     co_return 1;
 }
 
-resumable<int> bar(std::string tag)
+resumable<int> bar([[maybe_unused]] std::string tag)
 {
     std::cout << "a" << std::endl;
     int res1 = co_await boo("boo1");
@@ -169,7 +157,7 @@ resumable<int> bar(std::string tag)
     co_return res1 + res2;  // 1 + 1 = 2
 }
 
-resumable<int> foo(std::string tag) {
+resumable<int> foo([[maybe_unused]] std::string tag) {
     std::cout << "Hello" << std::endl;
     auto res1 = co_await bar("bar1");
     std::cout << "Coro " << res1 << std::endl;

From b8e77a0c62ca664e65f545a39c1132edb14995e1 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Fri, 8 Oct 2021 15:06:09 +0300
Subject: [PATCH 071/104] Add -fcoroutines for g++

---
 CMakeLists.txt | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 66df4d3124a..685b2c25a0d 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -336,6 +336,10 @@ if (COMPILER_GCC OR COMPILER_CLANG)
     set(COMPILER_FLAGS "${COMPILER_FLAGS} -falign-functions=32")
 endif ()
 
+if (COMPILER_GCC)
+    set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fcoroutines")
+endif ()
+
 # Compiler-specific coverage flags e.g. -fcoverage-mapping for gcc
 option(WITH_COVERAGE "Profile the resulting binary/binaries" OFF)
 

From f0e193d5a51725f524945adf55e85b80413f9c77 Mon Sep 17 00:00:00 2001
From: MaxWk <610379995@qq.com>
Date: Fri, 8 Oct 2021 20:25:37 +0800
Subject: [PATCH 072/104] add database alias

---
 src/Storages/System/StorageSystemDatabases.cpp | 7 +++++++
 src/Storages/System/StorageSystemDatabases.h   | 2 ++
 2 files changed, 9 insertions(+)

diff --git a/src/Storages/System/StorageSystemDatabases.cpp b/src/Storages/System/StorageSystemDatabases.cpp
index a781f44e9b2..fb7a1bc59b8 100644
--- a/src/Storages/System/StorageSystemDatabases.cpp
+++ b/src/Storages/System/StorageSystemDatabases.cpp
@@ -21,6 +21,13 @@ NamesAndTypesList StorageSystemDatabases::getNamesAndTypes()
     };
 }
 
+NamesAndAliases StorageSystemDatabases::getNamesAndAliases()
+{
+    return {
+        {"database", std::make_shared<DataTypeString>(), "name"}
+    };
+}
+
 void StorageSystemDatabases::fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo &) const
 {
     const auto access = context->getAccess();
diff --git a/src/Storages/System/StorageSystemDatabases.h b/src/Storages/System/StorageSystemDatabases.h
index 4aaae1bfd7f..3de0da126d4 100644
--- a/src/Storages/System/StorageSystemDatabases.h
+++ b/src/Storages/System/StorageSystemDatabases.h
@@ -23,6 +23,8 @@ public:
 
     static NamesAndTypesList getNamesAndTypes();
 
+    static NamesAndAliases getNamesAndAliases();
+
 protected:
     using IStorageSystemOneBlock::IStorageSystemOneBlock;
 

From f47e7aa8b84cb9b851e96a034a2bf6a9d5298dd3 Mon Sep 17 00:00:00 2001
From: MaxWk <610379995@qq.com>
Date: Fri, 8 Oct 2021 20:27:13 +0800
Subject: [PATCH 073/104] add test

---
 .../02047_alias_for_table_and_database_name.reference           | 2 ++
 .../0_stateless/02047_alias_for_table_and_database_name.sql     | 2 ++
 2 files changed, 4 insertions(+)
 create mode 100644 tests/queries/0_stateless/02047_alias_for_table_and_database_name.reference
 create mode 100644 tests/queries/0_stateless/02047_alias_for_table_and_database_name.sql

diff --git a/tests/queries/0_stateless/02047_alias_for_table_and_database_name.reference b/tests/queries/0_stateless/02047_alias_for_table_and_database_name.reference
new file mode 100644
index 00000000000..324e7ff9ab8
--- /dev/null
+++ b/tests/queries/0_stateless/02047_alias_for_table_and_database_name.reference
@@ -0,0 +1,2 @@
+numbers	numbers
+default	default
diff --git a/tests/queries/0_stateless/02047_alias_for_table_and_database_name.sql b/tests/queries/0_stateless/02047_alias_for_table_and_database_name.sql
new file mode 100644
index 00000000000..2fabd2affd4
--- /dev/null
+++ b/tests/queries/0_stateless/02047_alias_for_table_and_database_name.sql
@@ -0,0 +1,2 @@
+SELECT name,table from system.tables where database = 'system' and name = 'numbers';
+SELECt name,database from system.databases where name = 'default';

From 7fa3257bb6b5bf5ef8576f70c4657335442a0c70 Mon Sep 17 00:00:00 2001
From: Artur Filatenkov <613623@mail.ru>
Date: Fri, 8 Oct 2021 15:37:24 +0300
Subject: [PATCH 074/104] correct test

---
 tests/integration/test_settings_profile/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 7be0b395764..78efe7ffcad 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -201,7 +201,7 @@ def test_show_profiles():
 
     assert instance.query("SHOW CREATE PROFILE xyz") == "CREATE SETTINGS PROFILE xyz\n"
     assert instance.query(
-        "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n"
+        "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n"
     assert instance.query(
         "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n" \
                                    "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \

From e157d22ef7bb762d7f2f9e88b8aa48447af266b1 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Fri, 8 Oct 2021 18:25:25 +0300
Subject: [PATCH 075/104] Update test.py

---
 tests/integration/test_settings_profile/test.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 78efe7ffcad..048d09daaa5 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -203,11 +203,11 @@ def test_show_profiles():
     assert instance.query(
         "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n"
     assert instance.query(
-        "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n" \
+        "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n" \
                                    "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
                                    "CREATE SETTINGS PROFILE xyz\n"
 
-    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n" \
+    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n" \
                       "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
                       "CREATE SETTINGS PROFILE xyz\n"
     assert expected_access in instance.query("SHOW ACCESS")

From 21bdc12b9c7269036b6ca62425a90b98c0422111 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Fri, 8 Oct 2021 21:38:12 +0300
Subject: [PATCH 076/104] Pull libcxx

---
 contrib/libcxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/libcxx b/contrib/libcxx
index 2fa892f69ac..61e60294b1d 160000
--- a/contrib/libcxx
+++ b/contrib/libcxx
@@ -1 +1 @@
-Subproject commit 2fa892f69acbaa40f8a18c6484854a6183a34482
+Subproject commit 61e60294b1de01483caa9f5d00f437c99b674de6

From 2ad2f20176bb16d536217c0ad1f1737fbd1479fc Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Fri, 8 Oct 2021 21:55:09 +0300
Subject: [PATCH 077/104] Add NOLINT

---
 src/Core/examples/coro.cpp | 58 +++++++++++++++++++-------------------
 1 file changed, 29 insertions(+), 29 deletions(-)

diff --git a/src/Core/examples/coro.cpp b/src/Core/examples/coro.cpp
index a9728314495..e3a990e228d 100644
--- a/src/Core/examples/coro.cpp
+++ b/src/Core/examples/coro.cpp
@@ -27,11 +27,11 @@ namespace std
 
 
 template <typename T>
-struct suspend_value
+struct suspend_value // NOLINT(readability-identifier-naming)
 {
-    constexpr bool await_ready() const noexcept { return true; }
-    constexpr void await_suspend(std::coroutine_handle<>) const noexcept {}
-    constexpr T await_resume() const noexcept
+    constexpr bool await_ready() const noexcept { return true; } // NOLINT(readability-identifier-naming)
+    constexpr void await_suspend(std::coroutine_handle<>) const noexcept {} // NOLINT(readability-identifier-naming)
+    constexpr T await_resume() const noexcept // NOLINT(readability-identifier-naming)
     {
         std::cout << "  ret " << val << std::endl;
         return val;
@@ -41,57 +41,57 @@ struct suspend_value
 };
 
 template <typename T>
-struct resumable
+struct Task
 {
-    struct promise_type
+    struct promise_type // NOLINT(readability-identifier-naming)
     {
         using coro_handle = std::coroutine_handle<promise_type>;
-        auto get_return_object() { return coro_handle::from_promise(*this); }
-        auto initial_suspend() { return std::suspend_never(); }
-        auto final_suspend() noexcept { return suspend_value<T>{*r->value}; }
+        auto get_return_object() { return coro_handle::from_promise(*this); } // NOLINT(readability-identifier-naming)
+        auto initial_suspend() { return std::suspend_never(); } // NOLINT(readability-identifier-naming)
+        auto final_suspend() noexcept { return suspend_value<T>{*r->value}; } // NOLINT(readability-identifier-naming)
         //void return_void() {}
-        void return_value(T value_) { r->value = value_; }
-        void unhandled_exception()
+        void return_value(T value_) { r->value = value_; } // NOLINT(readability-identifier-naming)
+        void unhandled_exception() // NOLINT(readability-identifier-naming)
         {
             DB::tryLogCurrentException("Logger");
-            r->exception = std::current_exception();
+            r->exception = std::current_exception(); // NOLINT(bugprone-throw-keyword-missing)
         }
 
         explicit promise_type(std::string tag_) : tag(tag_) {}
         ~promise_type() { std::cout << "~promise_type " << tag << std::endl; }
         std::string tag;
         coro_handle next;
-        resumable * r = nullptr;
+        Task * r = nullptr;
     };
 
     using coro_handle = std::coroutine_handle<promise_type>;
 
-    bool await_ready() const noexcept { return false; }
-    void await_suspend(coro_handle g) noexcept
+    bool await_ready() const noexcept { return false; } // NOLINT(readability-identifier-naming)
+    void await_suspend(coro_handle g) noexcept // NOLINT(readability-identifier-naming)
     {
         std::cout << "  await_suspend " << my.promise().tag << std::endl;
         std::cout << "  g tag " << g.promise().tag << std::endl;
         g.promise().next = my;
     }
-    T await_resume() noexcept
+    T await_resume() noexcept // NOLINT(readability-identifier-naming)
     {
         std::cout << "  await_res " << my.promise().tag << std::endl;
         return *value;
     }
 
-    resumable(coro_handle handle) : my(handle), tag(handle.promise().tag)
+    explicit Task(coro_handle handle) : my(handle), tag(handle.promise().tag)
     {
         assert(handle);
         my.promise().r = this;
-        std::cout << "    resumable " << tag << std::endl;
+        std::cout << "    Task " << tag << std::endl;
     }
-    resumable(resumable &) = delete;
-    resumable(resumable &&rhs) : my(rhs.my), tag(rhs.tag)
+    Task(Task &) = delete;
+    Task(Task &&rhs) : my(rhs.my), tag(rhs.tag)
     {
         rhs.my = {};
-        std::cout << "    resumable&& " << tag << std::endl;
+        std::cout << "    Task&& " << tag << std::endl;
     }
-    static bool resume_impl(resumable *r)
+    static bool resumeImpl(Task *r)
     {
         if (r->value)
         return false;
@@ -100,7 +100,7 @@ struct resumable
 
         if (next)
         {
-            if (resume_impl(next.promise().r))
+            if (resumeImpl(next.promise().r))
             return true;
             next = {};
         }
@@ -116,7 +116,7 @@ struct resumable
 
     bool resume()
     {
-        return resume_impl(this);
+        return resumeImpl(this);
     }
 
     T res()
@@ -124,9 +124,9 @@ struct resumable
         return *value;
     }
 
-    ~resumable()
+    ~Task()
     {
-        std::cout << "    ~resumable " << tag << std::endl;
+        std::cout << "    ~Task " << tag << std::endl;
     }
 
 private:
@@ -136,7 +136,7 @@ private:
     std::exception_ptr exception;
 };
 
-resumable<int> boo([[maybe_unused]] std::string tag)
+Task<int> boo([[maybe_unused]] std::string tag)
 {
     std::cout << "x" << std::endl;
     co_await std::suspend_always();
@@ -145,7 +145,7 @@ resumable<int> boo([[maybe_unused]] std::string tag)
     co_return 1;
 }
 
-resumable<int> bar([[maybe_unused]] std::string tag)
+Task<int> bar([[maybe_unused]] std::string tag)
 {
     std::cout << "a" << std::endl;
     int res1 = co_await boo("boo1");
@@ -157,7 +157,7 @@ resumable<int> bar([[maybe_unused]] std::string tag)
     co_return res1 + res2;  // 1 + 1 = 2
 }
 
-resumable<int> foo([[maybe_unused]] std::string tag) {
+Task<int> foo([[maybe_unused]] std::string tag) {
     std::cout << "Hello" << std::endl;
     auto res1 = co_await bar("bar1");
     std::cout << "Coro " << res1 << std::endl;

From 75af011068122162c87722a05ddb80d30508c6f2 Mon Sep 17 00:00:00 2001
From: vesslanjin <jun.i.jin@intel.com>
Date: Fri, 8 Oct 2021 14:58:23 -0400
Subject: [PATCH 078/104] use while instead of popcnt + for

Co-authored-by: Zhu Jasper jasper.zhu@intel.com
---
 src/Columns/ColumnFixedString.cpp | 9 ++-------
 src/Columns/ColumnVector.cpp      | 9 ++-------
 src/Columns/ColumnsCommon.cpp     | 9 ++-------
 3 files changed, 6 insertions(+), 21 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index 1080f29b5aa..ea66ba73d8e 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -248,19 +248,14 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
         UInt16 mask = _mm_movemask_epi8(_mm_cmpeq_epi8(_mm_loadu_si128(reinterpret_cast<const __m128i *>(filt_pos)), zero16));
         mask = ~mask;
 
-        if (0 == mask)
-        {
-            /// Nothing is inserted.
-        }
-        else if (0xFFFF == mask)
+        if (0xFFFF == mask)
         {
             res->chars.insert(data_pos, data_pos + chars_per_simd_elements);
         }
         else
         {
             size_t res_chars_size = res->chars.size();
-            size_t pcnt = __builtin_popcount(mask);
-            for (size_t j = 0; j < pcnt; ++j)
+            while(mask)
             {
                 size_t index = __builtin_ctz(mask);
                 res->chars.resize(res_chars_size + n);
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index 61ba2074bd7..f45b0581213 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -327,18 +327,13 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
         UInt16 mask = _mm_movemask_epi8(_mm_cmpeq_epi8(_mm_loadu_si128(reinterpret_cast<const __m128i *>(filt_pos)), zero16));
         mask = ~mask;
 
-        if (0 == mask)
-        {
-            /// Nothing is inserted.
-        }
-        else if (0xFFFF == mask)
+        if (0xFFFF == mask)
         {
             res_data.insert(data_pos, data_pos + SIMD_BYTES);
         }
         else
         {
-            size_t pcnt = __builtin_popcount(mask);
-            for (size_t j = 0; j < pcnt; ++j)
+            while(mask)
             {
                 size_t index = __builtin_ctz(mask);
                 res_data.push_back(data_pos[index]);
diff --git a/src/Columns/ColumnsCommon.cpp b/src/Columns/ColumnsCommon.cpp
index b4614abe490..8a6f5c24a32 100644
--- a/src/Columns/ColumnsCommon.cpp
+++ b/src/Columns/ColumnsCommon.cpp
@@ -241,11 +241,7 @@ namespace
                 zero_vec));
             mask = ~mask;
 
-            if (mask == 0)
-            {
-                /// SIMD_BYTES consecutive rows do not pass the filter
-            }
-            else if (mask == 0xffff)
+            if (mask == 0xffff)
             {
                 /// SIMD_BYTES consecutive rows pass the filter
                 const auto first = offsets_pos == offsets_begin;
@@ -262,8 +258,7 @@ namespace
             }
             else
             {
-                size_t pcnt = __builtin_popcount(mask);
-                for (size_t j = 0; j < pcnt; ++j)
+                while(mask)
                 {
                     size_t index = __builtin_ctz(mask);
                     copy_array(offsets_pos + index);

From 7a5cc357ecb6df1ec14b008dbc04d8a14de1776a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Fri, 8 Oct 2021 22:44:08 +0300
Subject: [PATCH 079/104] Fix style

---
 src/Core/examples/coro.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Core/examples/coro.cpp b/src/Core/examples/coro.cpp
index e3a990e228d..e11d0af9e22 100644
--- a/src/Core/examples/coro.cpp
+++ b/src/Core/examples/coro.cpp
@@ -1,5 +1,3 @@
-#include <iostream>
-
 #include <cassert>
 #include <iostream>
 #include <string>
@@ -157,7 +155,8 @@ Task<int> bar([[maybe_unused]] std::string tag)
     co_return res1 + res2;  // 1 + 1 = 2
 }
 
-Task<int> foo([[maybe_unused]] std::string tag) {
+Task<int> foo([[maybe_unused]] std::string tag)
+{
     std::cout << "Hello" << std::endl;
     auto res1 = co_await bar("bar1");
     std::cout << "Coro " << res1 << std::endl;

From 8513994a659fd287a3a890fcd413cc23cc3d061d Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Fri, 8 Oct 2021 23:51:21 +0300
Subject: [PATCH 080/104] add logging in ZooKeeper client

---
 src/Common/ZooKeeper/ZooKeeperImpl.cpp | 46 ++++++++++++++++----------
 src/Common/ZooKeeper/ZooKeeperImpl.h   |  6 ++--
 2 files changed, 32 insertions(+), 20 deletions(-)

diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.cpp b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
index d79a94169b2..cf607a3d70e 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
@@ -289,7 +289,7 @@ ZooKeeper::~ZooKeeper()
 {
     try
     {
-        finalize(false, false);
+        finalize(false, false, "destructor called");
 
         if (send_thread.joinable())
             send_thread.join();
@@ -299,7 +299,7 @@ ZooKeeper::~ZooKeeper()
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
+        tryLogCurrentException(log);
     }
 }
 
@@ -317,6 +317,7 @@ ZooKeeper::ZooKeeper(
     session_timeout(session_timeout_),
     operation_timeout(std::min(operation_timeout_, session_timeout_))
 {
+    log = &Poco::Logger::get("ZooKeeperClient");
     std::atomic_store(&zk_log, std::move(zk_log_));
 
     if (!root_path.empty())
@@ -450,6 +451,10 @@ void ZooKeeper::connect(
         message << fail_reasons.str() << "\n";
         throw Exception(message.str(), Error::ZCONNECTIONLOSS);
     }
+    else
+    {
+        LOG_TEST(log, "Connected to ZooKeeper at {} with session_id {}", socket.peerAddress().toString(), session_id);
+    }
 }
 
 
@@ -604,8 +609,8 @@ void ZooKeeper::sendThread()
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-        finalize(true, false);
+        tryLogCurrentException(log);
+        finalize(true, false, "exception in sendThread");
     }
 }
 
@@ -663,8 +668,8 @@ void ZooKeeper::receiveThread()
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-        finalize(false, true);
+        tryLogCurrentException(log);
+        finalize(false, true, "exception in receiveThread");
     }
 }
 
@@ -799,7 +804,7 @@ void ZooKeeper::receiveEvent()
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
+        tryLogCurrentException(log);
 
         /// Unrecoverable. Don't leave incorrect state in memory.
         if (!response)
@@ -819,7 +824,7 @@ void ZooKeeper::receiveEvent()
         catch (...)
         {
             /// Throw initial exception, not exception from callback.
-            tryLogCurrentException(__PRETTY_FUNCTION__);
+            tryLogCurrentException(log);
         }
 
         throw;
@@ -832,10 +837,15 @@ void ZooKeeper::receiveEvent()
 }
 
 
-void ZooKeeper::finalize(bool error_send, bool error_receive)
+void ZooKeeper::finalize(bool error_send, bool error_receive, const String & reason)
 {
     /// If some thread (send/receive) already finalizing session don't try to do it
-    if (finalization_started.exchange(true))
+    bool already_started = finalization_started.exchange(true);
+
+    LOG_TEST(log, "Finalizing session {}: finalization_started={}, queue_closed={}, reason={}",
+             session_id, already_started, requests_queue.isClosed(), reason);
+
+    if (already_started)
         return;
 
     auto expire_session_if_not_expired = [&]
@@ -860,7 +870,7 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
                 /// This happens for example, when "Cannot push request to queue within operation timeout".
                 /// Just mark session expired in case of error on close request, otherwise sendThread may not stop.
                 expire_session_if_not_expired();
-                tryLogCurrentException(__PRETTY_FUNCTION__);
+                tryLogCurrentException(log);
             }
 
             /// Send thread will exit after sending close request or on expired flag
@@ -879,7 +889,7 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
         catch (...)
         {
             /// We must continue to execute all callbacks, because the user is waiting for them.
-            tryLogCurrentException(__PRETTY_FUNCTION__);
+            tryLogCurrentException(log);
         }
 
         if (!error_receive && receive_thread.joinable())
@@ -908,7 +918,7 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
                     catch (...)
                     {
                         /// We must continue to all other callbacks, because the user is waiting for them.
-                        tryLogCurrentException(__PRETTY_FUNCTION__);
+                        tryLogCurrentException(log);
                     }
                 }
             }
@@ -939,7 +949,7 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
                         }
                         catch (...)
                         {
-                            tryLogCurrentException(__PRETTY_FUNCTION__);
+                            tryLogCurrentException(log);
                         }
                     }
                 }
@@ -967,7 +977,7 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
                     }
                     catch (...)
                     {
-                        tryLogCurrentException(__PRETTY_FUNCTION__);
+                        tryLogCurrentException(log);
                     }
                 }
             }
@@ -983,14 +993,14 @@ void ZooKeeper::finalize(bool error_send, bool error_receive)
                 }
                 catch (...)
                 {
-                    tryLogCurrentException(__PRETTY_FUNCTION__);
+                    tryLogCurrentException(log);
                 }
             }
         }
     }
     catch (...)
     {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
+        tryLogCurrentException(log);
     }
 }
 
@@ -1028,7 +1038,7 @@ void ZooKeeper::pushRequest(RequestInfo && info)
     }
     catch (...)
     {
-        finalize(false, false);
+        finalize(false, false, getCurrentExceptionMessage(false, false, false));
         throw;
     }
 
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.h b/src/Common/ZooKeeper/ZooKeeperImpl.h
index ce37ca7b650..53908e5b0c7 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.h
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.h
@@ -187,7 +187,7 @@ public:
     /// it will do read in another session, that read may not see the
     /// already performed write.
 
-    void finalize()  override { finalize(false, false); }
+    void finalize()  override { finalize(false, false, "unknown"); }
 
     void setZooKeeperLog(std::shared_ptr<DB::ZooKeeperLog> zk_log_);
 
@@ -240,6 +240,8 @@ private:
     ThreadFromGlobalPool send_thread;
     ThreadFromGlobalPool receive_thread;
 
+    Poco::Logger * log;
+
     void connect(
         const Nodes & node,
         Poco::Timespan connection_timeout);
@@ -257,7 +259,7 @@ private:
     void close();
 
     /// Call all remaining callbacks and watches, passing errors to them.
-    void finalize(bool error_send, bool error_receive);
+    void finalize(bool error_send, bool error_receive, const String & reason);
 
     template <typename T>
     void write(const T &);

From e42a687b803ee4b0e514cd1dba9d43b171d45867 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Fri, 8 Oct 2021 23:52:15 +0300
Subject: [PATCH 081/104] Fix

---
 .../test.py                                   | 31 +++++++++++++------
 1 file changed, 22 insertions(+), 9 deletions(-)

diff --git a/tests/integration/test_postgresql_replica_database_engine/test.py b/tests/integration/test_postgresql_replica_database_engine/test.py
index 92423598a35..d3ce2295614 100644
--- a/tests/integration/test_postgresql_replica_database_engine/test.py
+++ b/tests/integration/test_postgresql_replica_database_engine/test.py
@@ -77,7 +77,8 @@ def create_materialized_db(ip, port,
                            materialized_database='test_database',
                            postgres_database='postgres_database',
                            settings=[]):
-    create_query = "CREATE DATABASE {} ENGINE = MaterializedPostgreSQL('{}:{}', '{}', 'postgres', 'mysecretpassword')".format(materialized_database, ip, port, postgres_database)
+    instance.query(f"DROP DATABASE IF EXISTS {materialized_database}")
+    create_query = f"CREATE DATABASE {materialized_database} ENGINE = MaterializedPostgreSQL('{ip}:{port}', '{postgres_database}', 'postgres', 'mysecretpassword')"
     if len(settings) > 0:
         create_query += " SETTINGS "
         for i in range(len(settings)):
@@ -131,6 +132,14 @@ def assert_nested_table_is_created(table_name, materialized_database='test_datab
     assert(table_name in database_tables)
 
 
+@pytest.mark.timeout(320)
+def assert_number_of_columns(expected, table_name, database_name='test_database'):
+    result = instance.query(f"select count() from system.columns where table = '{table_name}' and database = '{database_name}' and not startsWith(name, '_')")
+    while (int(result) != expected):
+        time.sleep(1)
+        result = instance.query(f"select count() from system.columns where table = '{table_name}' and database = '{database_name}' and not startsWith(name, '_')")
+
+
 @pytest.mark.timeout(320)
 def check_tables_are_synchronized(table_name, order_by='key', postgres_database='postgres_database', materialized_database='test_database'):
     assert_nested_table_is_created(table_name, materialized_database)
@@ -479,27 +488,30 @@ def test_table_schema_changes(started_cluster):
 
     expected = instance.query("SELECT key, value1, value3 FROM test_database.postgresql_replica_3 ORDER BY key");
 
-    altered_table = random.randint(0, 4)
-    cursor.execute("ALTER TABLE postgresql_replica_{} DROP COLUMN value2".format(altered_table))
+    altered_idx = random.randint(0, 4)
+    altered_table = f'postgresql_replica_{altered_idx}'
+    cursor.execute(f"ALTER TABLE {altered_table} DROP COLUMN value2")
 
     for i in range(NUM_TABLES):
-        cursor.execute("INSERT INTO postgresql_replica_{} VALUES (50, {}, {})".format(i, i, i))
-        cursor.execute("UPDATE postgresql_replica_{} SET value3 = 12 WHERE key%2=0".format(i))
+        cursor.execute(f"INSERT INTO postgresql_replica_{i} VALUES (50, {i}, {i})")
+        cursor.execute(f"UPDATE {altered_table} SET value3 = 12 WHERE key%2=0")
 
-    assert_nested_table_is_created('postgresql_replica_{}'.format(altered_table))
-    check_tables_are_synchronized('postgresql_replica_{}'.format(altered_table))
+    time.sleep(2)
+    assert_nested_table_is_created(altered_table)
+    assert_number_of_columns(3, altered_table)
+    check_tables_are_synchronized(altered_table)
     print('check1 OK')
 
     for i in range(NUM_TABLES):
         check_tables_are_synchronized('postgresql_replica_{}'.format(i));
 
     for i in range(NUM_TABLES):
-        if i != altered_table:
+        if i != altered_idx:
             instance.query("INSERT INTO postgres_database.postgresql_replica_{} SELECT 51 + number, {}, {}, {} from numbers(49)".format(i, i, i, i))
         else:
             instance.query("INSERT INTO postgres_database.postgresql_replica_{} SELECT 51 + number, {}, {} from numbers(49)".format(i, i, i))
 
-    check_tables_are_synchronized('postgresql_replica_{}'.format(altered_table));
+    check_tables_are_synchronized(altered_table);
     print('check2 OK')
     for i in range(NUM_TABLES):
         check_tables_are_synchronized('postgresql_replica_{}'.format(i));
@@ -645,6 +657,7 @@ def test_virtual_columns(started_cluster):
 
     cursor.execute("ALTER TABLE postgresql_replica_0 ADD COLUMN value2 integer")
     instance.query("INSERT INTO postgres_database.postgresql_replica_0 SELECT number, number, number from numbers(10, 10)")
+    assert_number_of_columns(3, 'postgresql_replica_0')
     check_tables_are_synchronized('postgresql_replica_0');
 
     result = instance.query('SELECT key, value, value2,  _sign, _version FROM test_database.postgresql_replica_0;')

From 5d6da023bbf590f511a8be1c59d280eba757b068 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 9 Oct 2021 01:42:08 +0300
Subject: [PATCH 082/104] clickhouse-test: fix hung check under stress tests

https://clickhouse-test-reports.s3.yandex.net/29856/e2d6698244d43979b3fe2478dfdcd8dc3a91a0fd/stress_test_(address).html#fail1
---
 tests/clickhouse-test | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 6bbfa97ab66..f00e5574c67 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -87,8 +87,11 @@ class Client(clickhouse_driver.Client):
         return data
 
 # Helpers
-def make_clickhouse_client(base_args, *args, **kwargs):
+def make_clickhouse_client(base_args):
     return Client(host=base_args.tcp_host, port=base_args.tcp_port,
+        # hung check in stress tests may remove the database,
+        # hence we should use 'system'.
+        database='system',
         settings=get_additional_client_options_dict(base_args))
 def clickhouse_execute_one(base_args, *args, **kwargs):
     return make_clickhouse_client(base_args).execute_one(*args, **kwargs)

From 42ca2b4bb241827edf69bbd6938d6b19c31935f1 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 9 Oct 2021 01:43:00 +0300
Subject: [PATCH 083/104] clickhouse-test: remove not existing options for
 pylint

https://clickhouse-test-reports.s3.yandex.net/29856/e2d6698244d43979b3fe2478dfdcd8dc3a91a0fd/style_check/test_run.txt.out.log
---
 tests/clickhouse-test | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index f00e5574c67..f10e38b87e5 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1,11 +1,7 @@
 #!/usr/bin/env python3
 
 # pylint: disable=too-many-return-statements
-# pylint: disable=consider-using-f-string
 # pylint: disable=global-variable-not-assigned
-# pylint: disable=consider-using-with
-# pylint: disable=unspecified-encoding
-# pylint: disable=consider-using-min-builtin
 
 import enum
 import shutil

From 89a52930c68e6c256aa9fe959dd4bb33aaddfc85 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Sat, 9 Oct 2021 11:47:08 +0800
Subject: [PATCH 084/104] Cosmetic refactoring of server constants.

---
 src/Functions/FunctionConstantBase.h | 17 ++++-------------
 src/Functions/serverConstants.cpp    | 19 +++++++++++--------
 2 files changed, 15 insertions(+), 21 deletions(-)

diff --git a/src/Functions/FunctionConstantBase.h b/src/Functions/FunctionConstantBase.h
index 35096a9942f..2d237c77256 100644
--- a/src/Functions/FunctionConstantBase.h
+++ b/src/Functions/FunctionConstantBase.h
@@ -12,18 +12,9 @@ template<typename Derived, typename T, typename ColumnT>
 class FunctionConstantBase : public IFunction
 {
 public:
-
-    /// For server-level constants (uptime(), version(), etc)
-    explicit FunctionConstantBase(ContextPtr context, T && constant_value_)
-        : is_distributed(context->isDistributed())
-        , constant_value(std::forward<T>(constant_value_))
-    {
-    }
-
-    /// For real constants (pi(), e(), etc)
-    explicit FunctionConstantBase(const T & constant_value_)
-        : is_distributed(false)
-        , constant_value(constant_value_)
+    template <typename U>
+    explicit FunctionConstantBase(U && constant_value_, bool is_distributed_ = false)
+        : constant_value(std::forward<U>(constant_value_)), is_distributed(is_distributed_)
     {
     }
 
@@ -56,8 +47,8 @@ public:
     }
 
 private:
-    bool is_distributed;
     const T constant_value;
+    bool is_distributed;
 };
 
 }
diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 9a53a5cf582..49d45368439 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -24,7 +24,7 @@ namespace
     public:
         static constexpr auto name = "buildId";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionBuildId>(context); }
-        explicit FunctionBuildId(ContextPtr context) : FunctionConstantBase(context, SymbolIndex::instance()->getBuildIDHex()) {}
+        explicit FunctionBuildId(ContextPtr context) : FunctionConstantBase(SymbolIndex::instance()->getBuildIDHex(), context->isDistributed()) {}
     };
 #endif
 
@@ -35,7 +35,7 @@ namespace
     public:
         static constexpr auto name = "hostName";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionHostName>(context); }
-        explicit FunctionHostName(ContextPtr context) : FunctionConstantBase(context, DNSResolver::instance().getHostName()) {}
+        explicit FunctionHostName(ContextPtr context) : FunctionConstantBase(DNSResolver::instance().getHostName(), context->isDistributed()) {}
     };
 
 
@@ -44,7 +44,7 @@ namespace
     public:
         static constexpr auto name = "serverUUID";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionServerUUID>(context); }
-        explicit FunctionServerUUID(ContextPtr context) : FunctionConstantBase(context, ServerUUID::get()) {}
+        explicit FunctionServerUUID(ContextPtr context) : FunctionConstantBase(ServerUUID::get(), context->isDistributed()) {}
     };
 
 
@@ -53,7 +53,7 @@ namespace
     public:
         static constexpr auto name = "tcpPort";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionTcpPort>(context); }
-        explicit FunctionTcpPort(ContextPtr context) : FunctionConstantBase(context, context->getTCPPort()) {}
+        explicit FunctionTcpPort(ContextPtr context) : FunctionConstantBase(context->getTCPPort(), context->isDistributed()) {}
     };
 
 
@@ -63,7 +63,7 @@ namespace
     public:
         static constexpr auto name = "timezone";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionTimezone>(context); }
-        explicit FunctionTimezone(ContextPtr context) : FunctionConstantBase(context, String{DateLUT::instance().getTimeZone()}) {}
+        explicit FunctionTimezone(ContextPtr context) : FunctionConstantBase(String{DateLUT::instance().getTimeZone()}, context->isDistributed()) {}
     };
 
 
@@ -73,7 +73,7 @@ namespace
     public:
         static constexpr auto name = "uptime";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionUptime>(context); }
-        explicit FunctionUptime(ContextPtr context) : FunctionConstantBase(context, context->getUptimeSeconds()) {}
+        explicit FunctionUptime(ContextPtr context) : FunctionConstantBase(context->getUptimeSeconds(), context->isDistributed()) {}
     };
 
 
@@ -83,14 +83,17 @@ namespace
     public:
         static constexpr auto name = "version";
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionVersion>(context); }
-        explicit FunctionVersion(ContextPtr context) : FunctionConstantBase(context, VERSION_STRING) {}
+        explicit FunctionVersion(ContextPtr context) : FunctionConstantBase(VERSION_STRING, context->isDistributed()) {}
     };
 
     class FunctionZooKeeperSessionUptime : public FunctionConstantBase<FunctionZooKeeperSessionUptime, UInt32, DataTypeUInt32>
     {
     public:
         static constexpr auto name = "zookeeperSessionUptime";
-        explicit FunctionZooKeeperSessionUptime(ContextPtr context) : FunctionConstantBase(context, context->getZooKeeperSessionUptime()) {}
+        explicit FunctionZooKeeperSessionUptime(ContextPtr context)
+            : FunctionConstantBase(context->getZooKeeperSessionUptime(), context->isDistributed())
+        {
+        }
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionZooKeeperSessionUptime>(context); }
     };
 }

From f7c1e25526eba1d7221f48eed9e6d8dc3263b7d8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Sat, 9 Oct 2021 09:00:51 +0300
Subject: [PATCH 085/104] Fix tidy

---
 src/Core/examples/coro.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/examples/coro.cpp b/src/Core/examples/coro.cpp
index e11d0af9e22..0f152d8090a 100644
--- a/src/Core/examples/coro.cpp
+++ b/src/Core/examples/coro.cpp
@@ -77,7 +77,7 @@ struct Task
         return *value;
     }
 
-    explicit Task(coro_handle handle) : my(handle), tag(handle.promise().tag)
+    Task(coro_handle handle) : my(handle), tag(handle.promise().tag) // NOLINT(google-explicit-constructor)
     {
         assert(handle);
         my.promise().r = this;

From bed09ee68d01da683b685e8b5dbd93925e0c93fb Mon Sep 17 00:00:00 2001
From: vesslanjin <jun.i.jin@intel.com>
Date: Sat, 9 Oct 2021 02:56:10 -0400
Subject: [PATCH 086/104] Whitespace fix

Signed-off-by: vesslanjin <jun.i.jin@intel.com>
---
 src/Columns/ColumnFixedString.cpp | 2 +-
 src/Columns/ColumnVector.cpp      | 2 +-
 src/Columns/ColumnsCommon.cpp     | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index ea66ba73d8e..ab14ea3fb87 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -255,7 +255,7 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
         else
         {
             size_t res_chars_size = res->chars.size();
-            while(mask)
+            while (mask)
             {
                 size_t index = __builtin_ctz(mask);
                 res->chars.resize(res_chars_size + n);
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index f45b0581213..85218402428 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -333,7 +333,7 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
         }
         else
         {
-            while(mask)
+            while (mask)
             {
                 size_t index = __builtin_ctz(mask);
                 res_data.push_back(data_pos[index]);
diff --git a/src/Columns/ColumnsCommon.cpp b/src/Columns/ColumnsCommon.cpp
index 8a6f5c24a32..d2f6883552a 100644
--- a/src/Columns/ColumnsCommon.cpp
+++ b/src/Columns/ColumnsCommon.cpp
@@ -258,7 +258,7 @@ namespace
             }
             else
             {
-                while(mask)
+                while (mask)
                 {
                     size_t index = __builtin_ctz(mask);
                     copy_array(offsets_pos + index);

From 2204597cfef8767472f2dd25a6e6972fd45845c7 Mon Sep 17 00:00:00 2001
From: WangZengrui <joeywang98@outlook.com>
Date: Sat, 9 Oct 2021 16:49:49 +0800
Subject: [PATCH 087/104] add FunctionOSKernelVersion

---
 .../registerFunctionsMiscellaneous.cpp        |  2 ++
 src/Functions/serverConstants.cpp             | 24 ++++++++++++++
 src/Interpreters/getOSKernelVersion.cpp       | 31 -------------------
 src/Interpreters/getOSKernelVersion.h         | 21 -------------
 4 files changed, 26 insertions(+), 52 deletions(-)
 delete mode 100644 src/Interpreters/getOSKernelVersion.cpp
 delete mode 100644 src/Interpreters/getOSKernelVersion.h

diff --git a/src/Functions/registerFunctionsMiscellaneous.cpp b/src/Functions/registerFunctionsMiscellaneous.cpp
index dfd986c5f82..8fc084b3d1a 100644
--- a/src/Functions/registerFunctionsMiscellaneous.cpp
+++ b/src/Functions/registerFunctionsMiscellaneous.cpp
@@ -81,6 +81,7 @@ void registerFunctionQueryID(FunctionFactory & factory);
 void registerFunctionInitialQueryID(FunctionFactory & factory);
 void registerFunctionServerUUID(FunctionFactory &);
 void registerFunctionZooKeeperSessionUptime(FunctionFactory &);
+void registerFunctionOSKernelVersion(FunctionFactory &);
 
 #if USE_ICU
 void registerFunctionConvertCharset(FunctionFactory &);
@@ -162,6 +163,7 @@ void registerFunctionsMiscellaneous(FunctionFactory & factory)
     registerFunctionInitialQueryID(factory);
     registerFunctionServerUUID(factory);
     registerFunctionZooKeeperSessionUptime(factory);
+    registerFunctionOSKernelVersion(factory);
 
 #if USE_ICU
     registerFunctionConvertCharset(factory);
diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 9a53a5cf582..170f4cb86ee 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -7,6 +7,10 @@
 #include <Common/DNSResolver.h>
 #include <base/DateLUT.h>
 
+#if defined(OS_LINUX)
+#    include <Poco/Environment.h>
+#endif
+
 #if !defined(ARCADIA_BUILD)
 #    include <Common/config_version.h>
 #endif
@@ -93,6 +97,17 @@ namespace
         explicit FunctionZooKeeperSessionUptime(ContextPtr context) : FunctionConstantBase(context, context->getZooKeeperSessionUptime()) {}
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionZooKeeperSessionUptime>(context); }
     };
+
+#if defined(OS_LINUX)
+    class FunctionOSKernelVersion : public FunctionConstantBase<FunctionOSKernelVersion, String, DataTypeString>
+    {
+    public:
+        static constexpr auto name = "OSKernelVersion";
+        explicit FunctionOSKernelVersion(ContextPtr context) : FunctionConstantBase(context, Poco::Environment::osName() + " " + Poco::Environment::osVersion()) {}
+        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionOSKernelVersion>(context); }
+    };
+#endif
+
 }
 
 
@@ -140,5 +155,14 @@ void registerFunctionZooKeeperSessionUptime(FunctionFactory & factory)
     factory.registerFunction<FunctionZooKeeperSessionUptime>();
 }
 
+
+void registerFunctionOSKernelVersion(FunctionFactory & factory)
+{
+#if defined(OS_LINUX)
+    factory.registerFunction<FunctionOSKernelVersion>();
+#endif
+}
+
+
 }
 
diff --git a/src/Interpreters/getOSKernelVersion.cpp b/src/Interpreters/getOSKernelVersion.cpp
deleted file mode 100644
index c4b4564f46e..00000000000
--- a/src/Interpreters/getOSKernelVersion.cpp
+++ /dev/null
@@ -1,31 +0,0 @@
-#if defined(OS_LINUX)
-#include <Interpreters/getOSKernelVersion.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int SYSTEM_ERROR;
-}
-    
-String getOSKernelVersion()
-{
-    struct utsname os_kernel_info;
-    int buf = uname(&os_kernel_info);
-    if (buf < 0)
-    {
-        throw Exception(
-            "EFAULT buffer is not valid.",
-            ErrorCodes::SYSTEM_ERROR);
-    }
-    else
-    {
-        return String(os_kernel_info.sysname) + " " + String(os_kernel_info.release);
-    }
-}
-
-}
-
-#endif
\ No newline at end of file
diff --git a/src/Interpreters/getOSKernelVersion.h b/src/Interpreters/getOSKernelVersion.h
deleted file mode 100644
index fc3c7583aef..00000000000
--- a/src/Interpreters/getOSKernelVersion.h
+++ /dev/null
@@ -1,21 +0,0 @@
-#pragma once
-#if defined(OS_LINUX)
-
-#include <Common/typeid_cast.h>
-
-#include <string>
-#include <sys/utsname.h>
-
-namespace DB
-{
-
-/// Returns String with OS Kernel version.
-/* To get name and information about current kernel.
-   For simplicity, the function can be implemented only for Linux. 
-*/
-    
-String getOSKernelVersion();
-
-}
-
-#endif
\ No newline at end of file

From 3940382c2f4e84c17eb7b9ff8819eca1a1bc579d Mon Sep 17 00:00:00 2001
From: Vladimir C <vdimir@clickhouse.com>
Date: Sat, 9 Oct 2021 13:34:02 +0300
Subject: [PATCH 088/104] Remove defined(__POPCNT__) from column filter

---
 src/Columns/ColumnFixedString.cpp | 2 +-
 src/Columns/ColumnVector.cpp      | 2 +-
 src/Columns/ColumnsCommon.cpp     | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index ab14ea3fb87..733ecaa979a 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -231,7 +231,7 @@ ColumnPtr ColumnFixedString::filter(const IColumn::Filter & filt, ssize_t result
     const UInt8 * filt_end = filt_pos + col_size;
     const UInt8 * data_pos = chars.data();
 
-#if defined(__SSE2__) && defined(__POPCNT__)
+#ifdef __SSE2__
     /** A slightly more optimized version.
         * Based on the assumption that often pieces of consecutive values
         *  completely pass or do not pass the filter.
diff --git a/src/Columns/ColumnVector.cpp b/src/Columns/ColumnVector.cpp
index 85218402428..a769cd93037 100644
--- a/src/Columns/ColumnVector.cpp
+++ b/src/Columns/ColumnVector.cpp
@@ -311,7 +311,7 @@ ColumnPtr ColumnVector<T>::filter(const IColumn::Filter & filt, ssize_t result_s
     const UInt8 * filt_end = filt_pos + size;
     const T * data_pos = data.data();
 
-#if defined(__SSE2__) && defined(__POPCNT__)
+#ifdef __SSE2__
     /** A slightly more optimized version.
     * Based on the assumption that often pieces of consecutive values
     *  completely pass or do not pass the filter.
diff --git a/src/Columns/ColumnsCommon.cpp b/src/Columns/ColumnsCommon.cpp
index d2f6883552a..a4d7de34382 100644
--- a/src/Columns/ColumnsCommon.cpp
+++ b/src/Columns/ColumnsCommon.cpp
@@ -229,7 +229,7 @@ namespace
             memcpy(&res_elems[elems_size_old], &src_elems[arr_offset], arr_size * sizeof(T));
         };
 
-    #if defined(__SSE2__) && defined(__POPCNT__)
+    #ifdef __SSE2__
         const __m128i zero_vec = _mm_setzero_si128();
         static constexpr size_t SIMD_BYTES = 16;
         const auto * filt_end_aligned = filt_pos + size / SIMD_BYTES * SIMD_BYTES;

From 96a9d99ab658f3e0e0dc4c21bf6f01ebcbe41dbb Mon Sep 17 00:00:00 2001
From: WangZengrui <joeywang98@outlook.com>
Date: Sat, 9 Oct 2021 19:53:21 +0800
Subject: [PATCH 089/104] add test

---
 src/Functions/registerFunctionsMiscellaneous.cpp     |  4 ++--
 src/Functions/serverConstants.cpp                    | 12 ++++++------
 .../02095_function_get_os_kernel_version.reference   |  1 +
 .../02095_function_get_os_kernel_version.sql         |  1 +
 4 files changed, 10 insertions(+), 8 deletions(-)
 create mode 100644 tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
 create mode 100644 tests/queries/0_stateless/02095_function_get_os_kernel_version.sql

diff --git a/src/Functions/registerFunctionsMiscellaneous.cpp b/src/Functions/registerFunctionsMiscellaneous.cpp
index 8fc084b3d1a..dc062ab148a 100644
--- a/src/Functions/registerFunctionsMiscellaneous.cpp
+++ b/src/Functions/registerFunctionsMiscellaneous.cpp
@@ -81,7 +81,7 @@ void registerFunctionQueryID(FunctionFactory & factory);
 void registerFunctionInitialQueryID(FunctionFactory & factory);
 void registerFunctionServerUUID(FunctionFactory &);
 void registerFunctionZooKeeperSessionUptime(FunctionFactory &);
-void registerFunctionOSKernelVersion(FunctionFactory &);
+void registerFunctionGetOSKernelVersion(FunctionFactory &);
 
 #if USE_ICU
 void registerFunctionConvertCharset(FunctionFactory &);
@@ -163,7 +163,7 @@ void registerFunctionsMiscellaneous(FunctionFactory & factory)
     registerFunctionInitialQueryID(factory);
     registerFunctionServerUUID(factory);
     registerFunctionZooKeeperSessionUptime(factory);
-    registerFunctionOSKernelVersion(factory);
+    registerFunctionGetOSKernelVersion(factory);
 
 #if USE_ICU
     registerFunctionConvertCharset(factory);
diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 170f4cb86ee..f92bd6f6653 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -99,12 +99,12 @@ namespace
     };
 
 #if defined(OS_LINUX)
-    class FunctionOSKernelVersion : public FunctionConstantBase<FunctionOSKernelVersion, String, DataTypeString>
+    class FunctionGetOSKernelVersion : public FunctionConstantBase<FunctionGetOSKernelVersion, String, DataTypeString>
     {
     public:
-        static constexpr auto name = "OSKernelVersion";
-        explicit FunctionOSKernelVersion(ContextPtr context) : FunctionConstantBase(context, Poco::Environment::osName() + " " + Poco::Environment::osVersion()) {}
-        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionOSKernelVersion>(context); }
+        static constexpr auto name = "getOSKernelVersion";
+        explicit FunctionGetOSKernelVersion(ContextPtr context) : FunctionConstantBase(context, Poco::Environment::osName() + " " + Poco::Environment::osVersion()) {}
+        static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionGetOSKernelVersion>(context); }
     };
 #endif
 
@@ -156,10 +156,10 @@ void registerFunctionZooKeeperSessionUptime(FunctionFactory & factory)
 }
 
 
-void registerFunctionOSKernelVersion(FunctionFactory & factory)
+void registerFunctionGetOSKernelVersion([[maybe_unused]] FunctionFactory & factory)
 {
 #if defined(OS_LINUX)
-    factory.registerFunction<FunctionOSKernelVersion>();
+    factory.registerFunction<FunctionGetOSKernelVersion>();
 #endif
 }
 
diff --git a/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference b/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
new file mode 100644
index 00000000000..9ec3c4aef9b
--- /dev/null
+++ b/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
@@ -0,0 +1 @@
+Linux	0
diff --git a/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
new file mode 100644
index 00000000000..01cd1057d84
--- /dev/null
+++ b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
@@ -0,0 +1 @@
+WITH splitByChar(' ', getOSKernelVersion()) AS version_pair SELECT version_pair[1], toUInt32(splitByChar('.', version_pair[2])[1]) > 3
\ No newline at end of file

From 473f7bee3ad023b21de225c280b0d8e62979fdcc Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Sat, 9 Oct 2021 12:16:37 +0000
Subject: [PATCH 090/104] refactor

---
 programs/server/users.xml                             | 4 ++--
 src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp | 3 +++
 src/Server/HTTP/WriteBufferFromHTTPServerResponse.h   | 8 ++++++++
 src/Server/HTTPHandler.cpp                            | 9 ++++++---
 tests/integration/test_settings_profile/test.py       | 6 +++---
 5 files changed, 22 insertions(+), 8 deletions(-)

diff --git a/programs/server/users.xml b/programs/server/users.xml
index b935937a1e5..4cd0c88a0a2 100644
--- a/programs/server/users.xml
+++ b/programs/server/users.xml
@@ -19,8 +19,8 @@
             -->
             <load_balancing>random</load_balancing>
 
-            <!-- Always try to add http cors header. -->
-            <add_http_cors_header>1</add_http_cors_header>
+            <!-- Turn on this setting for CORS headers. -->
+            <!-- add_http_cors_header>1</add_http_cors_header -->
         </default>
 
         <!-- Profile that allows only read queries. -->
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
index 9131413a887..cba0b6f0592 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
@@ -29,6 +29,9 @@ void WriteBufferFromHTTPServerResponse::startSendHeaders()
     {
         headers_started_sending = true;
 
+        if (add_cors_header)
+            response.set("Access-Control-Allow-Origin", "*");
+
         setResponseDefaultHeaders(response, keep_alive_timeout);
 
         if (!is_http_method_head)
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
index 7ce99b16261..665c2daebbd 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
@@ -36,6 +36,7 @@ private:
     HTTPServerResponse & response;
 
     bool is_http_method_head;
+    bool add_cors_header = false;
     unsigned keep_alive_timeout = 0;
     bool compress = false;
     CompressionMethod compression_method;
@@ -103,6 +104,13 @@ public:
         compression_level = level;
     }
 
+    /// Turn CORS on or off.
+    /// The setting has any effect only if HTTP headers haven't been sent yet.
+    void addHeaderCORS(bool enable_cors)
+    {
+        add_cors_header = enable_cors;
+    }
+
     /// Don't send HTTP headers with progress more frequently.
     void setSendProgressInterval(size_t send_progress_interval_ms_)
     {
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 9edef8a7223..c50d0e753ed 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -745,10 +745,13 @@ void HTTPHandler::processQuery(
     if (in_post_compressed && settings.http_native_compression_disable_checksumming_on_decompress)
         static_cast<CompressedReadBuffer &>(*in_post_maybe_compressed).disableChecksumming();
 
-    /// Add CORS header if 'add_http_cors_header' setting is turned on or config has http_options_response,
-    /// which means that there are some headers to be sent, and the client passed Origin header.
-    if (settings.add_http_cors_header && config.has("http_options_response") && !request.get("Origin", "").empty())
+    /// Add CORS header if 'add_http_cors_header' setting is turned on send * in Access-Control-Allow-Origin,
+    /// or  if config has http_options_response, which means that there
+    /// are some headers to be sent, and the client passed Origin header.
+    if (config.has("http_options_response") && !request.get("Origin", "").empty())
         tryAddHeadersFromConfig(response, config);
+    else if (settings.add_http_cors_header)
+        used_output.out->addHeaderCORS(settings.add_http_cors_header && !request.get("Origin", "").empty());
 
     auto append_callback = [context = context] (ProgressCallback callback)
     {
diff --git a/tests/integration/test_settings_profile/test.py b/tests/integration/test_settings_profile/test.py
index 048d09daaa5..7be0b395764 100644
--- a/tests/integration/test_settings_profile/test.py
+++ b/tests/integration/test_settings_profile/test.py
@@ -201,13 +201,13 @@ def test_show_profiles():
 
     assert instance.query("SHOW CREATE PROFILE xyz") == "CREATE SETTINGS PROFILE xyz\n"
     assert instance.query(
-        "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n"
+        "SHOW CREATE SETTINGS PROFILE default") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n"
     assert instance.query(
-        "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n" \
+        "SHOW CREATE PROFILES") == "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n" \
                                    "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
                                    "CREATE SETTINGS PROFILE xyz\n"
 
-    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\', add_http_cors_header = 1\n" \
+    expected_access = "CREATE SETTINGS PROFILE default SETTINGS max_memory_usage = 10000000000, load_balancing = \\'random\\'\n" \
                       "CREATE SETTINGS PROFILE readonly SETTINGS readonly = 1\n" \
                       "CREATE SETTINGS PROFILE xyz\n"
     assert expected_access in instance.query("SHOW ACCESS")

From 12f59f2dcac5ec74e40724c612e95f4093cadbc5 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Sat, 9 Oct 2021 12:52:20 +0000
Subject: [PATCH 091/104] refactor

---
 programs/server/users.xml  | 5 +----
 src/Server/HTTPHandler.cpp | 6 +++---
 2 files changed, 4 insertions(+), 7 deletions(-)

diff --git a/programs/server/users.xml b/programs/server/users.xml
index 4cd0c88a0a2..847e7768ed0 100644
--- a/programs/server/users.xml
+++ b/programs/server/users.xml
@@ -18,10 +18,7 @@
                  first_or_random - if first replica one has higher number of errors, pick a random one from replicas with minimum number of errors.
             -->
             <load_balancing>random</load_balancing>
-
-            <!-- Turn on this setting for CORS headers. -->
-            <!-- add_http_cors_header>1</add_http_cors_header -->
-        </default>
+       </default>
 
         <!-- Profile that allows only read queries. -->
         <readonly>
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index c50d0e753ed..42ff154e807 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -746,12 +746,12 @@ void HTTPHandler::processQuery(
         static_cast<CompressedReadBuffer &>(*in_post_maybe_compressed).disableChecksumming();
 
     /// Add CORS header if 'add_http_cors_header' setting is turned on send * in Access-Control-Allow-Origin,
-    /// or  if config has http_options_response, which means that there
+    /// or if config has http_options_response, which means that there
     /// are some headers to be sent, and the client passed Origin header.
     if (config.has("http_options_response") && !request.get("Origin", "").empty())
         tryAddHeadersFromConfig(response, config);
-    else if (settings.add_http_cors_header)
-        used_output.out->addHeaderCORS(settings.add_http_cors_header && !request.get("Origin", "").empty());
+    else if (settings.add_http_cors_header && !request.get("Origin", "").empty())
+        used_output.out->addHeaderCORS(true);
 
     auto append_callback = [context = context] (ProgressCallback callback)
     {

From a853cd57ca67014bcd5e73145aa1daf14f274b2f Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Sat, 9 Oct 2021 12:56:00 +0000
Subject: [PATCH 092/104] refactoring

---
 src/Server/HTTPHandler.cpp | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index 42ff154e807..b7e7ac2ac33 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -748,10 +748,13 @@ void HTTPHandler::processQuery(
     /// Add CORS header if 'add_http_cors_header' setting is turned on send * in Access-Control-Allow-Origin,
     /// or if config has http_options_response, which means that there
     /// are some headers to be sent, and the client passed Origin header.
-    if (config.has("http_options_response") && !request.get("Origin", "").empty())
-        tryAddHeadersFromConfig(response, config);
-    else if (settings.add_http_cors_header && !request.get("Origin", "").empty())
-        used_output.out->addHeaderCORS(true);
+    if (!request.get("Origin", "").empty())
+    {
+        if (config.has("http_options_response"))
+            tryAddHeadersFromConfig(response, config);
+        else if (settings.add_http_cors_header)
+            used_output.out->addHeaderCORS(true);
+    }
 
     auto append_callback = [context = context] (ProgressCallback callback)
     {

From 98ecd59ebe5ebbc25884c6a577b85d13219039ec Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Sat, 9 Oct 2021 16:00:37 +0300
Subject: [PATCH 093/104] Update users.xml

---
 programs/server/users.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/server/users.xml b/programs/server/users.xml
index 847e7768ed0..0f7dfadb8ea 100644
--- a/programs/server/users.xml
+++ b/programs/server/users.xml
@@ -18,7 +18,7 @@
                  first_or_random - if first replica one has higher number of errors, pick a random one from replicas with minimum number of errors.
             -->
             <load_balancing>random</load_balancing>
-       </default>
+      </default>
 
         <!-- Profile that allows only read queries. -->
         <readonly>

From 7753cc9c2843f737e8a946e2866626d724009477 Mon Sep 17 00:00:00 2001
From: Filatenkov Artur <58165623+FArthur-cmd@users.noreply.github.com>
Date: Sat, 9 Oct 2021 16:01:01 +0300
Subject: [PATCH 094/104] Update users.xml

---
 programs/server/users.xml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/server/users.xml b/programs/server/users.xml
index 0f7dfadb8ea..fd5fe414579 100644
--- a/programs/server/users.xml
+++ b/programs/server/users.xml
@@ -18,7 +18,7 @@
                  first_or_random - if first replica one has higher number of errors, pick a random one from replicas with minimum number of errors.
             -->
             <load_balancing>random</load_balancing>
-      </default>
+        </default>
 
         <!-- Profile that allows only read queries. -->
         <readonly>

From 24568c9de5dc629fd1ec7054566a48530a6ce777 Mon Sep 17 00:00:00 2001
From: Artur <613623@mail.ru>
Date: Sat, 9 Oct 2021 13:55:30 +0000
Subject: [PATCH 095/104] update test reference

---
 tests/queries/0_stateless/00372_cors_header.reference | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00372_cors_header.reference b/tests/queries/0_stateless/00372_cors_header.reference
index e22493782f0..2f1465d1598 100644
--- a/tests/queries/0_stateless/00372_cors_header.reference
+++ b/tests/queries/0_stateless/00372_cors_header.reference
@@ -1,3 +1,3 @@
 1
+1
 0
-0

From f25fbe37403355cb16e0b0c39689f1f1bb3ec50f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sat, 9 Oct 2021 18:37:38 +0300
Subject: [PATCH 096/104] Update CCTZ

---
 contrib/cctz | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/cctz b/contrib/cctz
index c0f1bcb97fd..9edd0861d83 160000
--- a/contrib/cctz
+++ b/contrib/cctz
@@ -1 +1 @@
-Subproject commit c0f1bcb97fd2782f7c3f972fadd5aad5affac4b8
+Subproject commit 9edd0861d8328b2ae77e8fb5f4d7dcd1cf33b42b

From f0b7e54e83d4435734eecb56b3881d30e1d5d96c Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Sat, 9 Oct 2021 18:42:53 +0300
Subject: [PATCH 097/104] Update CHANGELOG.md

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d203fcba4c8..718aa751cc2 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,4 +1,4 @@
-### ClickHouse release v21.10, 2021-10-08
+### ClickHouse release v21.10, 2021-10-14
 
 #### Backward Incompatible Change
 

From bc093e2b23bd64e34042374d13a4a3cef7939c29 Mon Sep 17 00:00:00 2001
From: WangZengrui <joeywang98@outlook.com>
Date: Sun, 10 Oct 2021 00:06:11 +0800
Subject: [PATCH 098/104] fix test

---
 .../0_stateless/02095_function_get_os_kernel_version.reference  | 2 +-
 .../0_stateless/02095_function_get_os_kernel_version.sql        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference b/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
index 9ec3c4aef9b..9b075671eac 100644
--- a/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
+++ b/tests/queries/0_stateless/02095_function_get_os_kernel_version.reference
@@ -1 +1 @@
-Linux	0
+Linux
diff --git a/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
index 01cd1057d84..ed38abb64a9 100644
--- a/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
+++ b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
@@ -1 +1 @@
-WITH splitByChar(' ', getOSKernelVersion()) AS version_pair SELECT version_pair[1], toUInt32(splitByChar('.', version_pair[2])[1]) > 3
\ No newline at end of file
+WITH splitByChar(' ', getOSKernelVersion()) AS version_pair SELECT version_pair[1]
\ No newline at end of file

From 0828ecae975d8f92756e28430d610c9bdce7b8d1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sat, 9 Oct 2021 19:46:36 +0300
Subject: [PATCH 099/104] Better exception message while reading column from
 Arrow-supported formats

---
 .../Formats/Impl/ArrowColumnToCHColumn.cpp          | 13 ++++++++++++-
 .../Formats/Impl/ParquetBlockInputFormat.cpp        |  1 +
 2 files changed, 13 insertions(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
index feb826d5aa0..3dada0d62be 100644
--- a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
+++ b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
@@ -26,6 +26,7 @@
 #include <Columns/ColumnMap.h>
 #include <Columns/ColumnsNumber.h>
 #include <Interpreters/castColumn.h>
+#include <Common/quoteString.h>
 #include <algorithm>
 #include <arrow/builder.h>
 #include <arrow/array.h>
@@ -568,7 +569,17 @@ void ArrowColumnToCHColumn::arrowTableToCHChunk(Chunk & res, std::shared_ptr<arr
         else
             column = readColumnFromArrowColumn(arrow_column, header_column.name, format_name, false, dictionary_values);
 
-        column.column = castColumn(column, header_column.type);
+        try
+        {
+            column.column = castColumn(column, header_column.type);
+        }
+        catch (Exception & e)
+        {
+            e.addMessage(fmt::format("while converting column {} from type {} to type {}",
+                backQuote(header_column.name), column.type->getName(), header_column.type->getName()));
+            throw;
+        }
+
         column.type = header_column.type;
         num_rows = column.column->size();
         columns_list.push_back(std::move(column.column));
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
index 5137318c6e1..8f088a3f84a 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
@@ -15,6 +15,7 @@
 
 #include <base/logger_useful.h>
 
+
 namespace DB
 {
 

From c61f09c4dc1df370fd73b00c450a029afc3a6544 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <avtokmakov@yandex-team.ru>
Date: Sat, 9 Oct 2021 18:20:13 +0300
Subject: [PATCH 100/104] fix test for replication consistency

---
 tests/queries/0_stateless/replication.lib | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/tests/queries/0_stateless/replication.lib b/tests/queries/0_stateless/replication.lib
index e7fa2dd5404..61491630f46 100755
--- a/tests/queries/0_stateless/replication.lib
+++ b/tests/queries/0_stateless/replication.lib
@@ -40,6 +40,17 @@ function check_replication_consistency()
     table_name_prefix=$1
     check_query_part=$2
 
+    # Wait for all queries to finish (query may still be running if thread is killed by timeout)
+    num_tries=0
+    while [[ $($CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes WHERE current_database=currentDatabase() AND query LIKE '%$table_name_prefix%'") -ne 1 ]]; do
+        sleep 0.5;
+        num_tries=$((num_tries-1))
+        if [ $num_tries -eq 100 ]; then
+            $CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes WHERE current_database=currentDatabase() AND query LIKE '%$table_name_prefix%' FORMAT Vertical"
+            break
+        fi
+    done
+
     # Do not check anything if all replicas are readonly,
     # because is this case all replicas are probably lost (it may happen and it's not a bug)
     res=$($CLICKHOUSE_CLIENT -q "SELECT count() - sum(is_readonly) FROM system.replicas WHERE database=currentDatabase() AND table LIKE '$table_name_prefix%'")

From b9969232f54f4e947aff6aa07eea165bf00695da Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Sun, 10 Oct 2021 01:12:36 +0300
Subject: [PATCH 101/104] Update 02095_function_get_os_kernel_version.sql

---
 .../0_stateless/02095_function_get_os_kernel_version.sql        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
index ed38abb64a9..d62b360f7e0 100644
--- a/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
+++ b/tests/queries/0_stateless/02095_function_get_os_kernel_version.sql
@@ -1 +1 @@
-WITH splitByChar(' ', getOSKernelVersion()) AS version_pair SELECT version_pair[1]
\ No newline at end of file
+WITH splitByChar(' ', getOSKernelVersion()) AS version_pair SELECT version_pair[1]

From cc1fbe27a7e5d0ad35678a9c78a3312f580e8a77 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 10 Oct 2021 03:40:51 +0300
Subject: [PATCH 102/104] Fix build due to conflicts in serverConstants

Refs: #29755
Refs: #29913
---
 src/Functions/serverConstants.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/serverConstants.cpp b/src/Functions/serverConstants.cpp
index 8fc103b2382..900a6dbf2a9 100644
--- a/src/Functions/serverConstants.cpp
+++ b/src/Functions/serverConstants.cpp
@@ -106,7 +106,7 @@ namespace
     {
     public:
         static constexpr auto name = "getOSKernelVersion";
-        explicit FunctionGetOSKernelVersion(ContextPtr context) : FunctionConstantBase(context, Poco::Environment::osName() + " " + Poco::Environment::osVersion()) {}
+        explicit FunctionGetOSKernelVersion(ContextPtr context) : FunctionConstantBase(Poco::Environment::osName() + " " + Poco::Environment::osVersion(), context->isDistributed()) {}
         static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionGetOSKernelVersion>(context); }
     };
 #endif

From 103b3c91ba9d8026e4eb574dd5a11f9b075f0b26 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 10 Oct 2021 04:21:07 +0300
Subject: [PATCH 103/104] Remove 'printf' function usage.

---
 src/Client/QueryFuzzer.cpp | 14 +++++---------
 1 file changed, 5 insertions(+), 9 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index aa9f89e47b5..ec267e44a99 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -144,7 +144,7 @@ Field QueryFuzzer::fuzzField(Field field)
         {
             size_t pos = fuzz_rand() % arr.size();
             arr.erase(arr.begin() + pos);
-            fprintf(stderr, "erased\n");
+            std::cerr << "erased\n";
         }
 
         if (fuzz_rand() % 5 == 0)
@@ -153,12 +153,12 @@ Field QueryFuzzer::fuzzField(Field field)
             {
                 size_t pos = fuzz_rand() % arr.size();
                 arr.insert(arr.begin() + pos, fuzzField(arr[pos]));
-                fprintf(stderr, "inserted (pos %zd)\n", pos);
+                std::cerr << fmt::format("inserted (pos {})\n", pos);
             }
             else
             {
                 arr.insert(arr.begin(), getRandomField(0));
-                fprintf(stderr, "inserted (0)\n");
+                std::cerr << "inserted (0)\n";
             }
 
         }
@@ -278,7 +278,7 @@ void QueryFuzzer::fuzzOrderByList(IAST * ast)
         }
         else
         {
-            fprintf(stderr, "no random col!\n");
+            std::cerr << "No random column.\n";
         }
     }
 
@@ -312,13 +312,9 @@ void QueryFuzzer::fuzzColumnLikeExpressionList(IAST * ast)
                 : impl->children.begin() + fuzz_rand() % impl->children.size();
         auto col = getRandomColumnLike();
         if (col)
-        {
             impl->children.insert(pos, col);
-        }
         else
-        {
-            fprintf(stderr, "no random col!\n");
-        }
+            std::cerr << "No random column.\n";
     }
 
     // We don't have to recurse here to fuzz the children, this is handled by

From 1aeb5d55dd3b4eea4a4aff129a9c35bf1379b101 Mon Sep 17 00:00:00 2001
From: tavplubix <avtokmakov@yandex-team.ru>
Date: Sun, 10 Oct 2021 12:55:37 +0300
Subject: [PATCH 104/104] Grep server log even if it contains binary data
 (#29903)

* grep server log even if it contains binary data

* Update cluster.py

Co-authored-by: mergify[bot] <37929162+mergify[bot]@users.noreply.github.com>
---
 tests/integration/helpers/cluster.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 5ba67085d73..51b7bfcbcb8 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -2073,11 +2073,11 @@ class ClickHouseInstance:
     def contains_in_log(self, substring, from_host=False):
         if from_host:
             result = subprocess_check_call(["bash", "-c",
-                f'[ -f {self.logs_dir}/clickhouse-server.log ] && grep "{substring}" {self.logs_dir}/clickhouse-server.log || true'
+                f'[ -f {self.logs_dir}/clickhouse-server.log ] && grep -a "{substring}" {self.logs_dir}/clickhouse-server.log || true'
             ])
         else:
             result = self.exec_in_container(["bash", "-c",
-                f'[ -f /var/log/clickhouse-server/clickhouse-server.log ] && grep "{substring}" /var/log/clickhouse-server/clickhouse-server.log || true'
+                f'[ -f /var/log/clickhouse-server/clickhouse-server.log ] && grep -a "{substring}" /var/log/clickhouse-server/clickhouse-server.log || true'
             ])
         return len(result) > 0
 
@@ -2085,18 +2085,18 @@ class ClickHouseInstance:
         logging.debug(f"grep in log called %s", substring)
         if from_host:
             result = subprocess_check_call(["bash", "-c",
-                f'grep "{substring}" {self.logs_dir}/clickhouse-server.log || true'
+                f'grep -a "{substring}" {self.logs_dir}/clickhouse-server.log || true'
             ])
         else:
             result = self.exec_in_container(["bash", "-c",
-                f'grep "{substring}" /var/log/clickhouse-server/clickhouse-server.log || true'
+                f'grep -a "{substring}" /var/log/clickhouse-server/clickhouse-server.log || true'
             ])
         logging.debug("grep result %s", result)
         return result
 
     def count_in_log(self, substring):
         result = self.exec_in_container(
-            ["bash", "-c", 'grep "{}" /var/log/clickhouse-server/clickhouse-server.log | wc -l'.format(substring)])
+            ["bash", "-c", 'grep -a "{}" /var/log/clickhouse-server/clickhouse-server.log | wc -l'.format(substring)])
         return result
 
     def wait_for_log_line(self, regexp, filename='/var/log/clickhouse-server/clickhouse-server.log', timeout=30, repetitions=1, look_behind_lines=100):