Merge with master

2024-09-20 16:50:48 +00:00 · 2019-08-19 11:20:48 +03:00 · 2019-08-19 11:20:48 +03:00 · e7542810bb
commit e7542810bb
parent 96f62fefcc 9c991b161e
186 changed files with 3354 additions and 1603 deletions
--- a/.gitmodules
+++ b/.gitmodules
@ -93,7 +93,7 @@
 	url = https://github.com/ClickHouse-Extras/libunwind.git
 [submodule "contrib/simdjson"]
 	path = contrib/simdjson
-	url = https://github.com/ClickHouse-Extras/simdjson.git
+	url = https://github.com/lemire/simdjson.git
 [submodule "contrib/rapidjson"]
 	path = contrib/rapidjson
 	url = https://github.com/Tencent/rapidjson
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@ -264,7 +264,9 @@ if (USE_STATIC_LIBRARIES AND HAVE_NO_PIE)
    set (CMAKE_C_FLAGS                   "${CMAKE_C_FLAGS} ${FLAG_NO_PIE}")
 endif ()

-if (NOT SANITIZE AND NOT SPLIT_SHARED_LIBRARIES)
+# TODO: only make this extra-checks in CI builds, since a lot of contrib libs won't link -
+#       CI works around this problem by explicitly adding GLIBC_COMPATIBILITY flag.
+if (NOT SANITIZE AND YANDEX_OFFICIAL_BUILD)
    set (CMAKE_EXE_LINKER_FLAGS              "${CMAKE_EXE_LINKER_FLAGS} -Wl,--no-undefined")
    set (CMAKE_SHARED_LINKER_FLAGS           "${CMAKE_SHARED_LINKER_FLAGS} -Wl,--no-undefined")
 endif ()
@ -328,7 +330,7 @@ if (OS_LINUX AND NOT UNBUNDLED AND (GLIBC_COMPATIBILITY OR USE_INTERNAL_UNWIND_L
        if (USE_INTERNAL_LIBCXX_LIBRARY)
            set (LIBCXX_LIBS "${ClickHouse_BINARY_DIR}/contrib/libcxx-cmake/libcxx_static${${CMAKE_POSTFIX_VARIABLE}}.a ${ClickHouse_BINARY_DIR}/contrib/libcxxabi-cmake/libcxxabi_static${${CMAKE_POSTFIX_VARIABLE}}.a")
        else ()
-            set (LIBCXX_LIBS "-lc++ -lc++abi")
+            set (LIBCXX_LIBS "-lc++ -lc++abi -lc++fs")
        endif ()

        set (DEFAULT_LIBS "${DEFAULT_LIBS} -Wl,-Bstatic ${LIBCXX_LIBS} ${EXCEPTION_HANDLING_LIBRARY} ${BUILTINS_LIB_PATH} -Wl,-Bdynamic")
--- a/README.md
+++ b/README.md
@ -13,7 +13,8 @@ ClickHouse is an open-source column-oriented database management system that all
 * You can also [fill this form](https://forms.yandex.com/surveys/meet-yandex-clickhouse-team/) to meet Yandex ClickHouse team in person.

 ## Upcoming Events
-* [ClickHouse Meetup in Mountain View](https://www.eventbrite.com/e/meetup-clickhouse-in-the-south-bay-registration-65935505873) on August 13.
 * [ClickHouse Meetup in Moscow](https://yandex.ru/promo/clickhouse/moscow-2019) on September 5.
+* [ClickHouse Meetup in Paris](https://www.eventbrite.com/e/clickhouse-paris-meetup-2019-registration-68493270215) on October 3.
+* [ClickHouse Meetup in Hong Kong](https://www.meetup.com/Hong-Kong-Machine-Learning-Meetup/events/263580542/) on October 17.
 * [ClickHouse Meetup in Shenzhen](https://www.huodongxing.com/event/3483759917300) on October 20.
 * [ClickHouse Meetup in Shanghai](https://www.huodongxing.com/event/4483760336000) on October 27.
--- a/cmake/find_cpuinfo.cmake
+++ b/cmake/find_cpuinfo.cmake
@ -1,8 +1,8 @@
 option(USE_INTERNAL_CPUINFO_LIBRARY "Set to FALSE to use system cpuinfo library instead of bundled" ${NOT_UNBUNDLED})

 # Now we have no contrib/libcpuinfo, use from system.
-if (USE_INTERNAL_CPUINFO_LIBRARY AND NOT EXISTS "${ClickHouse_SOURCE_DIR}/contrib/libcpuinfo/include")
-   #message (WARNING "submodule contrib/libcpuid is missing. to fix try run: \n git submodule update --init --recursive")
+if (NOT EXISTS "${ClickHouse_SOURCE_DIR}/contrib/libcpuinfo/include")
+   #message (WARNING "submodule contrib/libcpuinfo is missing. to fix try run: \n git submodule update --init --recursive")
   set (USE_INTERNAL_CPUINFO_LIBRARY 0)
   set (MISSING_INTERNAL_CPUINFO_LIBRARY 1)
 endif ()
@ -12,7 +12,7 @@ if(NOT USE_INTERNAL_CPUINFO_LIBRARY)
    find_path(CPUINFO_INCLUDE_DIR NAMES cpuinfo.h PATHS ${CPUINFO_INCLUDE_PATHS})
 endif()

-if(CPUID_LIBRARY AND CPUID_INCLUDE_DIR)
+if(CPUINFO_LIBRARY AND CPUINFO_INCLUDE_DIR)
    set(USE_CPUINFO 1)
 elseif(NOT MISSING_INTERNAL_CPUINFO_LIBRARY)
    set(CPUINFO_INCLUDE_DIR ${ClickHouse_SOURCE_DIR}/contrib/libcpuinfo/include)
--- a/cmake/find_simdjson.cmake
+++ b/cmake/find_simdjson.cmake
@ -3,8 +3,11 @@ if (NOT EXISTS "${ClickHouse_SOURCE_DIR}/contrib/simdjson/include/simdjson/jsonp
    return()
 endif ()

-if (NOT HAVE_AVX2)
-    message (WARNING "submodule contrib/simdjson requires AVX2 support")
+if (NOT HAVE_SSE42)
+    message (WARNING "submodule contrib/simdjson requires support of SSE4.2 instructions")
+    return()
+elseif (NOT HAVE_PCLMULQDQ)
+    message (WARNING "submodule contrib/simdjson requires support of PCLMULQDQ instructions")
    return()
 endif ()

--- a/cmake/test_cpu.cmake
+++ b/cmake/test_cpu.cmake
@ -81,6 +81,17 @@ check_cxx_source_compiles("
    }
 " HAVE_AVX2)

+set (TEST_FLAG "-mpclmul")
+set (CMAKE_REQUIRED_FLAGS "${TEST_FLAG} -O0")
+check_cxx_source_compiles("
+    #include <wmmintrin.h>
+    int main() {
+        auto a = _mm_clmulepi64_si128(__m128i(), __m128i(), 0);
+        (void)a;
+        return 0;
+    }
+" HAVE_PCLMULQDQ)
+
 # gcc -dM -E -mpopcnt - < /dev/null | sort > gcc-dump-popcnt
 #define __POPCNT__ 1

--- a/contrib/mariadb-connector-c
+++ b/contrib/mariadb-connector-c
@ -1 +1 @@
-Subproject commit d85d0e98999cd9e28ceb66645999b4a9ce85370e
+Subproject commit c6503d3acc85ca1a7f5e7e38b605d7c9410aac1e
--- a/contrib/mariadb-connector-c-cmake/CMakeLists.txt
+++ b/contrib/mariadb-connector-c-cmake/CMakeLists.txt
@ -31,6 +31,7 @@ ${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/ma_stmt_codec.c
 ${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/ma_string.c
 ${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/ma_time.c
 ${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/ma_tls.c
+${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/secure/openssl_crypt.c
 #${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/secure/gnutls.c
 #${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/secure/ma_schannel.c
 #${MARIADB_CLIENT_SOURCE_DIR}/libmariadb/secure/schannel.c
@ -42,6 +43,7 @@ ${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/mariadb_cleartext.c
 ${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/my_auth.c
 ${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/old_password.c
 ${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/sha256_pw.c
+${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/caching_sha2_pw.c
 #${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/sspi_client.c
 #${MARIADB_CLIENT_SOURCE_DIR}/plugins/auth/sspi_errmsg.c
 ${MARIADB_CLIENT_SOURCE_DIR}/plugins/connection/aurora.c
--- a/contrib/mariadb-connector-c-cmake/linux_x86_64/libmariadb/ma_client_plugin.c
+++ b/contrib/mariadb-connector-c-cmake/linux_x86_64/libmariadb/ma_client_plugin.c
@ -76,17 +76,20 @@ struct st_client_plugin_int *plugin_list[MYSQL_CLIENT_MAX_PLUGINS + MARIADB_CLIE
 static pthread_mutex_t LOCK_load_client_plugin;
 #endif

- extern struct st_mysql_client_plugin mysql_native_password_client_plugin;
- extern struct st_mysql_client_plugin mysql_old_password_client_plugin;
- extern struct st_mysql_client_plugin pvio_socket_client_plugin;
+extern struct st_mysql_client_plugin mysql_native_password_client_plugin;
+extern struct st_mysql_client_plugin mysql_old_password_client_plugin;
+extern struct st_mysql_client_plugin pvio_socket_client_plugin;
+extern struct st_mysql_client_plugin sha256_password_client_plugin;
+extern struct st_mysql_client_plugin caching_sha2_password_client_plugin;


 struct st_mysql_client_plugin *mysql_client_builtins[]=
 {
-     (struct st_mysql_client_plugin *)&mysql_native_password_client_plugin,
-   (struct st_mysql_client_plugin *)&mysql_old_password_client_plugin,
-   (struct st_mysql_client_plugin *)&pvio_socket_client_plugin,
-
+  (struct st_mysql_client_plugin *)&mysql_native_password_client_plugin,
+  (struct st_mysql_client_plugin *)&mysql_old_password_client_plugin,
+  (struct st_mysql_client_plugin *)&pvio_socket_client_plugin,
+  (struct st_mysql_client_plugin *)&sha256_password_client_plugin,
+  (struct st_mysql_client_plugin *)&caching_sha2_password_client_plugin,
  0
 };

--- a/contrib/poco
+++ b/contrib/poco
@ -1 +1 @@
-Subproject commit 7a2d304c21549427460428c9039009ef4bbfd899
+Subproject commit 6216cc01a107ce149863411ca29013a224f80343
--- a/contrib/simdjson
+++ b/contrib/simdjson
@ -1 +1 @@
-Subproject commit e3f6322af762213ff2087ce3366bf9541c7fd355
+Subproject commit e9be643db5cf1c29a69bc80ee72d220124a9c50e
--- a/contrib/simdjson-cmake/CMakeLists.txt
+++ b/contrib/simdjson-cmake/CMakeLists.txt
@ -1,6 +1,3 @@
-if (NOT HAVE_AVX2)
-    message (FATAL_ERROR "No AVX2 support")
-endif ()
 set(SIMDJSON_INCLUDE_DIR "${ClickHouse_SOURCE_DIR}/contrib/simdjson/include")
 set(SIMDJSON_SRC_DIR "${SIMDJSON_INCLUDE_DIR}/../src")
 set(SIMDJSON_SRC
@ -16,4 +13,3 @@ set(SIMDJSON_SRC

 add_library(${SIMDJSON_LIBRARY} ${SIMDJSON_SRC})
 target_include_directories(${SIMDJSON_LIBRARY} SYSTEM PUBLIC "${SIMDJSON_INCLUDE_DIR}")
-target_compile_options(${SIMDJSON_LIBRARY} PRIVATE -mavx2 -mbmi -mbmi2 -mpclmul)
--- a/dbms/cmake/version.cmake
+++ b/dbms/cmake/version.cmake
@ -1,11 +1,11 @@
 # This strings autochanged from release_lib.sh:
 set(VERSION_REVISION 54425)
 set(VERSION_MAJOR 19)
-set(VERSION_MINOR 13)
+set(VERSION_MINOR 14)
 set(VERSION_PATCH 1)
 set(VERSION_GITHASH adfc36917222bdb03eba069f0cad0f4f5b8f1c94)
-set(VERSION_DESCRIBE v19.13.1.1-prestable)
-set(VERSION_STRING 19.13.1.1)
+set(VERSION_DESCRIBE v19.14.1.1-prestable)
+set(VERSION_STRING 19.14.1.1)
 # end of autochange

 set(VERSION_EXTRA "" CACHE STRING "")
--- a/dbms/programs/performance-test/PerformanceTest.cpp
+++ b/dbms/programs/performance-test/PerformanceTest.cpp
@ -3,6 +3,8 @@
 #include <Core/Types.h>
 #include <Common/CpuId.h>
 #include <common/getMemoryAmount.h>
+#include <DataStreams/copyData.h>
+#include <DataStreams/NullBlockOutputStream.h>
 #include <DataStreams/RemoteBlockInputStream.h>
 #include <IO/ConnectionTimeouts.h>
 #include <IO/ReadBufferFromFile.h>
@ -249,6 +251,54 @@ std::vector<TestStats> PerformanceTest::execute()

        runQueries(queries_with_indexes, statistics_by_run);
    }
+
+    if (got_SIGINT)
+    {
+        return statistics_by_run;
+    }
+
+    // Pull memory usage data from query log. The log is normally filled in
+    // background, so we have to flush it synchronously here to see all the
+    // previous queries.
+    {
+        NullBlockOutputStream null_output(Block{});
+        RemoteBlockInputStream flush_log(connection, "system flush logs",
+            {} /* header */, context);
+        copyData(flush_log, null_output);
+    }
+
+    for (auto & statistics : statistics_by_run)
+    {
+        if (statistics.query_id.empty())
+        {
+            // We have statistics structs for skipped queries as well, so we
+            // have to filter them out.
+            continue;
+        }
+
+        // We run some test queries several times, specifying the same query id,
+        // so this query to the log may return several records. Choose the
+        // last one, because this is when the query performance has stabilized.
+        RemoteBlockInputStream log_reader(connection,
+            "select memory_usage, query_start_time from system.query_log "
+            "where type = 2 and query_id = '" + statistics.query_id + "' "
+            "order by query_start_time desc",
+            {} /* header */, context);
+
+        log_reader.readPrefix();
+        Block block = log_reader.read();
+        if (block.columns() == 0)
+        {
+            LOG_WARNING(log, "Query '" << statistics.query_id << "' is not found in query log.");
+            continue;
+        }
+
+        auto column = block.getByName("memory_usage").column;
+        statistics.memory_usage = column->get64(0);
+
+        log_reader.readSuffix();
+    }
+
    return statistics_by_run;
 }

@ -298,47 +348,6 @@ void PerformanceTest::runQueries(
            break;
        }
    }
-
-    if (got_SIGINT)
-    {
-        return;
-    }
-
-    // Pull memory usage data from query log. The log is normally filled in
-    // background, so we have to flush it synchronously here to see all the
-    // previous queries.
-    {
-        RemoteBlockInputStream flush_log(connection, "system flush logs",
-            {} /* header */, context);
-        flush_log.readPrefix();
-        while (flush_log.read());
-        flush_log.readSuffix();
-    }
-
-    for (auto & statistics : statistics_by_run)
-    {
-        RemoteBlockInputStream log_reader(connection,
-            "select memory_usage from system.query_log where type = 2 and query_id = '"
-                                   + statistics.query_id + "'",
-            {} /* header */, context);
-
-        log_reader.readPrefix();
-        Block block = log_reader.read();
-        if (block.columns() == 0)
-        {
-            LOG_WARNING(log, "Query '" << statistics.query_id << "' is not found in query log.");
-            continue;
-        }
-
-        assert(block.columns() == 1);
-        assert(block.getDataTypes()[0]->getName() == "UInt64");
-        ColumnPtr column = block.getByPosition(0).column;
-        assert(column->size() == 1);
-        StringRef ref = column->getDataAt(0);
-        assert(ref.size == sizeof(UInt64));
-        statistics.memory_usage = *reinterpret_cast<const UInt64*>(ref.data);
-        log_reader.readSuffix();
-    }
 }


--- a/dbms/programs/server/MySQLHandler.cpp
+++ b/dbms/programs/server/MySQLHandler.cpp
@ -2,7 +2,6 @@

 #include <limits>
 #include <ext/scope_guard.h>
-#include <openssl/rsa.h>
 #include <Columns/ColumnVector.h>
 #include <Common/config_version.h>
 #include <Common/NetException.h>
@ -45,6 +44,7 @@ MySQLHandler::MySQLHandler(IServer & server_, const Poco::Net::StreamSocket & so
    , connection_id(connection_id_)
    , public_key(public_key_)
    , private_key(private_key_)
+    , auth_plugin(new Authentication::Native41())
 {
    server_capability_flags = CLIENT_PROTOCOL_41 | CLIENT_SECURE_CONNECTION | CLIENT_PLUGIN_AUTH | CLIENT_PLUGIN_AUTH_LENENC_CLIENT_DATA | CLIENT_CONNECT_WITH_DB | CLIENT_DEPRECATE_EOF;
    if (ssl_enabled)
@ -62,9 +62,7 @@ void MySQLHandler::run()

    try
    {
-        String scramble = generateScramble();
-
-        Handshake handshake(server_capability_flags, connection_id, VERSION_STRING + String("-") + VERSION_NAME, Authentication::Native, scramble + '\0');
+        Handshake handshake(server_capability_flags, connection_id, VERSION_STRING + String("-") + VERSION_NAME, auth_plugin->getName(), auth_plugin->getAuthPluginData());
        packet_sender->sendPacket<Handshake>(handshake, true);

        LOG_TRACE(log, "Sent handshake");
@ -96,10 +94,21 @@ void MySQLHandler::run()
        client_capability_flags = handshake_response.capability_flags;
        if (!(client_capability_flags & CLIENT_PROTOCOL_41))
            throw Exception("Required capability: CLIENT_PROTOCOL_41.", ErrorCodes::MYSQL_CLIENT_INSUFFICIENT_CAPABILITIES);
-        if (!(client_capability_flags & CLIENT_PLUGIN_AUTH))
-            throw Exception("Required capability: CLIENT_PLUGIN_AUTH.", ErrorCodes::MYSQL_CLIENT_INSUFFICIENT_CAPABILITIES);

-        authenticate(handshake_response, scramble);
+        authenticate(handshake_response.username, handshake_response.auth_plugin_name, handshake_response.auth_response);
+
+        try
+        {
+            if (!handshake_response.database.empty())
+                connection_context.setCurrentDatabase(handshake_response.database);
+            connection_context.setCurrentQueryId("");
+        }
+        catch (const Exception & exc)
+        {
+            log->log(exc);
+            packet_sender->sendPacket(ERR_Packet(exc.code(), "00000", exc.message()), true);
+        }
+
        OK_Packet ok_packet(0, handshake_response.capability_flags, 0, 0, 0);
        packet_sender->sendPacket(ok_packet, true);

@ -216,121 +225,24 @@ void MySQLHandler::finishHandshake(MySQLProtocol::HandshakeResponse & packet)
    }
 }

-String MySQLHandler::generateScramble()
+void MySQLHandler::authenticate(const String & user_name, const String & auth_plugin_name, const String & initial_auth_response)
 {
-    String scramble(MySQLProtocol::SCRAMBLE_LENGTH, 0);
-    Poco::RandomInputStream generator;
-    for (size_t i = 0; i < scramble.size(); i++)
-    {
-        generator >> scramble[i];
-    }
-    return scramble;
-}
+    // For compatibility with JavaScript MySQL client, Native41 authentication plugin is used when possible (if password is specified using double SHA1). Otherwise SHA256 plugin is used.
+    auto user = connection_context.getUser(user_name);
+    if (user->password_double_sha1_hex.empty())
+        auth_plugin = std::make_unique<Authentication::Sha256Password>(public_key, private_key, log);

-void MySQLHandler::authenticate(const HandshakeResponse & handshake_response, const String & scramble)
-{
-
-    String auth_response;
-    AuthSwitchResponse response;
-    if (handshake_response.auth_plugin_name != Authentication::SHA256)
-    {
-        /** Native authentication sent 20 bytes + '\0' character = 21 bytes.
-         *  This plugin must do the same to stay consistent with historical behavior if it is set to operate as a default plugin.
-         *  https://github.com/mysql/mysql-server/blob/8.0/sql/auth/sql_authentication.cc#L3994
-         */
-        packet_sender->sendPacket(AuthSwitchRequest(Authentication::SHA256, scramble + '\0'), true);
-        if (in->eof())
-            throw Exception(
-                "Client doesn't support authentication method " + String(Authentication::SHA256) + " used by ClickHouse",
-                ErrorCodes::MYSQL_CLIENT_INSUFFICIENT_CAPABILITIES);
-        packet_sender->receivePacket(response);
-        auth_response = response.value;
-        LOG_TRACE(log, "Authentication method mismatch.");
-    }
-    else
-    {
-        auth_response = handshake_response.auth_response;
-        LOG_TRACE(log, "Authentication method match.");
-    }
-
-    if (auth_response == "\1")
-    {
-        LOG_TRACE(log, "Client requests public key.");
-
-        BIO * mem = BIO_new(BIO_s_mem());
-        SCOPE_EXIT(BIO_free(mem));
-        if (PEM_write_bio_RSA_PUBKEY(mem, &public_key) != 1)
-        {
-            throw Exception("Failed to write public key to memory. Error: " + getOpenSSLErrors(), ErrorCodes::OPENSSL_ERROR);
-        }
-        char * pem_buf = nullptr;
-        long pem_size = BIO_get_mem_data(mem, &pem_buf);
-        String pem(pem_buf, pem_size);
-
-        LOG_TRACE(log, "Key: " << pem);
-
-        AuthMoreData data(pem);
-        packet_sender->sendPacket(data, true);
-        packet_sender->receivePacket(response);
-        auth_response = response.value;
-    }
-    else
-    {
-        LOG_TRACE(log, "Client didn't request public key.");
-    }
-
-    String password;
-
-    /** Decrypt password, if it's not empty.
-     *  The original intention was that the password is a string[NUL] but this never got enforced properly so now we have to accept that
-     *  an empty packet is a blank password, thus the check for auth_response.empty() has to be made too.
-     *  https://github.com/mysql/mysql-server/blob/8.0/sql/auth/sql_authentication.cc#L4017
-     */
-    if (!secure_connection && !auth_response.empty() && auth_response != String("\0", 1))
-    {
-        LOG_TRACE(log, "Received nonempty password");
-        auto ciphertext = reinterpret_cast<unsigned char *>(auth_response.data());
-
-        unsigned char plaintext[RSA_size(&private_key)];
-        int plaintext_size = RSA_private_decrypt(auth_response.size(), ciphertext, plaintext, &private_key, RSA_PKCS1_OAEP_PADDING);
-        if (plaintext_size == -1)
-        {
-            throw Exception("Failed to decrypt auth data. Error: " + getOpenSSLErrors(), ErrorCodes::OPENSSL_ERROR);
-        }
-
-        password.resize(plaintext_size);
-        for (int i = 0; i < plaintext_size; ++i)
-        {
-            password[i] = plaintext[i] ^ static_cast<unsigned char>(scramble[i % scramble.size()]);
-        }
-    }
-    else if (secure_connection)
-    {
-        password = auth_response;
-    }
-    else
-    {
-        LOG_TRACE(log, "Received empty password");
-    }
-
-    if (!password.empty() && password.back() == 0)
-    {
-        password.pop_back();
-    }
-
-    try
-    {
-        connection_context.setUser(handshake_response.username, password, socket().address(), "");
-        if (!handshake_response.database.empty()) connection_context.setCurrentDatabase(handshake_response.database);
-        connection_context.setCurrentQueryId("");
-        LOG_INFO(log, "Authentication for user " << handshake_response.username << " succeeded.");
+    try {
+        std::optional<String> auth_response = auth_plugin_name == auth_plugin->getName() ? std::make_optional<String>(initial_auth_response) : std::nullopt;
+        auth_plugin->authenticate(user_name, auth_response, connection_context, packet_sender, secure_connection, socket().address());
    }
    catch (const Exception & exc)
    {
-        LOG_ERROR(log, "Authentication for user " << handshake_response.username << " failed.");
+        LOG_ERROR(log, "Authentication for user " << user_name << " failed.");
        packet_sender->sendPacket(ERR_Packet(exc.code(), "00000", exc.message()), true);
        throw;
    }
+    LOG_INFO(log, "Authentication for user " << user_name << " succeeded.");
 }

 void MySQLHandler::comInitDB(ReadBuffer & payload)
--- a/dbms/programs/server/MySQLHandler.h
+++ b/dbms/programs/server/MySQLHandler.h
@ -30,9 +30,7 @@ private:

    void comInitDB(ReadBuffer & payload);

-    static String generateScramble();
-
-    void authenticate(const MySQLProtocol::HandshakeResponse &, const String & scramble);
+    void authenticate(const String & user_name, const String & auth_plugin_name, const String & auth_response);

    IServer & server;
    Poco::Logger * log;
@ -48,6 +46,8 @@ private:
    RSA & public_key;
    RSA & private_key;

+    std::unique_ptr<MySQLProtocol::Authentication::IPlugin> auth_plugin;
+
    std::shared_ptr<Poco::Net::SecureStreamSocket> ss;
    std::shared_ptr<ReadBuffer> in;
    std::shared_ptr<WriteBuffer> out;
--- a/dbms/programs/server/config.d/metric_log.xml
+++ b/dbms/programs/server/config.d/metric_log.xml
@ -0,0 +1,8 @@
+<yandex>
+    <metric_log>
+        <database>system</database>
+        <table>metric_log</table>
+        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
+        <collect_interval_milliseconds>1000</collect_interval_milliseconds>
+    </metric_log>
+</yandex>
--- a/dbms/programs/server/config.xml
+++ b/dbms/programs/server/config.xml
@ -331,6 +331,16 @@
    </text_log>
    -->

+    <!-- Uncomment to write metric log into table.
+         Metric log contains rows with current values of ProfileEvents, CurrentMetrics collected with "collect_interval_milliseconds" interval.
+    <metric_log>
+        <database>system</database>
+        <table>metric_log</table>
+        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
+        <collect_interval_milliseconds>1000</collect_interval_milliseconds>
+    </metric_log>
+    -->
+
    <!-- Parameters for embedded dictionaries, used in Yandex.Metrica.
         See https://clickhouse.yandex/docs/en/dicts/internal_dicts/
    -->
--- a/dbms/programs/server/users.xml
+++ b/dbms/programs/server/users.xml
@ -39,10 +39,18 @@

                 If you want to specify SHA256, place it in 'password_sha256_hex' element.
                 Example: <password_sha256_hex>65e84be33532fb784c48129675f9eff3a682b27168c0ea744b2cf58ee02337c5</password_sha256_hex>
+                 Restrictions of SHA256: impossibility to connect to ClickHouse using MySQL JS client (as of July 2019).
+
+                 If you want to specify double SHA1, place it in 'password_double_sha1_hex' element.
+                 Example: <password_double_sha1_hex>e395796d6546b1b65db9d665cd43f0e858dd4303</password_double_sha1_hex>

                 How to generate decent password:
                 Execute: PASSWORD=$(base64 < /dev/urandom | head -c8); echo "$PASSWORD"; echo -n "$PASSWORD" | sha256sum | tr -d '-'
                 In first line will be password and in second - corresponding SHA256.
+
+                 How to generate double SHA1:
+                 Execute: PASSWORD=$(base64 < /dev/urandom | head -c8); echo "$PASSWORD"; echo -n "$PASSWORD" | openssl dgst -sha1 -binary | openssl dgst -sha1
+                 In first line will be password and in second - corresponding double SHA1.
            -->
            <password></password>

--- a/dbms/src/Common/ProfileEvents.cpp
+++ b/dbms/src/Common/ProfileEvents.cpp
@ -172,7 +172,7 @@
    M(OSWriteChars, "Number of bytes written to filesystem, including page cache.") \
    M(CreatedHTTPConnections, "Total amount of created HTTP connections (closed or opened).") \
    \
-    M(QueryProfilerCannotWriteTrace, "Number of stack traces dropped by query profiler because pipe is full or cannot write to pipe.") \
+    M(CannotWriteToWriteBufferDiscard, "Number of stack traces dropped by query profiler or signal handler because pipe is full or cannot write to pipe.") \
    M(QueryProfilerSignalOverruns, "Number of times we drop processing of a signal due to overrun plus the number of signals that OS has not delivered due to overrun.") \

 namespace ProfileEvents
--- a/dbms/src/Common/QueryProfiler.cpp
+++ b/dbms/src/Common/QueryProfiler.cpp
@ -11,12 +11,11 @@
 #include <Common/Exception.h>
 #include <Common/thread_local_rng.h>
 #include <IO/WriteHelpers.h>
-#include <IO/WriteBufferFromFileDescriptor.h>
+#include <IO/WriteBufferFromFileDescriptorDiscardOnFailure.h>


 namespace ProfileEvents
 {
-    extern const Event QueryProfilerCannotWriteTrace;
    extern const Event QueryProfilerSignalOverruns;
 }

@ -27,36 +26,6 @@ extern LazyPipe trace_pipe;

 namespace
 {
-    /** Write to file descriptor but drop the data if write would block or fail.
-      * To use within signal handler. Motivating example: a signal handler invoked during execution of malloc
-      *  should not block because some mutex (or even worse - a spinlock) may be held.
-      */
-    class WriteBufferDiscardOnFailure : public WriteBufferFromFileDescriptor
-    {
-    protected:
-        void nextImpl() override
-        {
-            size_t bytes_written = 0;
-            while (bytes_written != offset())
-            {
-                ssize_t res = ::write(fd, working_buffer.begin() + bytes_written, offset() - bytes_written);
-
-                if ((-1 == res || 0 == res) && errno != EINTR)
-                {
-                    ProfileEvents::increment(ProfileEvents::QueryProfilerCannotWriteTrace);
-                    break;  /// Discard
-                }
-
-                if (res > 0)
-                    bytes_written += res;
-            }
-        }
-
-    public:
-        using WriteBufferFromFileDescriptor::WriteBufferFromFileDescriptor;
-        ~WriteBufferDiscardOnFailure() override {}
-    };
-
    /// Normally query_id is a UUID (string with a fixed length) but user can provide custom query_id.
    /// Thus upper bound on query_id length should be introduced to avoid buffer overflow in signal handler.
    constexpr size_t QUERY_ID_MAX_LEN = 1024;
@ -90,7 +59,7 @@ namespace
                                    sizeof(TimerType) + // timer type
                                    sizeof(UInt32); // thread_number
        char buffer[buf_size];
-        WriteBufferDiscardOnFailure out(trace_pipe.fds_rw[1], buf_size, buffer);
+        WriteBufferFromFileDescriptorDiscardOnFailure out(trace_pipe.fds_rw[1], buf_size, buffer);

        StringRef query_id = CurrentThread::getQueryId();
        query_id.size = std::min(query_id.size, QUERY_ID_MAX_LEN);
@ -204,11 +173,13 @@ QueryProfilerBase<ProfilerImpl>::~QueryProfilerBase()
 template <typename ProfilerImpl>
 void QueryProfilerBase<ProfilerImpl>::tryCleanup()
 {
+#if USE_INTERNAL_UNWIND_LIBRARY
    if (timer_id != nullptr && timer_delete(timer_id))
        LOG_ERROR(log, "Failed to delete query profiler timer " + errnoToString(ErrorCodes::CANNOT_DELETE_TIMER));

    if (previous_handler != nullptr && sigaction(pause_signal, previous_handler, nullptr))
        LOG_ERROR(log, "Failed to restore signal handler after query profiler " + errnoToString(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER));
+#endif
 }

 template class QueryProfilerBase<QueryProfilerReal>;
--- a/dbms/src/Common/QueryProfiler.h
+++ b/dbms/src/Common/QueryProfiler.h
@ -1,7 +1,7 @@
 #pragma once

 #include <Core/Types.h>
-
+#include <common/config_common.h>
 #include <signal.h>
 #include <time.h>

@ -43,8 +43,10 @@ private:

    Poco::Logger * log;

+#if USE_INTERNAL_UNWIND_LIBRARY
    /// Timer id from timer_create(2)
    timer_t timer_id = nullptr;
+#endif

    /// Pause signal to interrupt threads to get traces
    int pause_signal;
--- a/dbms/src/Common/StackTrace.cpp
+++ b/dbms/src/Common/StackTrace.cpp
@ -151,6 +151,12 @@ std::string signalToErrorMessage(int sig, const siginfo_t & info, const ucontext
            }
            break;
        }
+
+        case SIGPROF:
+        {
+            error << "This is a signal used for debugging purposes by the user.";
+            break;
+        }
    }

    return error.str();
@ -239,10 +245,10 @@ const StackTrace::Frames & StackTrace::getFrames() const
 }


-static std::string toStringImpl(const StackTrace::Frames & frames, size_t offset, size_t size)
+static void toStringEveryLineImpl(const StackTrace::Frames & frames, size_t offset, size_t size, std::function<void(const std::string &)> callback)
 {
    if (size == 0)
-        return "<Empty trace>";
+        return callback("<Empty trace>");

    const DB::SymbolIndex & symbol_index = DB::SymbolIndex::instance();
    std::unordered_map<std::string, DB::Dwarf> dwarfs;
@ -281,12 +287,23 @@ static std::string toStringImpl(const StackTrace::Frames & frames, size_t offset
        else
            out << "?";

-        out << "\n";
+        callback(out.str());
+        out.str({});
    }
+}

+static std::string toStringImpl(const StackTrace::Frames & frames, size_t offset, size_t size)
+{
+    std::stringstream out;
+    toStringEveryLineImpl(frames, offset, size, [&](const std::string & str) { out << str << '\n'; });
    return out.str();
 }

+void StackTrace::toStringEveryLine(std::function<void(const std::string &)> callback) const
+{
+    toStringEveryLineImpl(frames, offset, size, std::move(callback));
+}
+
 std::string StackTrace::toString() const
 {
    /// Calculation of stack trace text is extremely slow.
--- a/dbms/src/Common/StackTrace.h
+++ b/dbms/src/Common/StackTrace.h
@ -4,6 +4,7 @@
 #include <vector>
 #include <array>
 #include <optional>
+#include <functional>
 #include <signal.h>

 #ifdef __APPLE__
@ -39,6 +40,8 @@ public:
    const Frames & getFrames() const;
    std::string toString() const;

+    void toStringEveryLine(std::function<void(const std::string &)> callback) const;
+
 protected:
    void tryCapture();

--- a/dbms/src/Common/tests/CMakeLists.txt
+++ b/dbms/src/Common/tests/CMakeLists.txt
@ -36,7 +36,7 @@ target_include_directories (simple_cache PRIVATE ${DBMS_INCLUDE_DIR})
 target_link_libraries (simple_cache PRIVATE common)

 add_executable (compact_array compact_array.cpp)
-target_link_libraries (compact_array PRIVATE clickhouse_common_io ${Boost_FILESYSTEM_LIBRARY})
+target_link_libraries (compact_array PRIVATE clickhouse_common_io stdc++fs)

 add_executable (radix_sort radix_sort.cpp)
 target_link_libraries (radix_sort PRIVATE clickhouse_common_io)
--- a/dbms/src/Compression/tests/gtest_compressionCodec.cpp
+++ b/dbms/src/Compression/tests/gtest_compressionCodec.cpp
@ -27,7 +27,7 @@
 /// For the expansion of gtest macros.
 #if defined(__clang__)
    #pragma clang diagnostic ignored "-Wdeprecated"
-#elif defined (__GNUC__)
+#elif defined (__GNUC__) && __GNUC__ >= 9
    #pragma GCC diagnostic ignored "-Wdeprecated-copy"
 #endif

--- a/dbms/src/Core/Defines.h
+++ b/dbms/src/Core/Defines.h
@ -92,6 +92,7 @@
 #endif

 /// Check for presence of address sanitizer
+#if !defined(ADDRESS_SANITIZER)
 #if defined(__has_feature)
    #if __has_feature(address_sanitizer)
        #define ADDRESS_SANITIZER 1
@ -99,7 +100,9 @@
 #elif defined(__SANITIZE_ADDRESS__)
    #define ADDRESS_SANITIZER 1
 #endif
+#endif

+#if !defined(THREAD_SANITIZER)
 #if defined(__has_feature)
    #if __has_feature(thread_sanitizer)
        #define THREAD_SANITIZER 1
@ -107,7 +110,9 @@
 #elif defined(__SANITIZE_THREAD__)
    #define THREAD_SANITIZER 1
 #endif
+#endif

+#if !defined(MEMORY_SANITIZER)
 #if defined(__has_feature)
    #if __has_feature(memory_sanitizer)
        #define MEMORY_SANITIZER 1
@ -115,6 +120,7 @@
 #elif defined(__MEMORY_SANITIZER__)
    #define MEMORY_SANITIZER 1
 #endif
+#endif

 /// Explicitly allow undefined behaviour for certain functions. Use it as a function attribute.
 /// It is useful in case when compiler cannot see (and exploit) it, but UBSan can.
--- a/dbms/src/Core/MySQLProtocol.h
+++ b/dbms/src/Core/MySQLProtocol.h
@ -1,9 +1,17 @@
 #pragma once

+#include <ext/scope_guard.h>
+#include <openssl/pem.h>
+#include <openssl/rsa.h>
+#include <random>
+#include <sstream>
 #include <Common/MemoryTracker.h>
+#include <Common/OpenSSLHelpers.h>
 #include <Common/PODArray.h>
 #include <Core/Types.h>
+#include <Interpreters/Context.h>
 #include <IO/copyData.h>
+#include <IO/LimitReadBuffer.h>
 #include <IO/ReadBuffer.h>
 #include <IO/ReadBufferFromMemory.h>
 #include <IO/ReadBufferFromPocoSocket.h>
@ -14,9 +22,7 @@
 #include <IO/WriteHelpers.h>
 #include <Poco/Net/StreamSocket.h>
 #include <Poco/RandomStream.h>
-#include <random>
-#include <sstream>
-#include <IO/LimitReadBuffer.h>
+#include <Poco/SHA1Engine.h>

 /// Implementation of MySQL wire protocol.
 /// Works only on little-endian architecture.
@ -27,6 +33,9 @@ namespace DB
 namespace ErrorCodes
 {
    extern const int UNKNOWN_PACKET_FROM_CLIENT;
+    extern const int MYSQL_CLIENT_INSUFFICIENT_CAPABILITIES;
+    extern const int OPENSSL_ERROR;
+    extern const int UNKNOWN_EXCEPTION;
 }

 namespace MySQLProtocol
@ -39,11 +48,6 @@ const size_t MYSQL_ERRMSG_SIZE = 512;
 const size_t PACKET_HEADER_SIZE = 4;
 const size_t SSL_REQUEST_PAYLOAD_SIZE = 32;

-namespace Authentication
-{
-    const String Native = "mysql_native_password";
-    const String SHA256 = "sha256_password"; /// Caching SHA2 plugin is not used because it would be possible to authenticate knowing hash from users.xml.
-}

 enum CharacterSet
 {
@ -149,6 +153,8 @@ private:
    uint8_t & sequence_id;
    const size_t max_packet_size = MAX_PACKET_LENGTH;

+    bool has_read_header = false;
+
    // Size of packet which is being read now.
    size_t payload_length = 0;

@ -158,8 +164,9 @@ private:
 protected:
    bool nextImpl() override
    {
-        if (payload_length == 0 || (payload_length == max_packet_size && offset == payload_length))
+        if (!has_read_header || (payload_length == max_packet_size && offset == payload_length))
        {
+            has_read_header = true;
            working_buffer.resize(0);
            offset = 0;
            payload_length = 0;
@ -171,10 +178,6 @@ protected:
                tmp << "Received packet with payload larger than max_packet_size: " << payload_length;
                throw ProtocolError(tmp.str(), ErrorCodes::UNKNOWN_PACKET_FROM_CLIENT);
            }
-            else if (payload_length == 0)
-            {
-                return false;
-            }

            size_t packet_sequence_id = 0;
            in.read(reinterpret_cast<char &>(packet_sequence_id));
@ -185,6 +188,9 @@ protected:
                throw ProtocolError(tmp.str(), ErrorCodes::UNKNOWN_PACKET_FROM_CLIENT);
            }
            sequence_id++;
+
+            if (payload_length == 0)
+                return false;
        }
        else if (offset == payload_length)
        {
@ -208,6 +214,7 @@ class ClientPacket
 {
 public:
    ClientPacket() = default;
+
    ClientPacket(ClientPacket &&) = default;

    virtual void read(ReadBuffer & in, uint8_t & sequence_id)
@ -257,6 +264,7 @@ public:
    {
        return total_left;
    }
+
 private:
    WriteBuffer & out;
    uint8_t & sequence_id;
@ -452,9 +460,6 @@ protected:
        buffer.write(static_cast<char>(auth_plugin_data.size()));
        writeChar(0x0, 10, buffer);
        writeString(auth_plugin_data.substr(AUTH_PLUGIN_DATA_PART_1_LENGTH, auth_plugin_data.size() - AUTH_PLUGIN_DATA_PART_1_LENGTH), buffer);
-        // A workaround for PHP mysqlnd extension bug which occurs when sha256_password is used as a default authentication plugin.
-        // Instead of using client response for mysql_native_password plugin, the server will always generate authentication method mismatch
-        // and switch to sha256_password to simulate that mysql_native_password is used as a default plugin.
        writeString(auth_plugin_name, buffer);
        writeChar(0x0, 1, buffer);
    }
@ -843,5 +848,230 @@ protected:
    }
 };

+namespace Authentication
+{
+
+class IPlugin
+{
+public:
+    virtual String getName() = 0;
+
+    virtual String getAuthPluginData() = 0;
+
+    virtual void authenticate(const String & user_name, std::optional<String> auth_response, Context & context, std::shared_ptr<PacketSender> packet_sender, bool is_secure_connection,
+                              const Poco::Net::SocketAddress & address) = 0;
+
+    virtual ~IPlugin() = default;
+};
+
+/// https://dev.mysql.com/doc/internals/en/secure-password-authentication.html
+class Native41 : public IPlugin
+{
+public:
+    Native41()
+    {
+        scramble.resize(SCRAMBLE_LENGTH + 1, 0);
+        Poco::RandomInputStream generator;
+
+        for (size_t i = 0; i < SCRAMBLE_LENGTH; i++)
+            generator >> scramble[i];
+    }
+
+    String getName() override
+    {
+        return "mysql_native_password";
+    }
+
+    String getAuthPluginData() override
+    {
+        return scramble;
+    }
+
+    void authenticate(
+        const String & user_name,
+        std::optional<String> auth_response,
+        Context & context,
+        std::shared_ptr<PacketSender> packet_sender,
+        bool /* is_secure_connection */,
+        const Poco::Net::SocketAddress & address) override
+    {
+        if (!auth_response)
+        {
+            packet_sender->sendPacket(AuthSwitchRequest(getName(), scramble), true);
+            AuthSwitchResponse response;
+            packet_sender->receivePacket(response);
+            auth_response = response.value;
+        }
+
+        if (auth_response->empty())
+        {
+            context.setUser(user_name, "", address, "");
+            return;
+        }
+
+        if (auth_response->size() != Poco::SHA1Engine::DIGEST_SIZE)
+            throw Exception("Wrong size of auth response. Expected: " + std::to_string(Poco::SHA1Engine::DIGEST_SIZE) + " bytes, received: " + std::to_string(auth_response->size()) + " bytes.",
+                            ErrorCodes::UNKNOWN_EXCEPTION);
+
+        auto user = context.getUser(user_name);
+
+        if (user->password_double_sha1_hex.empty())
+            throw Exception("Cannot use " + getName() + " auth plugin for user " + user_name + " since its password isn't specified using double SHA1.", ErrorCodes::UNKNOWN_EXCEPTION);
+
+        Poco::SHA1Engine::Digest double_sha1_value = Poco::DigestEngine::digestFromHex(user->password_double_sha1_hex);
+        assert(double_sha1_value.size() == Poco::SHA1Engine::DIGEST_SIZE);
+
+        Poco::SHA1Engine engine;
+        engine.update(scramble.data(), SCRAMBLE_LENGTH);
+        engine.update(double_sha1_value.data(), double_sha1_value.size());
+
+        String password_sha1(Poco::SHA1Engine::DIGEST_SIZE, 0x0);
+        const Poco::SHA1Engine::Digest & digest = engine.digest();
+        for (size_t i = 0; i < password_sha1.size(); i++)
+        {
+            password_sha1[i] = digest[i] ^ static_cast<unsigned char>((*auth_response)[i]);
+        }
+        context.setUser(user_name, password_sha1, address, "");
+    }
+private:
+    String scramble;
+};
+
+/// Caching SHA2 plugin is not used because it would be possible to authenticate knowing hash from users.xml.
+/// https://dev.mysql.com/doc/internals/en/sha256.html
+class Sha256Password : public IPlugin
+{
+public:
+    Sha256Password(RSA & public_key_, RSA & private_key_, Logger * log_)
+        : public_key(public_key_)
+        , private_key(private_key_)
+        , log(log_)
+    {
+        /** Native authentication sent 20 bytes + '\0' character = 21 bytes.
+         *  This plugin must do the same to stay consistent with historical behavior if it is set to operate as a default plugin. [1]
+         *  https://github.com/mysql/mysql-server/blob/8.0/sql/auth/sql_authentication.cc#L3994
+         */
+        scramble.resize(SCRAMBLE_LENGTH + 1, 0);
+        Poco::RandomInputStream generator;
+
+        for (size_t i = 0; i < SCRAMBLE_LENGTH; i++)
+            generator >> scramble[i];
+    }
+
+    String getName() override
+    {
+        return "sha256_password";
+    }
+
+    String getAuthPluginData() override
+    {
+        return scramble;
+    }
+
+    void authenticate(
+        const String & user_name,
+        std::optional<String> auth_response,
+        Context & context,
+        std::shared_ptr<PacketSender> packet_sender,
+        bool is_secure_connection,
+        const Poco::Net::SocketAddress & address) override
+    {
+        if (!auth_response)
+        {
+            packet_sender->sendPacket(AuthSwitchRequest(getName(), scramble), true);
+
+            if (packet_sender->in->eof())
+                throw Exception("Client doesn't support authentication method " + getName() + " used by ClickHouse. Specifying user password using 'password_double_sha1_hex' may fix the problem.",
+                    ErrorCodes::MYSQL_CLIENT_INSUFFICIENT_CAPABILITIES);
+
+            AuthSwitchResponse response;
+            packet_sender->receivePacket(response);
+            auth_response = response.value;
+            LOG_TRACE(log, "Authentication method mismatch.");
+        }
+        else
+        {
+            LOG_TRACE(log, "Authentication method match.");
+        }
+
+        if (auth_response == "\1")
+        {
+            LOG_TRACE(log, "Client requests public key.");
+
+            BIO * mem = BIO_new(BIO_s_mem());
+            SCOPE_EXIT(BIO_free(mem));
+            if (PEM_write_bio_RSA_PUBKEY(mem, &public_key) != 1)
+            {
+                throw Exception("Failed to write public key to memory. Error: " + getOpenSSLErrors(), ErrorCodes::OPENSSL_ERROR);
+            }
+            char * pem_buf = nullptr;
+            long pem_size = BIO_get_mem_data(mem, &pem_buf);
+            String pem(pem_buf, pem_size);
+
+            LOG_TRACE(log, "Key: " << pem);
+
+            AuthMoreData data(pem);
+            packet_sender->sendPacket(data, true);
+
+            AuthSwitchResponse response;
+            packet_sender->receivePacket(response);
+            auth_response = response.value;
+        }
+        else
+        {
+            LOG_TRACE(log, "Client didn't request public key.");
+        }
+
+        String password;
+
+        /** Decrypt password, if it's not empty.
+         *  The original intention was that the password is a string[NUL] but this never got enforced properly so now we have to accept that
+         *  an empty packet is a blank password, thus the check for auth_response.empty() has to be made too.
+         *  https://github.com/mysql/mysql-server/blob/8.0/sql/auth/sql_authentication.cc#L4017
+         */
+        if (!is_secure_connection && !auth_response->empty() && auth_response != String("\0", 1))
+        {
+            LOG_TRACE(log, "Received nonempty password");
+            auto ciphertext = reinterpret_cast<unsigned char *>(auth_response->data());
+
+            unsigned char plaintext[RSA_size(&private_key)];
+            int plaintext_size = RSA_private_decrypt(auth_response->size(), ciphertext, plaintext, &private_key, RSA_PKCS1_OAEP_PADDING);
+            if (plaintext_size == -1)
+            {
+                throw Exception("Failed to decrypt auth data. Error: " + getOpenSSLErrors(), ErrorCodes::OPENSSL_ERROR);
+            }
+
+            password.resize(plaintext_size);
+            for (int i = 0; i < plaintext_size; i++)
+            {
+                password[i] = plaintext[i] ^ static_cast<unsigned char>(scramble[i % scramble.size()]);
+            }
+        }
+        else if (is_secure_connection)
+        {
+            password = *auth_response;
+        }
+        else
+        {
+            LOG_TRACE(log, "Received empty password");
+        }
+
+        if (!password.empty() && password.back() == 0)
+        {
+            password.pop_back();
+        }
+
+        context.setUser(user_name, password, address, "");
+    }
+
+private:
+    RSA & public_key;
+    RSA & private_key;
+    Logger * log;
+    String scramble;
+};
+
+}
+
 }
 }
--- a/dbms/src/Core/SettingsCommon.h
+++ b/dbms/src/Core/SettingsCommon.h
@ -586,7 +586,7 @@ public:
        for (const auto & member : members())
        {
            if (member.isChanged(castToDerived()))
-                found_changes.emplace_back(member.name.toString(), member.get_field(castToDerived()));
+                found_changes.push_back({member.name.toString(), member.get_field(castToDerived())});
        }
        return found_changes;
    }
--- a/dbms/src/DataStreams/AsynchronousBlockInputStream.h
+++ b/dbms/src/DataStreams/AsynchronousBlockInputStream.h
@ -73,6 +73,15 @@ public:

    Block getHeader() const override { return children.at(0)->getHeader(); }

+    void cancel(bool kill) override
+    {
+        IBlockInputStream::cancel(kill);
+
+        /// Wait for some backgroud calculations to be sure,
+        ///  that after end of stream nothing is being executing.
+        if (started)
+            pool.wait();
+    }

    ~AsynchronousBlockInputStream() override
    {
--- a/dbms/src/DataStreams/CreatingSetsBlockInputStream.h
+++ b/dbms/src/DataStreams/CreatingSetsBlockInputStream.h
@ -2,7 +2,7 @@

 #include <Poco/Logger.h>
 #include <DataStreams/IBlockInputStream.h>
-#include <Interpreters/ExpressionAnalyzer.h>    /// SubqueriesForSets
+#include <Interpreters/SubqueryForSet.h>


 namespace Poco { class Logger; }
--- a/dbms/src/DataStreams/FinishSortingBlockInputStream.cpp
+++ b/dbms/src/DataStreams/FinishSortingBlockInputStream.cpp
@ -102,8 +102,6 @@ Block FinishSortingBlockInputStream::readImpl()
            if (block.rows() == 0)
                continue;

-            // We need to sort each block separately before merging.
-            sortBlock(block, description_to_sort, limit);

            removeConstantsFromBlock(block);

--- a/dbms/src/DataStreams/tests/expression_stream.cpp
+++ b/dbms/src/DataStreams/tests/expression_stream.cpp
@ -39,7 +39,7 @@ try

    NamesAndTypesList source_columns = {{"number", std::make_shared<DataTypeUInt64>()}};
    auto syntax_result = SyntaxAnalyzer(context, {}).analyze(ast, source_columns);
-    ExpressionAnalyzer analyzer(ast, syntax_result, context);
+    SelectQueryExpressionAnalyzer analyzer(ast, syntax_result, context);
    ExpressionActionsChain chain(context);
    analyzer.appendSelect(chain, false);
    analyzer.appendProjectResult(chain);
--- a/dbms/src/DataStreams/tests/filter_stream.cpp
+++ b/dbms/src/DataStreams/tests/filter_stream.cpp
@ -44,7 +44,7 @@ try

    NamesAndTypesList source_columns = {{"number", std::make_shared<DataTypeUInt64>()}};
    auto syntax_result = SyntaxAnalyzer(context, {}).analyze(ast, source_columns);
-    ExpressionAnalyzer analyzer(ast, syntax_result, context);
+    SelectQueryExpressionAnalyzer analyzer(ast, syntax_result, context);
    ExpressionActionsChain chain(context);
    analyzer.appendSelect(chain, false);
    analyzer.appendProjectResult(chain);
--- a/dbms/src/Dictionaries/LibraryDictionarySource.cpp
+++ b/dbms/src/Dictionaries/LibraryDictionarySource.cpp
@ -1,5 +1,6 @@
 #include "LibraryDictionarySource.h"
 #include <DataStreams/OneBlockInputStream.h>
+#include <Core/Defines.h>
 #include <Interpreters/Context.h>
 #include <Poco/File.h>
 #include <common/logger_useful.h>
@ -134,7 +135,7 @@ LibraryDictionarySource::LibraryDictionarySource(
            ErrorCodes::FILE_DOESNT_EXIST);
    description.init(sample_block);
    library = std::make_shared<SharedLibrary>(path, RTLD_LAZY
-#if defined(RTLD_DEEPBIND) // Does not exists in freebsd
+#if defined(RTLD_DEEPBIND) && !defined(ADDRESS_SANITIZER) // Does not exists in FreeBSD. Cannot work with Address Sanitizer.
        | RTLD_DEEPBIND
 #endif
    );
--- a/dbms/src/Formats/FormatFactory.cpp
+++ b/dbms/src/Formats/FormatFactory.cpp
@ -83,7 +83,17 @@ BlockInputStreamPtr FormatFactory::getInput(
        return std::make_shared<NativeBlockInputStream>(buf, sample, 0);

    if (!getCreators(name).input_processor_creator)
-        return getInput(name, buf, sample, context, max_block_size, rows_portion_size, std::move(callback));
+    {
+        const auto & input_getter = getCreators(name).inout_creator;
+        if (!input_getter)
+            throw Exception("Format " + name + " is not suitable for input", ErrorCodes::FORMAT_IS_NOT_SUITABLE_FOR_INPUT);
+
+        const Settings & settings = context.getSettingsRef();
+        FormatSettings format_settings = getInputFormatSetting(settings);
+
+        return input_getter(
+                buf, sample, context, max_block_size, rows_portion_size, callback ? callback : ReadCallback(), format_settings);
+    }

    auto format = getInputFormat(name, buf, sample, context, max_block_size, rows_portion_size, std::move(callback));
    return std::make_shared<InputStreamFromInputFormat>(std::move(format));
@ -106,13 +116,22 @@ BlockOutputStreamPtr FormatFactory::getOutput(const String & name, WriteBuffer &
    }

    if (!getCreators(name).output_processor_creator)
-        return getOutput(name, buf, sample, context);
+    {
+        const auto & output_getter = getCreators(name).output_creator;
+        if (!output_getter)
+            throw Exception("Format " + name + " is not suitable for output", ErrorCodes::FORMAT_IS_NOT_SUITABLE_FOR_OUTPUT);
+
+        const Settings & settings = context.getSettingsRef();
+        FormatSettings format_settings = getOutputFormatSetting(settings);
+
+        /** Materialization is needed, because formats can use the functions `IDataType`,
+          *  which only work with full columns.
+          */
+        return std::make_shared<MaterializingBlockOutputStream>(
+                output_getter(buf, sample, context, format_settings), sample);
+    }

    auto format = getOutputFormat(name, buf, sample, context);
-
-    /** Materialization is needed, because formats can use the functions `IDataType`,
-      *  which only work with full columns.
-      */
    return std::make_shared<MaterializingBlockOutputStream>(std::make_shared<OutputStreamToOutputFormat>(format), sample);
 }

--- a/dbms/src/Functions/CMakeLists.txt
+++ b/dbms/src/Functions/CMakeLists.txt
@ -25,6 +25,7 @@ target_link_libraries(clickhouse_functions
    PRIVATE
        ${ZLIB_LIBRARIES}
        ${Boost_FILESYSTEM_LIBRARY}
+        ${CMAKE_DL_LIBS}
 )

 if (OPENSSL_CRYPTO_LIBRARY)
--- a/dbms/src/Functions/FunctionsJSON.h
+++ b/dbms/src/Functions/FunctionsJSON.h
@ -7,6 +7,7 @@
 #include "config_functions.h"
 #include <Common/CpuId.h>
 #include <Common/typeid_cast.h>
+#include <Core/AccurateComparison.h>
 #include <Core/Settings.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnString.h>
@ -15,7 +16,6 @@
 #include <Columns/ColumnNullable.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnTuple.h>
-#include <Core/AccurateComparison.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeEnum.h>
@ -64,7 +64,7 @@ public:
    {
        /// Choose JSONParser.
 #if USE_SIMDJSON
-        if (context.getSettings().allow_simdjson && Cpu::CpuFlagsCache::have_AVX2)
+        if (context.getSettings().allow_simdjson && Cpu::CpuFlagsCache::have_SSE42 && Cpu::CpuFlagsCache::have_PCLMUL)
        {
            Executor<SimdJSONParser>::run(block, arguments, result_pos, input_rows_count);
            return;
--- a/dbms/src/Functions/bitBoolMaskAnd.cpp
+++ b/dbms/src/Functions/bitBoolMaskAnd.cpp
@ -4,6 +4,10 @@

 namespace DB
 {
+    namespace ErrorCodes
+    {
+        extern const int BAD_CAST;
+    }

    /// Working with UInt8: last bit = can be true, previous = can be false (Like dbms/src/Storages/MergeTree/BoolMask.h).
    /// This function provides "AND" operation for BoolMasks.
@ -17,6 +21,8 @@ namespace DB
        template <typename Result = ResultType>
        static inline Result apply(A left, B right)
        {
+            if constexpr (!std::is_same_v<A, ResultType> || !std::is_same_v<B, ResultType>)
+                throw DB::Exception("It's a bug! Only UInt8 type is supported by __bitBoolMaskAnd.", ErrorCodes::BAD_CAST);
            return static_cast<ResultType>(
                    ((static_cast<ResultType>(left) & static_cast<ResultType>(right)) & 1)
                    | ((((static_cast<ResultType>(left) >> 1) | (static_cast<ResultType>(right) >> 1)) & 1) << 1));
--- a/dbms/src/Functions/bitBoolMaskOr.cpp
+++ b/dbms/src/Functions/bitBoolMaskOr.cpp
@ -4,6 +4,10 @@

 namespace DB
 {
+    namespace ErrorCodes
+    {
+        extern const int BAD_CAST;
+    }

    /// Working with UInt8: last bit = can be true, previous = can be false (Like dbms/src/Storages/MergeTree/BoolMask.h).
    /// This function provides "OR" operation for BoolMasks.
@ -17,6 +21,8 @@ namespace DB
        template <typename Result = ResultType>
        static inline Result apply(A left, B right)
        {
+            if constexpr (!std::is_same_v<A, ResultType> || !std::is_same_v<B, ResultType>)
+                throw DB::Exception("It's a bug! Only UInt8 type is supported by __bitBoolMaskOr.", ErrorCodes::BAD_CAST);
            return static_cast<ResultType>(
                    ((static_cast<ResultType>(left) | static_cast<ResultType>(right)) & 1)
                    | ((((static_cast<ResultType>(left) >> 1) & (static_cast<ResultType>(right) >> 1)) & 1) << 1));
--- a/dbms/src/Functions/bitSwapLastTwo.cpp
+++ b/dbms/src/Functions/bitSwapLastTwo.cpp
@ -4,6 +4,10 @@

 namespace DB
 {
+    namespace ErrorCodes
+    {
+        extern const int BAD_CAST;
+    }

    /// Working with UInt8: last bit = can be true, previous = can be false (Like dbms/src/Storages/MergeTree/BoolMask.h).
    /// This function provides "NOT" operation for BoolMasks by swapping last two bits ("can be true" <-> "can be false").
@ -14,6 +18,8 @@ namespace DB

        static inline ResultType NO_SANITIZE_UNDEFINED apply(A a)
        {
+            if constexpr (!std::is_same_v<A, ResultType>)
+                throw DB::Exception("It's a bug! Only UInt8 type is supported by __bitSwapLastTwo.", ErrorCodes::BAD_CAST);
            return static_cast<ResultType>(
                    ((static_cast<ResultType>(a) & 1) << 1) | ((static_cast<ResultType>(a) >> 1) & 1));
        }
--- a/dbms/src/Functions/bitWrapperFunc.cpp
+++ b/dbms/src/Functions/bitWrapperFunc.cpp
@ -4,6 +4,10 @@

 namespace DB
 {
+    namespace ErrorCodes
+    {
+        extern const int BAD_CAST;
+    }

    /// Working with UInt8: last bit = can be true, previous = can be false (Like dbms/src/Storages/MergeTree/BoolMask.h).
    /// This function wraps bool atomic functions
@ -15,7 +19,9 @@ namespace DB

        static inline ResultType NO_SANITIZE_UNDEFINED apply(A a)
        {
-            return a == static_cast<UInt8>(0) ? static_cast<ResultType>(0b10) : static_cast<ResultType >(0b1);
+            if constexpr (!std::is_integral_v<A>)
+                throw DB::Exception("It's a bug! Only integer types are supported by __bitWrapperFunc.", ErrorCodes::BAD_CAST);
+            return a == 0 ? static_cast<ResultType>(0b10) : static_cast<ResultType >(0b1);
        }

 #if USE_EMBEDDED_COMPILER
--- a/dbms/src/Functions/currentUser.cpp
+++ b/dbms/src/Functions/currentUser.cpp
@ -0,0 +1,54 @@
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <Interpreters/Context.h>
+#include <DataTypes/DataTypeString.h>
+
+
+namespace DB
+{
+
+class FunctionCurrentUser : public IFunction
+{
+    const String user_name;
+
+public:
+    static constexpr auto name = "currentUser";
+    static FunctionPtr create(const Context & context)
+    {
+        return std::make_shared<FunctionCurrentUser>(context.getClientInfo().initial_user);
+    }
+
+    explicit FunctionCurrentUser(const String & user_name_) : user_name{user_name_}
+    {
+    }
+
+    String getName() const override
+    {
+        return name;
+    }
+    size_t getNumberOfArguments() const override
+    {
+        return 0;
+    }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
+    {
+        return std::make_shared<DataTypeString>();
+    }
+
+    bool isDeterministic() const override { return false; }
+
+    void executeImpl(Block & block, const ColumnNumbers &, size_t result, size_t input_rows_count) override
+    {
+        block.getByPosition(result).column = DataTypeString().createColumnConst(input_rows_count, user_name);
+    }
+};
+
+
+void registerFunctionCurrentUser(FunctionFactory & factory)
+{
+    factory.registerFunction<FunctionCurrentUser>();
+    factory.registerAlias("user", FunctionCurrentUser::name, FunctionFactory::CaseInsensitive);
+}
+
+}
--- a/dbms/src/Functions/registerFunctionsMiscellaneous.cpp
+++ b/dbms/src/Functions/registerFunctionsMiscellaneous.cpp
@ -6,6 +6,7 @@ namespace DB
 class FunctionFactory;

 void registerFunctionCurrentDatabase(FunctionFactory &);
+void registerFunctionCurrentUser(FunctionFactory &);
 void registerFunctionHostName(FunctionFactory &);
 void registerFunctionVisibleWidth(FunctionFactory &);
 void registerFunctionToTypeName(FunctionFactory &);
@ -56,6 +57,7 @@ void registerFunctionConvertCharset(FunctionFactory &);
 void registerFunctionsMiscellaneous(FunctionFactory & factory)
 {
    registerFunctionCurrentDatabase(factory);
+    registerFunctionCurrentUser(factory);
    registerFunctionHostName(factory);
    registerFunctionVisibleWidth(factory);
    registerFunctionToTypeName(factory);
--- a/dbms/src/IO/WriteBufferFromFileDescriptorDiscardOnFailure.cpp
+++ b/dbms/src/IO/WriteBufferFromFileDescriptorDiscardOnFailure.cpp
@ -0,0 +1,29 @@
+#include <IO/WriteBufferFromFileDescriptorDiscardOnFailure.h>
+
+namespace ProfileEvents
+{
+    extern const Event CannotWriteToWriteBufferDiscard;
+}
+
+namespace DB
+{
+
+void WriteBufferFromFileDescriptorDiscardOnFailure::nextImpl()
+{
+    size_t bytes_written = 0;
+    while (bytes_written != offset())
+    {
+        ssize_t res = ::write(fd, working_buffer.begin() + bytes_written, offset() - bytes_written);
+
+        if ((-1 == res || 0 == res) && errno != EINTR)
+        {
+            ProfileEvents::increment(ProfileEvents::CannotWriteToWriteBufferDiscard);
+            break;  /// Discard
+        }
+
+        if (res > 0)
+            bytes_written += res;
+    }
+}
+
+}
--- a/dbms/src/IO/WriteBufferFromFileDescriptorDiscardOnFailure.h
+++ b/dbms/src/IO/WriteBufferFromFileDescriptorDiscardOnFailure.h
@ -0,0 +1,23 @@
+#pragma once
+
+#include <IO/WriteBufferFromFileDescriptor.h>
+
+
+namespace DB
+{
+
+/** Write to file descriptor but drop the data if write would block or fail.
+  * To use within signal handler. Motivating example: a signal handler invoked during execution of malloc
+  *  should not block because some mutex (or even worse - a spinlock) may be held.
+  */
+class WriteBufferFromFileDescriptorDiscardOnFailure : public WriteBufferFromFileDescriptor
+{
+protected:
+    void nextImpl() override;
+
+public:
+    using WriteBufferFromFileDescriptor::WriteBufferFromFileDescriptor;
+    ~WriteBufferFromFileDescriptorDiscardOnFailure() override {}
+};
+
+}
--- a/dbms/src/IO/tests/CMakeLists.txt
+++ b/dbms/src/IO/tests/CMakeLists.txt
@ -59,10 +59,10 @@ target_link_libraries (write_int PRIVATE clickhouse_common_io)

 if (OS_LINUX OR OS_FREEBSD)
    add_executable(write_buffer_aio write_buffer_aio.cpp)
-    target_link_libraries (write_buffer_aio PRIVATE clickhouse_common_io ${Boost_FILESYSTEM_LIBRARY})
+    target_link_libraries (write_buffer_aio PRIVATE clickhouse_common_io stdc++fs)

    add_executable(read_buffer_aio read_buffer_aio.cpp)
-    target_link_libraries (read_buffer_aio PRIVATE clickhouse_common_io ${Boost_FILESYSTEM_LIBRARY})
+    target_link_libraries (read_buffer_aio PRIVATE clickhouse_common_io stdc++fs)
 endif ()

 add_executable (zlib_buffers zlib_buffers.cpp)
--- a/dbms/src/Interpreters/ActionsVisitor.cpp
+++ b/dbms/src/Interpreters/ActionsVisitor.cpp
@ -1,3 +1,5 @@
+#include <Common/typeid_cast.h>
+
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsMiscellaneous.h>

@ -19,8 +21,6 @@
 #include <Storages/StorageSet.h>

 #include <Parsers/ASTFunction.h>
-#include <Common/typeid_cast.h>
-#include <Parsers/DumpASTNode.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTSelectQuery.h>
@ -228,346 +228,350 @@ const Block & ScopeStack::getSampleBlock() const
    return stack.back().actions->getSampleBlock();
 }

-
-ActionsVisitor::ActionsVisitor(
-        const Context & context_, SizeLimits set_size_limit_, size_t subquery_depth_,
-        const NamesAndTypesList & source_columns_, const ExpressionActionsPtr & actions,
-        PreparedSets & prepared_sets_, SubqueriesForSets & subqueries_for_sets_,
-        bool no_subqueries_, bool only_consts_, bool no_storage_or_local_, std::ostream * ostr_)
-:   context(context_),
-    set_size_limit(set_size_limit_),
-    subquery_depth(subquery_depth_),
-    source_columns(source_columns_),
-    prepared_sets(prepared_sets_),
-    subqueries_for_sets(subqueries_for_sets_),
-    no_subqueries(no_subqueries_),
-    only_consts(only_consts_),
-    no_storage_or_local(no_storage_or_local_),
-    visit_depth(0),
-    ostr(ostr_),
-    actions_stack(actions, context)
+struct CachedColumnName
 {
+    String cached;
+
+    const String & get(const ASTPtr & ast)
+    {
+        if (cached.empty())
+            cached = ast->getColumnName();
+        return cached;
+    }
+};
+
+bool ActionsMatcher::needChildVisit(const ASTPtr & node, const ASTPtr & child)
+{
+    /// Visit children themself
+    if (node->as<ASTIdentifier>() ||
+        node->as<ASTFunction>() ||
+        node->as<ASTLiteral>())
+        return false;
+
+    /// Do not go to FROM, JOIN, UNION.
+    if (child->as<ASTTableExpression>() ||
+        child->as<ASTSelectQuery>())
+        return false;
+
+    return true;
 }

-void ActionsVisitor::visit(const ASTPtr & ast)
+void ActionsMatcher::visit(const ASTPtr & ast, Data & data)
 {
-    DumpASTNode dump(*ast, ostr, visit_depth, "getActions");
+    if (const auto * identifier = ast->as<ASTIdentifier>())
+        visit(*identifier, ast, data);
+    else if (const auto * node = ast->as<ASTFunction>())
+        visit(*node, ast, data);
+    else if (const auto * literal = ast->as<ASTLiteral>())
+        visit(*literal, ast, data);
+}

-    String ast_column_name;
-    auto getColumnName = [&ast, &ast_column_name]()
-    {
-        if (ast_column_name.empty())
-            ast_column_name = ast->getColumnName();
-
-        return ast_column_name;
-    };
-
-    /// If the result of the calculation already exists in the block.
-    if ((ast->as<ASTFunction>() || ast->as<ASTLiteral>()) && actions_stack.getSampleBlock().has(getColumnName()))
+void ActionsMatcher::visit(const ASTIdentifier & identifier, const ASTPtr & ast, Data & data)
+{
+    CachedColumnName column_name;
+    if (data.hasColumn(column_name.get(ast)))
        return;

-    if (const auto * identifier = ast->as<ASTIdentifier>())
+    if (!data.only_consts)
    {
-        if (!only_consts && !actions_stack.getSampleBlock().has(getColumnName()))
-        {
-            /// The requested column is not in the block.
-            /// If such a column exists in the table, then the user probably forgot to surround it with an aggregate function or add it to GROUP BY.
+        /// The requested column is not in the block.
+        /// If such a column exists in the table, then the user probably forgot to surround it with an aggregate function or add it to GROUP BY.

-            bool found = false;
-            for (const auto & column_name_type : source_columns)
-                if (column_name_type.name == getColumnName())
-                    found = true;
+        bool found = false;
+        for (const auto & column_name_type : data.source_columns)
+            if (column_name_type.name == column_name.get(ast))
+                found = true;

-            if (found)
-                throw Exception("Column " + getColumnName() + " is not under aggregate function and not in GROUP BY.",
-                    ErrorCodes::NOT_AN_AGGREGATE);
+        if (found)
+            throw Exception("Column " + column_name.get(ast) + " is not under aggregate function and not in GROUP BY.",
+                ErrorCodes::NOT_AN_AGGREGATE);

-            /// Special check for WITH statement alias. Add alias action to be able to use this alias.
-            if (identifier->prefer_alias_to_column_name && !identifier->alias.empty())
-                actions_stack.addAction(ExpressionAction::addAliases({{identifier->name, identifier->alias}}));
-        }
+        /// Special check for WITH statement alias. Add alias action to be able to use this alias.
+        if (identifier.prefer_alias_to_column_name && !identifier.alias.empty())
+            data.addAction(ExpressionAction::addAliases({{identifier.name, identifier.alias}}));
    }
-    else if (const auto * node = ast->as<ASTFunction>())
+}
+
+void ActionsMatcher::visit(const ASTFunction & node, const ASTPtr & ast, Data & data)
+{
+    CachedColumnName column_name;
+    if (data.hasColumn(column_name.get(ast)))
+        return;
+
+    if (node.name == "lambda")
+        throw Exception("Unexpected lambda expression", ErrorCodes::UNEXPECTED_EXPRESSION);
+
+    /// Function arrayJoin.
+    if (node.name == "arrayJoin")
    {
-        if (node->name == "lambda")
-            throw Exception("Unexpected lambda expression", ErrorCodes::UNEXPECTED_EXPRESSION);
+        if (node.arguments->children.size() != 1)
+            throw Exception("arrayJoin requires exactly 1 argument", ErrorCodes::TYPE_MISMATCH);

-        /// Function arrayJoin.
-        if (node->name == "arrayJoin")
+        ASTPtr arg = node.arguments->children.at(0);
+        visit(arg, data);
+        if (!data.only_consts)
        {
-            if (node->arguments->children.size() != 1)
-                throw Exception("arrayJoin requires exactly 1 argument", ErrorCodes::TYPE_MISMATCH);
+            String result_name = column_name.get(ast);
+            data.addAction(ExpressionAction::copyColumn(arg->getColumnName(), result_name));
+            NameSet joined_columns;
+            joined_columns.insert(result_name);
+            data.addAction(ExpressionAction::arrayJoin(joined_columns, false, data.context));
+        }

-            ASTPtr arg = node->arguments->children.at(0);
-            visit(arg);
-            if (!only_consts)
+        return;
+    }
+
+    SetPtr prepared_set;
+    if (functionIsInOrGlobalInOperator(node.name))
+    {
+        /// Let's find the type of the first argument (then getActionsImpl will be called again and will not affect anything).
+        visit(node.arguments->children.at(0), data);
+
+        if (!data.no_subqueries)
+        {
+            /// Transform tuple or subquery into a set.
+            prepared_set = makeSet(node, data);
+        }
+        else
+        {
+            if (!data.only_consts)
            {
-                String result_name = getColumnName();
-                actions_stack.addAction(ExpressionAction::copyColumn(arg->getColumnName(), result_name));
-                NameSet joined_columns;
-                joined_columns.insert(result_name);
-                actions_stack.addAction(ExpressionAction::arrayJoin(joined_columns, false, context));
-            }
+                /// We are in the part of the tree that we are not going to compute. You just need to define types.
+                /// Do not subquery and create sets. We treat "IN" as "ignoreExceptNull" function.

+                data.addAction(ExpressionAction::applyFunction(
+                        FunctionFactory::instance().get("ignoreExceptNull", data.context),
+                        { node.arguments->children.at(0)->getColumnName() },
+                        column_name.get(ast)));
+            }
            return;
        }
+    }

-        SetPtr prepared_set;
-        if (functionIsInOrGlobalInOperator(node->name))
+    /// A special function `indexHint`. Everything that is inside it is not calculated
+    /// (and is used only for index analysis, see KeyCondition).
+    if (node.name == "indexHint")
+    {
+        data.addAction(ExpressionAction::addColumn(ColumnWithTypeAndName(
+            ColumnConst::create(ColumnUInt8::create(1, 1), 1), std::make_shared<DataTypeUInt8>(),
+                column_name.get(ast))));
+        return;
+    }
+
+    if (AggregateFunctionFactory::instance().isAggregateFunctionName(node.name))
+        return;
+
+    /// Context object that we pass to function should live during query.
+    const Context & function_context = data.context.hasQueryContext()
+        ? data.context.getQueryContext()
+        : data.context;
+
+    FunctionBuilderPtr function_builder;
+    try
+    {
+        function_builder = FunctionFactory::instance().get(node.name, function_context);
+    }
+    catch (DB::Exception & e)
+    {
+        auto hints = AggregateFunctionFactory::instance().getHints(node.name);
+        if (!hints.empty())
+            e.addMessage("Or unknown aggregate function " + node.name + ". Maybe you meant: " + toString(hints));
+        e.rethrow();
+    }
+
+    Names argument_names;
+    DataTypes argument_types;
+    bool arguments_present = true;
+
+    /// If the function has an argument-lambda expression, you need to determine its type before the recursive call.
+    bool has_lambda_arguments = false;
+
+    for (size_t arg = 0; arg < node.arguments->children.size(); ++arg)
+    {
+        auto & child = node.arguments->children[arg];
+        auto child_column_name = child->getColumnName();
+
+        const auto * lambda = child->as<ASTFunction>();
+        if (lambda && lambda->name == "lambda")
        {
-            /// Let's find the type of the first argument (then getActionsImpl will be called again and will not affect anything).
-            visit(node->arguments->children.at(0));
+            /// If the argument is a lambda expression, just remember its approximate type.
+            if (lambda->arguments->children.size() != 2)
+                throw Exception("lambda requires two arguments", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);

-            if (!no_subqueries)
+            const auto * lambda_args_tuple = lambda->arguments->children.at(0)->as<ASTFunction>();
+
+            if (!lambda_args_tuple || lambda_args_tuple->name != "tuple")
+                throw Exception("First argument of lambda must be a tuple", ErrorCodes::TYPE_MISMATCH);
+
+            has_lambda_arguments = true;
+            argument_types.emplace_back(std::make_shared<DataTypeFunction>(DataTypes(lambda_args_tuple->arguments->children.size())));
+            /// Select the name in the next cycle.
+            argument_names.emplace_back();
+        }
+        else if (functionIsInOrGlobalInOperator(node.name) && arg == 1 && prepared_set)
+        {
+            ColumnWithTypeAndName column;
+            column.type = std::make_shared<DataTypeSet>();
+
+            /// If the argument is a set given by an enumeration of values (so, the set was already built), give it a unique name,
+            ///  so that sets with the same literal representation do not fuse together (they can have different types).
+            if (!prepared_set->empty())
+                column.name = getUniqueName(data.getSampleBlock(), "__set");
+            else
+                column.name = child_column_name;
+
+            if (!data.hasColumn(column.name))
            {
-                /// Transform tuple or subquery into a set.
-                prepared_set = makeSet(node, actions_stack.getSampleBlock());
+                column.column = ColumnSet::create(1, prepared_set);
+
+                data.addAction(ExpressionAction::addColumn(column));
+            }
+
+            argument_types.push_back(column.type);
+            argument_names.push_back(column.name);
+        }
+        else
+        {
+            /// If the argument is not a lambda expression, call it recursively and find out its type.
+            visit(child, data);
+            std::string name = child_column_name;
+            if (data.hasColumn(name))
+            {
+                argument_types.push_back(data.getSampleBlock().getByName(name).type);
+                argument_names.push_back(name);
            }
            else
            {
-                if (!only_consts)
-                {
-                    /// We are in the part of the tree that we are not going to compute. You just need to define types.
-                    /// Do not subquery and create sets. We treat "IN" as "ignoreExceptNull" function.
-
-                    actions_stack.addAction(ExpressionAction::applyFunction(
-                            FunctionFactory::instance().get("ignoreExceptNull", context),
-                            { node->arguments->children.at(0)->getColumnName() },
-                            getColumnName()));
-                }
-                return;
+                if (data.only_consts)
+                    arguments_present = false;
+                else
+                    throw Exception("Unknown identifier: " + name, ErrorCodes::UNKNOWN_IDENTIFIER);
            }
        }
+    }

-        /// A special function `indexHint`. Everything that is inside it is not calculated
-        /// (and is used only for index analysis, see KeyCondition).
-        if (node->name == "indexHint")
+    if (data.only_consts && !arguments_present)
+        return;
+
+    if (has_lambda_arguments && !data.only_consts)
+    {
+        function_builder->getLambdaArgumentTypes(argument_types);
+
+        /// Call recursively for lambda expressions.
+        for (size_t i = 0; i < node.arguments->children.size(); ++i)
        {
-            actions_stack.addAction(ExpressionAction::addColumn(ColumnWithTypeAndName(
-                ColumnConst::create(ColumnUInt8::create(1, 1), 1), std::make_shared<DataTypeUInt8>(),
-                    getColumnName())));
-            return;
-        }
-
-        if (AggregateFunctionFactory::instance().isAggregateFunctionName(node->name))
-            return;
-
-        /// Context object that we pass to function should live during query.
-        const Context & function_context = context.hasQueryContext()
-            ? context.getQueryContext()
-            : context;
-
-        FunctionBuilderPtr function_builder;
-        try
-        {
-            function_builder = FunctionFactory::instance().get(node->name, function_context);
-        }
-        catch (DB::Exception & e)
-        {
-            auto hints = AggregateFunctionFactory::instance().getHints(node->name);
-            if (!hints.empty())
-                e.addMessage("Or unknown aggregate function " + node->name + ". Maybe you meant: " + toString(hints));
-            e.rethrow();
-        }
-
-        Names argument_names;
-        DataTypes argument_types;
-        bool arguments_present = true;
-
-        /// If the function has an argument-lambda expression, you need to determine its type before the recursive call.
-        bool has_lambda_arguments = false;
-
-        for (size_t arg = 0; arg < node->arguments->children.size(); ++arg)
-        {
-            auto & child = node->arguments->children[arg];
-            auto child_column_name = child->getColumnName();
+            ASTPtr child = node.arguments->children[i];

            const auto * lambda = child->as<ASTFunction>();
            if (lambda && lambda->name == "lambda")
            {
-                /// If the argument is a lambda expression, just remember its approximate type.
-                if (lambda->arguments->children.size() != 2)
-                    throw Exception("lambda requires two arguments", ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
-
+                const DataTypeFunction * lambda_type = typeid_cast<const DataTypeFunction *>(argument_types[i].get());
                const auto * lambda_args_tuple = lambda->arguments->children.at(0)->as<ASTFunction>();
+                const ASTs & lambda_arg_asts = lambda_args_tuple->arguments->children;
+                NamesAndTypesList lambda_arguments;

-                if (!lambda_args_tuple || lambda_args_tuple->name != "tuple")
-                    throw Exception("First argument of lambda must be a tuple", ErrorCodes::TYPE_MISMATCH);
-
-                has_lambda_arguments = true;
-                argument_types.emplace_back(std::make_shared<DataTypeFunction>(DataTypes(lambda_args_tuple->arguments->children.size())));
-                /// Select the name in the next cycle.
-                argument_names.emplace_back();
-            }
-            else if (functionIsInOrGlobalInOperator(node->name) && arg == 1 && prepared_set)
-            {
-                ColumnWithTypeAndName column;
-                column.type = std::make_shared<DataTypeSet>();
-
-                /// If the argument is a set given by an enumeration of values (so, the set was already built), give it a unique name,
-                ///  so that sets with the same literal representation do not fuse together (they can have different types).
-                if (!prepared_set->empty())
-                    column.name = getUniqueName(actions_stack.getSampleBlock(), "__set");
-                else
-                    column.name = child_column_name;
-
-                if (!actions_stack.getSampleBlock().has(column.name))
+                for (size_t j = 0; j < lambda_arg_asts.size(); ++j)
                {
-                    column.column = ColumnSet::create(1, prepared_set);
+                    auto opt_arg_name = tryGetIdentifierName(lambda_arg_asts[j]);
+                    if (!opt_arg_name)
+                        throw Exception("lambda argument declarations must be identifiers", ErrorCodes::TYPE_MISMATCH);

-                    actions_stack.addAction(ExpressionAction::addColumn(column));
+                    lambda_arguments.emplace_back(*opt_arg_name, lambda_type->getArgumentTypes()[j]);
                }

-                argument_types.push_back(column.type);
-                argument_names.push_back(column.name);
+                data.actions_stack.pushLevel(lambda_arguments);
+                visit(lambda->arguments->children.at(1), data);
+                ExpressionActionsPtr lambda_actions = data.actions_stack.popLevel();
+
+                String result_name = lambda->arguments->children.at(1)->getColumnName();
+                lambda_actions->finalize(Names(1, result_name));
+                DataTypePtr result_type = lambda_actions->getSampleBlock().getByName(result_name).type;
+
+                Names captured;
+                Names required = lambda_actions->getRequiredColumns();
+                for (const auto & required_arg : required)
+                    if (findColumn(required_arg, lambda_arguments) == lambda_arguments.end())
+                        captured.push_back(required_arg);
+
+                /// We can not name `getColumnName()`,
+                ///  because it does not uniquely define the expression (the types of arguments can be different).
+                String lambda_name = getUniqueName(data.getSampleBlock(), "__lambda");
+
+                auto function_capture = std::make_shared<FunctionCapture>(
+                        lambda_actions, captured, lambda_arguments, result_type, result_name);
+                data.addAction(ExpressionAction::applyFunction(function_capture, captured, lambda_name));
+
+                argument_types[i] = std::make_shared<DataTypeFunction>(lambda_type->getArgumentTypes(), result_type);
+                argument_names[i] = lambda_name;
            }
-            else
-            {
-                /// If the argument is not a lambda expression, call it recursively and find out its type.
-                visit(child);
-                std::string name = child_column_name;
-                if (actions_stack.getSampleBlock().has(name))
-                {
-                    argument_types.push_back(actions_stack.getSampleBlock().getByName(name).type);
-                    argument_names.push_back(name);
-                }
-                else
-                {
-                    if (only_consts)
-                        arguments_present = false;
-                    else
-                        throw Exception("Unknown identifier: " + name, ErrorCodes::UNKNOWN_IDENTIFIER);
-                }
-            }
-        }
-
-        if (only_consts && !arguments_present)
-            return;
-
-        if (has_lambda_arguments && !only_consts)
-        {
-            function_builder->getLambdaArgumentTypes(argument_types);
-
-            /// Call recursively for lambda expressions.
-            for (size_t i = 0; i < node->arguments->children.size(); ++i)
-            {
-                ASTPtr child = node->arguments->children[i];
-
-                const auto * lambda = child->as<ASTFunction>();
-                if (lambda && lambda->name == "lambda")
-                {
-                    const DataTypeFunction * lambda_type = typeid_cast<const DataTypeFunction *>(argument_types[i].get());
-                    const auto * lambda_args_tuple = lambda->arguments->children.at(0)->as<ASTFunction>();
-                    const ASTs & lambda_arg_asts = lambda_args_tuple->arguments->children;
-                    NamesAndTypesList lambda_arguments;
-
-                    for (size_t j = 0; j < lambda_arg_asts.size(); ++j)
-                    {
-                        auto opt_arg_name = tryGetIdentifierName(lambda_arg_asts[j]);
-                        if (!opt_arg_name)
-                            throw Exception("lambda argument declarations must be identifiers", ErrorCodes::TYPE_MISMATCH);
-
-                        lambda_arguments.emplace_back(*opt_arg_name, lambda_type->getArgumentTypes()[j]);
-                    }
-
-                    actions_stack.pushLevel(lambda_arguments);
-                    visit(lambda->arguments->children.at(1));
-                    ExpressionActionsPtr lambda_actions = actions_stack.popLevel();
-
-                    String result_name = lambda->arguments->children.at(1)->getColumnName();
-                    lambda_actions->finalize(Names(1, result_name));
-                    DataTypePtr result_type = lambda_actions->getSampleBlock().getByName(result_name).type;
-
-                    Names captured;
-                    Names required = lambda_actions->getRequiredColumns();
-                    for (const auto & required_arg : required)
-                        if (findColumn(required_arg, lambda_arguments) == lambda_arguments.end())
-                            captured.push_back(required_arg);
-
-                    /// We can not name `getColumnName()`,
-                    ///  because it does not uniquely define the expression (the types of arguments can be different).
-                    String lambda_name = getUniqueName(actions_stack.getSampleBlock(), "__lambda");
-
-                    auto function_capture = std::make_shared<FunctionCapture>(
-                            lambda_actions, captured, lambda_arguments, result_type, result_name);
-                    actions_stack.addAction(ExpressionAction::applyFunction(function_capture, captured, lambda_name));
-
-                    argument_types[i] = std::make_shared<DataTypeFunction>(lambda_type->getArgumentTypes(), result_type);
-                    argument_names[i] = lambda_name;
-                }
-            }
-        }
-
-        if (only_consts)
-        {
-            for (const auto & argument_name : argument_names)
-            {
-                if (!actions_stack.getSampleBlock().has(argument_name))
-                {
-                    arguments_present = false;
-                    break;
-                }
-            }
-        }
-
-        if (arguments_present)
-        {
-            actions_stack.addAction(
-                ExpressionAction::applyFunction(function_builder, argument_names, getColumnName()));
        }
    }
-    else if (const auto * literal = ast->as<ASTLiteral>())
-    {
-        DataTypePtr type = applyVisitor(FieldToDataType(), literal->value);

-        ColumnWithTypeAndName column;
-        column.column = type->createColumnConst(1, convertFieldToType(literal->value, *type));
-        column.type = type;
-        column.name = getColumnName();
-
-        actions_stack.addAction(ExpressionAction::addColumn(column));
-    }
-    else
+    if (data.only_consts)
    {
-        for (auto & child : ast->children)
+        for (const auto & argument_name : argument_names)
        {
-            /// Do not go to FROM, JOIN, UNION.
-            if (!child->as<ASTTableExpression>() && !child->as<ASTSelectQuery>())
-                visit(child);
+            if (!data.hasColumn(argument_name))
+            {
+                arguments_present = false;
+                break;
+            }
        }
    }
+
+    if (arguments_present)
+    {
+        data.addAction(ExpressionAction::applyFunction(function_builder, argument_names, column_name.get(ast)));
+    }
 }

-SetPtr ActionsVisitor::makeSet(const ASTFunction * node, const Block & sample_block)
+void ActionsMatcher::visit(const ASTLiteral & literal, const ASTPtr & ast, Data & data)
+{
+    CachedColumnName column_name;
+    if (data.hasColumn(column_name.get(ast)))
+        return;
+
+    DataTypePtr type = applyVisitor(FieldToDataType(), literal.value);
+
+    ColumnWithTypeAndName column;
+    column.column = type->createColumnConst(1, convertFieldToType(literal.value, *type));
+    column.type = type;
+    column.name = column_name.get(ast);
+
+    data.addAction(ExpressionAction::addColumn(column));
+}
+
+SetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data)
 {
    /** You need to convert the right argument to a set.
      * This can be a table name, a value, a value enumeration, or a subquery.
      * The enumeration of values is parsed as a function `tuple`.
      */
-    const IAST & args = *node->arguments;
+    const IAST & args = *node.arguments;
    const ASTPtr & arg = args.children.at(1);
+    const Block & sample_block = data.getSampleBlock();

    /// If the subquery or table name for SELECT.
    const auto * identifier = arg->as<ASTIdentifier>();
    if (arg->as<ASTSubquery>() || identifier)
    {
        auto set_key = PreparedSetKey::forSubquery(*arg);
-        if (prepared_sets.count(set_key))
-            return prepared_sets.at(set_key);
+        if (data.prepared_sets.count(set_key))
+            return data.prepared_sets.at(set_key);

        /// A special case is if the name of the table is specified on the right side of the IN statement,
        ///  and the table has the type Set (a previously prepared set).
        if (identifier)
        {
            DatabaseAndTableWithAlias database_table(*identifier);
-            StoragePtr table = context.tryGetTable(database_table.database, database_table.table);
+            StoragePtr table = data.context.tryGetTable(database_table.database, database_table.table);

            if (table)
            {
                StorageSet * storage_set = dynamic_cast<StorageSet *>(table.get());
                if (storage_set)
                {
-                    prepared_sets[set_key] = storage_set->getSet();
+                    data.prepared_sets[set_key] = storage_set->getSet();
                    return storage_set->getSet();
                }
            }
@ -576,25 +580,25 @@ SetPtr ActionsVisitor::makeSet(const ASTFunction * node, const Block & sample_bl
        /// We get the stream of blocks for the subquery. Create Set and put it in place of the subquery.
        String set_id = arg->getColumnName();

-        SubqueryForSet & subquery_for_set = subqueries_for_sets[set_id];
+        SubqueryForSet & subquery_for_set = data.subqueries_for_sets[set_id];

        /// If you already created a Set with the same subquery / table.
        if (subquery_for_set.set)
        {
-            prepared_sets[set_key] = subquery_for_set.set;
+            data.prepared_sets[set_key] = subquery_for_set.set;
            return subquery_for_set.set;
        }

-        SetPtr set = std::make_shared<Set>(set_size_limit, false);
+        SetPtr set = std::make_shared<Set>(data.set_size_limit, false);

        /** The following happens for GLOBAL INs:
          * - in the addExternalStorage function, the IN (SELECT ...) subquery is replaced with IN _data1,
          *   in the subquery_for_set object, this subquery is set as source and the temporary table _data1 as the table.
          * - this function shows the expression IN_data1.
          */
-        if (!subquery_for_set.source && no_storage_or_local)
+        if (!subquery_for_set.source && data.no_storage_or_local)
        {
-            auto interpreter = interpretSubquery(arg, context, subquery_depth, {});
+            auto interpreter = interpretSubquery(arg, data.context, data.subquery_depth, {});
            subquery_for_set.source = std::make_shared<LazyBlockInputStream>(
                interpreter->getSampleBlock(), [interpreter]() mutable { return interpreter->execute().in; });

@ -627,13 +631,13 @@ SetPtr ActionsVisitor::makeSet(const ASTFunction * node, const Block & sample_bl
        }

        subquery_for_set.set = set;
-        prepared_sets[set_key] = set;
+        data.prepared_sets[set_key] = set;
        return set;
    }
    else
    {
        /// An explicit enumeration of values in parentheses.
-        return makeExplicitSet(node, sample_block, false, context, set_size_limit, prepared_sets);
+        return makeExplicitSet(&node, sample_block, false, data.context, data.set_size_limit, data.prepared_sets);
    }
 }

--- a/dbms/src/Interpreters/ActionsVisitor.h
+++ b/dbms/src/Interpreters/ActionsVisitor.h
@ -4,6 +4,7 @@
 #include <Interpreters/PreparedSets.h>
 #include <Interpreters/ExpressionActions.h>
 #include <Interpreters/SubqueryForSet.h>
+#include <Interpreters/InDepthNodeVisitor.h>


 namespace DB
@ -52,36 +53,81 @@ struct ScopeStack
    const Block & getSampleBlock() const;
 };

+class ASTIdentifier;
+class ASTFunction;
+class ASTLiteral;

 /// Collect ExpressionAction from AST. Returns PreparedSets and SubqueriesForSets too.
-/// After AST is visited source ExpressionActions should be updated with popActionsLevel() method.
-class ActionsVisitor
+class ActionsMatcher
 {
 public:
-    ActionsVisitor(const Context & context_, SizeLimits set_size_limit_, size_t subquery_depth_,
-                   const NamesAndTypesList & source_columns_, const ExpressionActionsPtr & actions,
-                   PreparedSets & prepared_sets_, SubqueriesForSets & subqueries_for_sets_,
-                   bool no_subqueries_, bool only_consts_, bool no_storage_or_local_, std::ostream * ostr_ = nullptr);
+    using Visitor = ConstInDepthNodeVisitor<ActionsMatcher, true>;

-    void visit(const ASTPtr & ast);
+    struct Data
+    {
+        const Context & context;
+        SizeLimits set_size_limit;
+        size_t subquery_depth;
+        const NamesAndTypesList & source_columns;
+        PreparedSets & prepared_sets;
+        SubqueriesForSets & subqueries_for_sets;
+        bool no_subqueries;
+        bool only_consts;
+        bool no_storage_or_local;
+        size_t visit_depth;
+        ScopeStack actions_stack;

-    ExpressionActionsPtr popActionsLevel() { return actions_stack.popLevel(); }
+        Data(const Context & context_, SizeLimits set_size_limit_, size_t subquery_depth_,
+                const NamesAndTypesList & source_columns_, const ExpressionActionsPtr & actions,
+                PreparedSets & prepared_sets_, SubqueriesForSets & subqueries_for_sets_,
+                bool no_subqueries_, bool only_consts_, bool no_storage_or_local_)
+        :   context(context_),
+            set_size_limit(set_size_limit_),
+            subquery_depth(subquery_depth_),
+            source_columns(source_columns_),
+            prepared_sets(prepared_sets_),
+            subqueries_for_sets(subqueries_for_sets_),
+            no_subqueries(no_subqueries_),
+            only_consts(only_consts_),
+            no_storage_or_local(no_storage_or_local_),
+            visit_depth(0),
+            actions_stack(actions, context)
+        {}
+
+        void updateActions(ExpressionActionsPtr & actions)
+        {
+            actions = actions_stack.popLevel();
+        }
+
+        void addAction(const ExpressionAction & action)
+        {
+            actions_stack.addAction(action);
+        }
+
+        const Block & getSampleBlock() const
+        {
+            return actions_stack.getSampleBlock();
+        }
+
+        /// Does result of the calculation already exists in the block.
+        bool hasColumn(const String & columnName) const
+        {
+            return actions_stack.getSampleBlock().has(columnName);
+        }
+    };
+
+    static void visit(const ASTPtr & ast, Data & data);
+    static bool needChildVisit(const ASTPtr & node, const ASTPtr & child);

 private:
-    const Context & context;
-    SizeLimits set_size_limit;
-    size_t subquery_depth;
-    const NamesAndTypesList & source_columns;
-    PreparedSets & prepared_sets;
-    SubqueriesForSets & subqueries_for_sets;
-    const bool no_subqueries;
-    const bool only_consts;
-    const bool no_storage_or_local;
-    mutable size_t visit_depth;
-    std::ostream * ostr;
-    ScopeStack actions_stack;

-    SetPtr makeSet(const ASTFunction * node, const Block & sample_block);
+    static void visit(const ASTIdentifier & identifier, const ASTPtr & ast, Data & data);
+    static void visit(const ASTFunction & node, const ASTPtr & ast, Data & data);
+    static void visit(const ASTLiteral & literal, const ASTPtr & ast, Data & data);
+
+    static SetPtr makeSet(const ASTFunction & node, Data & data);
 };

+using ActionsVisitor = ActionsMatcher::Visitor;
+
 }
--- a/dbms/src/Interpreters/AnalyzedJoin.cpp
+++ b/dbms/src/Interpreters/AnalyzedJoin.cpp
@ -1,7 +1,5 @@
 #include <Interpreters/AnalyzedJoin.h>
 #include <Interpreters/DatabaseAndTableWithAlias.h>
-#include <Interpreters/SyntaxAnalyzer.h>
-#include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>

 #include <Parsers/ASTExpressionList.h>
@ -50,40 +48,6 @@ size_t AnalyzedJoin::rightKeyInclusion(const String & name) const
    return count;
 }

-ExpressionActionsPtr AnalyzedJoin::createJoinedBlockActions(
-    const NamesAndTypesList & columns_added_by_join,
-    const ASTSelectQuery * select_query_with_join,
-    const Context & context) const
-{
-    if (!select_query_with_join)
-        return nullptr;
-
-    const ASTTablesInSelectQueryElement * join = select_query_with_join->join();
-
-    if (!join)
-        return nullptr;
-
-    const auto & join_params = join->table_join->as<ASTTableJoin &>();
-
-    /// Create custom expression list with join keys from right table.
-    auto expression_list = std::make_shared<ASTExpressionList>();
-    ASTs & children = expression_list->children;
-
-    if (join_params.on_expression)
-        for (const auto & join_right_key : key_asts_right)
-            children.emplace_back(join_right_key);
-
-    NameSet required_columns_set(key_names_right.begin(), key_names_right.end());
-    for (const auto & joined_column : columns_added_by_join)
-        required_columns_set.insert(joined_column.name);
-    Names required_columns(required_columns_set.begin(), required_columns_set.end());
-
-    ASTPtr query = expression_list;
-    auto syntax_result = SyntaxAnalyzer(context).analyze(query, columns_from_joined_table, required_columns);
-    ExpressionAnalyzer analyzer(query, syntax_result, context, required_columns_set);
-    return analyzer.getActions(true, false);
-}
-
 void AnalyzedJoin::deduplicateAndQualifyColumnNames(const NameSet & left_table_columns, const String & right_table_prefix)
 {
    NameSet joined_columns;
--- a/dbms/src/Interpreters/AnalyzedJoin.h
+++ b/dbms/src/Interpreters/AnalyzedJoin.h
@ -14,9 +14,6 @@ class Context;
 class ASTSelectQuery;
 struct DatabaseAndTableWithAlias;

-class ExpressionActions;
-using ExpressionActionsPtr = std::shared_ptr<ExpressionActions>;
-
 struct AnalyzedJoin
 {
    /** Query of the form `SELECT expr(x) AS k FROM t1 ANY LEFT JOIN (SELECT expr(x) AS k FROM t2) USING k`
@ -35,6 +32,7 @@ private:
    friend class SyntaxAnalyzer;
    friend struct SyntaxAnalyzerResult;
    friend class ExpressionAnalyzer;
+    friend class SelectQueryExpressionAnalyzer;

    Names key_names_left;
    Names key_names_right; /// Duplicating names are qualified.
@ -55,10 +53,8 @@ public:
    void addUsingKey(const ASTPtr & ast);
    void addOnKeys(ASTPtr & left_table_ast, ASTPtr & right_table_ast);

-    ExpressionActionsPtr createJoinedBlockActions(
-        const NamesAndTypesList & columns_added_by_join, /// Subset of available_joined_columns.
-        const ASTSelectQuery * select_query_with_join,
-        const Context & context) const;
+    bool hasUsing() const { return with_using; }
+    bool hasOn() const { return !with_using; }

    NameSet getQualifiedColumnsSet() const;
    NameSet getOriginalColumnsSet() const;
--- a/dbms/src/Interpreters/AsynchronousMetrics.cpp
+++ b/dbms/src/Interpreters/AsynchronousMetrics.cpp
@ -180,19 +180,22 @@ void AsynchronousMetrics::update()
                    calculateMaxAndSum(max_inserts_in_queue, sum_inserts_in_queue, status.queue.inserts_in_queue);
                    calculateMaxAndSum(max_merges_in_queue, sum_merges_in_queue, status.queue.merges_in_queue);

-                    try
+                    if (!status.is_readonly)
                    {
-                        time_t absolute_delay = 0;
-                        time_t relative_delay = 0;
-                        table_replicated_merge_tree->getReplicaDelays(absolute_delay, relative_delay);
+                        try
+                        {
+                            time_t absolute_delay = 0;
+                            time_t relative_delay = 0;
+                            table_replicated_merge_tree->getReplicaDelays(absolute_delay, relative_delay);

-                        calculateMax(max_absolute_delay, absolute_delay);
-                        calculateMax(max_relative_delay, relative_delay);
-                    }
-                    catch (...)
-                    {
-                        tryLogCurrentException(__PRETTY_FUNCTION__,
-                            "Cannot get replica delay for table: " + backQuoteIfNeed(db.first) + "." + backQuoteIfNeed(iterator->name()));
+                            calculateMax(max_absolute_delay, absolute_delay);
+                            calculateMax(max_relative_delay, relative_delay);
+                        }
+                        catch (...)
+                        {
+                            tryLogCurrentException(__PRETTY_FUNCTION__,
+                                "Cannot get replica delay for table: " + backQuoteIfNeed(db.first) + "." + backQuoteIfNeed(iterator->name()));
+                        }
                    }

                    calculateMax(max_part_count_for_partition, table_replicated_merge_tree->getMaxPartsCountForPartition());
--- a/dbms/src/Interpreters/Context.cpp
+++ b/dbms/src/Interpreters/Context.cpp
@ -38,10 +38,6 @@
 #include <Interpreters/Compiler.h>
 #include <Interpreters/SettingsConstraints.h>
 #include <Interpreters/SystemLog.h>
-#include <Interpreters/QueryLog.h>
-#include <Interpreters/QueryThreadLog.h>
-#include <Interpreters/PartLog.h>
-#include <Interpreters/TraceLog.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/DDLWorker.h>
 #include <Common/DNSResolver.h>
@ -659,6 +655,10 @@ void Context::setProfile(const String & profile)
    settings_constraints = std::move(new_constraints);
 }

+std::shared_ptr<const User> Context::getUser(const String & user_name)
+{
+    return shared->users_manager->getUser(user_name);
+}

 void Context::setUser(const String & name, const String & password, const Poco::Net::SocketAddress & address, const String & quota_key)
 {
@ -1712,6 +1712,7 @@ std::shared_ptr<PartLog> Context::getPartLog(const String & part_database)
    return shared->system_logs->part_log;
 }

+
 std::shared_ptr<TraceLog> Context::getTraceLog()
 {
    auto lock = getLock();
@ -1722,6 +1723,7 @@ std::shared_ptr<TraceLog> Context::getTraceLog()
    return shared->system_logs->trace_log;
 }

+
 std::shared_ptr<TextLog> Context::getTextLog()
 {
    auto lock = getLock();
@ -1733,6 +1735,17 @@ std::shared_ptr<TextLog> Context::getTextLog()
 }


+std::shared_ptr<MetricLog> Context::getMetricLog()
+{
+    auto lock = getLock();
+
+    if (!shared->system_logs || !shared->system_logs->metric_log)
+        return {};
+
+    return shared->system_logs->metric_log;
+}
+
+
 CompressionCodecPtr Context::chooseCompressionCodec(size_t part_size, double part_size_ratio) const
 {
    auto lock = getLock();
--- a/dbms/src/Interpreters/Context.h
+++ b/dbms/src/Interpreters/Context.h
@ -6,6 +6,7 @@
 #include <Core/Types.h>
 #include <DataStreams/IBlockStream_fwd.h>
 #include <Interpreters/ClientInfo.h>
+#include <Interpreters/Users.h>
 #include <Parsers/IAST_fwd.h>
 #include <Common/LRUCache.h>
 #include <Common/MultiVersion.h>
@ -64,6 +65,7 @@ class QueryThreadLog;
 class PartLog;
 class TextLog;
 class TraceLog;
+class MetricLog;
 struct MergeTreeSettings;
 class IDatabase;
 class DDLGuard;
@ -199,6 +201,10 @@ public:

    /// Must be called before getClientInfo.
    void setUser(const String & name, const String & password, const Poco::Net::SocketAddress & address, const String & quota_key);
+
+    /// Used by MySQL Secure Password Authentication plugin.
+    std::shared_ptr<const User> getUser(const String & user_name);
+
    /// Compute and set actual user settings, client_info.current_user should be set
    void calculateUserSettings();

@ -437,6 +443,7 @@ public:
    std::shared_ptr<QueryThreadLog> getQueryThreadLog();
    std::shared_ptr<TraceLog> getTraceLog();
    std::shared_ptr<TextLog> getTextLog();
+    std::shared_ptr<MetricLog> getMetricLog();

    /// Returns an object used to log opertaions with parts if it possible.
    /// Provide table name to make required cheks.
--- a/dbms/src/Interpreters/ExpressionAnalyzer.cpp
+++ b/dbms/src/Interpreters/ExpressionAnalyzer.cpp
@ -54,10 +54,11 @@
 #include <Interpreters/interpretSubquery.h>
 #include <Interpreters/DatabaseAndTableWithAlias.h>
 #include <Interpreters/QueryNormalizer.h>
-
 #include <Interpreters/ActionsVisitor.h>
+
 #include <Interpreters/ExternalTablesVisitor.h>
 #include <Interpreters/GlobalSubqueriesVisitor.h>
+#include <Interpreters/GetAggregatesVisitor.h>

 namespace DB
 {
@ -68,26 +69,22 @@ using LogAST = DebugASTLog<false>; /// set to true to enable logs
 namespace ErrorCodes
 {
    extern const int UNKNOWN_IDENTIFIER;
-    extern const int ILLEGAL_AGGREGATION;
-    extern const int EXPECTED_ALL_OR_ANY;
+    extern const int LOGICAL_ERROR;
 }

 ExpressionAnalyzer::ExpressionAnalyzer(
    const ASTPtr & query_,
    const SyntaxAnalyzerResultPtr & syntax_analyzer_result_,
    const Context & context_,
-    const NameSet & required_result_columns_,
    size_t subquery_depth_,
-    bool do_global_,
-    const SubqueriesForSets & subqueries_for_sets_)
-    : ExpressionAnalyzerData(required_result_columns_, subqueries_for_sets_)
-    , query(query_), context(context_), settings(context.getSettings())
-    , subquery_depth(subquery_depth_), do_global(do_global_)
+    bool do_global)
+    : query(query_), context(context_), settings(context.getSettings())
+    , subquery_depth(subquery_depth_)
    , syntax(syntax_analyzer_result_)
 {
    /// external_tables, subqueries_for_sets for global subqueries.
    /// Replaces global subqueries with the generated names of temporary tables that will be sent to remote servers.
-    initGlobalSubqueriesAndExternalTables();
+    initGlobalSubqueriesAndExternalTables(do_global);

    /// has_aggregation, aggregation_keys, aggregate_descriptions, aggregated_columns.
    /// This analysis should be performed after processing global subqueries, because otherwise,
@ -116,9 +113,6 @@ void ExpressionAnalyzer::analyzeAggregation()

    auto * select_query = query->as<ASTSelectQuery>();

-    if (select_query && (select_query->groupBy() || select_query->having()))
-        has_aggregation = true;
-
    ExpressionActionsPtr temp_actions = std::make_shared<ExpressionActions>(sourceColumns(), context);

    if (select_query)
@ -146,15 +140,17 @@ void ExpressionAnalyzer::analyzeAggregation()
                for (const auto & key_ast : analyzedJoin().key_asts_left)
                    getRootActions(key_ast, true, temp_actions);

-            addJoinAction(temp_actions, true);
+            addJoinAction(temp_actions);
        }
    }

-    getAggregates(query, temp_actions);
+    has_aggregation = makeAggregateDescriptions(temp_actions);
+    if (select_query && (select_query->groupBy() || select_query->having()))
+        has_aggregation = true;

    if (has_aggregation)
    {
-        assertSelect();
+        getSelectQuery(); /// assertSelect()

        /// Find out aggregation keys.
        if (select_query->groupBy())
@ -223,7 +219,7 @@ void ExpressionAnalyzer::analyzeAggregation()
 }


-void ExpressionAnalyzer::initGlobalSubqueriesAndExternalTables()
+void ExpressionAnalyzer::initGlobalSubqueriesAndExternalTables(bool do_global)
 {
    /// Adds existing external tables (not subqueries) to the external_tables dictionary.
    ExternalTablesVisitor::Data tables_data{context, external_tables};
@ -238,21 +234,7 @@ void ExpressionAnalyzer::initGlobalSubqueriesAndExternalTables()
 }


-void ExpressionAnalyzer::makeSetsForIndex()
-{
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    if (storage() && select_query && storage()->supportsIndexForIn())
-    {
-        if (select_query->where())
-            makeSetsForIndexImpl(select_query->where());
-        if (select_query->prewhere())
-            makeSetsForIndexImpl(select_query->prewhere());
-    }
-}
-
-
-void ExpressionAnalyzer::tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_or_table_name)
+void SelectQueryExpressionAnalyzer::tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_or_table_name)
 {
    auto set_key = PreparedSetKey::forSubquery(*subquery_or_table_name);
    if (prepared_sets.count(set_key))
@ -277,8 +259,12 @@ void ExpressionAnalyzer::tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_
 }


-void ExpressionAnalyzer::makeSetsForIndexImpl(const ASTPtr & node)
+/// Perfomance optimisation for IN() if storage supports it.
+void SelectQueryExpressionAnalyzer::makeSetsForIndex(const ASTPtr & node)
 {
+    if (!node || !storage() || !storage()->supportsIndexForIn())
+        return;
+
    for (auto & child : node->children)
    {
        /// Don't descend into subqueries.
@ -290,15 +276,16 @@ void ExpressionAnalyzer::makeSetsForIndexImpl(const ASTPtr & node)
        if (func && func->name == "lambda")
            continue;

-        makeSetsForIndexImpl(child);
+        makeSetsForIndex(child);
    }

    const auto * func = node->as<ASTFunction>();
    if (func && functionIsInOperator(func->name))
    {
        const IAST & args = *func->arguments;
+        const ASTPtr & left_in_operand = args.children.at(0);

-        if (storage() && storage()->mayBenefitFromIndexForIn(args.children.at(0), context))
+        if (storage()->mayBenefitFromIndexForIn(left_in_operand, context))
        {
            const ASTPtr & arg = args.children.at(1);
            if (arg->as<ASTSubquery>() || arg->as<ASTIdentifier>())
@ -310,13 +297,13 @@ void ExpressionAnalyzer::makeSetsForIndexImpl(const ASTPtr & node)
            {
                NamesAndTypesList temp_columns = sourceColumns();
                temp_columns.insert(temp_columns.end(), array_join_columns.begin(), array_join_columns.end());
-                for (const auto & joined_column : columnsAddedByJoin())
-                    temp_columns.push_back(joined_column);
+                temp_columns.insert(temp_columns.end(), columnsAddedByJoin().begin(), columnsAddedByJoin().end());
+
                ExpressionActionsPtr temp_actions = std::make_shared<ExpressionActions>(temp_columns, context);
-                getRootActions(func->arguments->children.at(0), true, temp_actions);
+                getRootActions(left_in_operand, true, temp_actions);

                Block sample_block_with_calculated_columns = temp_actions->getSampleBlock();
-                if (sample_block_with_calculated_columns.has(args.children.at(0)->getColumnName()))
+                if (sample_block_with_calculated_columns.has(left_in_operand->getColumnName()))
                    makeExplicitSet(func, sample_block_with_calculated_columns, true, context,
                        settings.size_limits_for_set, prepared_sets);
            }
@ -328,74 +315,27 @@ void ExpressionAnalyzer::makeSetsForIndexImpl(const ASTPtr & node)
 void ExpressionAnalyzer::getRootActions(const ASTPtr & ast, bool no_subqueries, ExpressionActionsPtr & actions, bool only_consts)
 {
    LogAST log;
-    ActionsVisitor actions_visitor(context, settings.size_limits_for_set, subquery_depth,
+    ActionsVisitor::Data visitor_data(context, settings.size_limits_for_set, subquery_depth,
                                   sourceColumns(), actions, prepared_sets, subqueries_for_sets,
-                                   no_subqueries, only_consts, !isRemoteStorage(), log.stream());
-    actions_visitor.visit(ast);
-    actions = actions_visitor.popActionsLevel();
+                                   no_subqueries, only_consts, !isRemoteStorage());
+    ActionsVisitor(visitor_data, log.stream()).visit(ast);
+    visitor_data.updateActions(actions);
 }


-void ExpressionAnalyzer::getActionsFromJoinKeys(const ASTTableJoin & table_join, bool no_subqueries, ExpressionActionsPtr & actions)
+bool ExpressionAnalyzer::makeAggregateDescriptions(ExpressionActionsPtr & actions)
 {
-    bool only_consts = false;
-
-    LogAST log;
-    ActionsVisitor actions_visitor(context, settings.size_limits_for_set, subquery_depth,
-                                   sourceColumns(), actions, prepared_sets, subqueries_for_sets,
-                                   no_subqueries, only_consts, !isRemoteStorage(), log.stream());
-
-    if (table_join.using_expression_list)
-        actions_visitor.visit(table_join.using_expression_list);
-    else if (table_join.on_expression)
+    for (const ASTFunction * node : aggregates())
    {
-        for (const auto & ast : analyzedJoin().key_asts_left)
-            actions_visitor.visit(ast);
-    }
-
-    actions = actions_visitor.popActionsLevel();
-}
-
-
-void ExpressionAnalyzer::getAggregates(const ASTPtr & ast, ExpressionActionsPtr & actions)
-{
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    /// There can not be aggregate functions inside the WHERE and PREWHERE.
-    if (select_query && (ast.get() == select_query->where().get() || ast.get() == select_query->prewhere().get()))
-    {
-        assertNoAggregates(ast, "in WHERE or PREWHERE");
-        return;
-    }
-
-    /// If we are not analyzing a SELECT query, but a separate expression, then there can not be aggregate functions in it.
-    if (!select_query)
-    {
-        assertNoAggregates(ast, "in wrong place");
-        return;
-    }
-
-    const auto * node = ast->as<ASTFunction>();
-    if (node && AggregateFunctionFactory::instance().isAggregateFunctionName(node->name))
-    {
-        has_aggregation = true;
        AggregateDescription aggregate;
        aggregate.column_name = node->getColumnName();

-        /// Make unique aggregate functions.
-        for (size_t i = 0; i < aggregate_descriptions.size(); ++i)
-            if (aggregate_descriptions[i].column_name == aggregate.column_name)
-                return;
-
        const ASTs & arguments = node->arguments->children;
        aggregate.argument_names.resize(arguments.size());
        DataTypes types(arguments.size());

        for (size_t i = 0; i < arguments.size(); ++i)
        {
-            /// There can not be other aggregate functions within the aggregate functions.
-            assertNoAggregates(arguments[i], "inside another aggregate function");
-
            getRootActions(arguments[i], true, actions);
            const std::string & name = arguments[i]->getColumnName();
            types[i] = actions->getSampleBlock().getByName(name).type;
@ -407,41 +347,24 @@ void ExpressionAnalyzer::getAggregates(const ASTPtr & ast, ExpressionActionsPtr

        aggregate_descriptions.push_back(aggregate);
    }
-    else
-    {
-        for (const auto & child : ast->children)
-            if (!child->as<ASTSubquery>() && !child->as<ASTSelectQuery>())
-                getAggregates(child, actions);
-    }
+
+    return !aggregates().empty();
 }


-void ExpressionAnalyzer::assertNoAggregates(const ASTPtr & ast, const char * description)
-{
-    const auto * node = ast->as<ASTFunction>();
-
-    if (node && AggregateFunctionFactory::instance().isAggregateFunctionName(node->name))
-        throw Exception("Aggregate function " + node->getColumnName()
-            + " is found " + String(description) + " in query", ErrorCodes::ILLEGAL_AGGREGATION);
-
-    for (const auto & child : ast->children)
-        if (!child->as<ASTSubquery>() && !child->as<ASTSelectQuery>())
-            assertNoAggregates(child, description);
-}
-
-
-void ExpressionAnalyzer::assertSelect() const
+const ASTSelectQuery * ExpressionAnalyzer::getSelectQuery() const
 {
    const auto * select_query = query->as<ASTSelectQuery>();
-
    if (!select_query)
        throw Exception("Not a select query", ErrorCodes::LOGICAL_ERROR);
+    return select_query;
 }

-void ExpressionAnalyzer::assertAggregation() const
+const ASTSelectQuery * SelectQueryExpressionAnalyzer::getAggregatingQuery() const
 {
    if (!has_aggregation)
        throw Exception("No aggregation", ErrorCodes::LOGICAL_ERROR);
+    return getSelectQuery();
 }

 void ExpressionAnalyzer::initChain(ExpressionActionsChain & chain, const NamesAndTypesList & columns) const
@ -469,11 +392,9 @@ void ExpressionAnalyzer::addMultipleArrayJoinAction(ExpressionActionsPtr & actio
    actions->add(ExpressionAction::arrayJoin(result_columns, array_join_is_left, context));
 }

-bool ExpressionAnalyzer::appendArrayJoin(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendArrayJoin(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    bool is_array_join_left;
    ASTPtr array_join_expression_list = select_query->array_join_expression_list(is_array_join_left);
@ -490,17 +411,6 @@ bool ExpressionAnalyzer::appendArrayJoin(ExpressionActionsChain & chain, bool on
    return true;
 }

-void ExpressionAnalyzer::addJoinAction(ExpressionActionsPtr & actions, bool only_types) const
-{
-    if (only_types)
-        actions->add(ExpressionAction::ordinaryJoin(nullptr, analyzedJoin().key_names_left, columnsAddedByJoin()));
-    else
-        for (auto & subquery_for_set : subqueries_for_sets)
-            if (subquery_for_set.second.join)
-                actions->add(ExpressionAction::ordinaryJoin(subquery_for_set.second.join, analyzedJoin().key_names_left,
-                                                            columnsAddedByJoin()));
-}
-
 static void appendRequiredColumns(
    NameSet & required_columns, const Block & sample, const Names & key_names_right, const NamesAndTypesList & columns_added_by_join)
 {
@ -513,41 +423,37 @@ static void appendRequiredColumns(
            required_columns.insert(column.name);
 }

-bool ExpressionAnalyzer::appendJoin(ExpressionActionsChain & chain, bool only_types)
+/// It's possible to set nullptr as join for only_types mode
+void ExpressionAnalyzer::addJoinAction(ExpressionActionsPtr & actions, JoinPtr join) const
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
+    actions->add(ExpressionAction::ordinaryJoin(join, analyzedJoin().key_names_left, columnsAddedByJoin()));
+}

-    assertSelect();
-
-    if (!select_query->join())
+bool SelectQueryExpressionAnalyzer::appendJoin(ExpressionActionsChain & chain, bool only_types)
+{
+    const ASTTablesInSelectQueryElement * ast_join = getSelectQuery()->join();
+    if (!ast_join)
        return false;

+    SubqueryForSet & subquery_for_set = getSubqueryForJoin(*ast_join);
+
+    ASTPtr left_keys_list = std::make_shared<ASTExpressionList>();
+    left_keys_list->children = analyzedJoin().key_asts_left;
+
    initChain(chain, sourceColumns());
    ExpressionActionsChain::Step & step = chain.steps.back();

-    const auto & join_element = select_query->join()->as<ASTTablesInSelectQueryElement &>();
+    getRootActions(left_keys_list, only_types, step.actions);
+    addJoinAction(step.actions, subquery_for_set.join);
+
+    return true;
+}
+
+static JoinPtr tryGetStorageJoin(const ASTTablesInSelectQueryElement & join_element, const Context & context)
+{
+    const auto & table_to_join = join_element.table_expression->as<ASTTableExpression &>();
    auto & join_params = join_element.table_join->as<ASTTableJoin &>();

-    if (join_params.strictness == ASTTableJoin::Strictness::Unspecified && join_params.kind != ASTTableJoin::Kind::Cross)
-    {
-        if (settings.join_default_strictness == "ANY")
-            join_params.strictness = ASTTableJoin::Strictness::Any;
-        else if (settings.join_default_strictness == "ALL")
-            join_params.strictness = ASTTableJoin::Strictness::All;
-        else
-            throw Exception("Expected ANY or ALL in JOIN section, because setting (join_default_strictness) is empty", DB::ErrorCodes::EXPECTED_ALL_OR_ANY);
-    }
-
-    const auto & table_to_join = join_element.table_expression->as<ASTTableExpression &>();
-
-    getActionsFromJoinKeys(join_params, only_types, step.actions);
-
-    /// Two JOINs are not supported with the same subquery, but different USINGs.
-    auto join_hash = join_element.getTreeHash();
-
-    SubqueryForSet & subquery_for_set = subqueries_for_sets[toString(join_hash.first) + "_" + toString(join_hash.second)];
-
-    /// Special case - if table name is specified on the right of JOIN, then the table has the type Join (the previously prepared mapping).
    /// TODO This syntax does not support specifying a database name.
    if (table_to_join.database_and_table_name)
    {
@ -563,72 +469,106 @@ bool ExpressionAnalyzer::appendJoin(ExpressionActionsChain & chain, bool only_ty
                storage_join->assertCompatible(join_params.kind, join_params.strictness);
                /// TODO Check the set of keys.

-                JoinPtr & join = storage_join->getJoin();
-                subquery_for_set.join = join;
+                return storage_join->getJoin();
            }
        }
    }

-    if (!subquery_for_set.join)
-    {
-        auto & analyzed_join = analyzedJoin();
-        /// Actions which need to be calculated on joined block.
-        ExpressionActionsPtr joined_block_actions =
-            analyzed_join.createJoinedBlockActions(columnsAddedByJoin(), select_query, context);
-
-        /** For GLOBAL JOINs (in the case, for example, of the push method for executing GLOBAL subqueries), the following occurs
-          * - in the addExternalStorage function, the JOIN (SELECT ...) subquery is replaced with JOIN _data1,
-          *   in the subquery_for_set object this subquery is exposed as source and the temporary table _data1 as the `table`.
-          * - this function shows the expression JOIN _data1.
-          */
-        if (!subquery_for_set.source)
-        {
-            ASTPtr table;
-
-            if (table_to_join.subquery)
-                table = table_to_join.subquery;
-            else if (table_to_join.table_function)
-                table = table_to_join.table_function;
-            else if (table_to_join.database_and_table_name)
-                table = table_to_join.database_and_table_name;
-
-            Names action_columns = joined_block_actions->getRequiredColumns();
-            NameSet required_columns(action_columns.begin(), action_columns.end());
-
-            appendRequiredColumns(
-                required_columns, joined_block_actions->getSampleBlock(), analyzed_join.key_names_right, columnsAddedByJoin());
-
-            auto original_map = analyzed_join.getOriginalColumnsMap(required_columns);
-            Names original_columns;
-            for (auto & pr : original_map)
-                original_columns.push_back(pr.second);
-
-            auto interpreter = interpretSubquery(table, context, subquery_depth, original_columns);
-
-            subquery_for_set.makeSource(interpreter, original_map);
-        }
-
-        Block sample_block = subquery_for_set.renamedSampleBlock();
-        joined_block_actions->execute(sample_block);
-
-        /// TODO You do not need to set this up when JOIN is only needed on remote servers.
-        subquery_for_set.join = std::make_shared<Join>(analyzedJoin().key_names_right, settings.join_use_nulls,
-            settings.size_limits_for_join, join_params.kind, join_params.strictness);
-        subquery_for_set.join->setSampleBlock(sample_block);
-        subquery_for_set.joined_block_actions = joined_block_actions;
-    }
-
-    addJoinAction(step.actions, false);
-
-    return true;
+    return {};
 }

-bool ExpressionAnalyzer::appendPrewhere(
+SubqueryForSet & SelectQueryExpressionAnalyzer::getSubqueryForJoin(const ASTTablesInSelectQueryElement & join_element)
+{
+    /// Two JOINs are not supported with the same subquery, but different USINGs.
+    auto join_hash = join_element.getTreeHash();
+    String join_subquery_id = toString(join_hash.first) + "_" + toString(join_hash.second);
+
+    SubqueryForSet & subquery_for_set = subqueries_for_sets[join_subquery_id];
+
+    /// Special case - if table name is specified on the right of JOIN, then the table has the type Join (the previously prepared mapping).
+    if (!subquery_for_set.join)
+        subquery_for_set.join = tryGetStorageJoin(join_element, context);
+
+    if (!subquery_for_set.join)
+        makeHashJoin(join_element, subquery_for_set);
+
+    return subquery_for_set;
+}
+
+void SelectQueryExpressionAnalyzer::makeHashJoin(const ASTTablesInSelectQueryElement & join_element,
+                                                 SubqueryForSet & subquery_for_set) const
+{
+    /// Actions which need to be calculated on joined block.
+    ExpressionActionsPtr joined_block_actions = createJoinedBlockActions();
+
+    /** For GLOBAL JOINs (in the case, for example, of the push method for executing GLOBAL subqueries), the following occurs
+        * - in the addExternalStorage function, the JOIN (SELECT ...) subquery is replaced with JOIN _data1,
+        *   in the subquery_for_set object this subquery is exposed as source and the temporary table _data1 as the `table`.
+        * - this function shows the expression JOIN _data1.
+        */
+    if (!subquery_for_set.source)
+    {
+        ASTPtr table;
+
+        auto & table_to_join = join_element.table_expression->as<ASTTableExpression &>();
+        if (table_to_join.subquery)
+            table = table_to_join.subquery;
+        else if (table_to_join.table_function)
+            table = table_to_join.table_function;
+        else if (table_to_join.database_and_table_name)
+            table = table_to_join.database_and_table_name;
+
+        Names action_columns = joined_block_actions->getRequiredColumns();
+        NameSet required_columns(action_columns.begin(), action_columns.end());
+
+        auto & analyzed_join = analyzedJoin();
+        appendRequiredColumns(
+            required_columns, joined_block_actions->getSampleBlock(), analyzed_join.key_names_right, columnsAddedByJoin());
+
+        auto original_map = analyzed_join.getOriginalColumnsMap(required_columns);
+        Names original_columns;
+        for (auto & pr : original_map)
+            original_columns.push_back(pr.second);
+
+        auto interpreter = interpretSubquery(table, context, subquery_depth, original_columns);
+
+        subquery_for_set.makeSource(interpreter, original_map);
+    }
+
+    Block sample_block = subquery_for_set.renamedSampleBlock();
+    joined_block_actions->execute(sample_block);
+
+    /// TODO You do not need to set this up when JOIN is only needed on remote servers.
+    auto & join_params = join_element.table_join->as<ASTTableJoin &>();
+    subquery_for_set.join = std::make_shared<Join>(analyzedJoin().key_names_right, settings.join_use_nulls,
+        settings.size_limits_for_join, join_params.kind, join_params.strictness);
+    subquery_for_set.join->setSampleBlock(sample_block);
+    subquery_for_set.joined_block_actions = joined_block_actions;
+}
+
+ExpressionActionsPtr SelectQueryExpressionAnalyzer::createJoinedBlockActions() const
+{
+    /// Create custom expression list with join keys from right table.
+    ASTPtr expression_list = std::make_shared<ASTExpressionList>();
+    ASTs & children = expression_list->children;
+
+    if (analyzedJoin().hasOn())
+        for (const auto & join_right_key : analyzedJoin().key_asts_right)
+            children.emplace_back(join_right_key);
+
+    NameSet required_columns_set(analyzedJoin().key_names_right.begin(), analyzedJoin().key_names_right.end());
+    for (const auto & joined_column : columnsAddedByJoin())
+        required_columns_set.insert(joined_column.name);
+    Names required_columns(required_columns_set.begin(), required_columns_set.end());
+
+    auto syntax_result = SyntaxAnalyzer(context).analyze(expression_list, analyzedJoin().columns_from_joined_table, required_columns);
+    return ExpressionAnalyzer(expression_list, syntax_result, context).getActions(true, false);
+}
+
+bool SelectQueryExpressionAnalyzer::appendPrewhere(
    ExpressionActionsChain & chain, bool only_types, const Names & additional_required_columns)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    if (!select_query->prewhere())
        return false;
@ -699,11 +639,9 @@ bool ExpressionAnalyzer::appendPrewhere(
    return true;
 }

-bool ExpressionAnalyzer::appendWhere(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendWhere(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    if (!select_query->where())
        return false;
@ -719,11 +657,9 @@ bool ExpressionAnalyzer::appendWhere(ExpressionActionsChain & chain, bool only_t
    return true;
 }

-bool ExpressionAnalyzer::appendGroupBy(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendGroupBy(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertAggregation();
+    const auto * select_query = getAggregatingQuery();

    if (!select_query->groupBy())
        return false;
@ -741,11 +677,9 @@ bool ExpressionAnalyzer::appendGroupBy(ExpressionActionsChain & chain, bool only
    return true;
 }

-void ExpressionAnalyzer::appendAggregateFunctionsArguments(ExpressionActionsChain & chain, bool only_types)
+void SelectQueryExpressionAnalyzer::appendAggregateFunctionsArguments(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertAggregation();
+    const auto * select_query = getAggregatingQuery();

    initChain(chain, sourceColumns());
    ExpressionActionsChain::Step & step = chain.steps.back();
@ -758,20 +692,27 @@ void ExpressionAnalyzer::appendAggregateFunctionsArguments(ExpressionActionsChai
        }
    }

-    getActionsBeforeAggregation(select_query->select(), step.actions, only_types);
+    /// Collect aggregates removing duplicates by node.getColumnName()
+    /// It's not clear why we recollect aggregates (for query parts) while we're able to use previously collected ones (for entire query)
+    /// @note The original recollection logic didn't remove duplicates.
+    GetAggregatesVisitor::Data data;
+    GetAggregatesVisitor(data).visit(select_query->select());

    if (select_query->having())
-        getActionsBeforeAggregation(select_query->having(), step.actions, only_types);
+        GetAggregatesVisitor(data).visit(select_query->having());

    if (select_query->orderBy())
-        getActionsBeforeAggregation(select_query->orderBy(), step.actions, only_types);
+        GetAggregatesVisitor(data).visit(select_query->orderBy());
+
+    /// TODO: data.aggregates -> aggregates()
+    for (const ASTFunction * node : data.aggregates)
+        for (auto & argument : node->arguments->children)
+            getRootActions(argument, only_types, step.actions);
 }

-bool ExpressionAnalyzer::appendHaving(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendHaving(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertAggregation();
+    const auto * select_query = getAggregatingQuery();

    if (!select_query->having())
        return false;
@ -785,11 +726,9 @@ bool ExpressionAnalyzer::appendHaving(ExpressionActionsChain & chain, bool only_
    return true;
 }

-void ExpressionAnalyzer::appendSelect(ExpressionActionsChain & chain, bool only_types)
+void SelectQueryExpressionAnalyzer::appendSelect(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    initChain(chain, aggregated_columns);
    ExpressionActionsChain::Step & step = chain.steps.back();
@ -800,11 +739,9 @@ void ExpressionAnalyzer::appendSelect(ExpressionActionsChain & chain, bool only_
        step.required_output.push_back(child->getColumnName());
 }

-bool ExpressionAnalyzer::appendOrderBy(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendOrderBy(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    if (!select_query->orderBy())
        return false;
@ -826,11 +763,9 @@ bool ExpressionAnalyzer::appendOrderBy(ExpressionActionsChain & chain, bool only
    return true;
 }

-bool ExpressionAnalyzer::appendLimitBy(ExpressionActionsChain & chain, bool only_types)
+bool SelectQueryExpressionAnalyzer::appendLimitBy(ExpressionActionsChain & chain, bool only_types)
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    if (!select_query->limitBy())
        return false;
@ -857,11 +792,9 @@ bool ExpressionAnalyzer::appendLimitBy(ExpressionActionsChain & chain, bool only
    return true;
 }

-void ExpressionAnalyzer::appendProjectResult(ExpressionActionsChain & chain) const
+void SelectQueryExpressionAnalyzer::appendProjectResult(ExpressionActionsChain & chain) const
 {
-    const auto * select_query = query->as<ASTSelectQuery>();
-
-    assertSelect();
+    const auto * select_query = getSelectQuery();

    initChain(chain, aggregated_columns);
    ExpressionActionsChain::Step & step = chain.steps.back();
@ -892,19 +825,6 @@ void ExpressionAnalyzer::appendExpression(ExpressionActionsChain & chain, const
 }


-void ExpressionAnalyzer::getActionsBeforeAggregation(const ASTPtr & ast, ExpressionActionsPtr & actions, bool no_subqueries)
-{
-    const auto * node = ast->as<ASTFunction>();
-
-    if (node && AggregateFunctionFactory::instance().isAggregateFunctionName(node->name))
-        for (auto & argument : node->arguments->children)
-            getRootActions(argument, no_subqueries, actions);
-    else
-        for (auto & child : ast->children)
-            getActionsBeforeAggregation(child, actions, no_subqueries);
-}
-
-
 ExpressionActionsPtr ExpressionAnalyzer::getActions(bool add_aliases, bool project_result)
 {
    ExpressionActionsPtr actions = std::make_shared<ExpressionActions>(sourceColumns(), context);
@ -960,7 +880,7 @@ ExpressionActionsPtr ExpressionAnalyzer::getConstActions()
    return actions;
 }

-void ExpressionAnalyzer::getAggregateInfo(Names & key_names, AggregateDescriptions & aggregates) const
+void SelectQueryExpressionAnalyzer::getAggregateInfo(Names & key_names, AggregateDescriptions & aggregates) const
 {
    for (const auto & name_and_type : aggregation_keys)
        key_names.emplace_back(name_and_type.name);
--- a/dbms/src/Interpreters/ExpressionAnalyzer.h
+++ b/dbms/src/Interpreters/ExpressionAnalyzer.h
@ -2,9 +2,9 @@

 #include <Core/Settings.h>
 #include <DataStreams/IBlockStream_fwd.h>
-#include <Interpreters/ActionsVisitor.h>
 #include <Interpreters/AggregateDescription.h>
 #include <Interpreters/SyntaxAnalyzer.h>
+#include <Interpreters/SubqueryForSet.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>

@ -24,6 +24,7 @@ struct ASTTableJoin;
 class ASTFunction;
 class ASTExpressionList;
 class ASTSelectQuery;
+struct ASTTablesInSelectQueryElement;

 struct SyntaxAnalyzerResult;
 using SyntaxAnalyzerResultPtr = std::shared_ptr<const SyntaxAnalyzerResult>;
@ -31,9 +32,6 @@ using SyntaxAnalyzerResultPtr = std::shared_ptr<const SyntaxAnalyzerResult>;
 /// ExpressionAnalyzer sources, intermediates and results. It splits data and logic, allows to test them separately.
 struct ExpressionAnalyzerData
 {
-    /// If non-empty, ignore all expressions in  not from this list.
-    NameSet required_result_columns;
-
    SubqueriesForSets subqueries_for_sets;
    PreparedSets prepared_sets;

@ -49,13 +47,6 @@ struct ExpressionAnalyzerData

    /// All new temporary tables obtained by performing the GLOBAL IN/JOIN subqueries.
    Tables external_tables;
-
-protected:
-    ExpressionAnalyzerData(const NameSet & required_result_columns_,
-                           const SubqueriesForSets & subqueries_for_sets_)
-    :   required_result_columns(required_result_columns_),
-        subqueries_for_sets(subqueries_for_sets_)
-    {}
 };


@ -63,7 +54,7 @@ protected:
  *
  * NOTE: if `ast` is a SELECT query from a table, the structure of this table should not change during the lifetime of ExpressionAnalyzer.
  */
-class ExpressionAnalyzer : private ExpressionAnalyzerData, private boost::noncopyable
+class ExpressionAnalyzer : protected ExpressionAnalyzerData, private boost::noncopyable
 {
 private:
    /// Extracts settings to enlight which are used (and avoid copy of others).
@ -73,33 +64,120 @@ private:
        const bool join_use_nulls;
        const SizeLimits size_limits_for_set;
        const SizeLimits size_limits_for_join;
-        const String join_default_strictness;

        ExtractedSettings(const Settings & settings_)
        :   use_index_for_in_with_subqueries(settings_.use_index_for_in_with_subqueries),
            join_use_nulls(settings_.join_use_nulls),
            size_limits_for_set(settings_.max_rows_in_set, settings_.max_bytes_in_set, settings_.set_overflow_mode),
-            size_limits_for_join(settings_.max_rows_in_join, settings_.max_bytes_in_join, settings_.join_overflow_mode),
-            join_default_strictness(settings_.join_default_strictness.toString())
+            size_limits_for_join(settings_.max_rows_in_join, settings_.max_bytes_in_join, settings_.join_overflow_mode)
        {}
    };

 public:
+    /// Ctor for non-select queries. Generally its usage is:
+    /// auto actions = ExpressionAnalyzer(query, syntax, context).getActions();
    ExpressionAnalyzer(
+        const ASTPtr & query_,
+        const SyntaxAnalyzerResultPtr & syntax_analyzer_result_,
+        const Context & context_)
+    :   ExpressionAnalyzer(query_, syntax_analyzer_result_, context_, 0, false)
+    {}
+
+    void appendExpression(ExpressionActionsChain & chain, const ASTPtr & expr, bool only_types);
+
+    /// If `ast` is not a SELECT query, just gets all the actions to evaluate the expression.
+    /// If add_aliases, only the calculated values in the desired order and add aliases.
+    ///     If also project_result, than only aliases remain in the output block.
+    /// Otherwise, only temporary columns will be deleted from the block.
+    ExpressionActionsPtr getActions(bool add_aliases, bool project_result = true);
+
+    /// Actions that can be performed on an empty block: adding constants and applying functions that depend only on constants.
+    /// Does not execute subqueries.
+    ExpressionActionsPtr getConstActions();
+
+    /** Sets that require a subquery to be create.
+      * Only the sets needed to perform actions returned from already executed `append*` or `getActions`.
+      * That is, you need to call getSetsWithSubqueries after all calls of `append*` or `getActions`
+      *  and create all the returned sets before performing the actions.
+      */
+    const SubqueriesForSets & getSubqueriesForSets() const { return subqueries_for_sets; }
+
+    /// Get intermediates for tests
+    const ExpressionAnalyzerData & getAnalyzedData() const { return *this; }
+
+protected:
+    ExpressionAnalyzer(
+        const ASTPtr & query_,
+        const SyntaxAnalyzerResultPtr & syntax_analyzer_result_,
+        const Context & context_,
+        size_t subquery_depth_,
+        bool do_global_);
+
+    ASTPtr query;
+    const Context & context;
+    const ExtractedSettings settings;
+    size_t subquery_depth;
+
+    SyntaxAnalyzerResultPtr syntax;
+
+    const StoragePtr & storage() const { return syntax->storage; } /// The main table in FROM clause, if exists.
+    const AnalyzedJoin & analyzedJoin() const { return syntax->analyzed_join; }
+    const NamesAndTypesList & sourceColumns() const { return syntax->required_source_columns; }
+    const NamesAndTypesList & columnsAddedByJoin() const { return syntax->columns_added_by_join; }
+    const std::vector<const ASTFunction *> & aggregates() const { return syntax->aggregates; }
+
+    /// Find global subqueries in the GLOBAL IN/JOIN sections. Fills in external_tables.
+    void initGlobalSubqueriesAndExternalTables(bool do_global);
+
+    void addMultipleArrayJoinAction(ExpressionActionsPtr & actions, bool is_left) const;
+
+    void addJoinAction(ExpressionActionsPtr & actions, JoinPtr join = {}) const;
+
+    void getRootActions(const ASTPtr & ast, bool no_subqueries, ExpressionActionsPtr & actions, bool only_consts = false);
+
+    /** Add aggregation keys to aggregation_keys, aggregate functions to aggregate_descriptions,
+      * Create a set of columns aggregated_columns resulting after the aggregation, if any,
+      *  or after all the actions that are normally performed before aggregation.
+      * Set has_aggregation = true if there is GROUP BY or at least one aggregate function.
+      */
+    void analyzeAggregation();
+    bool makeAggregateDescriptions(ExpressionActionsPtr & actions);
+
+    /// columns - the columns that are present before the transformations begin.
+    void initChain(ExpressionActionsChain & chain, const NamesAndTypesList & columns) const;
+
+    const ASTSelectQuery * getSelectQuery() const;
+
+    bool isRemoteStorage() const;
+};
+
+/// SelectQuery specific ExpressionAnalyzer part.
+class SelectQueryExpressionAnalyzer : public ExpressionAnalyzer
+{
+public:
+    SelectQueryExpressionAnalyzer(
        const ASTPtr & query_,
        const SyntaxAnalyzerResultPtr & syntax_analyzer_result_,
        const Context & context_,
        const NameSet & required_result_columns_ = {},
        size_t subquery_depth_ = 0,
-        bool do_global_ = false,
-        const SubqueriesForSets & subqueries_for_set_ = {});
+        bool do_global_ = false)
+    :   ExpressionAnalyzer(query_, syntax_analyzer_result_, context_, subquery_depth_, do_global_)
+    ,   required_result_columns(required_result_columns_)
+    {}

    /// Does the expression have aggregate functions or a GROUP BY or HAVING section.
    bool hasAggregation() const { return has_aggregation; }
+    bool hasGlobalSubqueries() { return has_global_subqueries; }

    /// Get a list of aggregation keys and descriptions of aggregate functions if the query contains GROUP BY.
    void getAggregateInfo(Names & key_names, AggregateDescriptions & aggregates) const;

+    const PreparedSets & getPreparedSets() const { return prepared_sets; }
+
+    /// Tables that will need to be sent to remote servers for distributed query processing.
+    const Tables & getExternalTables() const { return external_tables; }
+
    /** These methods allow you to build a chain of transformations over a block, that receives values in the desired sections of the query.
      *
      * Example usage:
@ -132,81 +210,12 @@ public:
    /// Deletes all columns except mentioned by SELECT, arranges the remaining columns and renames them to aliases.
    void appendProjectResult(ExpressionActionsChain & chain) const;

-    void appendExpression(ExpressionActionsChain & chain, const ASTPtr & expr, bool only_types);
-
-    /// If `ast` is not a SELECT query, just gets all the actions to evaluate the expression.
-    /// If add_aliases, only the calculated values in the desired order and add aliases.
-    ///     If also project_result, than only aliases remain in the output block.
-    /// Otherwise, only temporary columns will be deleted from the block.
-    ExpressionActionsPtr getActions(bool add_aliases, bool project_result = true);
-
-    /// Actions that can be performed on an empty block: adding constants and applying functions that depend only on constants.
-    /// Does not execute subqueries.
-    ExpressionActionsPtr getConstActions();
-
-    /** Sets that require a subquery to be create.
-      * Only the sets needed to perform actions returned from already executed `append*` or `getActions`.
-      * That is, you need to call getSetsWithSubqueries after all calls of `append*` or `getActions`
-      *  and create all the returned sets before performing the actions.
-      */
-    const SubqueriesForSets & getSubqueriesForSets() const { return subqueries_for_sets; }
-
-    const PreparedSets & getPreparedSets() const { return prepared_sets; }
-
-    /** Tables that will need to be sent to remote servers for distributed query processing.
-      */
-    const Tables & getExternalTables() const { return external_tables; }
-
-    /// Get intermediates for tests
-    const ExpressionAnalyzerData & getAnalyzedData() const { return *this; }
-
    /// Create Set-s that we can from IN section to use the index on them.
-    void makeSetsForIndex();
-
-    bool hasGlobalSubqueries() { return has_global_subqueries; }
+    void makeSetsForIndex(const ASTPtr & node);

 private:
-    ASTPtr query;
-    const Context & context;
-    const ExtractedSettings settings;
-    size_t subquery_depth;
-    bool do_global; /// Do I need to prepare for execution global subqueries when analyzing the query.
-
-    SyntaxAnalyzerResultPtr syntax;
-
-    const StoragePtr & storage() const { return syntax->storage; } /// The main table in FROM clause, if exists.
-    const AnalyzedJoin & analyzedJoin() const { return syntax->analyzed_join; }
-    const NamesAndTypesList & sourceColumns() const { return syntax->required_source_columns; }
-    const NamesAndTypesList & columnsAddedByJoin() const { return syntax->columns_added_by_join; }
-
-    /// Find global subqueries in the GLOBAL IN/JOIN sections. Fills in external_tables.
-    void initGlobalSubqueriesAndExternalTables();
-
-    void addMultipleArrayJoinAction(ExpressionActionsPtr & actions, bool is_left) const;
-
-    void addJoinAction(ExpressionActionsPtr & actions, bool only_types) const;
-
-    /// If ast is ASTSelectQuery with JOIN, add actions for JOIN key columns.
-    void getActionsFromJoinKeys(const ASTTableJoin & table_join, bool no_subqueries, ExpressionActionsPtr & actions);
-
-    void getRootActions(const ASTPtr & ast, bool no_subqueries, ExpressionActionsPtr & actions, bool only_consts = false);
-
-    void getActionsBeforeAggregation(const ASTPtr & ast, ExpressionActionsPtr & actions, bool no_subqueries);
-
-    /** Add aggregation keys to aggregation_keys, aggregate functions to aggregate_descriptions,
-      * Create a set of columns aggregated_columns resulting after the aggregation, if any,
-      *  or after all the actions that are normally performed before aggregation.
-      * Set has_aggregation = true if there is GROUP BY or at least one aggregate function.
-      */
-    void analyzeAggregation();
-    void getAggregates(const ASTPtr & ast, ExpressionActionsPtr & actions);
-    void assertNoAggregates(const ASTPtr & ast, const char * description);
-
-    /// columns - the columns that are present before the transformations begin.
-    void initChain(ExpressionActionsChain & chain, const NamesAndTypesList & columns) const;
-
-    void assertSelect() const;
-    void assertAggregation() const;
+    /// If non-empty, ignore all expressions not from this list.
+    NameSet required_result_columns;

    /**
      * Create Set from a subquery or a table expression in the query. The created set is suitable for using the index.
@ -214,9 +223,11 @@ private:
      */
    void tryMakeSetForIndexFromSubquery(const ASTPtr & subquery_or_table_name);

-    void makeSetsForIndexImpl(const ASTPtr & node);
+    SubqueryForSet & getSubqueryForJoin(const ASTTablesInSelectQueryElement & join_element);
+    ExpressionActionsPtr createJoinedBlockActions() const;
+    void makeHashJoin(const ASTTablesInSelectQueryElement & join_element, SubqueryForSet & subquery_for_set) const;

-    bool isRemoteStorage() const;
+    const ASTSelectQuery * getAggregatingQuery() const;
 };

 }
--- a/dbms/src/Interpreters/GetAggregatesVisitor.h
+++ b/dbms/src/Interpreters/GetAggregatesVisitor.h
@ -0,0 +1,75 @@
+#pragma once
+
+#include <Interpreters/InDepthNodeVisitor.h>
+#include <AggregateFunctions/AggregateFunctionFactory.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_AGGREGATION;
+}
+
+class GetAggregatesMatcher
+{
+public:
+    using Visitor = ConstInDepthNodeVisitor<GetAggregatesMatcher, true>;
+
+    struct Data
+    {
+        const char * assert_no_aggregates = nullptr;
+        std::unordered_set<String> uniq_names;
+        std::vector<const ASTFunction *> aggregates;
+    };
+
+    static bool needChildVisit(const ASTPtr & node, const ASTPtr & child)
+    {
+        if (child->as<ASTSubquery>() || child->as<ASTSelectQuery>())
+            return false;
+        if (auto * func = node->as<ASTFunction>())
+            if (isAggregateFunction(func->name))
+                return false;
+        return true;
+    }
+
+    static void visit(const ASTPtr & ast, Data & data)
+    {
+        if (auto * func = ast->as<ASTFunction>())
+            visit(*func, ast, data);
+    }
+
+private:
+    static void visit(const ASTFunction & node, const ASTPtr &, Data & data)
+    {
+        if (!isAggregateFunction(node.name))
+            return;
+
+        if (data.assert_no_aggregates)
+            throw Exception("Aggregate function " + node.getColumnName()  + " is found " + String(data.assert_no_aggregates) + " in query",
+                            ErrorCodes::ILLEGAL_AGGREGATION);
+
+        String column_name = node.getColumnName();
+        if (data.uniq_names.count(column_name))
+            return;
+
+        data.uniq_names.insert(column_name);
+        data.aggregates.push_back(&node);
+    }
+
+    static bool isAggregateFunction(const String & name)
+    {
+        return AggregateFunctionFactory::instance().isAggregateFunctionName(name);
+    }
+};
+
+using GetAggregatesVisitor = GetAggregatesMatcher::Visitor;
+
+
+inline void assertNoAggregates(const ASTPtr & ast, const char * description)
+{
+    GetAggregatesVisitor::Data data{description, {}, {}};
+    GetAggregatesVisitor(data).visit(ast);
+}
+
+}
--- a/dbms/src/Interpreters/GlobalSubqueriesVisitor.h
+++ b/dbms/src/Interpreters/GlobalSubqueriesVisitor.h
@ -7,7 +7,6 @@
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/ActionsVisitor.h>
 #include <Interpreters/interpretSubquery.h>
 #include <Common/typeid_cast.h>
 #include <Core/Block.h>
--- a/dbms/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
@ -144,7 +144,7 @@ String generateFilterActions(ExpressionActionsPtr & actions, const StoragePtr &

    /// Using separate expression analyzer to prevent any possible alias injection
    auto syntax_result = SyntaxAnalyzer(context).analyze(query_ast, storage->getColumns().getAllPhysical());
-    ExpressionAnalyzer analyzer(query_ast, syntax_result, context);
+    SelectQueryExpressionAnalyzer analyzer(query_ast, syntax_result, context);
    ExpressionActionsChain new_chain(context);
    analyzer.appendSelect(new_chain, false);
    actions = new_chain.getLastActions();
@ -296,7 +296,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(

    syntax_analyzer_result = SyntaxAnalyzer(context, options).analyze(
        query_ptr, source_header.getNamesAndTypesList(), required_result_column_names, storage, NamesAndTypesList());
-    query_analyzer = std::make_unique<ExpressionAnalyzer>(
+    query_analyzer = std::make_unique<SelectQueryExpressionAnalyzer>(
        query_ptr, syntax_analyzer_result, context,
        NameSet(required_result_column_names.begin(), required_result_column_names.end()),
        options.subquery_depth, !options.only_analyze);
@ -665,7 +665,8 @@ static UInt64 getLimitForSorting(const ASTSelectQuery & query, const Context & c
 }


-static SortingInfoPtr optimizeReadInOrder(const MergeTreeData & merge_tree, const ASTSelectQuery & query, const Context & context)
+static SortingInfoPtr optimizeReadInOrder(const MergeTreeData & merge_tree, const ASTSelectQuery & query,
+    const Context & context, const SyntaxAnalyzerResultPtr & global_syntax_result)
 {
    if (!merge_tree.hasSortingKey())
        return {};
@ -677,38 +678,21 @@ static SortingInfoPtr optimizeReadInOrder(const MergeTreeData & merge_tree, cons
    const auto & sorting_key_columns = merge_tree.getSortingKeyColumns();
    size_t prefix_size = std::min(order_descr.size(), sorting_key_columns.size());

-    auto order_by_expr = query.orderBy();
-    SyntaxAnalyzerResultPtr syntax_result;
-    try
-    {
-        syntax_result = SyntaxAnalyzer(context).analyze(order_by_expr, merge_tree.getColumns().getAllPhysical());
-    }
-    catch (const Exception &)
-    {
-        return {};
-    }
-
    for (size_t i = 0; i < prefix_size; ++i)
    {
-        /// Read in pk order in case of exact match with order key element
+        if (global_syntax_result->array_join_result_to_source.count(order_descr[i].column_name))
+            break;
+
+        /// Optimize in case of exact match with order key element
        ///  or in some simple cases when order key element is wrapped into monotonic function.
        int current_direction = order_descr[i].direction;
        if (order_descr[i].column_name == sorting_key_columns[i] && current_direction == read_direction)
            prefix_order_descr.push_back(order_descr[i]);
        else
        {
-            const auto & ast = query.orderBy()->children[i];
-            ExpressionActionsPtr actions;
-            try
-            {
-                actions = ExpressionAnalyzer(ast->children.at(0), syntax_result, context).getActions(false);
-            }
-            catch (const Exception &)
-            {
-                /// Can't analyze order expression at this stage.
-                /// May be some actions required for order will be executed later.
-                break;
-            }
+            auto ast = query.orderBy()->children[i]->children.at(0);
+            auto syntax_result = SyntaxAnalyzer(context).analyze(ast, global_syntax_result->required_source_columns);
+            auto actions = ExpressionAnalyzer(ast, syntax_result, context).getActions(true);

            const auto & input_columns = actions->getRequiredColumnsWithTypes();
            if (input_columns.size() != 1 || input_columns.front().name != sorting_key_columns[i])
@ -790,7 +774,8 @@ void InterpreterSelectQuery::executeImpl(TPipeline & pipeline, const BlockInputS
        if (!dry_run)
            from_stage = storage->getQueryProcessingStage(context);

-        query_analyzer->makeSetsForIndex();
+        query_analyzer->makeSetsForIndex(query.where());
+        query_analyzer->makeSetsForIndex(query.prewhere());

        auto optimize_prewhere = [&](auto & merge_tree)
        {
@ -820,10 +805,10 @@ void InterpreterSelectQuery::executeImpl(TPipeline & pipeline, const BlockInputS
    }

    SortingInfoPtr sorting_info;
-    if (settings.optimize_read_in_order && storage && query.orderBy() && !query.groupBy() && !query.final())
+    if (settings.optimize_read_in_order && storage && query.orderBy() && !query.groupBy() && !query.final() && !query.join())
    {
        if (const MergeTreeData * merge_tree_data = dynamic_cast<const MergeTreeData *>(storage.get()))
-            sorting_info = optimizeReadInOrder(*merge_tree_data, query, context);
+            sorting_info = optimizeReadInOrder(*merge_tree_data, query, context, syntax_analyzer_result);
    }

    if (dry_run)
@ -1941,13 +1926,12 @@ void InterpreterSelectQuery::executeOrder(Pipeline & pipeline, SortingInfoPtr so
         * At this stage we merge per-thread streams into one.
         */

-        if (sorting_info->prefix_order_descr.size() < order_descr.size())
+        bool need_finish_sorting = (sorting_info->prefix_order_descr.size() < order_descr.size());
+        if (need_finish_sorting)
        {
            pipeline.transform([&](auto & stream)
            {
-                stream = std::make_shared<FinishSortingBlockInputStream>(
-                    stream, sorting_info->prefix_order_descr,
-                    order_descr, settings.max_block_size, limit);
+                stream = std::make_shared<PartialSortingBlockInputStream>(stream, order_descr, limit);
            });
        }

@ -1958,11 +1942,19 @@ void InterpreterSelectQuery::executeOrder(Pipeline & pipeline, SortingInfoPtr so
                stream = std::make_shared<AsynchronousBlockInputStream>(stream);
            });

+            UInt64 limit_for_merging = (need_finish_sorting ? 0 : limit);
            pipeline.firstStream() = std::make_shared<MergingSortedBlockInputStream>(
-                pipeline.streams, order_descr,
-                settings.max_block_size, limit);
+                pipeline.streams, sorting_info->prefix_order_descr,
+                settings.max_block_size, limit_for_merging);
            pipeline.streams.resize(1);
        }
+
+        if (need_finish_sorting)
+        {
+            pipeline.firstStream() = std::make_shared<FinishSortingBlockInputStream>(
+                pipeline.firstStream(), sorting_info->prefix_order_descr,
+                order_descr, settings.max_block_size, limit);
+        }
    }
    else
    {
--- a/dbms/src/Interpreters/InterpreterSelectQuery.h
+++ b/dbms/src/Interpreters/InterpreterSelectQuery.h
@ -248,7 +248,7 @@ private:
    Context context;
    NamesAndTypesList source_columns;
    SyntaxAnalyzerResultPtr syntax_analyzer_result;
-    std::unique_ptr<ExpressionAnalyzer> query_analyzer;
+    std::unique_ptr<SelectQueryExpressionAnalyzer> query_analyzer;
    SelectQueryInfo query_info;

    /// How many streams we ask for storage to produce, and in how many threads we will do further processing.
--- a/dbms/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterSystemQuery.cpp
@ -16,6 +16,7 @@
 #include <Interpreters/QueryThreadLog.h>
 #include <Interpreters/TraceLog.h>
 #include <Interpreters/TextLog.h>
+#include <Interpreters/MetricLog.h>
 #include <Databases/IDatabase.h>
 #include <Storages/StorageDistributed.h>
 #include <Storages/StorageReplicatedMergeTree.h>
@ -232,7 +233,8 @@ BlockIO InterpreterSystemQuery::execute()
                    [&] () { if (auto part_log = context.getPartLog("")) part_log->flush(); },
                    [&] () { if (auto query_thread_log = context.getQueryThreadLog()) query_thread_log->flush(); },
                    [&] () { if (auto trace_log = context.getTraceLog()) trace_log->flush(); },
-                    [&] () { if (auto text_log = context.getTextLog()) text_log->flush(); }
+                    [&] () { if (auto text_log = context.getTextLog()) text_log->flush(); },
+                    [&] () { if (auto metric_log = context.getMetricLog()) metric_log->flush(); }
            );
            break;
        case Type::STOP_LISTEN_QUERIES:
--- a/dbms/src/Interpreters/MetricLog.cpp
+++ b/dbms/src/Interpreters/MetricLog.cpp
@ -0,0 +1,133 @@
+#include <Interpreters/MetricLog.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeDateTime.h>
+
+
+namespace DB
+{
+
+Block MetricLogElement::createBlock()
+{
+    ColumnsWithTypeAndName columns_with_type_and_name;
+
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDate>(),     "event_date");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeDateTime>(), "event_time");
+    columns_with_type_and_name.emplace_back(std::make_shared<DataTypeUInt64>(),   "milliseconds");
+
+    for (size_t i = 0, end = ProfileEvents::end(); i < end; ++i)
+    {
+        std::string name;
+        name += "ProfileEvent_";
+        name += ProfileEvents::getName(ProfileEvents::Event(i));
+        columns_with_type_and_name.emplace_back(std::make_shared<DataTypeUInt64>(), std::move(name));
+    }
+
+    for (size_t i = 0, end = CurrentMetrics::end(); i < end; ++i)
+    {
+        std::string name;
+        name += "CurrentMetric_";
+        name += CurrentMetrics::getName(ProfileEvents::Event(i));
+        columns_with_type_and_name.emplace_back(std::make_shared<DataTypeInt64>(), std::move(name));
+    }
+
+    return Block(columns_with_type_and_name);
+}
+
+
+void MetricLogElement::appendToBlock(Block & block) const
+{
+    MutableColumns columns = block.mutateColumns();
+
+    size_t column_idx = 0;
+
+    columns[column_idx++]->insert(DateLUT::instance().toDayNum(event_time));
+    columns[column_idx++]->insert(event_time);
+    columns[column_idx++]->insert(milliseconds);
+
+    for (size_t i = 0, end = ProfileEvents::end(); i < end; ++i)
+        columns[column_idx++]->insert(profile_events[i]);
+
+    for (size_t i = 0, end = CurrentMetrics::end(); i < end; ++i)
+        columns[column_idx++]->insert(current_metrics[i]);
+}
+
+
+void MetricLog::startCollectMetric(size_t collect_interval_milliseconds_)
+{
+    collect_interval_milliseconds = collect_interval_milliseconds_;
+    is_shutdown_metric_thread = false;
+    metric_flush_thread = ThreadFromGlobalPool([this] { metricThreadFunction(); });
+}
+
+
+void MetricLog::stopCollectMetric()
+{
+    bool old_val = false;
+    if (!is_shutdown_metric_thread.compare_exchange_strong(old_val, true))
+        return;
+    metric_flush_thread.join();
+}
+
+
+inline UInt64 time_in_milliseconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::milliseconds>(timepoint.time_since_epoch()).count();
+}
+
+
+inline UInt64 time_in_seconds(std::chrono::time_point<std::chrono::system_clock> timepoint)
+{
+    return std::chrono::duration_cast<std::chrono::seconds>(timepoint.time_since_epoch()).count();
+}
+
+
+void MetricLog::metricThreadFunction()
+{
+    auto desired_timepoint = std::chrono::system_clock::now();
+
+    /// For differentiation of ProfileEvents counters.
+    std::vector<ProfileEvents::Count> prev_profile_events(ProfileEvents::end());
+
+    while (!is_shutdown_metric_thread)
+    {
+        try
+        {
+            const auto current_time = std::chrono::system_clock::now();
+
+            MetricLogElement elem;
+            elem.event_time = std::chrono::system_clock::to_time_t(current_time);
+            elem.milliseconds = time_in_milliseconds(current_time) - time_in_seconds(current_time) * 1000;
+
+            elem.profile_events.resize(ProfileEvents::end());
+            for (size_t i = 0, end = ProfileEvents::end(); i < end; ++i)
+            {
+                const ProfileEvents::Count new_value = ProfileEvents::global_counters[i].load(std::memory_order_relaxed);
+                UInt64 & old_value = prev_profile_events[i];
+                elem.profile_events[i] = new_value - old_value;
+                old_value = new_value;
+            }
+
+            elem.current_metrics.resize(CurrentMetrics::end());
+            for (size_t i = 0, end = CurrentMetrics::end(); i < end; ++i)
+            {
+                elem.current_metrics[i] = CurrentMetrics::values[i];
+            }
+
+            this->add(elem);
+
+            /// We will record current time into table but align it to regular time intervals to avoid time drift.
+            /// We may drop some time points if the server is overloaded and recording took too much time.
+            while (desired_timepoint <= current_time)
+                desired_timepoint += std::chrono::milliseconds(collect_interval_milliseconds);
+
+            std::this_thread::sleep_until(desired_timepoint);
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+}
+
+}
--- a/dbms/src/Interpreters/MetricLog.h
+++ b/dbms/src/Interpreters/MetricLog.h
@ -0,0 +1,51 @@
+#pragma once
+
+#include <Interpreters/SystemLog.h>
+#include <Common/ProfileEvents.h>
+#include <Common/CurrentMetrics.h>
+
+#include <vector>
+#include <atomic>
+#include <ctime>
+
+
+namespace DB
+{
+
+/** MetricLog is a log of metric values measured at regular time interval.
+  */
+
+struct MetricLogElement
+{
+    time_t event_time{};
+    UInt64 milliseconds{};
+
+    std::vector<ProfileEvents::Count> profile_events;
+    std::vector<CurrentMetrics::Metric> current_metrics;
+
+    static std::string name() { return "MetricLog"; }
+    static Block createBlock();
+    void appendToBlock(Block & block) const;
+};
+
+
+class MetricLog : public SystemLog<MetricLogElement>
+{
+    using SystemLog<MetricLogElement>::SystemLog;
+
+public:
+    /// Launches a background thread to collect metrics with interval
+    void startCollectMetric(size_t collect_interval_milliseconds_);
+
+    /// Stop background thread. Call before shutdown.
+    void stopCollectMetric();
+
+private:
+    void metricThreadFunction();
+
+    ThreadFromGlobalPool metric_flush_thread;
+    size_t collect_interval_milliseconds;
+    std::atomic<bool> is_shutdown_metric_thread{false};
+};
+
+}
--- a/dbms/src/Interpreters/MutationsInterpreter.cpp
+++ b/dbms/src/Interpreters/MutationsInterpreter.cpp
@ -166,6 +166,7 @@ void MutationsInterpreter::prepare(bool dry_run)
        throw Exception("Empty mutation commands list", ErrorCodes::LOGICAL_ERROR);

    const ColumnsDescription & columns_desc = storage->getColumns();
+    const IndicesDescription & indices_desc = storage->getIndices();
    NamesAndTypesList all_columns = columns_desc.getAllPhysical();

    NameSet updated_columns;
@ -175,9 +176,10 @@ void MutationsInterpreter::prepare(bool dry_run)
            updated_columns.insert(kv.first);
    }

-    /// We need to know which columns affect which MATERIALIZED columns to recalculate them if dependencies
-    /// are updated.
+    /// We need to know which columns affect which MATERIALIZED columns and data skipping indices
+    /// to recalculate them if dependencies are updated.
    std::unordered_map<String, Names> column_to_affected_materialized;
+    NameSet affected_indices_columns;
    if (!updated_columns.empty())
    {
        for (const auto & column : columns_desc)
@ -193,24 +195,40 @@ void MutationsInterpreter::prepare(bool dry_run)
                }
            }
        }
+        for (const auto & index : indices_desc.indices)
+        {
+            auto query = index->expr->clone();
+            auto syntax_result = SyntaxAnalyzer(context).analyze(query, all_columns);
+            const auto required_columns = syntax_result->requiredSourceColumns();
+
+            for (const String & dependency : required_columns)
+            {
+                if (updated_columns.count(dependency))
+                {
+                    affected_indices_columns.insert(std::cbegin(required_columns), std::cend(required_columns));
+                    break;
+                }
+            }
+        }

        validateUpdateColumns(storage, updated_columns, column_to_affected_materialized);
    }

    /// First, break a sequence of commands into stages.
-    stages.emplace_back(context);
    for (const auto & command : commands)
    {
-        if (!stages.back().column_to_updated.empty())
-            stages.emplace_back(context);
-
        if (command.type == MutationCommand::DELETE)
        {
+            if (stages.empty() || !stages.back().column_to_updated.empty())
+                stages.emplace_back(context);
+
            auto negated_predicate = makeASTFunction("not", command.predicate->clone());
            stages.back().filters.push_back(negated_predicate);
        }
        else if (command.type == MutationCommand::UPDATE)
        {
+            if (stages.empty() || !stages.back().column_to_updated.empty())
+                stages.emplace_back(context);
            if (stages.size() == 1) /// First stage only supports filtering and can't update columns.
                stages.emplace_back(context);

@ -251,35 +269,84 @@ void MutationsInterpreter::prepare(bool dry_run)
                }
            }
        }
+        else if (command.type == MutationCommand::MATERIALIZE_INDEX)
+        {
+            auto it = std::find_if(
+                    std::cbegin(indices_desc.indices), std::end(indices_desc.indices),
+                    [&](const std::shared_ptr<ASTIndexDeclaration> & index)
+                    {
+                        return index->name == command.index_name;
+                    });
+            if (it == std::cend(indices_desc.indices))
+                throw Exception("Unknown index: " + command.index_name, ErrorCodes::BAD_ARGUMENTS);
+
+            auto query = (*it)->expr->clone();
+            auto syntax_result = SyntaxAnalyzer(context).analyze(query, all_columns);
+            const auto required_columns = syntax_result->requiredSourceColumns();
+            affected_indices_columns.insert(std::cbegin(required_columns), std::cend(required_columns));
+        }
        else
            throw Exception("Unknown mutation command type: " + DB::toString<int>(command.type), ErrorCodes::UNKNOWN_MUTATION_COMMAND);
    }

-    /// Next, for each stage calculate columns changed by this and previous stages.
-    for (size_t i = 0; i < stages.size(); ++i)
+    if (!affected_indices_columns.empty())
    {
-        if (!stages[i].filters.empty())
+        if (!stages.empty())
+        {
+            std::vector<Stage> stages_copy;
+            /// Copy all filled stages except index calculation stage.
+            for (const auto &stage : stages)
+            {
+                stages_copy.emplace_back(context);
+                stages_copy.back().column_to_updated = stage.column_to_updated;
+                stages_copy.back().output_columns = stage.output_columns;
+                stages_copy.back().filters = stage.filters;
+            }
+            auto first_stage_header = prepareInterpreterSelect(stages_copy, /* dry_run = */ true)->getSampleBlock();
+            auto in = std::make_shared<NullBlockInputStream>(first_stage_header);
+            updated_header = std::make_unique<Block>(addStreamsForLaterStages(stages_copy, in)->getHeader());
+        }
+        /// Special step to recalculate affected indices.
+        stages.emplace_back(context);
+        for (const auto & column : affected_indices_columns)
+            stages.back().column_to_updated.emplace(
+                    column, std::make_shared<ASTIdentifier>(column));
+    }
+
+    interpreter_select = prepareInterpreterSelect(stages, dry_run);
+
+    is_prepared = true;
+}
+
+std::unique_ptr<InterpreterSelectQuery> MutationsInterpreter::prepareInterpreterSelect(std::vector<Stage> & prepared_stages, bool dry_run)
+{
+    NamesAndTypesList all_columns = storage->getColumns().getAllPhysical();
+
+    /// Next, for each stage calculate columns changed by this and previous stages.
+    for (size_t i = 0; i < prepared_stages.size(); ++i)
+    {
+        if (!prepared_stages[i].filters.empty())
        {
            for (const auto & column : all_columns)
-                stages[i].output_columns.insert(column.name);
+                prepared_stages[i].output_columns.insert(column.name);
            continue;
        }

        if (i > 0)
-            stages[i].output_columns = stages[i - 1].output_columns;
+            prepared_stages[i].output_columns = prepared_stages[i - 1].output_columns;

-        if (stages[i].output_columns.size() < all_columns.size())
+        if (prepared_stages[i].output_columns.size() < all_columns.size())
        {
-            for (const auto & kv : stages[i].column_to_updated)
-                stages[i].output_columns.insert(kv.first);
+            for (const auto & kv : prepared_stages[i].column_to_updated)
+                prepared_stages[i].output_columns.insert(kv.first);
        }
    }

    /// Now, calculate `expressions_chain` for each stage except the first.
    /// Do it backwards to propagate information about columns required as input for a stage to the previous stage.
-    for (size_t i = stages.size() - 1; i > 0; --i)
+    for (size_t i = prepared_stages.size() - 1; i > 0; --i)
    {
-        auto & stage = stages[i];
+        auto & stage = prepared_stages[i];

        ASTPtr all_asts = std::make_shared<ASTExpressionList>();

@ -317,7 +384,7 @@ void MutationsInterpreter::prepare(bool dry_run)
            for (const auto & kv : stage.column_to_updated)
            {
                actions_chain.getLastActions()->add(ExpressionAction::copyColumn(
-                    kv.second->getColumnName(), kv.first, /* can_replace = */ true));
+                        kv.second->getColumnName(), kv.first, /* can_replace = */ true));
            }
        }

@ -329,7 +396,7 @@ void MutationsInterpreter::prepare(bool dry_run)

        /// Propagate information about columns needed as input.
        for (const auto & column : actions_chain.steps.front().actions->getRequiredColumnsWithTypes())
-            stages[i - 1].output_columns.insert(column.name);
+            prepared_stages[i - 1].output_columns.insert(column.name);
    }

    /// Execute first stage as a SELECT statement.
@ -337,36 +404,34 @@ void MutationsInterpreter::prepare(bool dry_run)
    auto select = std::make_shared<ASTSelectQuery>();

    select->setExpression(ASTSelectQuery::Expression::SELECT, std::make_shared<ASTExpressionList>());
-    for (const auto & column_name : stages[0].output_columns)
+    for (const auto & column_name : prepared_stages[0].output_columns)
        select->select()->children.push_back(std::make_shared<ASTIdentifier>(column_name));

-    if (!stages[0].filters.empty())
+    if (!prepared_stages[0].filters.empty())
    {
        ASTPtr where_expression;
-        if (stages[0].filters.size() == 1)
-            where_expression = stages[0].filters[0];
+        if (prepared_stages[0].filters.size() == 1)
+            where_expression = prepared_stages[0].filters[0];
        else
        {
            auto coalesced_predicates = std::make_shared<ASTFunction>();
            coalesced_predicates->name = "and";
            coalesced_predicates->arguments = std::make_shared<ASTExpressionList>();
            coalesced_predicates->children.push_back(coalesced_predicates->arguments);
-            coalesced_predicates->arguments->children = stages[0].filters;
+            coalesced_predicates->arguments->children = prepared_stages[0].filters;
            where_expression = std::move(coalesced_predicates);
        }
        select->setExpression(ASTSelectQuery::Expression::WHERE, std::move(where_expression));
    }

-    interpreter_select = std::make_unique<InterpreterSelectQuery>(select, context, storage, SelectQueryOptions().analyze(dry_run).ignoreLimits());
-
-    is_prepared = true;
+    return std::make_unique<InterpreterSelectQuery>(select, context, storage, SelectQueryOptions().analyze(dry_run).ignoreLimits());
 }

-BlockInputStreamPtr MutationsInterpreter::addStreamsForLaterStages(BlockInputStreamPtr in) const
+BlockInputStreamPtr MutationsInterpreter::addStreamsForLaterStages(const std::vector<Stage> & prepared_stages, BlockInputStreamPtr in) const
 {
-    for (size_t i_stage = 1; i_stage < stages.size(); ++i_stage)
+    for (size_t i_stage = 1; i_stage < prepared_stages.size(); ++i_stage)
    {
-        const Stage & stage = stages[i_stage];
+        const Stage & stage = prepared_stages[i_stage];

        for (size_t i = 0; i < stage.expressions_chain.steps.size(); ++i)
        {
@ -398,14 +463,22 @@ void MutationsInterpreter::validate()
    prepare(/* dry_run = */ true);
    Block first_stage_header = interpreter_select->getSampleBlock();
    BlockInputStreamPtr in = std::make_shared<NullBlockInputStream>(first_stage_header);
-    addStreamsForLaterStages(in)->getHeader();
+    addStreamsForLaterStages(stages, in)->getHeader();
 }

 BlockInputStreamPtr MutationsInterpreter::execute()
 {
    prepare(/* dry_run = */ false);
    BlockInputStreamPtr in = interpreter_select->execute().in;
-    return addStreamsForLaterStages(in);
+    auto result_stream = addStreamsForLaterStages(stages, in);
+    if (!updated_header)
+        updated_header = std::make_unique<Block>(result_stream->getHeader());
+    return result_stream;
+}
+
+const Block & MutationsInterpreter::getUpdatedHeader() const
+{
+    return *updated_header;
 }

 }
--- a/dbms/src/Interpreters/MutationsInterpreter.h
+++ b/dbms/src/Interpreters/MutationsInterpreter.h
@ -13,7 +13,7 @@ namespace DB

 class Context;

-/// Create an input stream that will read data from storage and apply mutation commands (UPDATEs, DELETEs)
+/// Create an input stream that will read data from storage and apply mutation commands (UPDATEs, DELETEs, MATERIALIZEs)
 /// to this data.
 class MutationsInterpreter
 {
@ -30,13 +30,19 @@ public:
    /// Return false if the data isn't going to be changed by mutations.
    bool isStorageTouchedByMutations() const;

-    /// The resulting stream will return blocks containing changed columns only.
+    /// The resulting stream will return blocks containing only changed columns and columns, that we need to recalculate indices.
    BlockInputStreamPtr execute();

+    /// Only changed columns.
+    const Block & getUpdatedHeader() const;
+
 private:
    void prepare(bool dry_run);

-    BlockInputStreamPtr addStreamsForLaterStages(BlockInputStreamPtr in) const;
+    struct Stage;
+
+    std::unique_ptr<InterpreterSelectQuery> prepareInterpreterSelect(std::vector<Stage> & prepared_stages, bool dry_run);
+    BlockInputStreamPtr addStreamsForLaterStages(const std::vector<Stage> & prepared_stages, BlockInputStreamPtr in) const;

 private:
    StoragePtr storage;
@ -78,6 +84,7 @@ private:
    };

    std::unique_ptr<InterpreterSelectQuery> interpreter_select;
+    std::unique_ptr<Block> updated_header;
    std::vector<Stage> stages;
    bool is_prepared = false; /// Has the sequence of stages been prepared.
 };
--- a/dbms/src/Interpreters/PredicateExpressionsOptimizer.h
+++ b/dbms/src/Interpreters/PredicateExpressionsOptimizer.h
@ -1,7 +1,6 @@
 #pragma once

 #include "DatabaseAndTableWithAlias.h"
-#include "ExpressionAnalyzer.h"
 #include <Parsers/ASTSelectQuery.h>
 #include <map>

--- a/dbms/src/Interpreters/SubqueryForSet.h
+++ b/dbms/src/Interpreters/SubqueryForSet.h
@ -12,7 +12,6 @@ class Join;
 using JoinPtr = std::shared_ptr<Join>;

 class InterpreterSelectWithUnionQuery;
-struct AnalyzedJoin;


 /// Information on what to do when executing a subquery in the [GLOBAL] IN/JOIN section.
--- a/dbms/src/Interpreters/SyntaxAnalyzer.cpp
+++ b/dbms/src/Interpreters/SyntaxAnalyzer.cpp
@ -1,7 +1,9 @@
+#include <Core/Settings.h>
+#include <Core/NamesAndTypes.h>
+
 #include <Interpreters/SyntaxAnalyzer.h>
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
 #include <Interpreters/LogicalExpressionsOptimizer.h>
-#include <Core/Settings.h>
 #include <Interpreters/QueryAliasesVisitor.h>
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Interpreters/ArrayJoinedColumnsVisitor.h>
@ -14,6 +16,8 @@
 #include <Interpreters/ExternalDictionaries.h>
 #include <Interpreters/OptimizeIfWithConstantConditionVisitor.h>
 #include <Interpreters/RequiredSourceColumnsVisitor.h>
+#include <Interpreters/GetAggregatesVisitor.h>
+#include <Interpreters/ExpressionActions.h> /// getSmallestColumn()

 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
@ -27,10 +31,8 @@

 #include <DataTypes/NestedUtils.h>

-#include <Core/NamesAndTypes.h>
 #include <IO/WriteHelpers.h>
 #include <Storages/IStorage.h>
-#include <Common/typeid_cast.h>

 #include <functional>

@ -46,6 +48,7 @@ namespace ErrorCodes
    extern const int EMPTY_LIST_OF_COLUMNS_QUERIED;
    extern const int NOT_IMPLEMENTED;
    extern const int UNKNOWN_IDENTIFIER;
+    extern const int EXPECTED_ALL_OR_ANY;
 }

 NameSet removeDuplicateColumns(NamesAndTypesList & columns)
@ -485,6 +488,27 @@ void getArrayJoinedColumns(ASTPtr & query, SyntaxAnalyzerResult & result, const
    }
 }

+void setJoinStrictness(ASTSelectQuery & select_query, JoinStrictness join_default_strictness)
+{
+    const ASTTablesInSelectQueryElement * node = select_query.join();
+    if (!node)
+        return;
+
+    auto & table_join = const_cast<ASTTablesInSelectQueryElement *>(node)->table_join->as<ASTTableJoin &>();
+
+    if (table_join.strictness == ASTTableJoin::Strictness::Unspecified &&
+        table_join.kind != ASTTableJoin::Kind::Cross)
+    {
+        if (join_default_strictness == JoinStrictness::ANY)
+            table_join.strictness = ASTTableJoin::Strictness::Any;
+        else if (join_default_strictness == JoinStrictness::ALL)
+            table_join.strictness = ASTTableJoin::Strictness::All;
+        else
+            throw Exception("Expected ANY or ALL in JOIN section, because setting (join_default_strictness) is empty",
+                            DB::ErrorCodes::EXPECTED_ALL_OR_ANY);
+    }
+}
+
 /// Find the columns that are obtained by JOIN.
 void collectJoinedColumns(AnalyzedJoin & analyzed_join, const ASTSelectQuery & select_query, const NameSet & source_columns,
                          const Aliases & aliases, bool join_use_nulls)
@ -558,6 +582,30 @@ void checkJoin(const ASTTablesInSelectQueryElement * join)
                            ErrorCodes::NOT_IMPLEMENTED);
 }

+std::vector<const ASTFunction *> getAggregates(const ASTPtr & query)
+{
+    if (const auto * select_query = query->as<ASTSelectQuery>())
+    {
+        /// There can not be aggregate functions inside the WHERE and PREWHERE.
+        if (select_query->where())
+            assertNoAggregates(select_query->where(), "in WHERE");
+        if (select_query->prewhere())
+            assertNoAggregates(select_query->prewhere(), "in PREWHERE");
+
+        GetAggregatesVisitor::Data data;
+        GetAggregatesVisitor(data).visit(query);
+
+        /// There can not be other aggregate functions within the aggregate functions.
+        for (const ASTFunction * node : data.aggregates)
+            for (auto & arg : node->arguments->children)
+                assertNoAggregates(arg, "inside another aggregate function");
+        return data.aggregates;
+    }
+    else
+        assertNoAggregates(query, "in wrong place");
+    return {};
+}
+
 }

 /// Calculate which columns are required to execute the expression.
@ -837,9 +885,11 @@ SyntaxAnalyzerResultPtr SyntaxAnalyzer::analyze(
        /// Push the predicate expression down to the subqueries.
        result.rewrite_subqueries = PredicateExpressionsOptimizer(select_query, settings, context).optimize();

+        setJoinStrictness(*select_query, settings.join_default_strictness);
        collectJoinedColumns(result.analyzed_join, *select_query, source_columns_set, result.aliases, settings.join_use_nulls);
    }

+    result.aggregates = getAggregates(query);
    result.collectUsedColumns(query, additional_source_columns);
    return std::make_shared<const SyntaxAnalyzerResult>(result);
 }
--- a/dbms/src/Interpreters/SyntaxAnalyzer.h
+++ b/dbms/src/Interpreters/SyntaxAnalyzer.h
@ -10,6 +10,8 @@ namespace DB

 NameSet removeDuplicateColumns(NamesAndTypesList & columns);

+class ASTFunction;
+
 struct SyntaxAnalyzerResult
 {
    StoragePtr storage;
@ -22,6 +24,7 @@ struct SyntaxAnalyzerResult
    NamesAndTypesList columns_added_by_join;

    Aliases aliases;
+    std::vector<const ASTFunction *> aggregates;

    /// Which column is needed to be ARRAY-JOIN'ed to get the specified.
    /// For example, for `SELECT s.v ... ARRAY JOIN a AS s` will get "s.v" -> "a.v".
--- a/dbms/src/Interpreters/SystemLog.cpp
+++ b/dbms/src/Interpreters/SystemLog.cpp
@ -4,6 +4,7 @@
 #include <Interpreters/PartLog.h>
 #include <Interpreters/TextLog.h>
 #include <Interpreters/TraceLog.h>
+#include <Interpreters/MetricLog.h>

 #include <Poco/Util/AbstractConfiguration.h>

@ -48,6 +49,13 @@ SystemLogs::SystemLogs(Context & global_context, const Poco::Util::AbstractConfi
    part_log = createSystemLog<PartLog>(global_context, "system", "part_log", config, "part_log");
    trace_log = createSystemLog<TraceLog>(global_context, "system", "trace_log", config, "trace_log");
    text_log = createSystemLog<TextLog>(global_context, "system", "text_log", config, "text_log");
+    metric_log = createSystemLog<MetricLog>(global_context, "system", "metric_log", config, "metric_log");
+
+    if (metric_log)
+    {
+        size_t collect_interval_milliseconds = config.getUInt64("metric_log.collect_interval_milliseconds");
+        metric_log->startCollectMetric(collect_interval_milliseconds);
+    }

    part_log_database = config.getString("part_log.database", "system");
 }
@ -70,6 +78,11 @@ void SystemLogs::shutdown()
        trace_log->shutdown();
    if (text_log)
        text_log->shutdown();
+    if (metric_log)
+    {
+        metric_log->stopCollectMetric();
+        metric_log->shutdown();
+    }
 }

 }
--- a/dbms/src/Interpreters/SystemLog.h
+++ b/dbms/src/Interpreters/SystemLog.h
@ -61,6 +61,7 @@ class QueryThreadLog;
 class PartLog;
 class TextLog;
 class TraceLog;
+class MetricLog;

 /// System logs should be destroyed in destructor of the last Context and before tables,
 ///  because SystemLog destruction makes insert query while flushing data into underlying tables
@ -76,6 +77,7 @@ struct SystemLogs
    std::shared_ptr<PartLog> part_log;                  /// Used to log operations with parts
    std::shared_ptr<TraceLog> trace_log;                /// Used to log traces from query profiler
    std::shared_ptr<TextLog> text_log;                  /// Used to log all text messages.
+    std::shared_ptr<MetricLog> metric_log;              /// Used to log all metrics.

    String part_log_database;
 };
--- a/dbms/src/Interpreters/Users.cpp
+++ b/dbms/src/Interpreters/Users.cpp
@ -278,12 +278,14 @@ User::User(const String & name_, const String & config_elem, const Poco::Util::A
 {
    bool has_password = config.has(config_elem + ".password");
    bool has_password_sha256_hex = config.has(config_elem + ".password_sha256_hex");
+    bool has_password_double_sha1_hex = config.has(config_elem + ".password_double_sha1_hex");

-    if (has_password && has_password_sha256_hex)
-        throw Exception("Both fields 'password' and 'password_sha256_hex' are specified for user " + name + ". Must be only one of them.", ErrorCodes::BAD_ARGUMENTS);
+    if (has_password + has_password_sha256_hex + has_password_double_sha1_hex > 1)
+        throw Exception("More than one field of 'password', 'password_sha256_hex', 'password_double_sha1_hex' is used to specify password for user " + name + ". Must be only one of them.",
+            ErrorCodes::BAD_ARGUMENTS);

-    if (!has_password && !has_password_sha256_hex)
-        throw Exception("Either 'password' or 'password_sha256_hex' must be specified for user " + name + ".", ErrorCodes::BAD_ARGUMENTS);
+    if (!has_password && !has_password_sha256_hex && !has_password_double_sha1_hex)
+        throw Exception("Either 'password' or 'password_sha256_hex' or 'password_double_sha1_hex' must be specified for user " + name + ".", ErrorCodes::BAD_ARGUMENTS);

    if (has_password)
        password     = config.getString(config_elem + ".password");
@ -296,6 +298,14 @@ User::User(const String & name_, const String & config_elem, const Poco::Util::A
            throw Exception("password_sha256_hex for user " + name + " has length " + toString(password_sha256_hex.size()) + " but must be exactly 64 symbols.", ErrorCodes::BAD_ARGUMENTS);
    }

+    if (has_password_double_sha1_hex)
+    {
+        password_double_sha1_hex = Poco::toLower(config.getString(config_elem + ".password_double_sha1_hex"));
+
+        if (password_double_sha1_hex.size() != 40)
+            throw Exception("password_double_sha1_hex for user " + name + " has length " + toString(password_double_sha1_hex.size()) + " but must be exactly 40 symbols.", ErrorCodes::BAD_ARGUMENTS);
+    }
+
    profile = config.getString(config_elem + ".profile");
    quota = config.getString(config_elem + ".quota");

--- a/dbms/src/Interpreters/Users.h
+++ b/dbms/src/Interpreters/Users.h
@ -56,6 +56,7 @@ struct User
    /// Required password. Could be stored in plaintext or in SHA256.
    String password;
    String password_sha256_hex;
+    String password_double_sha1_hex;

    String profile;
    String quota;
--- a/dbms/src/Interpreters/UsersManager.cpp
+++ b/dbms/src/Interpreters/UsersManager.cpp
@ -1,14 +1,15 @@
 #include <Interpreters/UsersManager.h>

-#include <Poco/Net/IPAddress.h>
-#include <Poco/Util/AbstractConfiguration.h>
-#include <Poco/String.h>
+#include "config_core.h"
 #include <Common/Exception.h>
+#include <common/logger_useful.h>
 #include <IO/HexWriteBuffer.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/WriteHelpers.h>
-#include <common/logger_useful.h>
-#include "config_core.h"
+#include <Poco/Net/IPAddress.h>
+#include <Poco/SHA1Engine.h>
+#include <Poco/String.h>
+#include <Poco/Util/AbstractConfiguration.h>
 #if USE_SSL
 #   include <openssl/sha.h>
 #endif
@ -93,6 +94,21 @@ UserPtr UsersManager::authorizeAndGetUser(
        throw DB::Exception("SHA256 passwords support is disabled, because ClickHouse was built without SSL library", DB::ErrorCodes::SUPPORT_IS_DISABLED);
 #endif
    }
+    else if (!it->second->password_double_sha1_hex.empty())
+    {
+        Poco::SHA1Engine engine;
+        engine.update(password);
+        const auto & first_sha1 = engine.digest();
+
+        /// If it was MySQL compatibility server, then first_sha1 already contains double SHA1.
+        if (Poco::SHA1Engine::digestToHex(first_sha1) == it->second->password_double_sha1_hex)
+            return it->second;
+
+        engine.update(first_sha1.data(), first_sha1.size());
+
+        if (Poco::SHA1Engine::digestToHex(engine.digest()) != it->second->password_double_sha1_hex)
+            on_wrong_password();
+    }
    else if (password != it->second->password)
    {
        on_wrong_password();
--- a/dbms/src/Interpreters/tests/CMakeLists.txt
+++ b/dbms/src/Interpreters/tests/CMakeLists.txt
@ -56,7 +56,7 @@ target_link_libraries (expression_analyzer PRIVATE dbms clickhouse_storages_syst
 add_check(expression_analyzer)

 add_executable (users users.cpp)
-target_link_libraries (users PRIVATE dbms clickhouse_common_config ${Boost_FILESYSTEM_LIBRARY})
+target_link_libraries (users PRIVATE dbms clickhouse_common_config stdc++fs)

 if (OS_LINUX)
    add_executable (internal_iotop internal_iotop.cpp)
--- a/dbms/src/Interpreters/tests/expression.cpp
+++ b/dbms/src/Interpreters/tests/expression.cpp
@ -56,7 +56,7 @@ int main(int argc, char ** argv)
        };

        auto syntax_result = SyntaxAnalyzer(context, {}).analyze(ast, columns);
-        ExpressionAnalyzer analyzer(ast, syntax_result, context);
+        SelectQueryExpressionAnalyzer analyzer(ast, syntax_result, context);
        ExpressionActionsChain chain(context);
        analyzer.appendSelect(chain, false);
        analyzer.appendProjectResult(chain);
--- a/dbms/src/Parsers/ASTAlterQuery.cpp
+++ b/dbms/src/Parsers/ASTAlterQuery.cpp
@ -114,8 +114,24 @@ void ASTAlterCommand::formatImpl(
    else if (type == ASTAlterCommand::DROP_INDEX)
    {
        settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str
-                      << "DROP INDEX " << (if_exists ? "IF EXISTS " : "") << (settings.hilite ? hilite_none : "");
+                      << (clear_index ? "CLEAR " : "DROP ") << "INDEX " << (if_exists ? "IF EXISTS " : "") << (settings.hilite ? hilite_none : "");
        index->formatImpl(settings, state, frame);
+        if (partition)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str<< " IN PARTITION " << (settings.hilite ? hilite_none : "");
+            partition->formatImpl(settings, state, frame);
+        }
+    }
+    else if (type == ASTAlterCommand::MATERIALIZE_INDEX)
+    {
+        settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str
+                      << "MATERIALIZE INDEX " << (settings.hilite ? hilite_none : "");
+        index->formatImpl(settings, state, frame);
+        if (partition)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << indent_str<< " IN PARTITION " << (settings.hilite ? hilite_none : "");
+            partition->formatImpl(settings, state, frame);
+        }
    }
    else if (type == ASTAlterCommand::DROP_PARTITION)
    {
--- a/dbms/src/Parsers/ASTAlterQuery.h
+++ b/dbms/src/Parsers/ASTAlterQuery.h
@ -32,6 +32,7 @@ public:

        ADD_INDEX,
        DROP_INDEX,
+        MATERIALIZE_INDEX,

        DROP_PARTITION,
        ATTACH_PARTITION,
@ -69,6 +70,8 @@ public:

    /** The ADD INDEX query stores the name of the index following AFTER.
     *  The DROP INDEX query stores the name for deletion.
+     *  The MATERIALIZE INDEX query stores the name of the index to materialize.
+     *  The CLEAR INDEX query stores the name of the index to clear.
     */
    ASTPtr index;

@ -98,9 +101,11 @@ public:

    bool clear_column = false;  /// for CLEAR COLUMN (do not drop column from metadata)

-    bool if_not_exists = false;  /// option for ADD_COLUMN
+    bool clear_index = false;   /// for CLEAR INDEX (do not drop index from metadata)

-    bool if_exists = false;  /// option for DROP_COLUMN, MODIFY_COLUMN, COMMENT_COLUMN
+    bool if_not_exists = false; /// option for ADD_COLUMN
+
+    bool if_exists = false;     /// option for DROP_COLUMN, MODIFY_COLUMN, COMMENT_COLUMN

    /** For FETCH PARTITION - the path in ZK to the shard, from which to download the partition.
     */
--- a/dbms/src/Parsers/ASTPartition.h
+++ b/dbms/src/Parsers/ASTPartition.h
@ -12,7 +12,7 @@ class ASTPartition : public IAST
 {
 public:
    ASTPtr value;
-    StringRef fields_str; /// The extent of comma-separated partition expression fields without parentheses.
+    String fields_str; /// The extent of comma-separated partition expression fields without parentheses.
    size_t fields_count = 0;

    String id;
--- a/dbms/src/Parsers/ParserAlterQuery.cpp
+++ b/dbms/src/Parsers/ParserAlterQuery.cpp
@ -33,6 +33,8 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected

    ParserKeyword s_add_index("ADD INDEX");
    ParserKeyword s_drop_index("DROP INDEX");
+    ParserKeyword s_clear_index("CLEAR INDEX");
+    ParserKeyword s_materialize_index("MATERIALIZE INDEX");

    ParserKeyword s_attach_partition("ATTACH PARTITION");
    ParserKeyword s_detach_partition("DETACH PARTITION");
@ -101,6 +103,24 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
        command->type = ASTAlterCommand::DROP_COLUMN;
        command->detach = false;
    }
+    else if (s_clear_column.ignore(pos, expected))
+    {
+        if (s_if_exists.ignore(pos, expected))
+            command->if_exists = true;
+
+        if (!parser_name.parse(pos, command->column, expected))
+            return false;
+
+        command->type = ASTAlterCommand::DROP_COLUMN;
+        command->clear_column = true;
+        command->detach = false;
+
+        if (s_in_partition.ignore(pos, expected))
+        {
+            if (!parser_partition.parse(pos, command->partition, expected))
+                return false;
+        }
+    }
    else if (s_add_index.ignore(pos, expected))
    {
        if (s_if_not_exists.ignore(pos, expected))
@ -128,16 +148,32 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
        command->type = ASTAlterCommand::DROP_INDEX;
        command->detach = false;
    }
-    else if (s_clear_column.ignore(pos, expected))
+    else if (s_clear_index.ignore(pos, expected))
    {
        if (s_if_exists.ignore(pos, expected))
            command->if_exists = true;

-        if (!parser_name.parse(pos, command->column, expected))
+        if (!parser_name.parse(pos, command->index, expected))
            return false;

-        command->type = ASTAlterCommand::DROP_COLUMN;
-        command->clear_column = true;
+        command->type = ASTAlterCommand::DROP_INDEX;
+        command->clear_index = true;
+        command->detach = false;
+
+        if (!s_in_partition.ignore(pos, expected))
+            return false;
+        if (!parser_partition.parse(pos, command->partition, expected))
+            return false;
+    }
+    else if (s_materialize_index.ignore(pos, expected))
+    {
+        if (s_if_exists.ignore(pos, expected))
+            command->if_exists = true;
+
+        if (!parser_name.parse(pos, command->index, expected))
+            return false;
+
+        command->type = ASTAlterCommand::MATERIALIZE_INDEX;
        command->detach = false;

        if (s_in_partition.ignore(pos, expected))
--- a/dbms/src/Parsers/ParserPartition.cpp
+++ b/dbms/src/Parsers/ParserPartition.cpp
@ -35,7 +35,7 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
            return false;

        size_t fields_count;
-        StringRef fields_str;
+        String fields_str;

        const auto * tuple_ast = value->as<ASTFunction>();
        if (tuple_ast && tuple_ast->name == "tuple")
@ -59,17 +59,17 @@ bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
            if (right_paren->type != TokenType::ClosingRoundBracket)
                return false;

-            fields_str = StringRef(left_paren->end, right_paren->begin - left_paren->end);
+            fields_str = String(left_paren->end, right_paren->begin - left_paren->end);
        }
        else
        {
            fields_count = 1;
-            fields_str = StringRef(begin->begin, pos->begin - begin->begin);
+            fields_str = String(begin->begin, pos->begin - begin->begin);
        }

        partition->value = value;
        partition->children.push_back(value);
-        partition->fields_str = fields_str;
+        partition->fields_str = std::move(fields_str);
        partition->fields_count = fields_count;
    }

--- a/dbms/src/Processors/Executors/PipelineExecutor.h
+++ b/dbms/src/Processors/Executors/PipelineExecutor.h
@ -177,7 +177,7 @@ private:
    /// Prepare processor with pid number.
    /// Check parents and children of current processor and push them to stacks if they also need to be prepared.
    /// If processor wants to be expanded, ExpandPipelineTask from thread_number's execution context will be used.
-    bool prepareProcessor(size_t pid, Stack & children, Stack & parents, size_t thread_number, bool async);
+    bool prepareProcessor(UInt64 pid, Stack & children, Stack & parents, size_t thread_number, bool async);
    void doExpandPipeline(ExpandPipelineTask * task, bool processing);

    void executeImpl(size_t num_threads);
--- a/dbms/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/CapnProtoRowInputFormat.cpp
@ -1,14 +1,13 @@
-#include "config_formats.h"
-#include <Processors/Formats/Impl/CapnProtoRowInputFormat.h> // Y_IGNORE
+#include "CapnProtoRowInputFormat.h"
 #if USE_CAPNP

 #include <IO/ReadBuffer.h>
 #include <Interpreters/Context.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/FormatSchemaInfo.h>
-#include <capnp/serialize.h> // Y_IGNORE
-#include <capnp/dynamic.h> // Y_IGNORE
-#include <capnp/common.h> // Y_IGNORE
+#include <capnp/serialize.h>
+#include <capnp/dynamic.h>
+#include <capnp/common.h>
 #include <boost/algorithm/string.hpp>
 #include <boost/range/join.hpp>
 #include <common/logger_useful.h>
--- a/dbms/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h
+++ b/dbms/src/Processors/Formats/Impl/CapnProtoRowInputFormat.h
@ -1,10 +1,10 @@
 #pragma once
-#include <Common/config.h>
+
+#include "config_formats.h"
 #if USE_CAPNP

 #include <Core/Block.h>
 #include <Processors/Formats/IRowInputFormat.h>
-
 #include <capnp/schema-parser.h>

 namespace DB
--- a/dbms/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
@ -1,7 +1,6 @@
-#include "config_formats.h"
-#include <Processors/Formats/Impl/ParquetBlockInputFormat.h>
-
+#include "ParquetBlockInputFormat.h"
 #if USE_PARQUET
+
 #include <algorithm>
 #include <iterator>
 #include <vector>
--- a/dbms/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/ParquetBlockOutputFormat.cpp
@ -1,5 +1,4 @@
-#include "config_formats.h"
-#include <Processors/Formats/Impl/ParquetBlockOutputFormat.h>
+#include "ParquetBlockOutputFormat.h"

 #if USE_PARQUET

--- a/dbms/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/ProtobufRowInputFormat.cpp
@ -1,5 +1,4 @@
-#include "config_formats.h"
-#include <Processors/Formats/Impl/ProtobufRowInputFormat.h>
+#include "ProtobufRowInputFormat.h"

 #if USE_PROTOBUF
 #include <Core/Block.h>
--- a/dbms/src/Processors/Formats/Impl/ProtobufRowInputFormat.h
+++ b/dbms/src/Processors/Formats/Impl/ProtobufRowInputFormat.h
@ -1,6 +1,6 @@
 #pragma once

-#include <Common/config.h>
+#include "config_formats.h"
 #if USE_PROTOBUF

 #include <DataTypes/IDataType.h>
--- a/dbms/src/Processors/Formats/Impl/ProtobufRowOutputFormat.cpp
+++ b/dbms/src/Processors/Formats/Impl/ProtobufRowOutputFormat.cpp
@ -1,10 +1,8 @@
 #include <Formats/FormatFactory.h>
+#include "ProtobufRowOutputFormat.h"

-#include "config_formats.h"
 #if USE_PROTOBUF

-#include <Processors/Formats/Impl/ProtobufRowOutputFormat.h>
-
 #include <Core/Block.h>
 #include <Formats/FormatSchemaInfo.h>
 #include <Formats/ProtobufSchemas.h>
--- a/dbms/src/Processors/Formats/Impl/ProtobufRowOutputFormat.h
+++ b/dbms/src/Processors/Formats/Impl/ProtobufRowOutputFormat.h
@ -1,6 +1,6 @@
 #pragma once

-#include <Common/config.h>
+#include "config_formats.h"
 #if USE_PROTOBUF

 #include <Core/Block.h>
--- a/dbms/src/Storages/AlterCommands.cpp
+++ b/dbms/src/Storages/AlterCommands.cpp
@ -155,10 +155,10 @@ std::optional<AlterCommand> AlterCommand::parse(const ASTAlterCommand * command_

        return command;
    }
-    else if (command_ast->type == ASTAlterCommand::DROP_INDEX)
+    else if (command_ast->type == ASTAlterCommand::DROP_INDEX && !command_ast->partition)
    {
        if (command_ast->clear_column)
-            throw Exception("\"ALTER TABLE table CLEAR COLUMN column\" queries are not supported yet. Use \"CLEAR COLUMN column IN PARTITION\".", ErrorCodes::NOT_IMPLEMENTED);
+            throw Exception("\"ALTER TABLE table CLEAR INDEX index\" queries are not supported yet. Use \"CLEAR INDEX index IN PARTITION\".", ErrorCodes::NOT_IMPLEMENTED);

        AlterCommand command;
        command.type = AlterCommand::DROP_INDEX;
--- a/dbms/src/Storages/IStorage.cpp
+++ b/dbms/src/Storages/IStorage.cpp
@ -34,11 +34,22 @@ IStorage::IStorage(ColumnsDescription columns_, ColumnsDescription virtuals_) :
    setColumns(std::move(columns_));
 }

+IStorage::IStorage(ColumnsDescription columns_, ColumnsDescription virtuals_, IndicesDescription indices_) : virtuals(std::move(virtuals_))
+{
+    setColumns(std::move(columns_));
+    setIndices(std::move(indices_));
+}
+
 const ColumnsDescription & IStorage::getColumns() const
 {
    return columns;
 }

+const ColumnsDescription & IStorage::getVirtuals() const
+{
+    return virtuals;
+}
+
 const IndicesDescription & IStorage::getIndices() const
 {
    return indices;
--- a/dbms/src/Storages/IStorage.h
+++ b/dbms/src/Storages/IStorage.h
@ -66,6 +66,7 @@ public:
    IStorage() = default;
    explicit IStorage(ColumnsDescription columns_);
    IStorage(ColumnsDescription columns_, ColumnsDescription virtuals_);
+    IStorage(ColumnsDescription columns_, ColumnsDescription virtuals_, IndicesDescription indices_);

    virtual ~IStorage() = default;
    IStorage(const IStorage &) = delete;
@ -106,6 +107,7 @@ public:

 public: /// thread-unsafe part. lockStructure must be acquired
    const ColumnsDescription & getColumns() const; /// returns combined set of columns
+    const ColumnsDescription & getVirtuals() const;
    const IndicesDescription & getIndices() const;

    /// NOTE: these methods should include virtual columns,
--- a/dbms/src/Storages/IndicesDescription.cpp
+++ b/dbms/src/Storages/IndicesDescription.cpp
@ -8,6 +8,16 @@
 namespace DB
 {

+bool IndicesDescription::has(const String & name) const
+{
+    return std::cend(indices) != std::find_if(
+            std::cbegin(indices), std::cend(indices),
+            [&name](const auto & index)
+            {
+                return index->name == name;
+            });
+}
+
 String IndicesDescription::toString() const
 {
    if (indices.empty())
--- a/dbms/src/Storages/IndicesDescription.h
+++ b/dbms/src/Storages/IndicesDescription.h
@ -15,8 +15,9 @@ struct IndicesDescription
    IndicesDescription() = default;

    bool empty() const { return indices.empty(); }
-    String toString() const;
+    bool has(const String & name) const;

+    String toString() const;
    static IndicesDescription parse(const String & str);
 };

--- a/dbms/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
+++ b/dbms/src/Storages/MergeTree/IMergedBlockOutputStream.cpp
@ -12,18 +12,22 @@ namespace ErrorCodes
 namespace
 {
    constexpr auto DATA_FILE_EXTENSION = ".bin";
+    constexpr auto INDEX_FILE_EXTENSION = ".idx";
 }


 IMergedBlockOutputStream::IMergedBlockOutputStream(
    MergeTreeData & storage_,
+    const String & part_path_,
    size_t min_compress_block_size_,
    size_t max_compress_block_size_,
    CompressionCodecPtr codec_,
    size_t aio_threshold_,
    bool blocks_are_granules_size_,
+    const std::vector<MergeTreeIndexPtr> & indices_to_recalc,
    const MergeTreeIndexGranularity & index_granularity_)
    : storage(storage_)
+    , part_path(part_path_)
    , min_compress_block_size(min_compress_block_size_)
    , max_compress_block_size(max_compress_block_size_)
    , aio_threshold(aio_threshold_)
@ -32,6 +36,7 @@ IMergedBlockOutputStream::IMergedBlockOutputStream(
    , index_granularity(index_granularity_)
    , compute_granularity(index_granularity.empty())
    , codec(std::move(codec_))
+    , skip_indices(indices_to_recalc)
    , with_final_mark(storage.getCOWSettings()->write_final_mark && storage.canUseAdaptiveGranularity())
 {
    if (blocks_are_granules_size && !index_granularity.empty())
@ -305,6 +310,106 @@ void IMergedBlockOutputStream::writeFinalMark(
    }, path);
 }

+void IMergedBlockOutputStream::initSkipIndices()
+{
+    for (const auto & index : skip_indices)
+    {
+        String stream_name = index->getFileName();
+        skip_indices_streams.emplace_back(
+                std::make_unique<ColumnStream>(
+                        stream_name,
+                        part_path + stream_name, INDEX_FILE_EXTENSION,
+                        part_path + stream_name, marks_file_extension,
+                        codec, max_compress_block_size,
+                        0, aio_threshold));
+        skip_indices_aggregators.push_back(index->createIndexAggregator());
+        skip_index_filling.push_back(0);
+    }
+}
+
+void IMergedBlockOutputStream::calculateAndSerializeSkipIndices(
+        const ColumnsWithTypeAndName & skip_indexes_columns, size_t rows)
+{
+    /// Creating block for update
+    Block indices_update_block(skip_indexes_columns);
+    size_t skip_index_current_mark = 0;
+
+    /// Filling and writing skip indices like in IMergedBlockOutputStream::writeColumn
+    for (size_t i = 0; i < storage.skip_indices.size(); ++i)
+    {
+        const auto index = storage.skip_indices[i];
+        auto & stream = *skip_indices_streams[i];
+        size_t prev_pos = 0;
+        skip_index_current_mark = skip_index_mark;
+        while (prev_pos < rows)
+        {
+            UInt64 limit = 0;
+            if (prev_pos == 0 && index_offset != 0)
+            {
+                limit = index_offset;
+            }
+            else
+            {
+                limit = index_granularity.getMarkRows(skip_index_current_mark);
+                if (skip_indices_aggregators[i]->empty())
+                {
+                    skip_indices_aggregators[i] = index->createIndexAggregator();
+                    skip_index_filling[i] = 0;
+
+                    if (stream.compressed.offset() >= min_compress_block_size)
+                        stream.compressed.next();
+
+                    writeIntBinary(stream.plain_hashing.count(), stream.marks);
+                    writeIntBinary(stream.compressed.offset(), stream.marks);
+                    /// Actually this numbers is redundant, but we have to store them
+                    /// to be compatible with normal .mrk2 file format
+                    if (storage.canUseAdaptiveGranularity())
+                        writeIntBinary(1UL, stream.marks);
+
+                    ++skip_index_current_mark;
+                }
+            }
+
+            size_t pos = prev_pos;
+            skip_indices_aggregators[i]->update(indices_update_block, &pos, limit);
+
+            if (pos == prev_pos + limit)
+            {
+                ++skip_index_filling[i];
+
+                /// write index if it is filled
+                if (skip_index_filling[i] == index->granularity)
+                {
+                    skip_indices_aggregators[i]->getGranuleAndReset()->serializeBinary(stream.compressed);
+                    skip_index_filling[i] = 0;
+                }
+            }
+            prev_pos = pos;
+        }
+    }
+    skip_index_mark = skip_index_current_mark;
+}
+
+void IMergedBlockOutputStream::finishSkipIndicesSerialization(
+        MergeTreeData::DataPart::Checksums & checksums)
+{
+    for (size_t i = 0; i < skip_indices.size(); ++i)
+    {
+        auto & stream = *skip_indices_streams[i];
+        if (!skip_indices_aggregators[i]->empty())
+            skip_indices_aggregators[i]->getGranuleAndReset()->serializeBinary(stream.compressed);
+    }
+
+    for (auto & stream : skip_indices_streams)
+    {
+        stream->finalize();
+        stream->addToChecksums(checksums);
+    }
+
+    skip_indices_streams.clear();
+    skip_indices_aggregators.clear();
+    skip_index_filling.clear();
+}

 /// Implementation of IMergedBlockOutputStream::ColumnStream.

--- a/dbms/src/Storages/MergeTree/IMergedBlockOutputStream.h
+++ b/dbms/src/Storages/MergeTree/IMergedBlockOutputStream.h
@ -16,11 +16,13 @@ class IMergedBlockOutputStream : public IBlockOutputStream
 public:
    IMergedBlockOutputStream(
        MergeTreeData & storage_,
+        const String & part_path_,
        size_t min_compress_block_size_,
        size_t max_compress_block_size_,
        CompressionCodecPtr default_codec_,
        size_t aio_threshold_,
        bool blocks_are_granules_size_,
+        const std::vector<MergeTreeIndexPtr> & indices_to_recalc,
        const MergeTreeIndexGranularity & index_granularity_);

    using WrittenOffsetColumns = std::set<std::string>;
@ -117,10 +119,15 @@ protected:
        bool skip_offsets,
        DB::IDataType::SubstreamPath & path);

+    void initSkipIndices();
+    void calculateAndSerializeSkipIndices(const ColumnsWithTypeAndName & skip_indexes_columns, size_t rows);
+    void finishSkipIndicesSerialization(MergeTreeData::DataPart::Checksums & checksums);
 protected:
-
    MergeTreeData & storage;

+    SerializationStates serialization_states;
+    String part_path;
+
    ColumnStreams column_streams;

    /// The offset to the first row of the block for which you want to write the index.
@ -132,6 +139,7 @@ protected:
    size_t aio_threshold;

    size_t current_mark = 0;
+    size_t skip_index_mark = 0;

    const std::string marks_file_extension;
    const bool blocks_are_granules_size;
@ -141,6 +149,11 @@ protected:
    const bool compute_granularity;
    CompressionCodecPtr codec;

+    std::vector<MergeTreeIndexPtr> skip_indices;
+    std::vector<std::unique_ptr<ColumnStream>> skip_indices_streams;
+    MergeTreeIndexAggregators skip_indices_aggregators;
+    std::vector<size_t> skip_index_filling;
+
    const bool with_final_mark;
 };

--- a/dbms/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeData.cpp
@ -1594,6 +1594,7 @@ void MergeTreeData::alterDataPart(
            true /* sync */,
            compression_codec,
            true /* skip_offsets */,
+            {},
            unused_written_offsets,
            part->index_granularity);

@ -2568,7 +2569,7 @@ String MergeTreeData::getPartitionIDFromQuery(const ASTPtr & ast, const Context
    if (fields_count)
    {
        ReadBufferFromMemory left_paren_buf("(", 1);
-        ReadBufferFromMemory fields_buf(partition_ast.fields_str.data, partition_ast.fields_str.size);
+        ReadBufferFromMemory fields_buf(partition_ast.fields_str.data(), partition_ast.fields_str.size());
        ReadBufferFromMemory right_paren_buf(")", 1);
        ConcatReadBuffer buf({&left_paren_buf, &fields_buf, &right_paren_buf});

@ -2577,7 +2578,7 @@ String MergeTreeData::getPartitionIDFromQuery(const ASTPtr & ast, const Context
        auto block = input_stream->read();
        if (!block || !block.rows())
            throw Exception(
-                "Could not parse partition value: `" + partition_ast.fields_str.toString() + "`",
+                "Could not parse partition value: `" + partition_ast.fields_str + "`",
                ErrorCodes::INVALID_PARTITION_VALUE);

        for (size_t i = 0; i < fields_count; ++i)
--- a/dbms/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@ -823,6 +823,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mergePartsToTempor
                false,
                compression_codec,
                false,
+                {},
                written_offset_columns,
                to.getIndexGranularity()
            );
@ -902,7 +903,6 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
            "This is a bug.", ErrorCodes::LOGICAL_ERROR);

    CurrentMetrics::Increment num_mutations{CurrentMetrics::PartMutation};
-
    const auto & source_part = future_part.parts[0];
    auto storage_from_source_part = StorageFromMergeTreeDataPart::create(source_part);

@ -910,7 +910,19 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
    context_for_reading.getSettingsRef().merge_tree_uniform_read_distribution = 0;
    context_for_reading.getSettingsRef().max_threads = 1;

-    MutationsInterpreter mutations_interpreter(storage_from_source_part, commands, context_for_reading);
+    std::vector<MutationCommand> commands_for_part;
+    std::copy_if(
+            std::cbegin(commands), std::cend(commands),
+            std::back_inserter(commands_for_part),
+            [&] (const MutationCommand & command)
+            {
+                return command.partition == nullptr ||
+                    future_part.parts[0]->info.partition_id == data.getPartitionIDFromQuery(
+                            command.partition, context_for_reading);
+            });
+
+
+    MutationsInterpreter mutations_interpreter(storage_from_source_part, commands_for_part, context_for_reading);

    if (!mutations_interpreter.isStorageTouchedByMutations())
    {
@ -940,6 +952,8 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
    Poco::File(new_part_tmp_path).createDirectories();

    auto in = mutations_interpreter.execute();
+    const auto & updated_header = mutations_interpreter.getUpdatedHeader();
+
    NamesAndTypesList all_columns = data.getColumns().getAllPhysical();
    const auto data_settings = data.getCOWSettings();

@ -949,7 +963,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
    MergeStageProgress stage_progress(1.0);
    in->setProgressCallback(MergeProgressCallback(merge_entry, watch_prev_elapsed, stage_progress));

-    if (in_header.columns() == all_columns.size())
+    if (updated_header.columns() == all_columns.size())
    {
        /// All columns are modified, proceed to write a new part from scratch.
        if (data.hasPrimaryKey() || data.hasSkipIndices())
@ -984,21 +998,39 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
        /// We will modify only some of the columns. Other columns and key values can be copied as-is.
        /// TODO: check that we modify only non-key columns in this case.

-        /// Checks if columns used in skipping indexes modified/
+        /// Checks if columns used in skipping indexes modified.
+        std::set<MergeTreeIndexPtr> indices_to_recalc;
+        ASTPtr indices_recalc_expr_list = std::make_shared<ASTExpressionList>();
        for (const auto & col : in_header.getNames())
        {
-            for (const auto & index : data.skip_indices)
+            for (size_t i = 0; i < data.skip_indices.size(); ++i)
            {
+                const auto & index = data.skip_indices[i];
                const auto & index_cols = index->expr->getRequiredColumns();
                auto it = find(cbegin(index_cols), cend(index_cols), col);
-                if (it != cend(index_cols))
-                    throw Exception("You can not modify columns used in index. Index name: '"
-                                    + index->name
-                                    + "' bad column: '" + *it + "'", ErrorCodes::ILLEGAL_COLUMN);
+                if (it != cend(index_cols) && indices_to_recalc.insert(index).second)
+                {
+                    ASTPtr expr_list = MergeTreeData::extractKeyExpressionList(
+                            storage_from_source_part->getIndices().indices[i]->expr->clone());
+                    for (const auto & expr : expr_list->children)
+                        indices_recalc_expr_list->children.push_back(expr->clone());
+                }
            }
        }

+        if (!indices_to_recalc.empty())
+        {
+            auto indices_recalc_syntax = SyntaxAnalyzer(context, {}).analyze(
+                    indices_recalc_expr_list, in_header.getNamesAndTypesList());
+            auto indices_recalc_expr = ExpressionAnalyzer(
+                    indices_recalc_expr_list,
+                    indices_recalc_syntax, context).getActions(false);
+            in = std::make_shared<MaterializingBlockInputStream>(
+                    std::make_shared<ExpressionBlockInputStream>(in, indices_recalc_expr));
+        }
+
        NameSet files_to_skip = {"checksums.txt", "columns.txt"};
+
        auto mrk_extension = data_settings->index_granularity_bytes ? getAdaptiveMrkExtension() : getNonAdaptiveMrkExtension();
        for (const auto & entry : in_header)
        {
@ -1012,6 +1044,11 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
            IDataType::SubstreamPath stream_path;
            entry.type->enumerateStreams(callback, stream_path);
        }
+        for (const auto & index : indices_to_recalc)
+        {
+            files_to_skip.insert(index->getFileName() + ".idx");
+            files_to_skip.insert(index->getFileName() + ".mrk");
+        }

        Poco::DirectoryIterator dir_end;
        for (Poco::DirectoryIterator dir_it(source_part->getFullPath()); dir_it != dir_end; ++dir_it)
@ -1025,16 +1062,17 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
            createHardLink(dir_it.path().toString(), destination.toString());
        }

-        merge_entry->columns_written = all_columns.size() - in_header.columns();
+        merge_entry->columns_written = all_columns.size() - updated_header.columns();

        IMergedBlockOutputStream::WrittenOffsetColumns unused_written_offsets;
        MergedColumnOnlyOutputStream out(
            data,
-            in_header,
+            updated_header,
            new_part_tmp_path,
            /* sync = */ false,
            compression_codec,
            /* skip_offsets = */ false,
+            std::vector<MergeTreeIndexPtr>(indices_to_recalc.begin(), indices_to_recalc.end()),
            unused_written_offsets,
            source_part->index_granularity
        );
@ -1068,7 +1106,7 @@ MergeTreeData::MutableDataPartPtr MergeTreeDataMergerMutator::mutatePartToTempor
        NameSet source_columns_name_set(source_column_names.begin(), source_column_names.end());
        for (auto it = new_data_part->columns.begin(); it != new_data_part->columns.end();)
        {
-            if (source_columns_name_set.count(it->name) || in_header.has(it->name))
+            if (source_columns_name_set.count(it->name) || updated_header.has(it->name))
                ++it;
            else
                it = new_data_part->columns.erase(it);
--- a/dbms/src/Storages/MergeTree/MergeTreeDataPart.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeDataPart.cpp
@ -409,6 +409,8 @@ void MergeTreeDataPart::remove() const
 #pragma GCC diagnostic push
 #pragma GCC diagnostic ignored "-Wunused-variable"
 #endif
+        std::shared_lock<std::shared_mutex> lock(columns_lock);
+
        for (const auto & [file, _] : checksums.files)
        {
            String path_to_remove = to + "/" + file;
--- a/Show More
+++ b/Show More