Merge branch 'master' of github.com:yandex/ClickHouse

2024-10-04 23:50:50 +00:00 · 2019-03-06 14:13:29 +03:00 · 2019-03-06 14:13:29 +03:00 · 1cc87a7e36
commit 1cc87a7e36
parent 98d999f95f 6e852288ff
96 changed files with 23737 additions and 971 deletions
--- a/cmake/print_include_directories.cmake
+++ b/cmake/print_include_directories.cmake
@ -13,6 +13,9 @@ list(APPEND dirs ${dirs1})
 get_property (dirs1 TARGET cityhash PROPERTY INCLUDE_DIRECTORIES)
 list(APPEND dirs ${dirs1})

+get_property (dirs1 TARGET roaring PROPERTY INCLUDE_DIRECTORIES)
+list(APPEND dirs ${dirs1})
+
 if (USE_INTERNAL_BOOST_LIBRARY)
    get_property (dirs1 TARGET ${Boost_PROGRAM_OPTIONS_LIBRARY} PROPERTY INCLUDE_DIRECTORIES)
    list(APPEND dirs ${dirs1})
--- a/contrib/CMakeLists.txt
+++ b/contrib/CMakeLists.txt
@ -46,6 +46,7 @@ if (USE_INTERNAL_METROHASH_LIBRARY)
 endif ()

 add_subdirectory (murmurhash)
+add_subdirectory (croaring)

 if (USE_INTERNAL_BTRIE_LIBRARY)
    add_subdirectory (libbtrie)
--- a/contrib/arrow-cmake/CMakeLists.txt
+++ b/contrib/arrow-cmake/CMakeLists.txt
@ -198,7 +198,7 @@ list(APPEND PARQUET_SRCS
 add_library(${PARQUET_LIBRARY} ${LINK_MODE} ${PARQUET_SRCS})
 target_include_directories(${PARQUET_LIBRARY} SYSTEM PUBLIC ${ClickHouse_SOURCE_DIR}/contrib/arrow/cpp/src ${CMAKE_CURRENT_SOURCE_DIR}/cpp/src)
 include(${ClickHouse_SOURCE_DIR}/contrib/thrift/build/cmake/ConfigureChecks.cmake) # makes config.h
-target_link_libraries(${PARQUET_LIBRARY} PRIVATE ${ARROW_LIBRARY} ${THRIFT_LIBRARY} ${Boost_REGEX_LIBRARY})
+target_link_libraries(${PARQUET_LIBRARY} PUBLIC ${ARROW_LIBRARY} PRIVATE ${THRIFT_LIBRARY} ${Boost_REGEX_LIBRARY})
 target_include_directories(${PARQUET_LIBRARY} PRIVATE ${Boost_INCLUDE_DIRS})

 if(SANITIZE STREQUAL "undefined")
--- a/contrib/croaring/CMakeLists.txt
+++ b/contrib/croaring/CMakeLists.txt
@ -0,0 +1,6 @@
+add_library(roaring
+	roaring.c
+	roaring.h
+	roaring.hh)
+
+target_include_directories (roaring PUBLIC ${CMAKE_CURRENT_SOURCE_DIR})
--- a/contrib/croaring/LICENSE
+++ b/contrib/croaring/LICENSE
@ -0,0 +1,202 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "{}"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright 2016 The CRoaring authors 
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+
--- a/contrib/croaring/README.txt
+++ b/contrib/croaring/README.txt
@ -0,0 +1,2 @@
+download from https://github.com/RoaringBitmap/CRoaring/archive/v0.2.57.tar.gz
+and use ./amalgamation.sh generate
--- a/contrib/croaring/roaring.c
+++ b/contrib/croaring/roaring.c
--- a/contrib/croaring/roaring.h
+++ b/contrib/croaring/roaring.h
--- a/contrib/croaring/roaring.hh
+++ b/contrib/croaring/roaring.hh
--- a/dbms/CMakeLists.txt
+++ b/dbms/CMakeLists.txt
@ -59,6 +59,12 @@ if (CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
    if (NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS 8)
        set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wextra-semi-stmt -Wshadow-field -Wstring-plus-int")
    endif ()
+
+    if (NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9)
+        if (WEVERYTHING)
+            set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-ctad-maybe-unsupported")
+        endif ()
+    endif ()
 endif ()

 if (USE_DEBUG_HELPERS)
@ -137,12 +143,10 @@ endif ()
 add_subdirectory(src/Common/ZooKeeper)
 add_subdirectory(src/Common/Config)

-if (MAKE_STATIC_LIBRARIES)
+if (MAKE_STATIC_LIBRARIES OR NOT SPLIT_SHARED_LIBRARIES)
    add_library(dbms ${dbms_headers} ${dbms_sources})
 else ()
    add_library(dbms SHARED ${dbms_headers} ${dbms_sources})
-    set_target_properties (dbms PROPERTIES SOVERSION ${VERSION_MAJOR}.${VERSION_MINOR} VERSION ${VERSION_SO} OUTPUT_NAME clickhouse)
-    install (TARGETS dbms LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} COMPONENT clickhouse)
 endif ()

 if (USE_EMBEDDED_COMPILER)
@ -201,9 +205,10 @@ target_link_libraries (clickhouse_common_io
    Threads::Threads
        PRIVATE
    ${CMAKE_DL_LIBS}
+        PUBLIC
+    roaring
 )

-target_include_directories(clickhouse_common_io SYSTEM BEFORE PUBLIC ${PDQSORT_INCLUDE_DIR})

 target_include_directories(clickhouse_common_io SYSTEM BEFORE PUBLIC ${RE2_INCLUDE_DIR})

@ -235,6 +240,7 @@ target_link_libraries (dbms
    Threads::Threads
 )

+target_include_directories(dbms SYSTEM BEFORE PUBLIC ${PDQSORT_INCLUDE_DIR})

 if (NOT USE_INTERNAL_BOOST_LIBRARY)
    target_include_directories (clickhouse_common_io SYSTEM BEFORE PUBLIC ${Boost_INCLUDE_DIRS})
--- a/dbms/programs/CMakeLists.txt
+++ b/dbms/programs/CMakeLists.txt
@ -7,7 +7,7 @@ option (ENABLE_CLICKHOUSE_SERVER "Enable clickhouse-server" ${ENABLE_CLICKHOUSE_
 option (ENABLE_CLICKHOUSE_CLIENT "Enable clickhouse-client" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_LOCAL "Enable clickhouse-local" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_BENCHMARK "Enable clickhouse-benchmark" ${ENABLE_CLICKHOUSE_ALL})
-option (ENABLE_CLICKHOUSE_PERFORMANCE "Enable clickhouse-performance-test" ${ENABLE_CLICKHOUSE_ALL})
+option (ENABLE_CLICKHOUSE_PERFORMANCE_TEST "Enable clickhouse-performance-test" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG "Enable clickhouse-extract-from-config" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_COMPRESSOR "Enable clickhouse-compressor" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_COPIER "Enable clickhouse-copier" ${ENABLE_CLICKHOUSE_ALL})
@ -15,8 +15,64 @@ option (ENABLE_CLICKHOUSE_FORMAT "Enable clickhouse-format" ${ENABLE_CLICKHOUSE_
 option (ENABLE_CLICKHOUSE_OBFUSCATOR "Enable clickhouse-obfuscator" ${ENABLE_CLICKHOUSE_ALL})
 option (ENABLE_CLICKHOUSE_ODBC_BRIDGE "Enable clickhouse-odbc-bridge" ${ENABLE_CLICKHOUSE_ALL})

+if(NOT (MAKE_STATIC_LIBRARIES OR SPLIT_SHARED_LIBRARIES))
+    set(CLICKHOUSE_ONE_SHARED 1)
+endif()
+
 configure_file (config_tools.h.in ${CMAKE_CURRENT_BINARY_DIR}/config_tools.h)

+
+
+macro(clickhouse_target_link_split_lib target name)
+    if(NOT CLICKHOUSE_ONE_SHARED)
+        target_link_libraries(${target} PRIVATE clickhouse-${name}-lib)
+    else()
+        target_link_libraries(${target} PRIVATE clickhouse-lib)
+    endif()
+endmacro()
+
+macro(clickhouse_program_link_split_binary name)
+    clickhouse_target_link_split_lib(clickhouse-${name} ${name})
+endmacro()
+
+macro(clickhouse_program_add_library name)
+    string(TOUPPER ${name} name_uc)
+    string(REPLACE "-" "_" name_uc ${name_uc})
+
+    # Some dark magic
+    set(CLICKHOUSE_${name_uc}_SOURCES ${CLICKHOUSE_${name_uc}_SOURCES} PARENT_SCOPE)
+    set(CLICKHOUSE_${name_uc}_LINK ${CLICKHOUSE_${name_uc}_LINK} PARENT_SCOPE)
+    set(CLICKHOUSE_${name_uc}_INCLUDE ${CLICKHOUSE_${name_uc}_INCLUDE} PARENT_SCOPE)
+
+    if(NOT CLICKHOUSE_ONE_SHARED)
+        add_library(clickhouse-${name}-lib ${LINK_MODE} ${CLICKHOUSE_${name_uc}_SOURCES})
+
+        set(_link ${CLICKHOUSE_${name_uc}_LINK}) # can't use ${} in if()
+        if(_link)
+            target_link_libraries(clickhouse-${name}-lib ${CLICKHOUSE_${name_uc}_LINK})
+        endif()
+
+        set(_include ${CLICKHOUSE_${name_uc}_INCLUDE}) # can't use ${} in if()
+        if (_include)
+            target_include_directories(clickhouse-${name}-lib ${CLICKHOUSE_${name_uc}_INCLUDE})
+        endif()
+    endif()
+endmacro()
+
+macro(clickhouse_program_add_executable name)
+    if(CLICKHOUSE_SPLIT_BINARY)
+        add_executable(clickhouse-${name} clickhouse-${name}.cpp)
+        clickhouse_program_link_split_binary(${name})
+        install(TARGETS clickhouse-${name} ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+    endif()
+endmacro()
+
+macro(clickhouse_program_add name)
+    clickhouse_program_add_library(${name})
+    clickhouse_program_add_executable(${name})
+endmacro()
+
+
 add_subdirectory (server)
 add_subdirectory (client)
 add_subdirectory (local)
@ -33,6 +89,13 @@ if (ENABLE_CLICKHOUSE_ODBC_BRIDGE)
    add_subdirectory (odbc-bridge)
 endif ()

+if (CLICKHOUSE_ONE_SHARED)
+    add_library(clickhouse-lib SHARED ${CLICKHOUSE_SERVER_SOURCES} ${CLICKHOUSE_CLIENT_SOURCES} ${CLICKHOUSE_LOCAL_SOURCES} ${CLICKHOUSE_BENCHMARK_SOURCES} ${CLICKHOUSE_PERFORMANCE_TEST_SOURCES} ${CLICKHOUSE_COPIER_SOURCES} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_SOURCES} ${CLICKHOUSE_COMPRESSOR_SOURCES} ${CLICKHOUSE_FORMAT_SOURCES} ${CLICKHOUSE_OBFUSCATOR_SOURCES} ${CLICKHOUSE_COMPILER_SOURCES} ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
+    target_link_libraries(clickhouse-lib PUBLIC ${CLICKHOUSE_SERVER_LINK} ${CLICKHOUSE_CLIENT_LINK} ${CLICKHOUSE_LOCAL_LINK} ${CLICKHOUSE_BENCHMARK_LINK} ${CLICKHOUSE_PERFORMANCE_TEST_LINK} ${CLICKHOUSE_COPIER_LINK} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_LINK} ${CLICKHOUSE_COMPRESSOR_LINK} ${CLICKHOUSE_FORMAT_LINK} ${CLICKHOUSE_OBFUSCATOR_LINK} ${CLICKHOUSE_COMPILER_LINK}  ${CLICKHOUSE_ODBC_BRIDGE_LINK})
+    set_target_properties(clickhouse-lib PROPERTIES SOVERSION ${VERSION_MAJOR}.${VERSION_MINOR} VERSION ${VERSION_SO} OUTPUT_NAME clickhouse)
+    target_include_directories(clickhouse-lib ${CLICKHOUSE_SERVER_INCLUDE} ${CLICKHOUSE_CLIENT_INCLUDE} ${CLICKHOUSE_LOCAL_INCLUDE} ${CLICKHOUSE_BENCHMARK_INCLUDE} ${CLICKHOUSE_PERFORMANCE_TEST_INCLUDE} ${CLICKHOUSE_COPIER_INCLUDE} ${CLICKHOUSE_EXTRACT_FROM_CONFIG_INCLUDE} ${CLICKHOUSE_COMPRESSOR_INCLUDE} ${CLICKHOUSE_FORMAT_INCLUDE} ${CLICKHOUSE_OBFUSCATOR_INCLUDE} ${CLICKHOUSE_COMPILER_INCLUDE} ${CLICKHOUSE_ODBC_BRIDGE_INCLUDE})
+endif()
+
 if (CLICKHOUSE_SPLIT_BINARY)
    set (CLICKHOUSE_ALL_TARGETS clickhouse-server clickhouse-client clickhouse-local clickhouse-benchmark clickhouse-performance-test
            clickhouse-extract-from-config clickhouse-compressor clickhouse-format clickhouse-copier)
@ -71,7 +134,7 @@ else ()
    if (ENABLE_CLICKHOUSE_BENCHMARK)
        target_link_libraries (clickhouse PRIVATE clickhouse-benchmark-lib)
    endif ()
-    if (ENABLE_CLICKHOUSE_PERFORMANCE)
+    if (ENABLE_CLICKHOUSE_PERFORMANCE_TEST)
        target_link_libraries (clickhouse PRIVATE clickhouse-performance-test-lib)
    endif ()
    if (ENABLE_CLICKHOUSE_COPIER)
@ -114,7 +177,7 @@ else ()
        install (FILES ${CMAKE_CURRENT_BINARY_DIR}/clickhouse-benchmark DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
        list(APPEND CLICKHOUSE_BUNDLE clickhouse-benchmark)
    endif ()
-    if (ENABLE_CLICKHOUSE_PERFORMANCE)
+    if (ENABLE_CLICKHOUSE_PERFORMANCE_TEST)
        add_custom_target (clickhouse-performance-test ALL COMMAND ${CMAKE_COMMAND} -E create_symlink clickhouse clickhouse-performance-test DEPENDS clickhouse)
        install (FILES ${CMAKE_CURRENT_BINARY_DIR}/clickhouse-performance-test DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
        list(APPEND CLICKHOUSE_BUNDLE clickhouse-performance-test)
--- a/dbms/programs/benchmark/CMakeLists.txt
+++ b/dbms/programs/benchmark/CMakeLists.txt
@ -1,9 +1,9 @@
-add_library (clickhouse-benchmark-lib ${LINK_MODE} Benchmark.cpp)
-target_link_libraries (clickhouse-benchmark-lib PRIVATE clickhouse_aggregate_functions clickhouse-client-lib clickhouse_common_config clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
-target_include_directories (clickhouse-benchmark-lib SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR})
+set(CLICKHOUSE_BENCHMARK_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/Benchmark.cpp)
+set(CLICKHOUSE_BENCHMARK_LINK PRIVATE clickhouse_aggregate_functions clickhouse_common_config clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_BENCHMARK_INCLUDE SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR})

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-benchmark clickhouse-benchmark.cpp)
-    target_link_libraries (clickhouse-benchmark PRIVATE clickhouse-benchmark-lib clickhouse_aggregate_functions)
-    install (TARGETS clickhouse-benchmark ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(benchmark)
+
+if(NOT CLICKHOUSE_ONE_SHARED)
+    target_link_libraries (clickhouse-benchmark-lib PRIVATE clickhouse-client-lib)
+endif()
--- a/dbms/programs/client/CMakeLists.txt
+++ b/dbms/programs/client/CMakeLists.txt
@ -1,13 +1,7 @@
-add_library (clickhouse-client-lib ${LINK_MODE} Client.cpp)
-target_link_libraries (clickhouse-client-lib PRIVATE clickhouse_common_config clickhouse_functions clickhouse_aggregate_functions clickhouse_common_io ${LINE_EDITING_LIBS} ${Boost_PROGRAM_OPTIONS_LIBRARY})
-if (READLINE_INCLUDE_DIR)
-    target_include_directories (clickhouse-client-lib SYSTEM PRIVATE ${READLINE_INCLUDE_DIR})
-endif ()
+set(CLICKHOUSE_CLIENT_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/Client.cpp)
+set(CLICKHOUSE_CLIENT_LINK PRIVATE clickhouse_common_config clickhouse_functions clickhouse_aggregate_functions clickhouse_common_io ${LINE_EDITING_LIBS} ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_CLIENT_INCLUDE SYSTEM PRIVATE ${READLINE_INCLUDE_DIR})

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-client clickhouse-client.cpp)
-    target_link_libraries (clickhouse-client PRIVATE clickhouse-client-lib)
-    install (TARGETS clickhouse-client ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(client)

 install (FILES clickhouse-client.xml DESTINATION ${CLICKHOUSE_ETC_DIR}/clickhouse-client COMPONENT clickhouse-client RENAME config.xml)
--- a/dbms/programs/compressor/CMakeLists.txt
+++ b/dbms/programs/compressor/CMakeLists.txt
@ -1,9 +1,7 @@
-add_library (clickhouse-compressor-lib ${LINK_MODE} Compressor.cpp)
-target_link_libraries (clickhouse-compressor-lib PRIVATE clickhouse_compression clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
+# Also in utils

-if (CLICKHOUSE_SPLIT_BINARY)
-    # Also in utils
-    add_executable (clickhouse-compressor clickhouse-compressor.cpp)
-    target_link_libraries (clickhouse-compressor PRIVATE clickhouse-compressor-lib)
-    install (TARGETS clickhouse-compressor ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+set(CLICKHOUSE_COMPRESSOR_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/Compressor.cpp)
+set(CLICKHOUSE_COMPRESSOR_LINK PRIVATE clickhouse_compression clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
+#set(CLICKHOUSE_COMPRESSOR_INCLUDE SYSTEM PRIVATE ...)
+
+clickhouse_program_add(compressor)
--- a/dbms/programs/config_tools.h.in
+++ b/dbms/programs/config_tools.h.in
@ -6,7 +6,7 @@
 #cmakedefine01 ENABLE_CLICKHOUSE_CLIENT
 #cmakedefine01 ENABLE_CLICKHOUSE_LOCAL
 #cmakedefine01 ENABLE_CLICKHOUSE_BENCHMARK
-#cmakedefine01 ENABLE_CLICKHOUSE_PERFORMANCE
+#cmakedefine01 ENABLE_CLICKHOUSE_PERFORMANCE_TEST
 #cmakedefine01 ENABLE_CLICKHOUSE_COPIER
 #cmakedefine01 ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG
 #cmakedefine01 ENABLE_CLICKHOUSE_COMPRESSOR
--- a/dbms/programs/copier/CMakeLists.txt
+++ b/dbms/programs/copier/CMakeLists.txt
@ -1,8 +1,5 @@
-add_library (clickhouse-copier-lib ${LINK_MODE} ClusterCopier.cpp)
-target_link_libraries (clickhouse-copier-lib PRIVATE clickhouse-server-lib clickhouse_functions clickhouse_aggregate_functions daemon)
+set(CLICKHOUSE_COPIER_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/ClusterCopier.cpp)
+set(CLICKHOUSE_COPIER_LINK PRIVATE clickhouse_functions clickhouse_aggregate_functions daemon)
+#set(CLICKHOUSE_COPIER_INCLUDE SYSTEM PRIVATE ...)

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-copier clickhouse-copier.cpp)
-    target_link_libraries (clickhouse-copier clickhouse-copier-lib)
-    install (TARGETS clickhouse-copier ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(copier)
--- a/dbms/programs/extract-from-config/CMakeLists.txt
+++ b/dbms/programs/extract-from-config/CMakeLists.txt
@ -1,8 +1,5 @@
-add_library (clickhouse-extract-from-config-lib ${LINK_MODE} ExtractFromConfig.cpp)
-target_link_libraries (clickhouse-extract-from-config-lib PRIVATE clickhouse_common_config clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_EXTRACT_FROM_CONFIG_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/ExtractFromConfig.cpp)
+set(CLICKHOUSE_EXTRACT_FROM_CONFIG_LINK PRIVATE clickhouse_common_config clickhouse_common_io ${Boost_PROGRAM_OPTIONS_LIBRARY})
+#set(CLICKHOUSE_EXTRACT_FROM_CONFIG_INCLUDE SYSTEM PRIVATE ...)

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-extract-from-config clickhouse-extract-from-config.cpp)
-    target_link_libraries (clickhouse-extract-from-config PRIVATE clickhouse-extract-from-config-lib)
-    install (TARGETS clickhouse-extract-from-config ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(extract-from-config)
--- a/dbms/programs/format/CMakeLists.txt
+++ b/dbms/programs/format/CMakeLists.txt
@ -1,7 +1,5 @@
-add_library (clickhouse-format-lib ${LINK_MODE} Format.cpp)
-target_link_libraries (clickhouse-format-lib PRIVATE dbms clickhouse_common_io clickhouse_parsers ${Boost_PROGRAM_OPTIONS_LIBRARY})
-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-format clickhouse-format.cpp)
-    target_link_libraries (clickhouse-format PRIVATE clickhouse-format-lib)
-    install (TARGETS clickhouse-format ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+set(CLICKHOUSE_FORMAT_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/Format.cpp)
+set(CLICKHOUSE_FORMAT_LINK PRIVATE dbms clickhouse_common_io clickhouse_parsers ${Boost_PROGRAM_OPTIONS_LIBRARY})
+#set(CLICKHOUSE_FORMAT_INCLUDE SYSTEM PRIVATE ...)
+
+clickhouse_program_add(format)
--- a/dbms/programs/local/CMakeLists.txt
+++ b/dbms/programs/local/CMakeLists.txt
@ -1,8 +1,9 @@
-add_library (clickhouse-local-lib ${LINK_MODE} LocalServer.cpp)
-target_link_libraries (clickhouse-local-lib PRIVATE clickhouse_dictionaries clickhouse_common_io clickhouse-server-lib clickhouse_functions clickhouse_aggregate_functions clickhouse_table_functions ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_LOCAL_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/LocalServer.cpp)
+set(CLICKHOUSE_LOCAL_LINK PRIVATE clickhouse_dictionaries clickhouse_common_io clickhouse_functions clickhouse_aggregate_functions clickhouse_table_functions ${Boost_PROGRAM_OPTIONS_LIBRARY})
+#set(CLICKHOUSE_LOCAL_INCLUDE SYSTEM PRIVATE ...)

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-local clickhouse-local.cpp)
-    target_link_libraries (clickhouse-local PRIVATE clickhouse-local-lib)
-    install (TARGETS clickhouse-local ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+clickhouse_program_add(local)
+
+if(NOT CLICKHOUSE_ONE_SHARED)
+    target_link_libraries(clickhouse-local-lib PRIVATE clickhouse-server-lib)
 endif ()
--- a/dbms/programs/main.cpp
+++ b/dbms/programs/main.cpp
@ -38,7 +38,7 @@ int mainEntryClickHouseLocal(int argc, char ** argv);
 #if ENABLE_CLICKHOUSE_BENCHMARK || !defined(ENABLE_CLICKHOUSE_BENCHMARK)
 int mainEntryClickHouseBenchmark(int argc, char ** argv);
 #endif
-#if ENABLE_CLICKHOUSE_PERFORMANCE || !defined(ENABLE_CLICKHOUSE_PERFORMANCE)
+#if ENABLE_CLICKHOUSE_PERFORMANCE_TEST || !defined(ENABLE_CLICKHOUSE_PERFORMANCE_TEST)
 int mainEntryClickHousePerformanceTest(int argc, char ** argv);
 #endif
 #if ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG || !defined(ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG)
@ -84,7 +84,7 @@ std::pair<const char *, MainFunc> clickhouse_applications[] =
 #if ENABLE_CLICKHOUSE_SERVER || !defined(ENABLE_CLICKHOUSE_SERVER)
    {"server", mainEntryClickHouseServer},
 #endif
-#if ENABLE_CLICKHOUSE_PERFORMANCE || !defined(ENABLE_CLICKHOUSE_PERFORMANCE)
+#if ENABLE_CLICKHOUSE_PERFORMANCE_TEST || !defined(ENABLE_CLICKHOUSE_PERFORMANCE_TEST)
    {"performance-test", mainEntryClickHousePerformanceTest},
 #endif
 #if ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG || !defined(ENABLE_CLICKHOUSE_EXTRACT_FROM_CONFIG)
--- a/dbms/programs/obfuscator/CMakeLists.txt
+++ b/dbms/programs/obfuscator/CMakeLists.txt
@ -1,9 +1,5 @@
-add_library (clickhouse-obfuscator-lib ${LINK_MODE} Obfuscator.cpp)
-target_link_libraries (clickhouse-obfuscator-lib PRIVATE dbms ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_OBFUSCATOR_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/Obfuscator.cpp)
+set(CLICKHOUSE_OBFUSCATOR_LINK PRIVATE dbms ${Boost_PROGRAM_OPTIONS_LIBRARY})
+#set(CLICKHOUSE_OBFUSCATOR_INCLUDE SYSTEM PRIVATE ...)

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-obfuscator clickhouse-obfuscator.cpp)
-    set_target_properties(clickhouse-obfuscator PROPERTIES RUNTIME_OUTPUT_DIRECTORY ..)
-    target_link_libraries (clickhouse-obfuscator PRIVATE clickhouse-obfuscator-lib)
-    install (TARGETS clickhouse-obfuscator ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(obfuscator)
--- a/dbms/programs/odbc-bridge/CMakeLists.txt
+++ b/dbms/programs/odbc-bridge/CMakeLists.txt
@ -1,30 +1,36 @@
-add_headers_and_sources(clickhouse_odbc_bridge .)
+set(CLICKHOUSE_ODBC_BRIDGE_SOURCES
+    ${CMAKE_CURRENT_SOURCE_DIR}/ColumnInfoHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/getIdentifierQuote.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/HandlerFactory.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/IdentifierQuoteHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/MainHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/ODBCBlockInputStream.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/odbc-bridge.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/ODBCBridge.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/PingHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/validateODBCConnectionString.cpp
+)

-add_library (clickhouse-odbc-bridge-lib ${LINK_MODE} ${clickhouse_odbc_bridge_sources})
-
-target_link_libraries (clickhouse-odbc-bridge-lib PRIVATE daemon dbms clickhouse_common_io)
-target_include_directories (clickhouse-odbc-bridge-lib PUBLIC ${ClickHouse_SOURCE_DIR}/libs/libdaemon/include)
+set(CLICKHOUSE_ODBC_BRIDGE_LINK PRIVATE daemon dbms clickhouse_common_io)
+set(CLICKHOUSE_ODBC_BRIDGE_INCLUDE PUBLIC ${ClickHouse_SOURCE_DIR}/libs/libdaemon/include)

 if (USE_POCO_SQLODBC)
-    target_link_libraries (clickhouse-odbc-bridge-lib PRIVATE ${Poco_SQLODBC_LIBRARY})
-    target_include_directories (clickhouse-odbc-bridge-lib SYSTEM PRIVATE ${ODBC_INCLUDE_DIRECTORIES} ${Poco_SQLODBC_INCLUDE_DIR})
+    set(CLICKHOUSE_ODBC_BRIDGE_LINK ${CLICKHOUSE_ODBC_BRIDGE_LINK} PRIVATE ${Poco_SQLODBC_LIBRARY})
+    set(CLICKHOUSE_ODBC_BRIDGE_INCLUDE ${CLICKHOUSE_ODBC_BRIDGE_INCLUDE} SYSTEM PRIVATE ${ODBC_INCLUDE_DIRECTORIES} ${Poco_SQLODBC_INCLUDE_DIR})
 endif ()
 if (Poco_SQL_FOUND)
-    target_link_libraries (clickhouse-odbc-bridge-lib PRIVATE ${Poco_SQL_LIBRARY})
+    set(CLICKHOUSE_ODBC_BRIDGE_LINK ${CLICKHOUSE_ODBC_BRIDGE_LINK} PRIVATE ${Poco_SQL_LIBRARY})
 endif ()

 if (USE_POCO_DATAODBC)
-    target_link_libraries (clickhouse-odbc-bridge-lib PRIVATE ${Poco_DataODBC_LIBRARY})
-    target_include_directories (clickhouse-odbc-bridge-lib SYSTEM PRIVATE ${ODBC_INCLUDE_DIRECTORIES} ${Poco_DataODBC_INCLUDE_DIR})
+    set(CLICKHOUSE_ODBC_BRIDGE_LINK ${CLICKHOUSE_ODBC_BRIDGE_LINK} PRIVATE ${Poco_DataODBC_LIBRARY})
+    set(CLICKHOUSE_ODBC_BRIDGE_INCLUDE ${CLICKHOUSE_ODBC_BRIDGE_INCLUDE} SYSTEM PRIVATE ${ODBC_INCLUDE_DIRECTORIES} ${Poco_DataODBC_INCLUDE_DIR})
 endif()
 if (Poco_Data_FOUND)
-    target_link_libraries (clickhouse-odbc-bridge-lib PRIVATE ${Poco_Data_LIBRARY})
+    set(CLICKHOUSE_ODBC_BRIDGE_LINK ${CLICKHOUSE_ODBC_BRIDGE_LINK} PRIVATE ${Poco_Data_LIBRARY})
 endif ()

-
-if (ENABLE_TESTS)
-    add_subdirectory (tests)
-endif ()
+clickhouse_program_add_library(odbc-bridge)

 # clickhouse-odbc-bridge is always a separate binary.
 # Reason: it must not export symbols from SSL, mariadb-client, etc. to not break ABI compatibility with ODBC drivers.
@ -32,5 +38,11 @@ endif ()
 SET(CMAKE_SHARED_LIBRARY_LINK_CXX_FLAGS "")

 add_executable (clickhouse-odbc-bridge odbc-bridge.cpp)
-target_link_libraries (clickhouse-odbc-bridge PRIVATE clickhouse-odbc-bridge-lib)
+
+clickhouse_program_link_split_binary(odbc-bridge)
+
 install (TARGETS clickhouse-odbc-bridge RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
+
+if (ENABLE_TESTS)
+    add_subdirectory (tests)
+endif ()
--- a/dbms/programs/odbc-bridge/tests/CMakeLists.txt
+++ b/dbms/programs/odbc-bridge/tests/CMakeLists.txt
@ -1,2 +1,3 @@
 add_executable (validate-odbc-connection-string validate-odbc-connection-string.cpp)
-target_link_libraries (validate-odbc-connection-string PRIVATE clickhouse-odbc-bridge-lib clickhouse_common_io)
+clickhouse_target_link_split_lib(validate-odbc-connection-string odbc-bridge)
+target_link_libraries (validate-odbc-connection-string PRIVATE clickhouse_common_io)
--- a/dbms/programs/performance-test/CMakeLists.txt
+++ b/dbms/programs/performance-test/CMakeLists.txt
@ -1,21 +1,18 @@
-add_library (clickhouse-performance-test-lib ${LINK_MODE}
-  JSONString.cpp
-  StopConditionsSet.cpp
-  TestStopConditions.cpp
-  TestStats.cpp
-  ConfigPreprocessor.cpp
-  PerformanceTest.cpp
-  PerformanceTestInfo.cpp
-  executeQuery.cpp
-  applySubstitutions.cpp
-  ReportBuilder.cpp
-  PerformanceTestSuite.cpp
-)
-target_link_libraries (clickhouse-performance-test-lib PRIVATE dbms clickhouse_common_io clickhouse_common_config ${Boost_PROGRAM_OPTIONS_LIBRARY})
-target_include_directories (clickhouse-performance-test-lib SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR})
+set(CLICKHOUSE_PERFORMANCE_TEST_SOURCES 
+  ${CMAKE_CURRENT_SOURCE_DIR}/JSONString.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/StopConditionsSet.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/TestStopConditions.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/TestStats.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/ConfigPreprocessor.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/PerformanceTest.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/PerformanceTestInfo.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/executeQuery.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/applySubstitutions.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/ReportBuilder.cpp
+  ${CMAKE_CURRENT_SOURCE_DIR}/PerformanceTestSuite.cpp
+ )

-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-performance-test clickhouse-performance-test.cpp)
-    target_link_libraries (clickhouse-performance-test PRIVATE clickhouse-performance-test-lib)
-    install (TARGETS clickhouse-performance-test ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+set(CLICKHOUSE_PERFORMANCE_TEST_LINK PRIVATE dbms clickhouse_common_io clickhouse_common_config ${Boost_PROGRAM_OPTIONS_LIBRARY})
+set(CLICKHOUSE_PERFORMANCE_TEST_INCLUDE SYSTEM PRIVATE ${PCG_RANDOM_INCLUDE_DIR})
+
+clickhouse_program_add(performance-test)
--- a/dbms/programs/server/CMakeLists.txt
+++ b/dbms/programs/server/CMakeLists.txt
@ -1,27 +1,22 @@
-add_library (clickhouse-server-lib ${LINK_MODE}
-    HTTPHandler.cpp
-    InterserverIOHTTPHandler.cpp
-    MetricsTransmitter.cpp
-    NotFoundHandler.cpp
-    PingRequestHandler.cpp
-    ReplicasStatusHandler.cpp
-    RootRequestHandler.cpp
-    Server.cpp
-    TCPHandler.cpp
-    )
+set(CLICKHOUSE_SERVER_SOURCES
+    ${CMAKE_CURRENT_SOURCE_DIR}/HTTPHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/InterserverIOHTTPHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/MetricsTransmitter.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/NotFoundHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/PingRequestHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/ReplicasStatusHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/RootRequestHandler.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/Server.cpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/TCPHandler.cpp
+   )

-target_link_libraries (clickhouse-server-lib PRIVATE clickhouse_dictionaries clickhouse_common_io daemon clickhouse_storages_system clickhouse_functions clickhouse_aggregate_functions clickhouse_table_functions ${Poco_Net_LIBRARY})
+set(CLICKHOUSE_SERVER_LINK PRIVATE clickhouse_dictionaries clickhouse_common_io daemon clickhouse_storages_system clickhouse_functions clickhouse_aggregate_functions clickhouse_table_functions ${Poco_Net_LIBRARY})
 if (USE_POCO_NETSSL)
-    target_link_libraries (clickhouse-server-lib PRIVATE ${Poco_NetSSL_LIBRARY} ${Poco_Crypto_LIBRARY})
+    set(CLICKHOUSE_SERVER_LINK ${CLICKHOUSE_SERVER_LINK} PRIVATE ${Poco_NetSSL_LIBRARY} ${Poco_Crypto_LIBRARY})
 endif ()
+set(CLICKHOUSE_SERVER_INCLUDE PUBLIC ${ClickHouse_SOURCE_DIR}/libs/libdaemon/include)

-target_include_directories (clickhouse-server-lib PUBLIC ${ClickHouse_SOURCE_DIR}/libs/libdaemon/include)
-
-if (CLICKHOUSE_SPLIT_BINARY)
-    add_executable (clickhouse-server clickhouse-server.cpp)
-    target_link_libraries (clickhouse-server PRIVATE clickhouse-server-lib)
-    install (TARGETS clickhouse-server ${CLICKHOUSE_ALL_TARGETS} RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse)
-endif ()
+clickhouse_program_add(server)

 if (GLIBC_COMPATIBILITY)
    set (GLIBC_MAX_REQUIRED 2.4 CACHE INTERNAL "")
@ -31,7 +26,4 @@ if (GLIBC_COMPATIBILITY)
    #add_test(NAME GLIBC_required_version COMMAND bash -c "readelf -s ${CMAKE_CURRENT_BINARY_DIR}/../clickhouse-server | grep '@GLIBC' | grep -oP 'GLIBC_[\\d\\.]+' | sort | uniq | sort --version-sort --reverse | perl -lnE 'warn($_), exit 1 if $_ gt q{GLIBC_${GLIBC_MAX_REQUIRED}}'") # old
 endif ()

-install (
-    FILES config.xml users.xml
-    DESTINATION  ${CLICKHOUSE_ETC_DIR}/clickhouse-server
-    COMPONENT clickhouse)
+install(FILES config.xml users.xml DESTINATION ${CLICKHOUSE_ETC_DIR}/clickhouse-server COMPONENT clickhouse)
--- a/dbms/programs/server/users.d/allow_only_from_localhost.xml
+++ b/dbms/programs/server/users.d/allow_only_from_localhost.xml
@ -4,7 +4,6 @@
        <default>
            <networks replace="replace">
                <ip>::1</ip>
-                <ip>0.0.0.0</ip>
                <ip>127.0.0.1</ip>
            </networks>
        </default>
--- a/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmap.cpp
+++ b/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmap.cpp
@ -0,0 +1,40 @@
+#include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <AggregateFunctions/AggregateFunctionGroupBitmap.h>
+#include <AggregateFunctions/Helpers.h>
+#include <AggregateFunctions/FactoryHelpers.h>
+
+
+namespace DB
+{
+
+namespace
+{
+
+template <template <typename> class Data>
+AggregateFunctionPtr createAggregateFunctionBitmap(const std::string & name, const DataTypes & argument_types, const Array & parameters)
+{
+    assertNoParameters(name, parameters);
+    assertUnary(name, argument_types);
+
+    if (!argument_types[0]->canBeUsedInBitOperations())
+        throw Exception("The type " + argument_types[0]->getName() + " of argument for aggregate function " + name
+            + " is illegal, because it cannot be used in Bitmap operations",
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+    AggregateFunctionPtr res(createWithUnsignedIntegerType<AggregateFunctionBitmap, Data>(*argument_types[0], argument_types[0]));
+
+    if (!res)
+        throw Exception("Illegal type " + argument_types[0]->getName() + " of argument for aggregate function " + name, ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+    return res;
+}
+
+}
+
+void registerAggregateFunctionsBitmap(AggregateFunctionFactory & factory)
+{
+    factory.registerFunction("groupBitmap", createAggregateFunctionBitmap<AggregateFunctionGroupBitmapData>);
+
+}
+
+}
--- a/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmap.h
+++ b/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmap.h
@ -0,0 +1,56 @@
+#pragma once
+
+#include <Columns/ColumnVector.h>
+#include <boost/noncopyable.hpp>
+#include <AggregateFunctions/IAggregateFunction.h>
+#include <AggregateFunctions/AggregateFunctionGroupBitmapData.h>
+#include <DataTypes/DataTypesNumber.h>
+
+namespace DB
+{
+
+/// Counts bitmap operation on numbers.
+template <typename T, typename Data>
+class AggregateFunctionBitmap final : public IAggregateFunctionDataHelper<Data, AggregateFunctionBitmap<T, Data>>
+{
+public:
+    AggregateFunctionBitmap(const DataTypePtr & type)
+            : IAggregateFunctionDataHelper<Data, AggregateFunctionBitmap<T, Data>>({type}, {}) {}
+
+    String getName() const override { return Data::name(); }
+
+    DataTypePtr getReturnType() const override
+    {
+        return std::make_shared<DataTypeNumber<T>>();
+    }
+
+    void add(AggregateDataPtr place, const IColumn ** columns, size_t row_num, Arena *) const override
+    {
+        this->data(place).rbs.add(static_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num]);
+    }
+
+    void merge(AggregateDataPtr place, ConstAggregateDataPtr rhs, Arena *) const override
+    {
+        this->data(place).rbs.merge(this->data(rhs).rbs);
+    }
+
+    void serialize(ConstAggregateDataPtr place, WriteBuffer & buf) const override
+    {
+        this->data(place).rbs.write(buf);
+    }
+
+    void deserialize(AggregateDataPtr place, ReadBuffer & buf, Arena *) const override
+    {
+        this->data(place).rbs.read(buf);
+    }
+
+    void insertResultInto(ConstAggregateDataPtr place, IColumn & to) const override
+    {
+        static_cast<ColumnVector<T> &>(to).getData().push_back(this->data(place).rbs.size());
+    }
+
+    const char * getHeaderFilePath() const override { return __FILE__; }
+};
+
+
+}
--- a/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h
+++ b/dbms/src/AggregateFunctions/AggregateFunctionGroupBitmapData.h
@ -0,0 +1,516 @@
+#pragma once
+
+#include <roaring.h>
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
+#include <boost/noncopyable.hpp>
+#include <roaring.hh>
+#include <Common/HashTable/SmallTable.h>
+
+namespace DB
+{
+/**
+  * For a small number of values - an array of fixed size "on the stack".
+  * For large, roaring_bitmap_t is allocated.
+  * For a description of the roaring_bitmap_t, see: https://github.com/RoaringBitmap/CRoaring
+  */
+template <typename T, UInt8 small_set_size>
+class RoaringBitmapWithSmallSet : private boost::noncopyable
+{
+private:
+    using Small = SmallSet<T, small_set_size>;
+    using ValueBuffer = std::vector<T>;
+    Small small;
+    roaring_bitmap_t * rb = nullptr;
+
+    void toLarge()
+    {
+        rb = roaring_bitmap_create();
+
+        for (const auto & x : small)
+            roaring_bitmap_add(rb, x.getValue());
+    }
+
+public:
+    bool isLarge() const { return rb != nullptr; }
+
+    bool isSmall() const { return rb == nullptr; }
+
+    ~RoaringBitmapWithSmallSet()
+    {
+        if (isLarge())
+            roaring_bitmap_free(rb);
+    }
+
+    void add(T value)
+    {
+        if (isSmall())
+        {
+            if (small.find(value) == small.end())
+            {
+                if (!small.full())
+                    small.insert(value);
+                else
+                {
+                    toLarge();
+                    roaring_bitmap_add(rb, value);
+                }
+            }
+        }
+        else
+            roaring_bitmap_add(rb, value);
+    }
+
+    UInt64 size() const { return isSmall() ? small.size() : roaring_bitmap_get_cardinality(rb); }
+
+    void merge(const RoaringBitmapWithSmallSet & r1)
+    {
+        if (r1.isLarge())
+        {
+            if (isSmall())
+                toLarge();
+
+            roaring_bitmap_or_inplace(rb, r1.rb);
+        }
+        else
+        {
+            for (const auto & x : r1.small)
+                add(x.getValue());
+        }
+    }
+
+    void read(DB::ReadBuffer & in)
+    {
+        bool is_large;
+        readBinary(is_large, in);
+
+        if (is_large)
+        {
+            toLarge();
+            UInt32 cardinality;
+            readBinary(cardinality, in);
+            db_roaring_bitmap_add_many(in, rb, cardinality);
+        }
+        else
+            small.read(in);
+    }
+
+    void write(DB::WriteBuffer & out) const
+    {
+        writeBinary(isLarge(), out);
+
+        if (isLarge())
+        {
+            UInt32 cardinality = roaring_bitmap_get_cardinality(rb);
+            writePODBinary(cardinality, out);
+            db_ra_to_uint32_array(out, &rb->high_low_container);
+        }
+        else
+            small.write(out);
+    }
+
+
+    roaring_bitmap_t * getRb() const { return rb; }
+
+    Small & getSmall() const { return small; }
+
+    /**
+     * Get a new roaring_bitmap_t from elements of small
+     */
+    roaring_bitmap_t * getNewRbFromSmall() const
+    {
+        roaring_bitmap_t * smallRb = roaring_bitmap_create();
+        for (const auto & x : small)
+            roaring_bitmap_add(smallRb, x.getValue());
+        return smallRb;
+    }
+
+    /**
+     * Computes the intersection between two bitmaps
+     */
+    void rb_and(const RoaringBitmapWithSmallSet & r1)
+    {
+        ValueBuffer buffer;
+        if (isSmall() && r1.isSmall())
+        {
+            // intersect
+            for (const auto & x : small)
+                if (r1.small.find(x.getValue()) != r1.small.end())
+                    buffer.push_back(x.getValue());
+
+            // Clear out the original values
+            small.clear();
+
+            for (const auto & value : buffer)
+                small.insert(value);
+
+            buffer.clear();
+        }
+        else if (isSmall() && r1.isLarge())
+        {
+            for (const auto & x : small)
+                if (roaring_bitmap_contains(r1.rb, x.getValue()))
+                    buffer.push_back(x.getValue());
+
+            // Clear out the original values
+            small.clear();
+
+            for (const auto & value : buffer)
+                small.insert(value);
+
+            buffer.clear();
+        }
+        else
+        {
+            roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+            roaring_bitmap_and_inplace(rb, rb1);
+            if (r1.isSmall())
+                roaring_bitmap_free(rb1);
+        }
+    }
+
+    /**
+     * Computes the union between two bitmaps.
+     */
+    void rb_or(const RoaringBitmapWithSmallSet & r1) { merge(r1); }
+
+    /**
+     * Computes the symmetric difference (xor) between two bitmaps.
+     */
+    void rb_xor(const RoaringBitmapWithSmallSet & r1)
+    {
+        if (isSmall())
+            toLarge();
+        roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+        roaring_bitmap_xor_inplace(rb, rb1);
+        if (r1.isSmall())
+            roaring_bitmap_free(rb1);
+    }
+
+    /**
+     * Computes the difference (andnot) between two bitmaps
+     */
+    void rb_andnot(const RoaringBitmapWithSmallSet & r1)
+    {
+        ValueBuffer buffer;
+        if (isSmall() && r1.isSmall())
+        {
+            // subtract
+            for (const auto & x : small)
+                if (r1.small.find(x.getValue()) == r1.small.end())
+                    buffer.push_back(x.getValue());
+
+            // Clear out the original values
+            small.clear();
+
+            for (const auto & value : buffer)
+                small.insert(value);
+
+            buffer.clear();
+        }
+        else if (isSmall() && r1.isLarge())
+        {
+            for (const auto & x : small)
+                if (!roaring_bitmap_contains(r1.rb, x.getValue()))
+                    buffer.push_back(x.getValue());
+
+            // Clear out the original values
+            small.clear();
+
+            for (const auto & value : buffer)
+                small.insert(value);
+
+            buffer.clear();
+        }
+        else
+        {
+            roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+            roaring_bitmap_andnot_inplace(rb, rb1);
+            if (r1.isSmall())
+                roaring_bitmap_free(rb1);
+        }
+    }
+
+    /**
+     * Computes the cardinality of the intersection between two bitmaps.
+     */
+    UInt64 rb_and_cardinality(const RoaringBitmapWithSmallSet & r1) const
+    {
+        UInt64 retSize = 0;
+        if (isSmall() && r1.isSmall())
+        {
+            for (const auto & x : small)
+                if (r1.small.find(x.getValue()) != r1.small.end())
+                    retSize++;
+        }
+        else if (isSmall() && r1.isLarge())
+        {
+            for (const auto & x : small)
+                if (roaring_bitmap_contains(r1.rb, x.getValue()))
+                    retSize++;
+        }
+        else
+        {
+            roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+            retSize = roaring_bitmap_and_cardinality(rb, rb1);
+            if (r1.isSmall())
+                roaring_bitmap_free(rb1);
+        }
+        return retSize;
+    }
+
+    /**
+     * Computes the cardinality of the union between two bitmaps.
+    */
+    UInt64 rb_or_cardinality(const RoaringBitmapWithSmallSet & r1) const
+    {
+        UInt64 c1 = size();
+        UInt64 c2 = r1.size();
+        UInt64 inter = rb_and_cardinality(r1);
+        return c1 + c2 - inter;
+    }
+
+    /**
+     * Computes the cardinality of the symmetric difference (andnot) between two bitmaps.
+    */
+    UInt64 rb_xor_cardinality(const RoaringBitmapWithSmallSet & r1) const
+    {
+        UInt64 c1 = size();
+        UInt64 c2 = r1.size();
+        UInt64 inter = rb_and_cardinality(r1);
+        return c1 + c2 - 2 * inter;
+    }
+
+    /**
+     * Computes the cardinality of the difference (andnot) between two bitmaps.
+     */
+    UInt64 rb_andnot_cardinality(const RoaringBitmapWithSmallSet & r1) const
+    {
+        UInt64 c1 = size();
+        UInt64 inter = rb_and_cardinality(r1);
+        return c1 - inter;
+    }
+
+    /**
+     * Return 1 if the two bitmaps contain the same elements.
+     */
+    UInt8 rb_equals(const RoaringBitmapWithSmallSet & r1)
+    {
+        if (isSmall())
+            toLarge();
+        roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+        UInt8 is_true = roaring_bitmap_equals(rb, rb1);
+        if (r1.isSmall())
+            roaring_bitmap_free(rb1);
+        return is_true;
+    }
+
+    /**
+     * Check whether two bitmaps intersect.
+     */
+    UInt8 rb_intersect(const RoaringBitmapWithSmallSet & r1)
+    {
+        if (isSmall())
+            toLarge();
+        roaring_bitmap_t * rb1 = r1.isSmall() ? r1.getNewRbFromSmall() : r1.getRb();
+        UInt8 is_true = roaring_bitmap_intersect(rb, rb1);
+        if (r1.isSmall())
+            roaring_bitmap_free(rb1);
+        return is_true;
+    }
+
+    /**
+     * Remove value
+     */
+    void rb_remove(UInt64 offsetid)
+    {
+        if (isSmall())
+            toLarge();
+        roaring_bitmap_remove(rb, offsetid);
+    }
+
+    /**
+     * compute (in place) the negation of the roaring bitmap within a specified
+     * interval: [range_start, range_end). The number of negated values is
+     * range_end - range_start.
+     * Areas outside the range are passed through unchanged.
+     */
+    void rb_flip(UInt64 offsetstart, UInt64 offsetend)
+    {
+        if (isSmall())
+            toLarge();
+        roaring_bitmap_flip_inplace(rb, offsetstart, offsetend);
+    }
+
+    /**
+     * returns the number of integers that are smaller or equal to offsetid.
+     */
+    UInt64 rb_rank(UInt64 offsetid)
+    {
+        if (isSmall())
+            toLarge();
+        return roaring_bitmap_rank(rb, offsetid);
+    }
+
+    /**
+     * Convert elements to integer array, return number of elements
+     */
+    template <typename Element>
+    UInt64 rb_to_array(PaddedPODArray<Element> & res_data) const
+    {
+        UInt64 count = 0;
+        if (isSmall())
+        {
+            for (const auto & x : small)
+            {
+                res_data.emplace_back(x.getValue());
+                count++;
+            }
+        }
+        else
+        {
+            roaring_uint32_iterator_t iterator;
+            roaring_init_iterator(rb, &iterator);
+            while (iterator.has_value)
+            {
+                res_data.emplace_back(iterator.current_value);
+                roaring_advance_uint32_iterator(&iterator);
+                count++;
+            }
+        }
+        return count;
+    }
+
+private:
+    /// To read and write the DB Buffer directly, migrate code from CRoaring
+    void db_roaring_bitmap_add_many(DB::ReadBuffer & dbBuf, roaring_bitmap_t * r, size_t n_args)
+    {
+        void * container = NULL; // hold value of last container touched
+        uint8_t typecode = 0; // typecode of last container touched
+        uint32_t prev = 0; // previous valued inserted
+        size_t i = 0; // index of value
+        int containerindex = 0;
+        if (n_args == 0)
+            return;
+        uint32_t val;
+        readBinary(val, dbBuf);
+        container = containerptr_roaring_bitmap_add(r, val, &typecode, &containerindex);
+        prev = val;
+        i++;
+        for (; i < n_args; i++)
+        {
+            readBinary(val, dbBuf);
+            if (((prev ^ val) >> 16) == 0)
+            { // no need to seek the container, it is at hand
+                // because we already have the container at hand, we can do the
+                // insertion
+                // automatically, bypassing the roaring_bitmap_add call
+                uint8_t newtypecode = typecode;
+                void * container2 = container_add(container, val & 0xFFFF, typecode, &newtypecode);
+                // rare instance when we need to
+                if (container2 != container)
+                {
+                    // change the container type
+                    container_free(container, typecode);
+                    ra_set_container_at_index(&r->high_low_container, containerindex, container2, newtypecode);
+                    typecode = newtypecode;
+                    container = container2;
+                }
+            }
+            else
+            {
+                container = containerptr_roaring_bitmap_add(r, val, &typecode, &containerindex);
+            }
+            prev = val;
+        }
+    }
+
+    void db_ra_to_uint32_array(DB::WriteBuffer & dbBuf, roaring_array_t * ra) const
+    {
+        size_t ctr = 0;
+        for (Int32 i = 0; i < ra->size; ++i)
+        {
+            Int32 num_added = db_container_to_uint32_array(dbBuf, ra->containers[i], ra->typecodes[i], ((UInt32)ra->keys[i]) << 16);
+            ctr += num_added;
+        }
+    }
+
+    UInt32 db_container_to_uint32_array(DB::WriteBuffer & dbBuf, const void * container, UInt8 typecode, UInt32 base) const
+    {
+        container = container_unwrap_shared(container, &typecode);
+        switch (typecode)
+        {
+            case BITSET_CONTAINER_TYPE_CODE:
+                return db_bitset_container_to_uint32_array(dbBuf, (const bitset_container_t *)container, base);
+            case ARRAY_CONTAINER_TYPE_CODE:
+                return db_array_container_to_uint32_array(dbBuf, (const array_container_t *)container, base);
+            case RUN_CONTAINER_TYPE_CODE:
+                return db_run_container_to_uint32_array(dbBuf, (const run_container_t *)container, base);
+        }
+        return 0;
+    }
+
+    UInt32 db_bitset_container_to_uint32_array(DB::WriteBuffer & dbBuf, const bitset_container_t * cont, UInt32 base) const
+    {
+        return (UInt32)db_bitset_extract_setbits(dbBuf, cont->array, BITSET_CONTAINER_SIZE_IN_WORDS, base);
+    }
+
+    size_t db_bitset_extract_setbits(DB::WriteBuffer & dbBuf, UInt64 * bitset, size_t length, UInt32 base) const
+    {
+        UInt32 outpos = 0;
+        for (size_t i = 0; i < length; ++i)
+        {
+            UInt64 w = bitset[i];
+            while (w != 0)
+            {
+                UInt64 t = w & (~w + 1); // on x64, should compile to BLSI (careful: the Intel compiler seems to fail)
+                UInt32 r = __builtin_ctzll(w); // on x64, should compile to TZCNT
+                UInt32 val = r + base;
+                writePODBinary(val, dbBuf);
+                outpos++;
+                w ^= t;
+            }
+            base += 64;
+        }
+        return outpos;
+    }
+
+    int db_array_container_to_uint32_array(DB::WriteBuffer & dbBuf, const array_container_t * cont, UInt32 base) const
+    {
+        UInt32 outpos = 0;
+        for (Int32 i = 0; i < cont->cardinality; ++i)
+        {
+            const UInt32 val = base + cont->array[i];
+            writePODBinary(val, dbBuf);
+            outpos++;
+        }
+        return outpos;
+    }
+
+    int db_run_container_to_uint32_array(DB::WriteBuffer & dbBuf, const run_container_t * cont, UInt32 base) const
+    {
+        UInt32 outpos = 0;
+        for (Int32 i = 0; i < cont->n_runs; ++i)
+        {
+            UInt32 run_start = base + cont->runs[i].value;
+            UInt16 le = cont->runs[i].length;
+            for (Int32 j = 0; j <= le; ++j)
+            {
+                UInt32 val = run_start + j;
+                writePODBinary(val, dbBuf);
+                outpos++;
+            }
+        }
+        return outpos;
+    }
+};
+
+template <typename T>
+struct AggregateFunctionGroupBitmapData
+{
+    RoaringBitmapWithSmallSet<T, 32> rbs;
+    static const char * name() { return "groupBitmap"; }
+};
+
+
+}
--- a/dbms/src/AggregateFunctions/CMakeLists.txt
+++ b/dbms/src/AggregateFunctions/CMakeLists.txt
@ -20,7 +20,7 @@ list(REMOVE_ITEM clickhouse_aggregate_functions_headers
 )

 add_library(clickhouse_aggregate_functions ${LINK_MODE} ${clickhouse_aggregate_functions_sources})
-target_link_libraries(clickhouse_aggregate_functions PRIVATE dbms)
+target_link_libraries(clickhouse_aggregate_functions PRIVATE dbms PUBLIC ${CITYHASH_LIBRARIES})
 target_include_directories (clickhouse_aggregate_functions BEFORE PRIVATE ${COMMON_INCLUDE_DIR})

 if (ENABLE_TESTS)
--- a/dbms/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/dbms/src/AggregateFunctions/registerAggregateFunctions.cpp
@ -26,6 +26,7 @@ void registerAggregateFunctionUniqCombined(AggregateFunctionFactory &);
 void registerAggregateFunctionUniqUpTo(AggregateFunctionFactory &);
 void registerAggregateFunctionTopK(AggregateFunctionFactory &);
 void registerAggregateFunctionsBitwise(AggregateFunctionFactory &);
+void registerAggregateFunctionsBitmap(AggregateFunctionFactory &);
 void registerAggregateFunctionsMaxIntersections(AggregateFunctionFactory &);
 void registerAggregateFunctionEntropy(AggregateFunctionFactory &);

@ -63,6 +64,7 @@ void registerAggregateFunctions()
        registerAggregateFunctionUniqUpTo(factory);
        registerAggregateFunctionTopK(factory);
        registerAggregateFunctionsBitwise(factory);
+        registerAggregateFunctionsBitmap(factory);
        registerAggregateFunctionsMaxIntersections(factory);
        registerAggregateFunctionHistogram(factory);
        registerAggregateFunctionRetention(factory);
--- a/dbms/src/Columns/ColumnFixedString.cpp
+++ b/dbms/src/Columns/ColumnFixedString.cpp
@ -4,6 +4,7 @@
 #include <Common/Arena.h>
 #include <Common/SipHash.h>
 #include <Common/memcpySmall.h>
+#include <Common/memcmpSmall.h>

 #include <DataStreams/ColumnGathererStream.h>

@ -106,8 +107,7 @@ struct ColumnFixedString::less
    explicit less(const ColumnFixedString & parent_) : parent(parent_) {}
    bool operator()(size_t lhs, size_t rhs) const
    {
-        /// TODO: memcmp slows down.
-        int res = memcmp(&parent.chars[lhs * parent.n], &parent.chars[rhs * parent.n], parent.n);
+        int res = memcmpSmallAllowOverflow15(parent.chars.data() + lhs * parent.n, parent.chars.data() + rhs * parent.n, parent.n);
        return positive ? (res < 0) : (res > 0);
    }
 };
--- a/dbms/src/Columns/ColumnFixedString.h
+++ b/dbms/src/Columns/ColumnFixedString.h
@ -1,8 +1,7 @@
 #pragma once

-#include <string.h> // memcmp
-
 #include <Common/PODArray.h>
+#include <Common/memcmpSmall.h>
 #include <Columns/IColumn.h>
 #include <Columns/ColumnVectorHelper.h>

@ -98,7 +97,7 @@ public:
    int compareAt(size_t p1, size_t p2, const IColumn & rhs_, int /*nan_direction_hint*/) const override
    {
        const ColumnFixedString & rhs = static_cast<const ColumnFixedString &>(rhs_);
-        return memcmp(&chars[p1 * n], &rhs.chars[p2 * n], n);
+        return memcmpSmallAllowOverflow15(chars.data() + p1 * n, rhs.chars.data() + p2 * n, n);
    }

    void getPermutation(bool reverse, size_t limit, int nan_direction_hint, Permutation & res) const override;
--- a/dbms/src/Columns/ColumnString.cpp
+++ b/dbms/src/Columns/ColumnString.cpp
@ -1,5 +1,6 @@
 #include <Core/Defines.h>
 #include <Common/Arena.h>
+#include <Common/memcmpSmall.h>
 #include <Columns/Collator.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsCommon.h>
@ -239,15 +240,11 @@ struct ColumnString::less
    explicit less(const ColumnString & parent_) : parent(parent_) {}
    bool operator()(size_t lhs, size_t rhs) const
    {
-        size_t left_len = parent.sizeAt(lhs);
-        size_t right_len = parent.sizeAt(rhs);
+        int res = memcmpSmallAllowOverflow15(
+            parent.chars.data() + parent.offsetAt(lhs), parent.sizeAt(lhs) - 1,
+            parent.chars.data() + parent.offsetAt(rhs), parent.sizeAt(rhs) - 1);

-        int res = memcmp(&parent.chars[parent.offsetAt(lhs)], &parent.chars[parent.offsetAt(rhs)], std::min(left_len, right_len));
-
-        if (res != 0)
-            return positive ? (res < 0) : (res > 0);
-        else
-            return positive ? (left_len < right_len) : (left_len > right_len);
+        return positive ? (res < 0) : (res > 0);
    }
 };

--- a/dbms/src/Columns/ColumnString.h
+++ b/dbms/src/Columns/ColumnString.h
@ -6,6 +6,7 @@
 #include <Common/PODArray.h>
 #include <Common/SipHash.h>
 #include <Common/memcpySmall.h>
+#include <Common/memcmpSmall.h>


 class Collator;
@ -210,16 +211,7 @@ public:
    int compareAt(size_t n, size_t m, const IColumn & rhs_, int /*nan_direction_hint*/) const override
    {
        const ColumnString & rhs = static_cast<const ColumnString &>(rhs_);
-
-        const size_t size = sizeAt(n);
-        const size_t rhs_size = rhs.sizeAt(m);
-
-        int cmp = memcmp(&chars[offsetAt(n)], &rhs.chars[rhs.offsetAt(m)], std::min(size, rhs_size));
-
-        if (cmp != 0)
-            return cmp;
-        else
-            return size > rhs_size ? 1 : (size < rhs_size ? -1 : 0);
+        return memcmpSmallAllowOverflow15(chars.data() + offsetAt(n), sizeAt(n) - 1, rhs.chars.data() + rhs.offsetAt(m), rhs.sizeAt(m) - 1);
    }

    /// Variant of compareAt for string comparison with respect of collation.
--- a/dbms/src/Common/ErrorCodes.cpp
+++ b/dbms/src/Common/ErrorCodes.cpp
@ -424,6 +424,7 @@ namespace ErrorCodes
    extern const int POCO_EXCEPTION = 1000;
    extern const int STD_EXCEPTION = 1001;
    extern const int UNKNOWN_EXCEPTION = 1002;
+    extern const int METRIKA_OTHER_ERROR = 1003;

    extern const int CONDITIONAL_TREE_PARENT_NOT_FOUND = 2001;
    extern const int ILLEGAL_PROJECTION_MANIPULATOR = 2002;
--- a/dbms/src/Common/Exception.h
+++ b/dbms/src/Common/Exception.h
@ -17,6 +17,7 @@ namespace DB
 namespace ErrorCodes
 {
    extern const int POCO_EXCEPTION;
+    extern const int METRIKA_OTHER_ERROR;
 }

 class Exception : public Poco::Exception
--- a/dbms/src/Common/ThreadPool.cpp
+++ b/dbms/src/Common/ThreadPool.cpp
@ -157,6 +157,7 @@ void ThreadPoolImpl<Thread>::worker(typename std::list<Thread>::iterator thread_
            }
            else
            {
+                /// shutdown is true, simply finish the thread.
                return;
            }
        }
--- a/dbms/src/Common/memcmpSmall.h
+++ b/dbms/src/Common/memcmpSmall.h
@ -0,0 +1,239 @@
+#pragma once
+
+#include <cstdint>
+#include <algorithm>
+
+#ifdef __SSE2__
+#include <emmintrin.h>
+
+
+namespace detail
+{
+
+template <typename T>
+inline int cmp(T a, T b)
+{
+    if (a < b)
+        return -1;
+    if (a > b)
+        return 1;
+    return 0;
+}
+
+}
+
+/** All functions works under the following assumptions:
+  * - it's possible to read up to 15 excessive bytes after end of 'a' and 'b' region;
+  * - memory regions are relatively small and extra loop unrolling is not worth to do.
+  */
+
+/** Variant when memory regions may have different sizes.
+  */
+template <typename Char>
+inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
+{
+    size_t min_size = std::min(a_size, b_size);
+
+    for (size_t offset = 0; offset < min_size; offset += 16)
+    {
+        uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(a + offset)),
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(b + offset))));
+        mask = ~mask;
+
+        if (mask)
+        {
+            offset += __builtin_ctz(mask);
+
+            if (offset >= min_size)
+                break;
+
+            return detail::cmp(a[offset], b[offset]);
+        }
+    }
+
+    return detail::cmp(a_size, b_size);
+}
+
+
+/** Variant when memory regions have same size.
+  * TODO Check if the compiler can optimize previous function when the caller pass identical sizes.
+  */
+template <typename Char>
+inline int memcmpSmallAllowOverflow15(const Char * a, const Char * b, size_t size)
+{
+    for (size_t offset = 0; offset < size; offset += 16)
+    {
+        uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(a + offset)),
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(b + offset))));
+        mask = ~mask;
+
+        if (mask)
+        {
+            offset += __builtin_ctz(mask);
+
+            if (offset >= size)
+                return 0;
+
+            return detail::cmp(a[offset], b[offset]);
+        }
+    }
+
+    return 0;
+}
+
+
+/** Compare memory regions for equality.
+  */
+template <typename Char>
+inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
+{
+    if (a_size != b_size)
+        return false;
+
+    for (size_t offset = 0; offset < a_size; offset += 16)
+    {
+        uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(a + offset)),
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(b + offset))));
+        mask = ~mask;
+
+        if (mask)
+        {
+            offset += __builtin_ctz(mask);
+            return offset >= a_size;
+        }
+    }
+
+    return true;
+}
+
+
+/** Variant when the caller know in advance that the size is a multiple of 16.
+  */
+template <typename Char>
+inline int memcmpSmallMultipleOf16(const Char * a, const Char * b, size_t size)
+{
+    for (size_t offset = 0; offset < size; offset += 16)
+    {
+        uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(a + offset)),
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(b + offset))));
+        mask = ~mask;
+
+        if (mask)
+        {
+            offset += __builtin_ctz(mask);
+            return detail::cmp(a[offset], b[offset]);
+        }
+    }
+
+    return 0;
+}
+
+
+/** Variant when the size is 16 exactly.
+  */
+template <typename Char>
+inline int memcmp16(const Char * a, const Char * b)
+{
+    uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(
+        _mm_loadu_si128(reinterpret_cast<const __m128i *>(a)),
+        _mm_loadu_si128(reinterpret_cast<const __m128i *>(b))));
+    mask = ~mask;
+
+    if (mask)
+    {
+        auto offset = __builtin_ctz(mask);
+        return detail::cmp(a[offset], b[offset]);
+    }
+
+    return 0;
+}
+
+
+/** Variant when the size is 16 exactly.
+  */
+inline bool memequal16(const void * a, const void * b)
+{
+    return 0xFFFF == _mm_movemask_epi8(_mm_cmpeq_epi8(
+        _mm_loadu_si128(reinterpret_cast<const __m128i *>(a)),
+        _mm_loadu_si128(reinterpret_cast<const __m128i *>(b))));
+}
+
+
+/** Compare memory region to zero */
+inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
+{
+    const __m128i zero16 = _mm_setzero_si128();
+
+    for (size_t offset = 0; offset < size; offset += 16)
+    {
+        uint16_t mask = _mm_movemask_epi8(_mm_cmpeq_epi8(zero16,
+            _mm_loadu_si128(reinterpret_cast<const __m128i *>(reinterpret_cast<const char *>(data) + offset))));
+        mask = ~mask;
+
+        if (mask)
+        {
+            offset += __builtin_ctz(mask);
+            return offset >= size;
+        }
+    }
+
+    return true;
+}
+
+
+#else
+
+#include <cstring>
+
+template <typename Char>
+inline int memcmpSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
+{
+    return memcmp(a, b, std::min(a_size, b_size));
+}
+
+template <typename Char>
+inline int memcmpSmallAllowOverflow15(const Char * a, const Char * b, size_t size)
+{
+    return memcmp(a, b, size);
+}
+
+template <typename Char>
+inline bool memequalSmallAllowOverflow15(const Char * a, size_t a_size, const Char * b, size_t b_size)
+{
+    return a_size == b_size && 0 == memcmp(a, b, a_size);
+}
+
+template <typename Char>
+inline int memcmpSmallMultipleOf16(const Char * a, const Char * b, size_t size)
+{
+    return memcmp(a, b, size);
+}
+
+template <typename Char>
+inline int memcmp16(const Char * a, const Char * b)
+{
+    return memcmp(a, b, 16);
+}
+
+inline bool memequal16(const void * a, const void * b)
+{
+    return 0 == memcmp(a, b, 16);
+}
+
+inline bool memoryIsZeroSmallAllowOverflow15(const void * data, size_t size)
+{
+    const char * pos = reinterpret_cast<const char *>(data);
+    const char * end = pos + size;
+
+    for (; pos < end; ++pos)
+        if (*pos)
+            return false;
+
+    return true;
+}
+
+#endif
--- a/dbms/src/Common/memcpySmall.h
+++ b/dbms/src/Common/memcpySmall.h
@ -1,7 +1,6 @@
 #pragma once

 #include <string.h>
-#include <Core/Defines.h>

 #ifdef __SSE2__
 #include <emmintrin.h>
--- a/dbms/src/Compression/CMakeLists.txt
+++ b/dbms/src/Compression/CMakeLists.txt
@ -1,8 +1,9 @@
 include(${ClickHouse_SOURCE_DIR}/cmake/dbms_glob_sources.cmake)
 add_headers_and_sources(clickhouse_compression .)
 add_library(clickhouse_compression ${LINK_MODE} ${clickhouse_compression_headers} ${clickhouse_compression_sources})
-target_link_libraries(clickhouse_compression PRIVATE clickhouse_parsers clickhouse_common_io ${ZSTD_LIBRARY} ${LZ4_LIBRARY})
+target_link_libraries(clickhouse_compression PRIVATE clickhouse_parsers clickhouse_common_io ${ZSTD_LIBRARY} ${LZ4_LIBRARY} ${CITYHASH_LIBRARIES})
 target_include_directories(clickhouse_compression PUBLIC ${DBMS_INCLUDE_DIR})
+target_include_directories(clickhouse_compression SYSTEM PUBLIC ${PCG_RANDOM_INCLUDE_DIR})

 if (NOT USE_INTERNAL_LZ4_LIBRARY)
    target_include_directories(clickhouse_compression SYSTEM BEFORE PRIVATE ${LZ4_INCLUDE_DIR})
--- a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
+++ b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
@ -23,8 +23,11 @@ GraphiteRollupSortedBlockInputStream::GraphiteRollupSortedBlockInputStream(

    for (const auto & pattern : params.patterns)
    {
-        max_size_of_aggregate_state = std::max(max_size_of_aggregate_state, pattern.function->sizeOfData());
-        max_alignment_of_aggregate_state = std::max(max_alignment_of_aggregate_state, pattern.function->alignOfData());
+        if (pattern.function)
+        {
+            max_size_of_aggregate_state = std::max(max_size_of_aggregate_state, pattern.function->sizeOfData());
+            max_alignment_of_aggregate_state = std::max(max_alignment_of_aggregate_state, pattern.function->alignOfData());
+        }
    }

    place_for_aggregate_state.reset(max_size_of_aggregate_state, max_alignment_of_aggregate_state);
@ -41,13 +44,60 @@ GraphiteRollupSortedBlockInputStream::GraphiteRollupSortedBlockInputStream(
 }


-const Graphite::Pattern * GraphiteRollupSortedBlockInputStream::selectPatternForPath(StringRef path) const
+Graphite::RollupRule GraphiteRollupSortedBlockInputStream::selectPatternForPath(StringRef path) const
 {
-    for (const auto & pattern : params.patterns)
-        if (!pattern.regexp || pattern.regexp->match(path.data, path.size))
-            return &pattern;
+    const Graphite::Pattern * first_match = &undef_pattern;

-    return nullptr;
+    for (const auto & pattern : params.patterns)
+    {
+        if (!pattern.regexp)
+        {
+            /// Default pattern
+            if (first_match->type == first_match->TypeUndef && pattern.type == pattern.TypeAll)
+            {
+                /// There is only default pattern for both retention and aggregation
+                return std::pair(&pattern, &pattern);
+            }
+            if (pattern.type != first_match->type)
+            {
+                if (first_match->type == first_match->TypeRetention)
+                {
+                    return std::pair(first_match, &pattern);
+                }
+                if (first_match->type == first_match->TypeAggregation)
+                {
+                    return std::pair(&pattern, first_match);
+                }
+            }
+        }
+        else if (pattern.regexp->match(path.data, path.size))
+        {
+            /// General pattern with matched path
+            if (pattern.type == pattern.TypeAll)
+            {
+               /// Only for not default patterns with both function and retention parameters
+               return std::pair(&pattern, &pattern);
+            }
+            if (first_match->type == first_match->TypeUndef)
+            {
+                first_match = &pattern;
+                continue;
+            }
+            if (pattern.type != first_match->type)
+            {
+                if (first_match->type == first_match->TypeRetention)
+                {
+                    return std::pair(first_match, &pattern);
+                }
+                if (first_match->type == first_match->TypeAggregation)
+                {
+                    return std::pair(&pattern, first_match);
+                }
+            }
+        }
+    }
+
+    return {nullptr, nullptr};
 }


@ -142,14 +192,15 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns
            if (started_rows)
                accumulateRow(current_subgroup_newest_row);

-            const Graphite::Pattern * next_pattern = current_pattern;
+            Graphite::RollupRule next_rule = current_rule;
            if (new_path)
-                next_pattern = selectPatternForPath(next_path);
+                next_rule = selectPatternForPath(next_path);

+            const Graphite::RetentionPattern * retention_pattern = std::get<0>(next_rule);
            time_t next_time_rounded;
-            if (next_pattern)
+            if (retention_pattern)
            {
-                UInt32 precision = selectPrecision(next_pattern->retentions, next_row_time);
+                UInt32 precision = selectPrecision(retention_pattern->retentions, next_row_time);
                next_time_rounded = roundTimeToPrecision(date_lut, next_row_time, precision);
            }
            else
@ -177,7 +228,7 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns
                /// At this point previous row has been fully processed, so we can advance the loop
                /// (substitute current_* values for next_*, advance the cursor).

-                startNextGroup(merged_columns, next_cursor, next_pattern);
+                startNextGroup(merged_columns, next_cursor, next_rule);
                ++started_rows;

                current_time_rounded = next_time_rounded;
@ -229,8 +280,10 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns

 template <typename TSortCursor>
 void GraphiteRollupSortedBlockInputStream::startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor,
-                                                          const Graphite::Pattern * next_pattern)
+                                                          Graphite::RollupRule next_rule)
 {
+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(next_rule);
+
    /// Copy unmodified column values (including path column).
    for (size_t i = 0, size = unmodified_column_numbers.size(); i < size; ++i)
    {
@ -238,13 +291,13 @@ void GraphiteRollupSortedBlockInputStream::startNextGroup(MutableColumns & merge
        merged_columns[j]->insertFrom(*cursor->all_columns[j], cursor->pos);
    }

-    if (next_pattern)
+    if (aggregation_pattern)
    {
-        next_pattern->function->create(place_for_aggregate_state.data());
+        aggregation_pattern->function->create(place_for_aggregate_state.data());
        aggregate_state_created = true;
    }

-    current_pattern = next_pattern;
+    current_rule = next_rule;
 }


@ -255,10 +308,11 @@ void GraphiteRollupSortedBlockInputStream::finishCurrentGroup(MutableColumns & m
    merged_columns[version_column_num]->insertFrom(
        *(*current_subgroup_newest_row.columns)[version_column_num], current_subgroup_newest_row.row_num);

+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(current_rule);
    if (aggregate_state_created)
    {
-        current_pattern->function->insertResultInto(place_for_aggregate_state.data(), *merged_columns[value_column_num]);
-        current_pattern->function->destroy(place_for_aggregate_state.data());
+        aggregation_pattern->function->insertResultInto(place_for_aggregate_state.data(), *merged_columns[value_column_num]);
+        aggregation_pattern->function->destroy(place_for_aggregate_state.data());
        aggregate_state_created = false;
    }
    else
@ -269,8 +323,9 @@ void GraphiteRollupSortedBlockInputStream::finishCurrentGroup(MutableColumns & m

 void GraphiteRollupSortedBlockInputStream::accumulateRow(RowRef & row)
 {
+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(current_rule);
    if (aggregate_state_created)
-        current_pattern->function->add(place_for_aggregate_state.data(), &(*row.columns)[value_column_num], row.row_num, nullptr);
+        aggregation_pattern->function->add(place_for_aggregate_state.data(), &(*row.columns)[value_column_num], row.row_num, nullptr);
 }

 }
--- a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h
+++ b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h
@ -27,11 +27,24 @@ namespace DB
  *
  * Each row in a table correspond to one value of one sensor.
  *
+  * Pattern should contain function, retention scheme, or both of them. The order of patterns does mean as well:
+  *   * Aggregation OR retention patterns should be first
+  *   * Then aggregation AND retention full patterns have to be placed
+  *   * default pattern without regexp must be the last
+  *
  * Rollup rules are specified in the following way:
  *
  * pattern
  *     regexp
  *     function
+  * pattern
+  *     regexp
+  *     age -> precision
+  *     age -> precision
+  *     ...
+  * pattern
+  *     regexp
+  *     function
  *     age -> precision
  *     age -> precision
  *     ...
@ -54,6 +67,10 @@ namespace DB
  *
  * <graphite_rollup>
  *     <pattern>
+  *         <regexp>\.max$</regexp>
+  *         <function>max</function>
+  *     </pattern>
+  *     <pattern>
  *         <regexp>click_cost</regexp>
  *         <function>any</function>
  *         <retention>
@ -98,9 +115,12 @@ namespace Graphite
        std::shared_ptr<OptimizedRegularExpression> regexp;
        AggregateFunctionPtr function;
        Retentions retentions;    /// Must be ordered by 'age' descending.
+        enum { TypeUndef, TypeRetention, TypeAggregation, TypeAll } type = TypeAll; /// The type of defined pattern, filled automatically
    };

    using Patterns = std::vector<Pattern>;
+    using RetentionPattern = Pattern;
+    using AggregationPattern = Pattern;

    struct Params
    {
@ -110,6 +130,8 @@ namespace Graphite
        String version_column_name;
        Graphite::Patterns patterns;
    };
+
+    using RollupRule = std::pair<const RetentionPattern *, const AggregationPattern *>;
 }

 /** Merges several sorted streams into one.
@ -135,7 +157,7 @@ public:
    ~GraphiteRollupSortedBlockInputStream() override
    {
        if (aggregate_state_created)
-            current_pattern->function->destroy(place_for_aggregate_state.data());
+            std::get<1>(current_rule)->function->destroy(place_for_aggregate_state.data());
    }

 protected:
@ -186,11 +208,18 @@ private:
    time_t current_time = 0;
    time_t current_time_rounded = 0;

-    const Graphite::Pattern * current_pattern = nullptr;
+    Graphite::RollupRule current_rule = {nullptr, nullptr};
    AlignedBuffer place_for_aggregate_state;
-    bool aggregate_state_created = false; /// Invariant: if true then current_pattern is not NULL.
+    bool aggregate_state_created = false; /// Invariant: if true then current_rule is not NULL.

-    const Graphite::Pattern * selectPatternForPath(StringRef path) const;
+    const Graphite::Pattern undef_pattern =
+    { /// temporary empty pattern for selectPatternForPath
+        nullptr,
+        nullptr,
+        DB::Graphite::Retentions(),
+        undef_pattern.TypeUndef,
+    };
+    Graphite::RollupRule selectPatternForPath(StringRef path) const;
    UInt32 selectPrecision(const Graphite::Retentions & retentions, time_t time) const;


@ -198,7 +227,7 @@ private:

    /// Insert the values into the resulting columns, which will not be changed in the future.
    template <typename TSortCursor>
-    void startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor, const Graphite::Pattern * next_pattern);
+    void startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor, Graphite::RollupRule next_pattern);

    /// Insert the calculated `time`, `value`, `version` values into the resulting columns by the last group of rows.
    void finishCurrentGroup(MutableColumns & merged_columns);
--- a/dbms/src/DataTypes/IDataType.h
+++ b/dbms/src/DataTypes/IDataType.h
@ -262,8 +262,10 @@ protected:

    /** Text serialization with escaping but without quoting.
      */
+public: // used somewhere in arcadia
    virtual void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;

+protected:
    virtual void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;

    /** Text serialization as a literal that may be inserted into a query.
--- a/dbms/src/Dictionaries/ClickHouseDictionarySource.cpp
+++ b/dbms/src/Dictionaries/ClickHouseDictionarySource.cpp
@ -6,6 +6,7 @@
 #include <Interpreters/executeQuery.h>
 #include <Common/isLocalAddress.h>
 #include <ext/range.h>
+#include <common/logger_useful.h>
 #include "DictionarySourceFactory.h"
 #include "DictionaryStructure.h"
 #include "ExternalQueryBuilder.h"
@ -155,6 +156,7 @@ bool ClickHouseDictionarySource::isModified() const
    if (!invalidate_query.empty())
    {
        auto response = doInvalidateQuery(invalidate_query);
+        LOG_TRACE(log, "Invalidate query has returned: " << response << ", previous value: " << invalidate_query_response);
        if (invalidate_query_response == response)
            return false;
        invalidate_query_response = response;
@ -182,6 +184,7 @@ BlockInputStreamPtr ClickHouseDictionarySource::createStreamForSelectiveLoad(con

 std::string ClickHouseDictionarySource::doInvalidateQuery(const std::string & request) const
 {
+    LOG_TRACE(log, "Performing invalidate query");
    if (is_local)
    {
        Context query_context = context;
--- a/dbms/src/Dictionaries/ClickHouseDictionarySource.h
+++ b/dbms/src/Dictionaries/ClickHouseDictionarySource.h
@ -1,6 +1,7 @@
 #pragma once

 #include <memory>
+#include <Poco/Logger.h>
 #include <Client/ConnectionPoolWithFailover.h>
 #include <Interpreters/Context.h>
 #include "DictionaryStructure.h"
@ -70,6 +71,7 @@ private:
    const bool is_local;
    ConnectionPoolWithFailoverPtr pool;
    const std::string load_all_query;
+    Poco::Logger * log = &Poco::Logger::get("ClickHouseDictionarySource");
 };

 }
--- a/dbms/src/Dictionaries/readInvalidateQuery.cpp
+++ b/dbms/src/Dictionaries/readInvalidateQuery.cpp
@ -1,8 +1,11 @@
 #include "readInvalidateQuery.h"
 #include <DataStreams/IBlockInputStream.h>
+#include <IO/WriteBufferFromString.h>
+

 namespace DB
 {
+
 namespace ErrorCodes
 {
    extern const int TOO_MANY_COLUMNS;
@ -13,7 +16,6 @@ namespace ErrorCodes
 std::string readInvalidateQuery(IBlockInputStream & block_input_stream)
 {
    block_input_stream.readPrefix();
-    std::string response;

    Block block = block_input_stream.read();
    if (!block)
@ -29,18 +31,16 @@ std::string readInvalidateQuery(IBlockInputStream & block_input_stream)
    if (rows > 1)
        throw Exception("Expected single row in resultset, got at least " + std::to_string(rows), ErrorCodes::TOO_MANY_ROWS);

-    auto column = block.getByPosition(0).column;
-    response = column->getDataAt(0).toString();
+    WriteBufferFromOwnString out;
+    auto & column_type = block.getByPosition(0);
+    column_type.type->serializeAsTextQuoted(*column_type.column->convertToFullColumnIfConst(), 0, out, FormatSettings());

    while ((block = block_input_stream.read()))
-    {
        if (block.rows() > 0)
            throw Exception("Expected single row in resultset, got at least " + std::to_string(rows + 1), ErrorCodes::TOO_MANY_ROWS);
-    }

    block_input_stream.readSuffix();
-
-    return response;
+    return out.str();
 }

 }
--- a/dbms/src/Dictionaries/readInvalidateQuery.h
+++ b/dbms/src/Dictionaries/readInvalidateQuery.h
@ -1,12 +1,12 @@
 #pragma once
 #include <string>

-class IBlockInputStream;
-
 namespace DB
 {
-// Using in MySQLDictionarySource and XDBCDictionarySource after processing invalidate_query
+
+class IBlockInputStream;
+
+/// Using in MySQLDictionarySource and XDBCDictionarySource after processing invalidate_query.
 std::string readInvalidateQuery(IBlockInputStream & block_input_stream);

-
 }
--- a/dbms/src/Formats/ProtobufWriter.h
+++ b/dbms/src/Formats/ProtobufWriter.h
@ -238,29 +238,29 @@ using ConstAggregateDataPtr = const char *;
 class ProtobufWriter
 {
 public:
-    bool writeNumber(Int8 value) { return false; }
-    bool writeNumber(UInt8 value) { return false; }
-    bool writeNumber(Int16 value) { return false; }
-    bool writeNumber(UInt16 value) { return false; }
-    bool writeNumber(Int32 value) { return false; }
-    bool writeNumber(UInt32 value) { return false; }
-    bool writeNumber(Int64 value) { return false; }
-    bool writeNumber(UInt64 value) { return false; }
-    bool writeNumber(UInt128 value) { return false; }
-    bool writeNumber(Float32 value) { return false; }
-    bool writeNumber(Float64 value) { return false; }
-    bool writeString(const StringRef & value) { return false; }
-    void prepareEnumMapping(const std::vector<std::pair<std::string, Int8>> & name_value_pairs) {}
-    void prepareEnumMapping(const std::vector<std::pair<std::string, Int16>> & name_value_pairs) {}
-    bool writeEnum(Int8 value) { return false; }
-    bool writeEnum(Int16 value) { return false; }
-    bool writeUUID(const UUID & value) { return false; }
-    bool writeDate(DayNum date) { return false; }
-    bool writeDateTime(time_t tm) { return false; }
-    bool writeDecimal(Decimal32 decimal, UInt32 scale) { return false; }
-    bool writeDecimal(Decimal64 decimal, UInt32 scale) { return false; }
-    bool writeDecimal(const Decimal128 & decimal, UInt32 scale) { return false; }
-    bool writeAggregateFunction(const AggregateFunctionPtr & function, ConstAggregateDataPtr place) { return false; }
+    bool writeNumber(Int8 /* value */) { return false; }
+    bool writeNumber(UInt8 /* value */) { return false; }
+    bool writeNumber(Int16 /* value */) { return false; }
+    bool writeNumber(UInt16 /* value */) { return false; }
+    bool writeNumber(Int32 /* value */) { return false; }
+    bool writeNumber(UInt32 /* value */) { return false; }
+    bool writeNumber(Int64 /* value */) { return false; }
+    bool writeNumber(UInt64 /* value */) { return false; }
+    bool writeNumber(UInt128 /* value */) { return false; }
+    bool writeNumber(Float32 /* value */) { return false; }
+    bool writeNumber(Float64 /* value */) { return false; }
+    bool writeString(const StringRef & /* value */) { return false; }
+    void prepareEnumMapping(const std::vector<std::pair<std::string, Int8>> & /* name_value_pairs */) {}
+    void prepareEnumMapping(const std::vector<std::pair<std::string, Int16>> & /* name_value_pairs */) {}
+    bool writeEnum(Int8 /* value */) { return false; }
+    bool writeEnum(Int16 /* value */) { return false; }
+    bool writeUUID(const UUID & /* value */) { return false; }
+    bool writeDate(DayNum /* date */) { return false; }
+    bool writeDateTime(time_t /* tm */) { return false; }
+    bool writeDecimal(Decimal32 /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeDecimal(Decimal64 /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeDecimal(const Decimal128 & /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeAggregateFunction(const AggregateFunctionPtr & /* function */, ConstAggregateDataPtr /* place */) { return false; }
 };

 }
--- a/dbms/src/Functions/CMakeLists.txt
+++ b/dbms/src/Functions/CMakeLists.txt
@ -11,11 +11,11 @@ add_library(clickhouse_functions ${LINK_MODE} ${clickhouse_functions_sources})

 target_link_libraries(clickhouse_functions
    PUBLIC
-        dbms
-    PRIVATE
        clickhouse_dictionaries
+        dbms
        ${CONSISTENT_HASHING_LIBRARY}
        consistent-hashing-sumbur
+        ${CITYHASH_LIBRARIES}
        ${FARMHASH_LIBRARIES}
        ${METROHASH_LIBRARIES}
        murmurhash
--- a/dbms/src/Functions/EmptyImpl.h
+++ b/dbms/src/Functions/EmptyImpl.h
@ -1,5 +1,6 @@
 #pragma once
-#include <cstring>
+
+#include <Common/memcmpSmall.h>
 #include <Columns/ColumnString.h>
 #include <Functions/FunctionFactory.h>

@ -38,11 +39,9 @@ struct EmptyImpl

    static void vector_fixed_to_vector(const ColumnString::Chars & data, size_t n, PaddedPODArray<UInt8> & res)
    {
-        std::vector<char> empty_chars(n);
        size_t size = data.size() / n;
-
        for (size_t i = 0; i < size; ++i)
-            res[i] = negative ^ (0 == memcmp(&data[i * n], empty_chars.data(), n));
+            res[i] = negative ^ memoryIsZeroSmallAllowOverflow15(data.data() + i * n, n);
    }

    static void array(const ColumnString::Offsets & offsets, PaddedPODArray<UInt8> & res)
--- a/dbms/src/Functions/FunctionsBitmap.cpp
+++ b/dbms/src/Functions/FunctionsBitmap.cpp
@ -0,0 +1,25 @@
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionsBitmap.h>
+
+
+namespace DB
+{
+
+void registerFunctionsBitmap(FunctionFactory & factory)
+{
+    factory.registerFunction<FunctionBitmapBuild>();
+    factory.registerFunction<FunctionBitmapToArray>();
+
+    factory.registerFunction<FunctionBitmapSelfCardinality>();
+    factory.registerFunction<FunctionBitmapAndCardinality>();
+    factory.registerFunction<FunctionBitmapOrCardinality>();
+    factory.registerFunction<FunctionBitmapXorCardinality>();
+    factory.registerFunction<FunctionBitmapAndnotCardinality>();
+
+    factory.registerFunction<FunctionBitmapAnd>();
+    factory.registerFunction<FunctionBitmapOr>();
+    factory.registerFunction<FunctionBitmapXor>();
+    factory.registerFunction<FunctionBitmapAndnot>();
+
+}
+}
--- a/dbms/src/Functions/FunctionsBitmap.h
+++ b/dbms/src/Functions/FunctionsBitmap.h
@ -0,0 +1,593 @@
+#pragma once
+
+#include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <AggregateFunctions/AggregateFunctionGroupBitmapData.h>
+#include <Columns/ColumnAggregateFunction.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnFunction.h>
+#include <Columns/ColumnVector.h>
+#include <DataTypes/DataTypeAggregateFunction.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/IFunction.h>
+#include <Common/typeid_cast.h>
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
+/** Bitmap functions.
+  * Build a bitmap from integer array:
+  * bitmapBuild: integer[] -> bitmap
+  *
+  * Convert bitmap to integer array:
+  * bitmapToArray:	bitmap -> integer[]
+  *
+  * Two bitmap and calculation:
+  * bitmapAnd:	bitmap,bitmap -> bitmap
+  *
+  * Two bitmap or calculation:
+  * bitmapOr:	bitmap,bitmap -> bitmap
+  *
+  * Two bitmap xor calculation:
+  * bitmapXor:	bitmap,bitmap -> bitmap
+  *
+  * Two bitmap andnot calculation:
+  * bitmapAndnot:	bitmap,bitmap -> bitmap
+  *
+  * Retrun bitmap cardinality:
+  * bitmapCardinality:	bitmap -> integer
+  *
+  * Two bitmap and calculation, return cardinality:
+  * bitmapAndCardinality:	bitmap,bitmap -> integer
+  *
+  * Two bitmap or calculation, return cardinality:
+  * bitmapOrCardinality:	bitmap,bitmap -> integer
+  *
+  * Two bitmap xor calculation, return cardinality:
+  * bitmapXorCardinality:	bitmap,bitmap -> integer
+  *
+  * Two bitmap andnot calculation, return cardinality:
+  * bitmapAndnotCardinality: bitmap,bitmap -> integer
+  */
+
+template <typename Name>
+class FunctionBitmapBuildImpl : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionBitmapBuildImpl>(); }
+
+    String getName() const override { return name; }
+
+    bool isVariadic() const override { return false; }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        if (arguments[0]->onlyNull())
+            return arguments[0];
+
+        auto array_type = typeid_cast<const DataTypeArray *>(arguments[0].get());
+        if (!array_type)
+            throw Exception(
+                "First argument for function " + getName() + " must be an array but it has type " + arguments[0]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        auto nested_type = array_type->getNestedType();
+        DataTypes argument_types = {nested_type};
+        Array params_row;
+        AggregateFunctionPtr bitmap_function
+            = AggregateFunctionFactory::instance().get(AggregateFunctionGroupBitmapData<UInt32>::name(), argument_types, params_row);
+
+        return std::make_shared<DataTypeAggregateFunction>(bitmap_function, argument_types, params_row);
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t /* input_rows_count */) override
+    {
+        const IDataType * from_type = block.getByPosition(arguments[0]).type.get();
+        auto array_type = typeid_cast<const DataTypeArray *>(from_type);
+        auto nested_type = array_type->getNestedType();
+
+        DataTypes argument_types = {nested_type};
+
+        WhichDataType which(nested_type);
+        if (which.isUInt8())
+            executeBitmapData<UInt8>(block, argument_types, arguments, result);
+        else if (which.isUInt16())
+            executeBitmapData<UInt16>(block, argument_types, arguments, result);
+        else if (which.isUInt32())
+            executeBitmapData<UInt32>(block, argument_types, arguments, result);
+        else if (which.isUInt64())
+            executeBitmapData<UInt64>(block, argument_types, arguments, result);
+        else
+            throw Exception(
+                "Unexpected type " + from_type->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+    }
+
+private:
+    template <typename T>
+    void executeBitmapData(Block & block, DataTypes & argument_types, const ColumnNumbers & arguments, size_t result)
+    {
+        // input data
+        const ColumnArray * array = typeid_cast<const ColumnArray *>(block.getByPosition(arguments[0]).column.get());
+        ColumnPtr mapped = array->getDataPtr();
+        const ColumnArray::Offsets & offsets = array->getOffsets();
+        const ColumnVector<T> * column = checkAndGetColumn<ColumnVector<T>>(&*mapped);
+        const typename ColumnVector<T>::Container & input_data = column->getData();
+
+        // output data
+        Array params_row;
+        AggregateFunctionPtr bitmap_function
+            = AggregateFunctionFactory::instance().get(AggregateFunctionGroupBitmapData<UInt32>::name(), argument_types, params_row);
+        auto col_to = ColumnAggregateFunction::create(bitmap_function);
+        col_to->reserve(offsets.size());
+
+        size_t pos = 0;
+        for (size_t i = 0; i < offsets.size(); ++i)
+        {
+            col_to->insertDefault();
+            AggregateFunctionGroupBitmapData<T> & bitmap_data
+                = *reinterpret_cast<AggregateFunctionGroupBitmapData<T> *>(col_to->getData()[i]);
+            for (; pos < offsets[i]; ++pos)
+            {
+                bitmap_data.rbs.add(input_data[pos]);
+            }
+        }
+        block.getByPosition(result).column = std::move(col_to);
+    }
+};
+
+template <typename Name>
+class FunctionBitmapToArrayImpl : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionBitmapToArrayImpl>(); }
+
+    String getName() const override { return name; }
+
+    bool isVariadic() const override { return false; }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        const DataTypeAggregateFunction * bitmap_type = typeid_cast<const DataTypeAggregateFunction *>(arguments[0].get());
+        if (!(bitmap_type && bitmap_type->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "First argument for function " + getName() + " must be an bitmap but it has type " + arguments[0]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        const DataTypePtr data_type = bitmap_type->getArgumentsDataTypes()[0];
+
+        return std::make_shared<DataTypeArray>(data_type);
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override
+    {
+        // input data
+        const auto & return_type = block.getByPosition(result).type;
+        auto res_ptr = return_type->createColumn();
+        ColumnArray & res = static_cast<ColumnArray &>(*res_ptr);
+
+        IColumn & res_data = res.getData();
+        ColumnArray::Offsets & res_offsets = res.getOffsets();
+
+        const IDataType * from_type = block.getByPosition(arguments[0]).type.get();
+        const DataTypeAggregateFunction * aggr_type = typeid_cast<const DataTypeAggregateFunction *>(from_type);
+        WhichDataType which(aggr_type->getArgumentsDataTypes()[0]);
+        if (which.isUInt8())
+            executeIntType<UInt8>(block, arguments, input_rows_count, res_data, res_offsets);
+        else if (which.isUInt16())
+            executeIntType<UInt16>(block, arguments, input_rows_count, res_data, res_offsets);
+        else if (which.isUInt32())
+            executeIntType<UInt32>(block, arguments, input_rows_count, res_data, res_offsets);
+        else if (which.isUInt64())
+            executeIntType<UInt64>(block, arguments, input_rows_count, res_data, res_offsets);
+        else
+            throw Exception(
+                "Unexpected type " + from_type->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        block.getByPosition(result).column = std::move(res_ptr);
+    }
+
+private:
+    using ToType = UInt64;
+
+    template <typename T>
+    void executeIntType(
+        Block & block, const ColumnNumbers & arguments, size_t input_rows_count, IColumn & res_data_col, ColumnArray::Offsets & res_offsets)
+        const
+    {
+        const ColumnAggregateFunction * column
+            = typeid_cast<const ColumnAggregateFunction *>(block.getByPosition(arguments[0]).column.get());
+
+        PaddedPODArray<T> & res_data = typeid_cast<ColumnVector<T> &>(res_data_col).getData();
+        ColumnArray::Offset res_offset = 0;
+
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            const AggregateFunctionGroupBitmapData<T> & bd1
+                = *reinterpret_cast<const AggregateFunctionGroupBitmapData<T> *>(column->getData()[i]);
+            UInt64 count = bd1.rbs.rb_to_array(res_data);
+            res_offset += count;
+            res_offsets.emplace_back(res_offset);
+        }
+    }
+};
+
+template <typename Name>
+class FunctionBitmapSelfCardinalityImpl : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionBitmapSelfCardinalityImpl>(); }
+
+    String getName() const override { return name; }
+
+    bool isVariadic() const override { return false; }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        auto bitmap_type = typeid_cast<const DataTypeAggregateFunction *>(arguments[0].get());
+        if (!(bitmap_type && bitmap_type->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "First argument for function " + getName() + " must be an bitmap but it has type " + arguments[0]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        return std::make_shared<DataTypeNumber<ToType>>();
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override
+    {
+        auto col_to = ColumnVector<ToType>::create(input_rows_count);
+        typename ColumnVector<ToType>::Container & vec_to = col_to->getData();
+        const IDataType * from_type = block.getByPosition(arguments[0]).type.get();
+
+        const DataTypeAggregateFunction * aggr_type = typeid_cast<const DataTypeAggregateFunction *>(from_type);
+        WhichDataType which(aggr_type->getArgumentsDataTypes()[0]);
+        if (which.isUInt8())
+            executeIntType<UInt8>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt16())
+            executeIntType<UInt16>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt32())
+            executeIntType<UInt32>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt64())
+            executeIntType<UInt64>(block, arguments, input_rows_count, vec_to);
+        else
+            throw Exception(
+                "Unexpected type " + from_type->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        block.getByPosition(result).column = std::move(col_to);
+    }
+
+private:
+    using ToType = UInt64;
+
+    template <typename T>
+    void executeIntType(
+        Block & block, const ColumnNumbers & arguments, size_t input_rows_count, typename ColumnVector<ToType>::Container & vec_to)
+    {
+        const ColumnAggregateFunction * column
+            = typeid_cast<const ColumnAggregateFunction *>(block.getByPosition(arguments[0]).column.get());
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            const AggregateFunctionGroupBitmapData<T> & bd1
+                = *reinterpret_cast<const AggregateFunctionGroupBitmapData<T> *>(column->getData()[i]);
+            vec_to[i] = bd1.rbs.size();
+        }
+    }
+};
+
+template <typename T>
+struct BitmapAndCardinalityImpl
+{
+    using ReturnType = UInt64;
+    static UInt64 apply(const AggregateFunctionGroupBitmapData<T> & bd1, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        // roaring_bitmap_and_cardinality( rb1, rb2 );
+        return bd1.rbs.rb_and_cardinality(bd2.rbs);
+    }
+};
+
+
+template <typename T>
+struct BitmapOrCardinalityImpl
+{
+    using ReturnType = UInt64;
+    static UInt64 apply(const AggregateFunctionGroupBitmapData<T> & bd1, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        // return roaring_bitmap_or_cardinality( rb1, rb2 );
+        return bd1.rbs.rb_or_cardinality(bd2.rbs);
+    }
+};
+
+template <typename T>
+struct BitmapXorCardinalityImpl
+{
+    using ReturnType = UInt64;
+    static UInt64 apply(const AggregateFunctionGroupBitmapData<T> & bd1, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        // return roaring_bitmap_xor_cardinality( rb1, rb2 );
+        return bd1.rbs.rb_xor_cardinality(bd2.rbs);
+    }
+};
+
+template <typename T>
+struct BitmapAndnotCardinalityImpl
+{
+    using ReturnType = UInt64;
+    static UInt64 apply(const AggregateFunctionGroupBitmapData<T> & bd1, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        // roaring_bitmap_andnot_cardinality( rb1, rb2 );
+        return bd1.rbs.rb_andnot_cardinality(bd2.rbs);
+    }
+};
+
+template <template <typename> class Impl, typename Name>
+class FunctionBitmapCardinality : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionBitmapCardinality>(); }
+
+    String getName() const override { return name; }
+
+    bool isVariadic() const override { return false; }
+
+    size_t getNumberOfArguments() const override { return 2; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        auto bitmap_type0 = typeid_cast<const DataTypeAggregateFunction *>(arguments[0].get());
+        if (!(bitmap_type0 && bitmap_type0->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "First argument for function " + getName() + " must be an bitmap but it has type " + arguments[0]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        auto bitmap_type1 = typeid_cast<const DataTypeAggregateFunction *>(arguments[1].get());
+        if (!(bitmap_type1 && bitmap_type1->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "Second argument for function " + getName() + " must be an bitmap but it has type " + arguments[1]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        return std::make_shared<DataTypeNumber<ToType>>();
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override
+    {
+        auto col_to = ColumnVector<ToType>::create(input_rows_count);
+        typename ColumnVector<ToType>::Container & vec_to = col_to->getData();
+        const IDataType * from_type = block.getByPosition(arguments[0]).type.get();
+
+        const DataTypeAggregateFunction * aggr_type = typeid_cast<const DataTypeAggregateFunction *>(from_type);
+        WhichDataType which(aggr_type->getArgumentsDataTypes()[0]);
+        if (which.isUInt8())
+            executeIntType<UInt8>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt16())
+            executeIntType<UInt16>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt32())
+            executeIntType<UInt32>(block, arguments, input_rows_count, vec_to);
+        else if (which.isUInt64())
+            executeIntType<UInt64>(block, arguments, input_rows_count, vec_to);
+        else
+            throw Exception(
+                "Unexpected type " + from_type->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        block.getByPosition(result).column = std::move(col_to);
+    }
+
+private:
+    using ToType = UInt64;
+
+    template <typename T>
+    void executeIntType(
+        Block & block, const ColumnNumbers & arguments, size_t input_rows_count, typename ColumnVector<ToType>::Container & vec_to)
+    {
+        const ColumnAggregateFunction * columns[2];
+        for (size_t i = 0; i < 2; ++i)
+            columns[i] = typeid_cast<const ColumnAggregateFunction *>(block.getByPosition(arguments[i]).column.get());
+
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            const AggregateFunctionGroupBitmapData<T> & bd1
+                = *reinterpret_cast<const AggregateFunctionGroupBitmapData<T> *>(columns[0]->getData()[i]);
+            const AggregateFunctionGroupBitmapData<T> & bd2
+                = *reinterpret_cast<const AggregateFunctionGroupBitmapData<T> *>(columns[1]->getData()[i]);
+            vec_to[i] = Impl<T>::apply(bd1, bd2);
+        }
+    }
+};
+
+template <typename T>
+struct BitmapAndImpl
+{
+    static void apply(AggregateFunctionGroupBitmapData<T> & toBd, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        toBd.rbs.rb_and(bd2.rbs);
+    }
+};
+
+template <typename T>
+struct BitmapOrImpl
+{
+    static void apply(AggregateFunctionGroupBitmapData<T> & toBd, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        toBd.rbs.rb_or(bd2.rbs);
+    }
+};
+
+template <typename T>
+struct BitmapXorImpl
+{
+    static void apply(AggregateFunctionGroupBitmapData<T> & toBd, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        toBd.rbs.rb_xor(bd2.rbs);
+    }
+};
+
+template <typename T>
+struct BitmapAndnotImpl
+{
+    static void apply(AggregateFunctionGroupBitmapData<T> & toBd, const AggregateFunctionGroupBitmapData<T> & bd2)
+    {
+        toBd.rbs.rb_andnot(bd2.rbs);
+    }
+};
+
+template <template <typename> class Impl, typename Name>
+class FunctionBitmap : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+
+    static FunctionPtr create(const Context &) { return std::make_shared<FunctionBitmap>(); }
+
+    String getName() const override { return name; }
+
+    bool isVariadic() const override { return false; }
+
+    size_t getNumberOfArguments() const override { return 2; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        auto bitmap_type0 = typeid_cast<const DataTypeAggregateFunction *>(arguments[0].get());
+        if (!(bitmap_type0 && bitmap_type0->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "First argument for function " + getName() + " must be an bitmap but it has type " + arguments[0]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+
+        auto bitmap_type1 = typeid_cast<const DataTypeAggregateFunction *>(arguments[1].get());
+        if (!(bitmap_type1 && bitmap_type1->getFunctionName() == AggregateFunctionGroupBitmapData<UInt32>::name()))
+            throw Exception(
+                "Second argument for function " + getName() + " must be an bitmap but it has type " + arguments[1]->getName() + ".",
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+        return arguments[0];
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    void executeImpl(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count) override
+    {
+        const IDataType * from_type = block.getByPosition(arguments[0]).type.get();
+        const DataTypeAggregateFunction * aggr_type = typeid_cast<const DataTypeAggregateFunction *>(from_type);
+        WhichDataType which(aggr_type->getArgumentsDataTypes()[0]);
+        if (which.isUInt8())
+            executeBitmapData<UInt8>(block, arguments, result, input_rows_count);
+        else if (which.isUInt16())
+            executeBitmapData<UInt16>(block, arguments, result, input_rows_count);
+        else if (which.isUInt32())
+            executeBitmapData<UInt32>(block, arguments, result, input_rows_count);
+        else if (which.isUInt64())
+            executeBitmapData<UInt64>(block, arguments, result, input_rows_count);
+        else
+            throw Exception(
+                "Unexpected type " + from_type->getName() + " of argument of function " + getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
+    }
+
+private:
+    template <typename T>
+    void executeBitmapData(Block & block, const ColumnNumbers & arguments, size_t result, size_t input_rows_count)
+    {
+        const ColumnAggregateFunction * columns[2];
+        for (size_t i = 0; i < 2; ++i)
+            columns[i] = typeid_cast<const ColumnAggregateFunction *>(block.getByPosition(arguments[i]).column.get());
+
+        auto col_to = ColumnAggregateFunction::create(columns[0]->getAggregateFunction());
+
+        col_to->reserve(input_rows_count);
+
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            col_to->insertFrom(columns[0]->getData()[i]);
+            AggregateFunctionGroupBitmapData<T> & toBd = *reinterpret_cast<AggregateFunctionGroupBitmapData<T> *>(col_to->getData()[i]);
+            const AggregateFunctionGroupBitmapData<T> & bd2
+                = *reinterpret_cast<const AggregateFunctionGroupBitmapData<T> *>(columns[1]->getData()[i]);
+            Impl<T>::apply(toBd, bd2);
+        }
+        block.getByPosition(result).column = std::move(col_to);
+    }
+};
+
+struct NameBitmapBuild
+{
+    static constexpr auto name = "bitmapBuild";
+};
+using FunctionBitmapBuild = FunctionBitmapBuildImpl<NameBitmapBuild>;
+
+struct NameBitmapToArray
+{
+    static constexpr auto name = "bitmapToArray";
+};
+using FunctionBitmapToArray = FunctionBitmapToArrayImpl<NameBitmapToArray>;
+
+struct NameBitmapCardinality
+{
+    static constexpr auto name = "bitmapCardinality";
+};
+struct NameBitmapAndCardinality
+{
+    static constexpr auto name = "bitmapAndCardinality";
+};
+struct NameBitmapOrCardinality
+{
+    static constexpr auto name = "bitmapOrCardinality";
+};
+struct NameBitmapXorCardinality
+{
+    static constexpr auto name = "bitmapXorCardinality";
+};
+struct NameBitmapAndnotCardinality
+{
+    static constexpr auto name = "bitmapAndnotCardinality";
+};
+
+using FunctionBitmapSelfCardinality = FunctionBitmapSelfCardinalityImpl<NameBitmapCardinality>;
+using FunctionBitmapAndCardinality = FunctionBitmapCardinality<BitmapAndCardinalityImpl, NameBitmapAndCardinality>;
+using FunctionBitmapOrCardinality = FunctionBitmapCardinality<BitmapOrCardinalityImpl, NameBitmapOrCardinality>;
+using FunctionBitmapXorCardinality = FunctionBitmapCardinality<BitmapXorCardinalityImpl, NameBitmapXorCardinality>;
+using FunctionBitmapAndnotCardinality = FunctionBitmapCardinality<BitmapAndnotCardinalityImpl, NameBitmapAndnotCardinality>;
+
+struct NameBitmapAnd
+{
+    static constexpr auto name = "bitmapAnd";
+};
+struct NameBitmapOr
+{
+    static constexpr auto name = "bitmapOr";
+};
+struct NameBitmapXor
+{
+    static constexpr auto name = "bitmapXor";
+};
+struct NameBitmapAndnot
+{
+    static constexpr auto name = "bitmapAndnot";
+};
+using FunctionBitmapAnd = FunctionBitmap<BitmapAndImpl, NameBitmapAnd>;
+using FunctionBitmapOr = FunctionBitmap<BitmapOrImpl, NameBitmapOr>;
+using FunctionBitmapXor = FunctionBitmap<BitmapXorImpl, NameBitmapXor>;
+using FunctionBitmapAndnot = FunctionBitmap<BitmapAndnotImpl, NameBitmapAndnot>;
+
+
+}
--- a/dbms/src/Functions/FunctionsComparison.h
+++ b/dbms/src/Functions/FunctionsComparison.h
@ -1,5 +1,7 @@
 #pragma once

+#include <Common/memcmpSmall.h>
+
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnDecimal.h>
@ -115,30 +117,6 @@ struct NumComparisonImpl
 };


-inline int memcmp16(const void * a, const void * b)
-{
-    /// Assuming little endian.
-
-    UInt64 a_hi = __builtin_bswap64(unalignedLoad<UInt64>(a));
-    UInt64 b_hi = __builtin_bswap64(unalignedLoad<UInt64>(b));
-
-    if (a_hi < b_hi)
-        return -1;
-    if (a_hi > b_hi)
-        return 1;
-
-    UInt64 a_lo = __builtin_bswap64(unalignedLoad<UInt64>(reinterpret_cast<const char *>(a) + 8));
-    UInt64 b_lo = __builtin_bswap64(unalignedLoad<UInt64>(reinterpret_cast<const char *>(b) + 8));
-
-    if (a_lo < b_lo)
-        return -1;
-    if (a_lo > b_lo)
-        return 1;
-
-    return 0;
-}
-
-
 template <typename Op>
 struct StringComparisonImpl
 {
@ -148,27 +126,17 @@ struct StringComparisonImpl
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
+        ColumnString::Offset prev_a_offset = 0;
+        ColumnString::Offset prev_b_offset = 0;

        for (size_t i = 0; i < size; ++i)
        {
-            /// Trailing zero byte of the smaller string is included in the comparison.
-            size_t a_size;
-            size_t b_size;
-            int res;
-            if (i == 0)
-            {
-                a_size = a_offsets[0];
-                b_size = b_offsets[0];
-                res = memcmp(a_data.data(), b_data.data(), std::min(a_size, b_size));
-            }
-            else
-            {
-                a_size = a_offsets[i] - a_offsets[i - 1];
-                b_size = b_offsets[i] - b_offsets[i - 1];
-                res = memcmp(&a_data[a_offsets[i - 1]], &b_data[b_offsets[i - 1]], std::min(a_size, b_size));
-            }
+            c[i] = Op::apply(memcmpSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_offsets[i] - prev_a_offset - 1,
+                b_data.data() + prev_b_offset, b_offsets[i] - prev_b_offset - 1), 0);

-            c[i] = Op::apply(res, 0) || (res == 0 && Op::apply(a_size, b_size));
+            prev_a_offset = a_offsets[i];
+            prev_b_offset = b_offsets[i];
        }
    }

@ -178,43 +146,33 @@ struct StringComparisonImpl
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
+        ColumnString::Offset prev_a_offset = 0;
+
        for (size_t i = 0; i < size; ++i)
        {
-            if (i == 0)
-            {
-                int res = memcmp(a_data.data(), b_data.data(), std::min(a_offsets[0] - 1, b_n));
-                c[i] = Op::apply(res, 0) || (res == 0 && Op::apply(a_offsets[0], b_n + 1));
-            }
-            else
-            {
-                int res = memcmp(&a_data[a_offsets[i - 1]], &b_data[i * b_n],
-                    std::min(a_offsets[i] - a_offsets[i - 1] - 1, b_n));
-                c[i] = Op::apply(res, 0) || (res == 0 && Op::apply(a_offsets[i] - a_offsets[i - 1], b_n + 1));
-            }
+            c[i] = Op::apply(memcmpSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_offsets[i] - prev_a_offset - 1,
+                b_data.data() + i * b_n, b_n), 0);
+
+            prev_a_offset = a_offsets[i];
        }
    }

    static void NO_INLINE string_vector_constant(
        const ColumnString::Chars & a_data, const ColumnString::Offsets & a_offsets,
-        const std::string & b,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
-        ColumnString::Offset b_size = b.size() + 1;
-        const UInt8 * b_data = reinterpret_cast<const UInt8 *>(b.data());
+        ColumnString::Offset prev_a_offset = 0;
+
        for (size_t i = 0; i < size; ++i)
        {
-            /// Trailing zero byte of the smaller string is included in the comparison.
-            if (i == 0)
-            {
-                int res = memcmp(a_data.data(), b_data, std::min(a_offsets[0], b_size));
-                c[i] = Op::apply(res, 0) || (res == 0 && Op::apply(a_offsets[0], b_size));
-            }
-            else
-            {
-                int res = memcmp(&a_data[a_offsets[i - 1]], b_data, std::min(a_offsets[i] - a_offsets[i - 1], b_size));
-                c[i] = Op::apply(res, 0) || (res == 0 && Op::apply(a_offsets[i] - a_offsets[i - 1], b_size));
-            }
+            c[i] = Op::apply(memcmpSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_offsets[i] - prev_a_offset - 1,
+                b_data.data(), b_size), 0);
+
+            prev_a_offset = a_offsets[i];
        }
    }

@ -239,13 +197,13 @@ struct StringComparisonImpl

    static void NO_INLINE fixed_string_vector_constant_16(
        const ColumnString::Chars & a_data,
-        const std::string & b,
+        const ColumnString::Chars & b_data,
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_data.size();

        for (size_t i = 0, j = 0; i < size; i += 16, ++j)
-            c[j] = Op::apply(memcmp16(&a_data[i], b.data()), 0);
+            c[j] = Op::apply(memcmp16(&a_data[i], &b_data[0]), 0);
    }

    static void NO_INLINE fixed_string_vector_fixed_string_vector(
@ -253,74 +211,73 @@ struct StringComparisonImpl
        const ColumnString::Chars & b_data, ColumnString::Offset b_n,
        PaddedPODArray<UInt8> & c)
    {
-        /** Specialization if both sizes are 16.
-          * To more efficient comparison of IPv6 addresses stored in FixedString(16).
-          */
        if (a_n == 16 && b_n == 16)
        {
+            /** Specialization if both sizes are 16.
+              * To more efficient comparison of IPv6 addresses stored in FixedString(16).
+              */
            fixed_string_vector_fixed_string_vector_16(a_data, b_data, c);
        }
+        else if (a_n == b_n)
+        {
+            size_t size = a_data.size();
+            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
+                c[j] = Op::apply(memcmpSmallAllowOverflow15(a_data.data() + i, b_data.data() + i, a_n), 0);
+        }
        else
        {
-            /// Generic implementation, less efficient.
-            size_t size = a_data.size();
+            size_t size = a_data.size() / a_n;

-            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
-            {
-                int res = memcmp(&a_data[i], &b_data[i], std::min(a_n, b_n));
-                c[j] = Op::apply(res, 0) || (res == 0 && Op::apply(a_n, b_n));
-            }
+            for (size_t i = 0; i < size; ++i)
+                c[i] = Op::apply(memcmpSmallAllowOverflow15(a_data.data() + i * a_n, a_n, b_data.data() + i * b_n, b_n), 0);
        }
    }

    static void NO_INLINE fixed_string_vector_constant(
        const ColumnString::Chars & a_data, ColumnString::Offset a_n,
-        const std::string & b,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        PaddedPODArray<UInt8> & c)
    {
-        ColumnString::Offset b_n = b.size();
-        if (a_n == 16 && b_n == 16)
+        if (a_n == 16 && b_size == 16)
        {
-            fixed_string_vector_constant_16(a_data, b, c);
+            fixed_string_vector_constant_16(a_data, b_data, c);
+        }
+        else if (a_n == b_size)
+        {
+            size_t size = a_data.size();
+            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
+                c[j] = Op::apply(memcmpSmallAllowOverflow15(a_data.data() + i, b_data.data(), a_n), 0);
        }
        else
        {
            size_t size = a_data.size();
-            const UInt8 * b_data = reinterpret_cast<const UInt8 *>(b.data());
            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
-            {
-                int res = memcmp(&a_data[i], b_data, std::min(a_n, b_n));
-                c[j] = Op::apply(res, 0) || (res == 0 && Op::apply(a_n, b_n));
-            }
+                c[j] = Op::apply(memcmpSmallAllowOverflow15(a_data.data() + i, a_n, b_data.data(), b_size), 0);
        }
    }

    static void constant_string_vector(
-        const std::string & a,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
        const ColumnString::Chars & b_data, const ColumnString::Offsets & b_offsets,
        PaddedPODArray<UInt8> & c)
    {
-        StringComparisonImpl<typename Op::SymmetricOp>::string_vector_constant(b_data, b_offsets, a, c);
+        StringComparisonImpl<typename Op::SymmetricOp>::string_vector_constant(b_data, b_offsets, a_data, a_size, c);
    }

    static void constant_fixed_string_vector(
-        const std::string & a,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
        const ColumnString::Chars & b_data, ColumnString::Offset b_n,
        PaddedPODArray<UInt8> & c)
    {
-        StringComparisonImpl<typename Op::SymmetricOp>::fixed_string_vector_constant(b_data, b_n, a, c);
+        StringComparisonImpl<typename Op::SymmetricOp>::fixed_string_vector_constant(b_data, b_n, a_data, a_size, c);
    }

    static void constant_constant(
-        const std::string & a,
-        const std::string & b,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        UInt8 & c)
    {
-        size_t a_n = a.size();
-        size_t b_n = b.size();
-
-        int res = memcmp(a.data(), b.data(), std::min(a_n, b_n));
-        c = Op::apply(res, 0) || (res == 0 && Op::apply(a_n, b_n));
+        c = Op::apply(memcmpSmallAllowOverflow15(a_data.data(), a_size, b_data.data(), b_size), 0);
    }
 };

@ -335,11 +292,21 @@ struct StringEqualsImpl
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
+        ColumnString::Offset prev_a_offset = 0;
+        ColumnString::Offset prev_b_offset = 0;
+
        for (size_t i = 0; i < size; ++i)
-            c[i] = positive == ((i == 0)
-                ? (a_offsets[0] == b_offsets[0] && !memcmp(a_data.data(), b_data.data(), a_offsets[0] - 1))
-                : (a_offsets[i] - a_offsets[i - 1] == b_offsets[i] - b_offsets[i - 1]
-                    && !memcmp(&a_data[a_offsets[i - 1]], &b_data[b_offsets[i - 1]], a_offsets[i] - a_offsets[i - 1] - 1)));
+        {
+            auto a_size = a_offsets[i] - prev_a_offset - 1;
+            auto b_size = b_offsets[i] - prev_b_offset - 1;
+
+            c[i] = positive == memequalSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_size,
+                b_data.data() + prev_b_offset, b_size);
+
+            prev_a_offset = a_offsets[i];
+            prev_b_offset = b_offsets[i];
+        }
    }

    static void NO_INLINE string_vector_fixed_string_vector(
@ -348,76 +315,65 @@ struct StringEqualsImpl
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
+        ColumnString::Offset prev_a_offset = 0;
+
        for (size_t i = 0; i < size; ++i)
-            c[i] = positive == ((i == 0)
-                ? (a_offsets[0] == b_n + 1 && !memcmp(a_data.data(), b_data.data(), b_n))
-                : (a_offsets[i] - a_offsets[i - 1] == b_n + 1
-                    && !memcmp(&a_data[a_offsets[i - 1]], &b_data[b_n * i], b_n)));
+        {
+            auto a_size = a_offsets[i] - prev_a_offset - 1;
+
+            c[i] = positive == memequalSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_size,
+                b_data.data() + b_n * i, b_n);
+
+            prev_a_offset = a_offsets[i];
+        }
    }

    static void NO_INLINE string_vector_constant(
        const ColumnString::Chars & a_data, const ColumnString::Offsets & a_offsets,
-        const std::string & b,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        PaddedPODArray<UInt8> & c)
    {
        size_t size = a_offsets.size();
-        ColumnString::Offset b_n = b.size();
-        const UInt8 * b_data = reinterpret_cast<const UInt8 *>(b.data());
+        ColumnString::Offset prev_a_offset = 0;
+
        for (size_t i = 0; i < size; ++i)
-            c[i] = positive == ((i == 0)
-                ? (a_offsets[0] == b_n + 1 && !memcmp(a_data.data(), b_data, b_n))
-                : (a_offsets[i] - a_offsets[i - 1] == b_n + 1
-                    && !memcmp(&a_data[a_offsets[i - 1]], b_data, b_n)));
+        {
+            auto a_size = a_offsets[i] - prev_a_offset - 1;
+
+            c[i] = positive == memequalSmallAllowOverflow15(
+                a_data.data() + prev_a_offset, a_size,
+                b_data.data(), b_size);
+
+            prev_a_offset = a_offsets[i];
+        }
    }

-#ifdef __SSE2__
    static void NO_INLINE fixed_string_vector_fixed_string_vector_16(
        const ColumnString::Chars & a_data,
        const ColumnString::Chars & b_data,
        PaddedPODArray<UInt8> & c)
    {
-        size_t size = c.size();
+        size_t size = a_data.size() / 16;

-        const __m128i * a_pos = reinterpret_cast<const __m128i *>(a_data.data());
-        const __m128i * b_pos = reinterpret_cast<const __m128i *>(b_data.data());
-        UInt8 * c_pos = c.data();
-        UInt8 * c_end = c_pos + size;
-
-        while (c_pos < c_end)
-        {
-            *c_pos = positive == (0xFFFF == _mm_movemask_epi8(_mm_cmpeq_epi8(
-                _mm_loadu_si128(a_pos),
-                _mm_loadu_si128(b_pos))));
-
-            ++a_pos;
-            ++b_pos;
-            ++c_pos;
-        }
+        for (size_t i = 0; i < size; ++i)
+            c[i] = positive == memequal16(
+                a_data.data() + i * 16,
+                b_data.data() + i * 16);
    }

    static void NO_INLINE fixed_string_vector_constant_16(
        const ColumnString::Chars & a_data,
-        const std::string & b,
+        const ColumnString::Chars & b_data,
        PaddedPODArray<UInt8> & c)
    {
-        size_t size = c.size();
+        size_t size = a_data.size() / 16;

-        const __m128i * a_pos = reinterpret_cast<const __m128i *>(a_data.data());
-        const __m128i b_value = _mm_loadu_si128(reinterpret_cast<const __m128i *>(b.data()));
-        UInt8 * c_pos = c.data();
-        UInt8 * c_end = c_pos + size;
-
-        while (c_pos < c_end)
-        {
-            *c_pos = positive == (0xFFFF == _mm_movemask_epi8(_mm_cmpeq_epi8(
-                _mm_loadu_si128(a_pos),
-                b_value)));
-
-            ++a_pos;
-            ++c_pos;
-        }
+        for (size_t i = 0; i < size; ++i)
+            c[i] = positive == memequal16(
+                a_data.data() + i * 16,
+                b_data.data());
    }
-#endif

    static void NO_INLINE fixed_string_vector_fixed_string_vector(
        const ColumnString::Chars & a_data, ColumnString::Offset a_n,
@ -427,38 +383,32 @@ struct StringEqualsImpl
        /** Specialization if both sizes are 16.
          * To more efficient comparison of IPv6 addresses stored in FixedString(16).
          */
-#ifdef __SSE2__
        if (a_n == 16 && b_n == 16)
        {
            fixed_string_vector_fixed_string_vector_16(a_data, b_data, c);
        }
        else
-#endif
        {
-            size_t size = a_data.size();
-            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
-                c[j] = positive == (a_n == b_n && !memcmp(&a_data[i], &b_data[i], a_n));
+            size_t size = a_data.size() / a_n;
+            for (size_t i = 0; i < size; ++i)
+                c[i] = positive == memequalSmallAllowOverflow15(a_data.data() + i * a_n, a_n, b_data.data() + i * b_n, b_n);
        }
    }

    static void NO_INLINE fixed_string_vector_constant(
        const ColumnString::Chars & a_data, ColumnString::Offset a_n,
-        const std::string & b,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        PaddedPODArray<UInt8> & c)
    {
-        ColumnString::Offset b_n = b.size();
-#ifdef __SSE2__
-        if (a_n == 16 && b_n == 16)
+        if (a_n == 16 && b_size == 16)
        {
-            fixed_string_vector_constant_16(a_data, b, c);
+            fixed_string_vector_constant_16(a_data, b_data, c);
        }
        else
-#endif
        {
-            size_t size = a_data.size();
-            const UInt8 * b_data = reinterpret_cast<const UInt8 *>(b.data());
-            for (size_t i = 0, j = 0; i < size; i += a_n, ++j)
-                c[j] = positive == (a_n == b_n && !memcmp(&a_data[i], b_data, a_n));
+            size_t size = a_data.size() / a_n;
+            for (size_t i = 0; i < size; ++i)
+                c[i] = positive == memequalSmallAllowOverflow15(a_data.data() + i * a_n, a_n, b_data.data(), b_size);
        }
    }

@ -471,27 +421,27 @@ struct StringEqualsImpl
    }

    static void constant_string_vector(
-        const std::string & a,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
        const ColumnString::Chars & b_data, const ColumnString::Offsets & b_offsets,
        PaddedPODArray<UInt8> & c)
    {
-        string_vector_constant(b_data, b_offsets, a, c);
+        string_vector_constant(b_data, b_offsets, a_data, a_size, c);
    }

    static void constant_fixed_string_vector(
-        const std::string & a,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
        const ColumnString::Chars & b_data, ColumnString::Offset b_n,
        PaddedPODArray<UInt8> & c)
    {
-        fixed_string_vector_constant(b_data, b_n, a, c);
+        fixed_string_vector_constant(b_data, b_n, a_data, a_size, c);
    }

    static void constant_constant(
-        const std::string & a,
-        const std::string & b,
+        const ColumnString::Chars & a_data, ColumnString::Offset a_size,
+        const ColumnString::Chars & b_data, ColumnString::Offset b_size,
        UInt8 & c)
    {
-        c = positive == (a == b);
+        c = positive == memequalSmallAllowOverflow15(a_data.data(), a_size, b_data.data(), b_size);
    }
 };

@ -744,18 +694,62 @@ private:
        const ColumnString * c1_string = checkAndGetColumn<ColumnString>(c1);
        const ColumnFixedString * c0_fixed_string = checkAndGetColumn<ColumnFixedString>(c0);
        const ColumnFixedString * c1_fixed_string = checkAndGetColumn<ColumnFixedString>(c1);
+
        const ColumnConst * c0_const = checkAndGetColumnConstStringOrFixedString(c0);
        const ColumnConst * c1_const = checkAndGetColumnConstStringOrFixedString(c1);

        if (!((c0_string || c0_fixed_string || c0_const) && (c1_string || c1_fixed_string || c1_const)))
            return false;

+        const ColumnString::Chars * c0_const_chars = nullptr;
+        const ColumnString::Chars * c1_const_chars = nullptr;
+        ColumnString::Offset c0_const_size = 0;
+        ColumnString::Offset c1_const_size = 0;
+
+        if (c0_const)
+        {
+            const ColumnString * c0_const_string = checkAndGetColumn<ColumnString>(&c0_const->getDataColumn());
+            const ColumnFixedString * c0_const_fixed_string = checkAndGetColumn<ColumnFixedString>(&c0_const->getDataColumn());
+
+            if (c0_const_string)
+            {
+                c0_const_chars = &c0_const_string->getChars();
+                c0_const_size = c0_const_string->getDataAt(0).size;
+            }
+            else if (c0_const_fixed_string)
+            {
+                c0_const_chars = &c0_const_fixed_string->getChars();
+                c0_const_size = c0_const_fixed_string->getN();
+            }
+            else
+                throw Exception("Logical error: ColumnConst contains not String nor FixedString column", ErrorCodes::ILLEGAL_COLUMN);
+        }
+
+        if (c1_const)
+        {
+            const ColumnString * c1_const_string = checkAndGetColumn<ColumnString>(&c1_const->getDataColumn());
+            const ColumnFixedString * c1_const_fixed_string = checkAndGetColumn<ColumnFixedString>(&c1_const->getDataColumn());
+
+            if (c1_const_string)
+            {
+                c1_const_chars = &c1_const_string->getChars();
+                c1_const_size = c1_const_string->getDataAt(0).size;
+            }
+            else if (c1_const_fixed_string)
+            {
+                c1_const_chars = &c1_const_fixed_string->getChars();
+                c1_const_size = c1_const_fixed_string->getN();
+            }
+            else
+                throw Exception("Logical error: ColumnConst contains not String nor FixedString column", ErrorCodes::ILLEGAL_COLUMN);
+        }
+
        using StringImpl = StringComparisonImpl<Op<int, int>>;

        if (c0_const && c1_const)
        {
            UInt8 res = 0;
-            StringImpl::constant_constant(c0_const->getValue<String>(), c1_const->getValue<String>(), res);
+            StringImpl::constant_constant(*c0_const_chars, c0_const_size, *c1_const_chars, c1_const_size, res);
            block.getByPosition(result).column = block.getByPosition(result).type->createColumnConst(c0_const->size(), toField(res));
            return true;
        }
@ -778,7 +772,7 @@ private:
            else if (c0_string && c1_const)
                StringImpl::string_vector_constant(
                    c0_string->getChars(), c0_string->getOffsets(),
-                    c1_const->getValue<String>(),
+                    *c1_const_chars, c1_const_size,
                    c_res->getData());
            else if (c0_fixed_string && c1_string)
                StringImpl::fixed_string_vector_string_vector(
@ -793,16 +787,16 @@ private:
            else if (c0_fixed_string && c1_const)
                StringImpl::fixed_string_vector_constant(
                    c0_fixed_string->getChars(), c0_fixed_string->getN(),
-                    c1_const->getValue<String>(),
+                    *c1_const_chars, c1_const_size,
                    c_res->getData());
            else if (c0_const && c1_string)
                StringImpl::constant_string_vector(
-                    c0_const->getValue<String>(),
+                    *c0_const_chars, c0_const_size,
                    c1_string->getChars(), c1_string->getOffsets(),
                    c_res->getData());
            else if (c0_const && c1_fixed_string)
                StringImpl::constant_fixed_string_vector(
-                    c0_const->getValue<String>(),
+                    *c0_const_chars, c0_const_size,
                    c1_fixed_string->getChars(), c1_fixed_string->getN(),
                    c_res->getData());
            else
--- a/dbms/src/Functions/arrayIndex.h
+++ b/dbms/src/Functions/arrayIndex.h
@ -6,9 +6,11 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnNullable.h>
 #include <Common/FieldVisitors.h>
+#include <Common/memcmpSmall.h>


 namespace DB
@ -272,8 +274,7 @@ struct ArrayIndexNumNullImpl
    }
 };

-/// Implementation for arrays of strings when the 2nd function argument
-/// is a NULL value.
+/// Implementation for arrays of strings when the 2nd function argument is a NULL value.
 template <typename IndexConv>
 struct ArrayIndexStringNullImpl
 {
@ -311,12 +312,11 @@ struct ArrayIndexStringImpl
 {
    static void vector_const(
        const ColumnString::Chars & data, const ColumnArray::Offsets & offsets, const ColumnString::Offsets & string_offsets,
-        const String & value,
+        const ColumnString::Chars & value, ColumnString::Offset value_size,
        PaddedPODArray<typename IndexConv::ResultType> & result,
        const PaddedPODArray<UInt8> * null_map_data)
    {
        const auto size = offsets.size();
-        const auto value_size = value.size();
        result.resize(size);

        ColumnArray::Offset current_offset = 0;
@ -331,12 +331,12 @@ struct ArrayIndexStringImpl
                    ? 0
                    : string_offsets[current_offset + j - 1];

-                ColumnArray::Offset string_size = string_offsets[current_offset + j] - string_pos;
+                ColumnArray::Offset string_size = string_offsets[current_offset + j] - string_pos - 1;

                if (null_map_data && (*null_map_data)[current_offset + j])
                {
                }
-                else if (string_size == value_size + 1 && 0 == memcmp(value.data(), &data[string_pos], value_size))
+                else if (memequalSmallAllowOverflow15(value.data(), value_size, &data[string_pos], string_size))
                {
                    if (!IndexConv::apply(j, current))
                        break;
@ -381,7 +381,7 @@ struct ArrayIndexStringImpl
                    if (null_map_item && (*null_map_item)[i])
                        hit = true;
                }
-                else if (string_size == value_size && 0 == memcmp(&item_values[value_pos], &data[string_pos], value_size))
+                else if (memequalSmallAllowOverflow15(&item_values[value_pos], value_size, &data[string_pos], string_size))
                    hit = true;

                if (hit)
@ -708,16 +708,32 @@ private:
        const auto item_arg = block.getByPosition(arguments[1]).column.get();

        if (item_arg->onlyNull())
+        {
            ArrayIndexStringNullImpl<IndexConv>::vector_const(col_nested->getChars(), col_array->getOffsets(),
                col_nested->getOffsets(), col_res->getData(), null_map_data);
+        }
        else if (const auto item_arg_const = checkAndGetColumnConstStringOrFixedString(item_arg))
-            ArrayIndexStringImpl<IndexConv>::vector_const(col_nested->getChars(), col_array->getOffsets(),
-                col_nested->getOffsets(), item_arg_const->getValue<String>(), col_res->getData(),
-                null_map_data);
+        {
+            const ColumnString * item_const_string = checkAndGetColumn<ColumnString>(&item_arg_const->getDataColumn());
+            const ColumnFixedString * item_const_fixedstring = checkAndGetColumn<ColumnFixedString>(&item_arg_const->getDataColumn());
+
+            if (item_const_string)
+                ArrayIndexStringImpl<IndexConv>::vector_const(col_nested->getChars(), col_array->getOffsets(), col_nested->getOffsets(),
+                    item_const_string->getChars(), item_const_string->getDataAt(0).size,
+                    col_res->getData(), null_map_data);
+            else if (item_const_fixedstring)
+                ArrayIndexStringImpl<IndexConv>::vector_const(col_nested->getChars(), col_array->getOffsets(), col_nested->getOffsets(),
+                    item_const_fixedstring->getChars(), item_const_fixedstring->getN(),
+                    col_res->getData(), null_map_data);
+            else
+                throw Exception("Logical error: ColumnConst contains not String nor FixedString column", ErrorCodes::ILLEGAL_COLUMN);
+        }
        else if (const auto item_arg_vector = checkAndGetColumn<ColumnString>(item_arg))
+        {
            ArrayIndexStringImpl<IndexConv>::vector_vector(col_nested->getChars(), col_array->getOffsets(),
                col_nested->getOffsets(), item_arg_vector->getChars(), item_arg_vector->getOffsets(),
                col_res->getData(), null_map_data, null_map_item);
+        }
        else
            return false;

--- a/dbms/src/Functions/registerFunctions.cpp
+++ b/dbms/src/Functions/registerFunctions.cpp
@ -13,6 +13,7 @@ namespace DB
 void registerFunctionsArithmetic(FunctionFactory &);
 void registerFunctionsArray(FunctionFactory &);
 void registerFunctionsTuple(FunctionFactory &);
+void registerFunctionsBitmap(FunctionFactory &);
 void registerFunctionsCoding(FunctionFactory &);
 void registerFunctionsComparison(FunctionFactory &);
 void registerFunctionsConditional(FunctionFactory &);
@ -53,6 +54,7 @@ void registerFunctions()
    registerFunctionsArithmetic(factory);
    registerFunctionsArray(factory);
    registerFunctionsTuple(factory);
+    registerFunctionsBitmap(factory);
    registerFunctionsCoding(factory);
    registerFunctionsComparison(factory);
    registerFunctionsConditional(factory);
--- a/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp
+++ b/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp
@ -192,6 +192,9 @@ void CrossToInnerJoinMatcher::visit(ASTSelectQuery & select, ASTPtr & ast, Data
    using CheckExpressionMatcher = OneTypeMatcher<CheckExpressionVisitorData, false>;
    using CheckExpressionVisitor = InDepthNodeVisitor<CheckExpressionMatcher, true>;

+    if (!select.where_expression)
+        return;
+
    std::vector<DatabaseAndTableWithAlias> table_names;
    ASTPtr ast_join = getCrossJoin(select, table_names);
    if (!ast_join)
@ -215,10 +218,10 @@ void CrossToInnerJoinMatcher::visit(ASTSelectQuery & select, ASTPtr & ast, Data
            select.where_expression.reset();

        join.children.push_back(join.on_expression);
+
+        ast = ast->clone(); /// rewrite AST in right manner
+        data.done = true;
    }
-
-    ast = ast->clone(); /// rewrite AST in right manner
-    data.done = true;
 }

 }
--- a/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp
+++ b/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp
@ -62,11 +62,11 @@ bool DatabaseAndTableWithAlias::satisfies(const DatabaseAndTableWithAlias & db_t
    return database == db_table.database && table == db_table.table;
 }

-String DatabaseAndTableWithAlias::getQualifiedNamePrefix() const
+String DatabaseAndTableWithAlias::getQualifiedNamePrefix(bool with_dot) const
 {
    if (alias.empty() && table.empty())
        return "";
-    return (!alias.empty() ? alias : table) + '.';
+    return (!alias.empty() ? alias : table) + (with_dot ? "." : "");
 }

 std::vector<const ASTTableExpression *> getSelectTablesExpression(const ASTSelectQuery & select_query)
--- a/dbms/src/Interpreters/DatabaseAndTableWithAlias.h
+++ b/dbms/src/Interpreters/DatabaseAndTableWithAlias.h
@ -32,7 +32,7 @@ struct DatabaseAndTableWithAlias
    DatabaseAndTableWithAlias(const ASTTableExpression & table_expression, const String & current_database = "");

    /// "alias." or "table." if alias is empty
-    String getQualifiedNamePrefix() const;
+    String getQualifiedNamePrefix(bool with_dot = true) const;

    /// Check if it satisfies another db_table name. @note opterion is not symmetric.
    bool satisfies(const DatabaseAndTableWithAlias & table, bool table_may_be_an_alias);
--- a/dbms/src/Interpreters/ExternalLoader.cpp
+++ b/dbms/src/Interpreters/ExternalLoader.cpp
@ -155,36 +155,57 @@ void ExternalLoader::reloadAndUpdate(bool throw_on_error)
    /// periodic update
    std::vector<std::pair<std::string, LoadablePtr>> objects_to_update;

+    auto getNextUpdateTime = [this](const LoadablePtr & current)
+    {
+        /// calculate next update time
+        const auto & lifetime = current->getLifetime();
+        std::uniform_int_distribution<UInt64> distribution{lifetime.min_sec, lifetime.max_sec};
+        return std::chrono::system_clock::now() + std::chrono::seconds{distribution(rnd_engine)};
+    };
+
    /// Collect objects that needs to be updated under lock. Then create new versions without lock, and assign under lock.
    {
        std::lock_guard lock{map_mutex};

        for (auto & loadable_object : loadable_objects)
        {
-            /// If the loadable objects failed to load or even failed to initialize from the config.
-            if (!loadable_object.second.loadable)
-                continue;
+            try
+            {
+                /// If the loadable objects failed to load or even failed to initialize from the config.
+                if (!loadable_object.second.loadable)
+                    continue;

-            const LoadablePtr & current = loadable_object.second.loadable;
-            const auto & lifetime = current->getLifetime();
+                const LoadablePtr & current = loadable_object.second.loadable;
+                const auto & lifetime = current->getLifetime();

-            /// do not update loadable objects with zero as lifetime
-            if (lifetime.min_sec == 0 || lifetime.max_sec == 0)
-                continue;
+                /// do not update loadable objects with zero as lifetime
+                if (lifetime.min_sec == 0 || lifetime.max_sec == 0)
+                    continue;

-            if (!current->supportUpdates())
-                continue;
+                if (!current->supportUpdates())
+                    continue;

-            auto update_time = update_times[current->getName()];
+                auto & update_time = update_times[current->getName()];

-            /// check that timeout has passed
-            if (std::chrono::system_clock::now() < update_time)
-                continue;
+                /// check that timeout has passed
+                if (std::chrono::system_clock::now() < update_time)
+                    continue;

-            if (!current->isModified())
-                continue;
+                if (!current->isModified())
+                {
+                    update_time = getNextUpdateTime(current);
+                    continue;
+                }

-            objects_to_update.emplace_back(loadable_object.first, current);
+                objects_to_update.emplace_back(loadable_object.first, current);
+            }
+            catch (...)
+            {
+                tryLogCurrentException(log, "Cannot check if the '" + loadable_object.first + "' " + object_name + " need to be updated");
+
+                if (throw_on_error)
+                    throw;
+            }
        }
    }

@ -209,10 +230,7 @@ void ExternalLoader::reloadAndUpdate(bool throw_on_error)

            if (auto it = loadable_objects.find(name); it != loadable_objects.end())
            {
-                /// calculate next update time
-                const auto & lifetime = current->getLifetime();
-                std::uniform_int_distribution<UInt64> distribution{lifetime.min_sec, lifetime.max_sec};
-                update_times[name] = std::chrono::system_clock::now() + std::chrono::seconds{distribution(rnd_engine)};
+                update_times[name] = getNextUpdateTime(current);

                it->second.exception = exception;
                if (!exception)
--- a/dbms/src/Interpreters/FindIdentifierBestTableVisitor.cpp
+++ b/dbms/src/Interpreters/FindIdentifierBestTableVisitor.cpp
@ -16,13 +16,13 @@ void FindIdentifierBestTableData::visit(ASTIdentifier & identifier, ASTPtr &)

    if (!identifier.compound())
    {
-        for (const auto & [table, names] : tables)
+        for (const auto & table_names : tables)
        {
-            if (std::find(names.begin(), names.end(), identifier.name) != names.end())
+            if (std::find(table_names.second.begin(), table_names.second.end(), identifier.name) != table_names.second.end())
            {
                // TODO: make sure no collision ever happens
                if (!best_table)
-                    best_table = &table;
+                    best_table = &table_names.first;
            }
        }
    }
@ -30,13 +30,13 @@ void FindIdentifierBestTableData::visit(ASTIdentifier & identifier, ASTPtr &)
    {
        // FIXME: make a better matcher using `names`?
        size_t best_match = 0;
-        for (const auto & [table, names] : tables)
+        for (const auto & table_names : tables)
        {
-            if (size_t match = IdentifierSemantic::canReferColumnToTable(identifier, table))
+            if (size_t match = IdentifierSemantic::canReferColumnToTable(identifier, table_names.first))
                if (match > best_match)
                {
                    best_match = match;
-                    best_table = &table;
+                    best_table = &table_names.first;
                }
        }
    }
--- a/dbms/src/Interpreters/IExternalLoadable.h
+++ b/dbms/src/Interpreters/IExternalLoadable.h
@ -37,7 +37,7 @@ public:
    virtual std::string getName() const = 0;
    /// True if object can be updated when lifetime exceeded.
    virtual bool supportUpdates() const = 0;
-    /// If lifetime exceeded and isModified() ExternalLoader replace current object with the result of clone().
+    /// If lifetime exceeded and isModified(), ExternalLoader replace current object with the result of clone().
    virtual bool isModified() const = 0;
    /// Returns new object with the same configuration. Is used to update modified object when lifetime exceeded.
    virtual std::unique_ptr<IExternalLoadable> clone() const = 0;
--- a/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@ -36,9 +36,10 @@ struct ColumnAliasesMatcher
    {
        const std::vector<DatabaseAndTableWithAlias> tables;
        bool public_names;
-        AsteriskSemantic::RevertedAliases rev_aliases;
-        std::unordered_map<String, String> aliases;
+        AsteriskSemantic::RevertedAliases rev_aliases;  /// long_name -> aliases
+        std::unordered_map<String, String> aliases;     /// alias -> long_name
        std::vector<std::pair<ASTIdentifier *, bool>> compound_identifiers;
+        std::set<String> allowed_long_names;            /// original names allowed as aliases '--t.x as t.x' (select expressions only).

        Data(std::vector<DatabaseAndTableWithAlias> && tables_)
            : tables(tables_)
@ -51,29 +52,37 @@ struct ColumnAliasesMatcher

            for (auto & [identifier, is_public] : compound_identifiers)
            {
-                auto it = rev_aliases.find(identifier->name);
+                String long_name = identifier->name;
+
+                auto it = rev_aliases.find(long_name);
                if (it == rev_aliases.end())
                {
                    bool last_table = IdentifierSemantic::canReferColumnToTable(*identifier, tables.back());
                    if (!last_table)
                    {
-                        String long_name = identifier->name;
                        String alias = hide_prefix + long_name;
                        aliases[alias] = long_name;
                        rev_aliases[long_name].push_back(alias);

                        identifier->setShortName(alias);
                        if (is_public)
+                        {
                            identifier->setAlias(long_name);
+                            allowed_long_names.insert(long_name);
+                        }
                    }
                    else if (is_public)
-                        identifier->setAlias(identifier->name); /// prevent crop long to short name
+                        identifier->setAlias(long_name); /// prevent crop long to short name
                }
                else
                {
                    if (it->second.empty())
-                        throw Exception("No alias for '" + identifier->name + "'", ErrorCodes::LOGICAL_ERROR);
-                    identifier->setShortName(it->second[0]);
+                        throw Exception("No alias for '" + long_name + "'", ErrorCodes::LOGICAL_ERROR);
+
+                    if (is_public && allowed_long_names.count(long_name))
+                        ; /// leave original name unchanged for correct output
+                    else
+                        identifier->setShortName(it->second[0]);
                }
            }
        }
@ -131,7 +140,7 @@ struct ColumnAliasesMatcher
                node.setAlias("");
            }
        }
-        else
+        else if (node.compound())
            data.compound_identifiers.emplace_back(&node, data.public_names);
    }
 };
--- a/dbms/src/Interpreters/Settings.h
+++ b/dbms/src/Interpreters/Settings.h
@ -75,7 +75,7 @@ struct Settings
    M(SettingFloat, totals_auto_threshold, 0.5, "The threshold for totals_mode = 'auto'.") \
    \
    M(SettingBool, compile, false, "Whether query compilation is enabled.") \
-    M(SettingBool, compile_expressions, true, "Compile some scalar functions and operators to native code.") \
+    M(SettingBool, compile_expressions, false, "Compile some scalar functions and operators to native code.") \
    M(SettingUInt64, min_count_to_compile, 3, "The number of structurally identical queries before they are compiled.") \
    M(SettingUInt64, min_count_to_compile_expression, 3, "The number of identical expressions before they are JIT-compiled") \
    M(SettingUInt64, group_by_two_level_threshold, 100000, "From what number of keys, a two-level aggregation starts. 0 - the threshold is not set.") \
--- a/dbms/src/Interpreters/SyntaxAnalyzer.cpp
+++ b/dbms/src/Interpreters/SyntaxAnalyzer.cpp
@ -652,7 +652,8 @@ SyntaxAnalyzerResultPtr SyntaxAnalyzer::analyze(
    {
        if (const ASTTablesInSelectQueryElement * node = select_query->join())
        {
-            replaceJoinedTable(node);
+            if (settings.enable_optimize_predicate_expression)
+                replaceJoinedTable(node);

            const auto & joined_expression = static_cast<const ASTTableExpression &>(*node->table_expression);
            DatabaseAndTableWithAlias table(joined_expression, context.getCurrentDatabase());
--- a/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@ -143,21 +143,14 @@ void TranslateQualifiedNamesMatcher::visit(ASTSelectQuery & select, const ASTPtr
        Visitor(data).visit(*add_node);
 }

-/// qualifed names for duplicates
-static std::shared_ptr<ASTIdentifier> makeIdentifier(const String & short_name, const String & long_name, bool need_long_name)
+static void addIdentifier(ASTs & nodes, const String & table_name, const String & column_name, AsteriskSemantic::RevertedAliasesPtr aliases)
 {
-    if (need_long_name)
-        return std::make_shared<ASTIdentifier>(long_name);
-    return std::make_shared<ASTIdentifier>(short_name);
-}
+    auto identifier = std::make_shared<ASTIdentifier>(std::vector<String>{table_name, column_name});

-static void addIdentifier(ASTs & nodes, std::shared_ptr<ASTIdentifier> identifier, const String & long_name,
-                          AsteriskSemantic::RevertedAliasesPtr aliases)
-{
    bool added = false;
-    if (aliases && aliases->count(long_name))
+    if (aliases && aliases->count(identifier->name))
    {
-        for (const String & alias : (*aliases)[long_name])
+        for (const String & alias : (*aliases)[identifier->name])
        {
            nodes.push_back(identifier->clone());
            nodes.back()->setAlias(alias);
@ -173,7 +166,6 @@ static void addIdentifier(ASTs & nodes, std::shared_ptr<ASTIdentifier> identifie
 void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPtr &, Data & data)
 {
    const auto & tables_with_columns = data.tables;
-    const auto & source_columns = data.source_columns;

    ASTs old_children;
    if (data.processAsterisks())
@ -208,16 +200,14 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
        if (const auto * asterisk = typeid_cast<const ASTAsterisk *>(child.get()))
        {
            bool first_table = true;
-            for (const auto & [table_name, table_columns] : tables_with_columns)
+            for (const auto & [table, table_columns] : tables_with_columns)
            {
                for (const auto & column_name : table_columns)
                {
                    if (first_table || !data.join_using_columns.count(column_name))
                    {
-                        bool need_prefix = !first_table && source_columns.count(column_name);
-                        String long_name = table_name.getQualifiedNamePrefix() + column_name;
-                        auto identifier = makeIdentifier(column_name, long_name, need_prefix);
-                        addIdentifier(node.children, identifier, long_name, AsteriskSemantic::getAliases(*asterisk));
+                        String table_name = table.getQualifiedNamePrefix(false);
+                        addIdentifier(node.children, table_name, column_name, AsteriskSemantic::getAliases(*asterisk));
                    }
                }

@ -228,22 +218,17 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
        {
            DatabaseAndTableWithAlias ident_db_and_name(qualified_asterisk->children[0]);

-            bool first_table = true;
-            for (const auto & [table_name, table_columns] : tables_with_columns)
+            for (const auto & [table, table_columns] : tables_with_columns)
            {
-                if (ident_db_and_name.satisfies(table_name, true))
+                if (ident_db_and_name.satisfies(table, true))
                {
                    for (const auto & column_name : table_columns)
                    {
-                        bool need_prefix = !first_table && source_columns.count(column_name);
-                        String long_name = table_name.getQualifiedNamePrefix() + column_name;
-                        auto identifier = makeIdentifier(column_name, long_name, need_prefix);
-                        addIdentifier(node.children, identifier, long_name, AsteriskSemantic::getAliases(*qualified_asterisk));
+                        String table_name = table.getQualifiedNamePrefix(false);
+                        addIdentifier(node.children, table_name, column_name, AsteriskSemantic::getAliases(*qualified_asterisk));
                    }
                    break;
                }
-
-                first_table = false;
            }
        }
        else
--- a/dbms/src/Interpreters/executeQuery.cpp
+++ b/dbms/src/Interpreters/executeQuery.cpp
@ -63,18 +63,24 @@ static String joinLines(const String & query)


 /// Log query into text log (not into system table).
-static void logQuery(const String & query, const Context & context)
+static void logQuery(const String & query, const Context & context, bool internal)
 {
-    const auto & current_query_id = context.getClientInfo().current_query_id;
-    const auto & initial_query_id = context.getClientInfo().initial_query_id;
-    const auto & current_user = context.getClientInfo().current_user;
+    if (internal)
+    {
+        LOG_DEBUG(&Logger::get("executeQuery"), "(internal) " << joinLines(query));
+    }
+    else
+    {
+        const auto & current_query_id = context.getClientInfo().current_query_id;
+        const auto & initial_query_id = context.getClientInfo().initial_query_id;
+        const auto & current_user = context.getClientInfo().current_user;

-    LOG_DEBUG(&Logger::get("executeQuery"), "(from " << context.getClientInfo().current_address.toString()
-    << (current_user != "default" ? ", user: " + context.getClientInfo().current_user : "")
-    << (!initial_query_id.empty() && current_query_id != initial_query_id ? ", initial_query_id: " + initial_query_id : std::string())
-    << ") "
-    << joinLines(query)
-    );
+        LOG_DEBUG(&Logger::get("executeQuery"), "(from " << context.getClientInfo().current_address.toString()
+            << (current_user != "default" ? ", user: " + context.getClientInfo().current_user : "")
+            << (!initial_query_id.empty() && current_query_id != initial_query_id ? ", initial_query_id: " + initial_query_id : std::string())
+            << ") "
+            << joinLines(query));
+    }
 }


@ -176,13 +182,12 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
    }
    catch (...)
    {
+        /// Anyway log the query.
+        String query = String(begin, begin + std::min(end - begin, static_cast<ptrdiff_t>(max_query_size)));
+        logQuery(query.substr(0, settings.log_queries_cut_to_length), context, internal);
+
        if (!internal)
-        {
-            /// Anyway log the query.
-            String query = String(begin, begin + std::min(end - begin, static_cast<ptrdiff_t>(max_query_size)));
-            logQuery(query.substr(0, settings.log_queries_cut_to_length), context);
            onExceptionBeforeStart(query, context, current_time);
-        }

        throw;
    }
@ -193,15 +198,14 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(

    try
    {
-        if (!internal)
-            logQuery(query.substr(0, settings.log_queries_cut_to_length), context);
+        logQuery(query.substr(0, settings.log_queries_cut_to_length), context, internal);

        if (!internal && settings.allow_experimental_multiple_joins_emulation)
        {
            JoinToSubqueryTransformVisitor::Data join_to_subs_data;
            JoinToSubqueryTransformVisitor(join_to_subs_data).visit(ast);
            if (join_to_subs_data.done)
-                logQuery(queryToString(*ast), context);
+                logQuery(queryToString(*ast), context, internal);
        }

        if (!internal && settings.allow_experimental_cross_to_join_conversion)
@ -209,7 +213,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
            CrossToInnerJoinVisitor::Data cross_to_inner;
            CrossToInnerJoinVisitor(cross_to_inner).visit(ast);
            if (cross_to_inner.done)
-                logQuery(queryToString(*ast), context);
+                logQuery(queryToString(*ast), context, internal);
        }

        /// Check the limits.
--- a/dbms/src/Parsers/ASTIdentifier.cpp
+++ b/dbms/src/Parsers/ASTIdentifier.cpp
@ -29,6 +29,10 @@ ASTIdentifier::ASTIdentifier(const String & name_, std::vector<String> && name_p
 {
 }

+ASTIdentifier::ASTIdentifier(std::vector<String> && name_parts_)
+    : ASTIdentifier(name_parts_.at(0) + '.' + name_parts_.at(1), std::move(name_parts_))
+{}
+
 void ASTIdentifier::setShortName(const String & new_name)
 {
    name = new_name;
@ -48,9 +52,8 @@ void ASTIdentifier::formatImplWithoutAlias(const FormatSettings & settings, Form
        settings.ostr << (settings.hilite ? hilite_none : "");
    };

-    /// A simple or compound identifier?
-
-    if (name_parts.size() > 1)
+    /// It could be compound but short
+    if (!isShort())
    {
        for (size_t i = 0, size = name_parts.size(); i < size; ++i)
        {
--- a/dbms/src/Parsers/ASTIdentifier.h
+++ b/dbms/src/Parsers/ASTIdentifier.h
@ -22,6 +22,7 @@ public:
    String name;

    ASTIdentifier(const String & name_, std::vector<String> && name_parts_ = {});
+    ASTIdentifier(std::vector<String> && name_parts_);

    /** Get the text that identifies this element. */
    String getID(char delim) const override { return "Identifier" + (delim + name); }
--- a/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp
@ -126,17 +126,32 @@ static void appendGraphitePattern(
            throw Exception("Unknown element in config: " + key, ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG);
    }

-    if (!pattern.function)
-        throw Exception("Aggregate function is mandatory for retention patterns in GraphiteMergeTree",
+    if (!pattern.function && pattern.retentions.empty())
+        throw Exception("At least one of an aggregate function or retention rules is mandatory for rollup patterns in GraphiteMergeTree",
            ErrorCodes::NO_ELEMENTS_IN_CONFIG);

-    if (pattern.function->allocatesMemoryInArena())
-        throw Exception("Aggregate function " + pattern.function->getName() + " isn't supported in GraphiteMergeTree",
-                        ErrorCodes::NOT_IMPLEMENTED);
+    if (!pattern.function)
+    {
+        pattern.type = pattern.TypeRetention;
+    }
+    else if (pattern.retentions.empty())
+    {
+        pattern.type = pattern.TypeAggregation;
+    }
+    else
+    {
+        pattern.type = pattern.TypeAll;
+    }
+
+    if (pattern.type & pattern.TypeAggregation) /// TypeAggregation or TypeAll
+        if (pattern.function->allocatesMemoryInArena())
+            throw Exception("Aggregate function " + pattern.function->getName() + " isn't supported in GraphiteMergeTree",
+                            ErrorCodes::NOT_IMPLEMENTED);

    /// retention should be in descending order of age.
-    std::sort(pattern.retentions.begin(), pattern.retentions.end(),
-        [] (const Graphite::Retention & a, const Graphite::Retention & b) { return a.age > b.age; });
+    if (pattern.type & pattern.TypeRetention) /// TypeRetention or TypeAll
+        std::sort(pattern.retentions.begin(), pattern.retentions.end(),
+            [] (const Graphite::Retention & a, const Graphite::Retention & b) { return a.age > b.age; });

    patterns.emplace_back(pattern);
 }
--- a/dbms/src/Storages/System/StorageSystemGraphite.cpp
+++ b/dbms/src/Storages/System/StorageSystemGraphite.cpp
@ -148,13 +148,26 @@ void StorageSystemGraphite::fillData(MutableColumns & res_columns, const Context
        const auto patterns = readPatterns(config, section);
        for (const auto & pattern : patterns)
        {
-            for (const auto & ret : pattern.retentions)
+            if (!pattern.retentions.empty())
+            {
+                for (const auto & ret : pattern.retentions)
+                {
+                    res_columns[0]->insert(section);
+                    res_columns[1]->insert(pattern.regexp);
+                    res_columns[2]->insert(pattern.function);
+                    res_columns[3]->insert(ret.age);
+                    res_columns[4]->insert(ret.precision);
+                    res_columns[5]->insert(pattern.priority);
+                    res_columns[6]->insert(pattern.is_default);
+                }
+            }
+            else
            {
                res_columns[0]->insert(section);
                res_columns[1]->insert(pattern.regexp);
                res_columns[2]->insert(pattern.function);
-                res_columns[3]->insert(ret.age);
-                res_columns[4]->insert(ret.precision);
+                res_columns[3]->insert(0);
+                res_columns[4]->insert(0);
                res_columns[5]->insert(pattern.priority);
                res_columns[6]->insert(pattern.is_default);
            }
--- a/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml
+++ b/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml
@ -5,6 +5,29 @@
        <time_column_name>timestamp</time_column_name>
        <value_column_name>value</value_column_name>
        <version_column_name>updated</version_column_name>
+        <pattern>
+            <regexp>\.count$</regexp>
+            <function>sum</function>
+        </pattern>
+        <pattern>
+            <regexp>\.max$</regexp>
+            <function>max</function>
+        </pattern>
+        <pattern>
+          <regexp>^five_min\.</regexp>
+          <retention>
+              <age>0</age>
+              <precision>300</precision>
+          </retention>
+          <retention>
+              <age>5184000</age>
+              <precision>3600</precision>
+          </retention>
+          <retention>
+              <age>31536000</age>
+              <precision>14400</precision>
+          </retention>
+        </pattern>
        <pattern>
            <regexp>^one_min</regexp>
            <function>avg</function>
@ -22,4 +45,53 @@
            </retention>
        </pattern>
    </graphite_rollup>
+    <graphite_rollup_with_default>
+        <path_column_name>metric</path_column_name>
+        <time_column_name>timestamp</time_column_name>
+        <value_column_name>value</value_column_name>
+        <version_column_name>updated</version_column_name>
+        <pattern>
+            <regexp>\.count$</regexp>
+            <function>sum</function>
+        </pattern>
+        <pattern>
+            <regexp>\.max$</regexp>
+            <function>max</function>
+        </pattern>
+        <default>
+            <function>any</function>
+            <retention>
+                <age>0</age>
+                <precision>60</precision>
+            </retention>
+            <retention>
+                <age>7776000</age>
+                <precision>300</precision>
+            </retention>
+            <retention>
+                <age>31536000</age>
+                <precision>600</precision>
+            </retention>
+        </default>
+    </graphite_rollup_with_default>
+    <graphite_rollup_broken>
+        <path_column_name>metric</path_column_name>
+        <time_column_name>timestamp</time_column_name>
+        <value_column_name>value</value_column_name>
+        <version_column_name>updated</version_column_name>
+        <default>
+            <retention>
+                <age>0</age>
+                <precision>60</precision>
+            </retention>
+            <retention>
+                <age>7776000</age>
+                <precision>300</precision>
+            </retention>
+            <retention>
+                <age>31536000</age>
+                <precision>600</precision>
+            </retention>
+        </default>
+    </graphite_rollup_broken>
 </yandex>
--- a/dbms/tests/integration/test_graphite_merge_tree/test.py
+++ b/dbms/tests/integration/test_graphite_merge_tree/test.py
@ -8,31 +8,38 @@ from helpers.test_tools import TSV


 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=['configs/graphite_rollup.xml'])
+instance = cluster.add_instance('instance',
+                                main_configs=['configs/graphite_rollup.xml'])
+q = instance.query
+

@pytest.fixture(scope="module")
 def started_cluster():
    try:
        cluster.start()
-        instance.query('CREATE DATABASE test')
+        q('CREATE DATABASE test')

        yield cluster

    finally:
        cluster.shutdown()

+
@pytest.fixture
 def graphite_table(started_cluster):
-    instance.query('''
+    q('''
 DROP TABLE IF EXISTS test.graphite;
 CREATE TABLE test.graphite
    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
-    ENGINE = GraphiteMergeTree(date, (metric, timestamp), 8192, 'graphite_rollup');
+    ENGINE = GraphiteMergeTree('graphite_rollup')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=8192;
 ''')

    yield

-    instance.query('DROP TABLE test.graphite')
+    q('DROP TABLE test.graphite')


 def test_rollup_versions(graphite_table):
@ -40,13 +47,14 @@ def test_rollup_versions(graphite_table):
    rounded_timestamp = timestamp - timestamp % 60
    date = datetime.date.today().isoformat()

-    q = instance.query
-
-    # Insert rows with timestamps relative to the current time so that the first retention clause is active.
+    # Insert rows with timestamps relative to the current time so that the
+    # first retention clause is active.
    # Two parts are created.
    q('''
-INSERT INTO test.graphite (metric, value, timestamp, date, updated) VALUES ('one_min.x1', 100, {timestamp}, '{date}', 1);
-INSERT INTO test.graphite (metric, value, timestamp, date, updated) VALUES ('one_min.x1', 200, {timestamp}, '{date}', 2);
+INSERT INTO test.graphite (metric, value, timestamp, date, updated)
+      VALUES ('one_min.x1', 100, {timestamp}, '{date}', 1);
+INSERT INTO test.graphite (metric, value, timestamp, date, updated)
+      VALUES ('one_min.x1', 200, {timestamp}, '{date}', 2);
 '''.format(timestamp=timestamp, date=date))

    expected1 = '''\
@ -54,7 +62,9 @@ one_min.x1	100	{timestamp}	{date}	1
 one_min.x1	200	{timestamp}	{date}	2
 '''.format(timestamp=timestamp, date=date)

-    assert TSV(q('SELECT * FROM test.graphite ORDER BY updated')) == TSV(expected1)
+    assert TSV(
+        q('SELECT * FROM test.graphite ORDER BY updated')
+    ) == TSV(expected1)

    q('OPTIMIZE TABLE test.graphite')

@ -67,8 +77,6 @@ one_min.x1	200	{timestamp}	{date}	2


 def test_rollup_aggregation(graphite_table):
-    q = instance.query
-
    # This query essentially emulates what rollup does.
    result1 = q('''
 SELECT avg(v), max(upd)
@ -91,7 +99,8 @@ FROM (SELECT timestamp,
 '''
    assert TSV(result1) == TSV(expected1)

-    # Timestamp 1111111111 is in sufficiently distant past so that the last retention clause is active.
+    # Timestamp 1111111111 is in sufficiently distant past
+    # so that the last retention clause is active.
    result2 = q('''
 INSERT INTO test.graphite
    SELECT 'one_min.x' AS metric,
@ -114,7 +123,7 @@ one_min.x	999634.9918367347	1111444200	2017-02-02	499999


 def test_rollup_aggregation_2(graphite_table):
-    result = instance.query('''
+    result = q('''
 INSERT INTO test.graphite
    SELECT 'one_min.x' AS metric,
           toFloat64(number) AS value,
@ -136,7 +145,7 @@ one_min.x	24	1111110600	2017-02-02	100


 def test_multiple_paths_and_versions(graphite_table):
-    result = instance.query('''
+    result = q('''
 INSERT INTO test.graphite
    SELECT 'one_min.x' AS metric,
           toFloat64(number) AS value,
@ -163,7 +172,9 @@ OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL;
 SELECT * FROM test.graphite;
 ''')

-    with open(p.join(p.dirname(__file__), 'test_multiple_paths_and_versions.reference')) as reference:
+    with open(p.join(p.dirname(__file__),
+                     'test_multiple_paths_and_versions.reference')
+              ) as reference:
        assert TSV(result) == TSV(reference)


@ -177,14 +188,18 @@ def test_multiple_output_blocks(graphite_table):

        for j in range(3):
            cur_time = rolled_up_time + 100 * j
-            to_insert += 'one_min.x1	{}	{}	2001-09-09	1\n'.format(10 * j, cur_time)
-            to_insert += 'one_min.x1	{}	{}	2001-09-09	2\n'.format(10 * (j + 1), cur_time)
+            to_insert += 'one_min.x1	{}	{}	2001-09-09	1\n'.format(
+                10 * j, cur_time
+            )
+            to_insert += 'one_min.x1	{}	{}	2001-09-09	2\n'.format(
+                10 * (j + 1), cur_time
+            )

        expected += 'one_min.x1	20	{}	2001-09-09	2\n'.format(rolled_up_time)

-    instance.query('INSERT INTO test.graphite FORMAT TSV', to_insert)
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)

-    result = instance.query('''
+    result = q('''
 OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;

 SELECT * FROM test.graphite;
@ -200,14 +215,14 @@ zzzzzzzz	100	1000000001	2001-09-09	1
 zzzzzzzz	200	1000000001	2001-09-09	2
 '''

-    instance.query('INSERT INTO test.graphite FORMAT TSV', to_insert)
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)

    expected = '''\
 one_min.x1	100	999999600	2001-09-09	1
 zzzzzzzz	200	1000000001	2001-09-09	2
 '''

-    result = instance.query('''
+    result = q('''
 OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;

 SELECT * FROM test.graphite;
@ -215,27 +230,171 @@ SELECT * FROM test.graphite;

    assert TSV(result) == TSV(expected)

+
 def test_path_dangling_pointer(graphite_table):
-    instance.query('''
+    q('''
 DROP TABLE IF EXISTS test.graphite2;
 CREATE TABLE test.graphite2
-  (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
-  ENGINE = GraphiteMergeTree(date, (metric, timestamp), 1, 'graphite_rollup');
-  ''')
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+    ''')

-    path = 'abcd' * 4000000 # 16MB
-    instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t100\n".format(path))
-    instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t101\n".format(path))
+    path = 'abcd' * 4000000  # 16MB
+    q('INSERT INTO test.graphite2 FORMAT TSV',
+      "{}\t0.0\t0\t2018-01-01\t100\n".format(path))
+    q('INSERT INTO test.graphite2 FORMAT TSV',
+      "{}\t0.0\t0\t2018-01-01\t101\n".format(path))
    for version in range(10):
-        instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t{}\n".format(path, version))
+        q('INSERT INTO test.graphite2 FORMAT TSV',
+          "{}\t0.0\t0\t2018-01-01\t{}\n".format(path, version))

    while True:
-      instance.query('OPTIMIZE TABLE test.graphite2 PARTITION 201801 FINAL')
-      parts = int(instance.query("SELECT count() FROM system.parts WHERE active AND database='test' AND table='graphite2'"))
-      if parts == 1:
-        break
-      print "Parts", parts
+        q('OPTIMIZE TABLE test.graphite2 PARTITION 201801 FINAL')
+        parts = int(q("SELECT count() FROM system.parts "
+                      "WHERE active AND database='test' "
+                      "AND table='graphite2'"))
+        if parts == 1:
+            break
+        print('Parts', parts)

-    assert TSV(instance.query("SELECT value, timestamp, date, updated FROM test.graphite2")) == TSV("0\t0\t2018-01-01\t101\n")
+    assert TSV(
+        q("SELECT value, timestamp, date, updated FROM test.graphite2")
+    ) == TSV("0\t0\t2018-01-01\t101\n")

-    instance.query('DROP TABLE test.graphite2')
+    q('DROP TABLE test.graphite2')
+
+
+def test_combined_rules(graphite_table):
+    # 1487970000 ~ Sat 25 Feb 00:00:00 MSK 2017
+    to_insert = 'INSERT INTO test.graphite VALUES '
+    expected_unmerged = ''
+    for i in range(384):
+        to_insert += "('five_min.count', {v}, {t}, toDate({t}), 1), ".format(
+            v=1, t=1487970000+(i*300)
+        )
+        to_insert += "('five_min.max', {v}, {t}, toDate({t}), 1), ".format(
+            v=i, t=1487970000+(i*300)
+        )
+        expected_unmerged += ("five_min.count\t{v1}\t{t}\n"
+                              "five_min.max\t{v2}\t{t}\n").format(
+                                  v1=1, v2=i,
+                                  t=1487970000+(i*300)
+                              )
+
+    q(to_insert)
+    assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
+               ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
+
+    q('OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL')
+    expected_merged = '''
+        five_min.count	48	1487970000	2017-02-25	1
+        five_min.count	48	1487984400	2017-02-25	1
+        five_min.count	48	1487998800	2017-02-25	1
+        five_min.count	48	1488013200	2017-02-25	1
+        five_min.count	48	1488027600	2017-02-25	1
+        five_min.count	48	1488042000	2017-02-25	1
+        five_min.count	48	1488056400	2017-02-26	1
+        five_min.count	48	1488070800	2017-02-26	1
+        five_min.max	47	1487970000	2017-02-25	1
+        five_min.max	95	1487984400	2017-02-25	1
+        five_min.max	143	1487998800	2017-02-25	1
+        five_min.max	191	1488013200	2017-02-25	1
+        five_min.max	239	1488027600	2017-02-25	1
+        five_min.max	287	1488042000	2017-02-25	1
+        five_min.max	335	1488056400	2017-02-26	1
+        five_min.max	383	1488070800	2017-02-26	1
+    '''
+    assert TSV(q('SELECT * FROM test.graphite'
+                 ' ORDER BY (metric, timestamp)')) == TSV(expected_merged)
+
+
+def test_combined_rules_with_default(graphite_table):
+    q('''
+DROP TABLE IF EXISTS test.graphite;
+CREATE TABLE test.graphite
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup_with_default')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+      ''')
+    # 1487970000 ~ Sat 25 Feb 00:00:00 MSK 2017
+    to_insert = 'INSERT INTO test.graphite VALUES '
+    expected_unmerged = ''
+    for i in range(100):
+        to_insert += "('top_level.count', {v}, {t}, toDate({t}), 1), ".format(
+            v=1, t=1487970000+(i*60)
+        )
+        to_insert += "('top_level.max', {v}, {t}, toDate({t}), 1), ".format(
+            v=i, t=1487970000+(i*60)
+        )
+        expected_unmerged += ("top_level.count\t{v1}\t{t}\n"
+                              "top_level.max\t{v2}\t{t}\n").format(
+                                  v1=1, v2=i,
+                                  t=1487970000+(i*60)
+                              )
+
+    q(to_insert)
+    assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
+                 ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
+
+    q('OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL')
+    expected_merged = '''
+        top_level.count	10	1487970000	2017-02-25	1
+        top_level.count	10	1487970600	2017-02-25	1
+        top_level.count	10	1487971200	2017-02-25	1
+        top_level.count	10	1487971800	2017-02-25	1
+        top_level.count	10	1487972400	2017-02-25	1
+        top_level.count	10	1487973000	2017-02-25	1
+        top_level.count	10	1487973600	2017-02-25	1
+        top_level.count	10	1487974200	2017-02-25	1
+        top_level.count	10	1487974800	2017-02-25	1
+        top_level.count	10	1487975400	2017-02-25	1
+        top_level.max	9	1487970000	2017-02-25	1
+        top_level.max	19	1487970600	2017-02-25	1
+        top_level.max	29	1487971200	2017-02-25	1
+        top_level.max	39	1487971800	2017-02-25	1
+        top_level.max	49	1487972400	2017-02-25	1
+        top_level.max	59	1487973000	2017-02-25	1
+        top_level.max	69	1487973600	2017-02-25	1
+        top_level.max	79	1487974200	2017-02-25	1
+        top_level.max	89	1487974800	2017-02-25	1
+        top_level.max	99	1487975400	2017-02-25	1
+    '''
+    assert TSV(q('SELECT * FROM test.graphite'
+                 ' ORDER BY (metric, timestamp)')) == TSV(expected_merged)
+
+
+def test_broken_partial_rollup(graphite_table):
+    q('''
+DROP TABLE IF EXISTS test.graphite;
+CREATE TABLE test.graphite
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup_broken')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+      ''')
+    to_insert = '''\
+one_min.x1	100	1000000000	2001-09-09	1
+zzzzzzzz	100	1000000001	2001-09-09	1
+zzzzzzzz	200	1000000001	2001-09-09	2
+'''
+
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)
+
+    expected = '''\
+one_min.x1	100	1000000000	2001-09-09	1
+zzzzzzzz	200	1000000001	2001-09-09	2
+'''
+
+    result = q('''
+OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;
+
+SELECT * FROM test.graphite;
+''')
+
+    assert TSV(result) == TSV(expected)
--- a/dbms/tests/performance/string_sort/string_sort.xml
+++ b/dbms/tests/performance/string_sort/string_sort.xml
@ -0,0 +1,55 @@
+<test>
+    <name>String sorting</name>
+
+    <preconditions>
+        <table_exists>hits_10m_single</table_exists>
+    </preconditions>
+
+    <type>loop</type>
+
+    <stop_conditions>
+        <all_of>
+            <iterations>5</iterations>
+            <min_time_not_changing_for_ms>10000</min_time_not_changing_for_ms>
+        </all_of>
+        <any_of>
+            <iterations>50</iterations>
+            <total_time_ms>60000</total_time_ms>
+        </any_of>
+    </stop_conditions>
+
+    <substitutions>
+       <substitution>
+           <name>str1</name>
+           <values>
+               <value>URL</value>
+               <value>Referer</value>
+               <value>Title</value>
+               <value>SearchPhrase</value>
+               <value>MobilePhoneModel</value>
+               <value>PageCharset</value>
+           </values>
+       </substitution>
+       <substitution>
+           <name>str2</name>
+           <values>
+               <value>URL</value>
+               <value>Referer</value>
+               <value>Title</value>
+               <value>SearchPhrase</value>
+               <value>MobilePhoneModel</value>
+               <value>PageCharset</value>
+           </values>
+       </substitution>
+    </substitutions>
+
+    <query><![CDATA[SELECT {str1} FROM hits_10m_single ORDER BY {str1} LIMIT 10]]></query>
+    <query><![CDATA[SELECT {str1} FROM hits_10m_single ORDER BY {str1} LIMIT 9000000, 10]]></query>
+
+    <query><![CDATA[SELECT {str1}, {str2} FROM hits_10m_single ORDER BY {str1}, {str2} LIMIT 10]]></query>
+    <query><![CDATA[SELECT {str1}, {str2} FROM hits_10m_single ORDER BY {str1}, {str2} LIMIT 9000000, 10]]></query>
+
+    <main_metric>
+        <min_time/>
+    </main_metric>
+</test>
--- a/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference
+++ b/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference
@ -20,7 +20,7 @@ SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) A
 3	3
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        name, \n        value, \n        min(id) AS id\n    FROM test.test \n    GROUP BY \n        date, \n        name, \n        value\n    HAVING id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) AS a, \n        b\n    FROM test.test AS table_alias \n    HAVING b = 3\n) AS outer_table_alias \nWHERE outer_table_alias.b = 3
+SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) AS a, \n        b\n    FROM test.test AS table_alias \n    HAVING b = 3\n) AS outer_table_alias \nWHERE b = 3
 3	3
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
@ -32,9 +32,9 @@ SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n
 2000-01-01	1	test string 1	1
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) \n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) AS b \nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) AS b \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) AS a \n    WHERE id = 1\n) AS b \nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) AS a \n    WHERE id = 1\n) AS b \nWHERE id = 1
 2000-01-01	1	test string 1	1
 SELECT \n    id, \n    date, \n    value\nFROM \n(\n    SELECT \n        id, \n        date, \n        min(value) AS value\n    FROM test.test \n    WHERE id = 1\n    GROUP BY \n        id, \n        date\n) \nWHERE id = 1
 1	2000-01-01	1
@ -45,11 +45,11 @@ SELECT \n    date, \n    id, \n    name, \n    value, \n    date, \n    name, \n
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
 SELECT \n    id, \n    date, \n    name, \n    value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test USING (id)\nWHERE value = 1
 1	2000-01-01	test string 1	1
-SELECT b.value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test AS b USING (id)\nWHERE value = 1
+SELECT value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test AS b USING (id)\nWHERE value = 1
 1
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value, \n        date, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) \n    ANY LEFT JOIN \n    (\n        SELECT *\n        FROM test.test \n        WHERE id = 1\n    ) USING (id)\n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value, \n    `b.date`, \n    `b.name`, \n    `b.value`\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE id = 1\n) AS b USING (id)\nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value, \n    b.date, \n    b.name, \n    b.value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE id = 1\n) AS b USING (id)\nWHERE b.id = 1
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
 SELECT \n    id, \n    date, \n    name, \n    value\nFROM \n(\n    SELECT \n        toInt8(1) AS id, \n        toDate(\'2000-01-01\') AS date\n    FROM system.numbers \n    LIMIT 1\n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE date = toDate(\'2000-01-01\')\n) AS b USING (date, id)\nWHERE b.date = toDate(\'2000-01-01\')
 1	2000-01-01	test string 1	1
--- a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference
+++ b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference
@ -1,3 +1,5 @@
+0	0
+0	0
 cross
 1	1	1	1
 1	1	1	2
@ -67,7 +69,7 @@ Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  Expression
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 2)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1 (alias x)\n     TablesInSelectQueryElement (children 2)\n      TableJoin (children 1)\n       Function and (children 1)\n        ExpressionList (children 2)\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier x.a\n           Identifier y.a\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier x.b\n           Identifier y.b\n      TableExpression (children 1)\n       Identifier t1 (alias y)\n
 cross one table expr
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
-Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableJoin\n      TableExpression (children 1)\n       Identifier t2\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
+Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
 cross multiple ands
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function and (children 1)\n     ExpressionList (children 2)\n      Function equals (children 1)\n       ExpressionList (children 2)\n        Identifier t1.a\n        Identifier t2.a\n      Function equals (children 1)\n       ExpressionList (children 2)\n        Identifier t1.b\n        Identifier t2.b\n
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 2)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableJoin (children 1)\n       Function and (children 1)\n        ExpressionList (children 2)\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier t1.a\n           Identifier t2.a\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier t1.b\n           Identifier t2.b\n      TableExpression (children 1)\n       Identifier t2\n
--- a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql
+++ b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql
@ -1,6 +1,11 @@
 SET enable_debug_queries = 1;
 USE test;

+set allow_experimental_cross_to_join_conversion = 0;
+select * from system.one cross join system.one;
+set allow_experimental_cross_to_join_conversion = 1;
+select * from system.one cross join system.one;
+
 DROP TABLE IF EXISTS t1;
 DROP TABLE IF EXISTS t2;

--- a/dbms/tests/queries/0_stateless/00829_bitmap_function.reference
+++ b/dbms/tests/queries/0_stateless/00829_bitmap_function.reference
@ -0,0 +1,17 @@
+[1,2,3,4,5]
+[3]
+[1,2,3,4,5]
+[1,2,4,5]
+[1,2]
+5
+1
+5
+4
+2
+70
+2019-01-01	50	[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50]
+2019-01-02	60	[11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70]
+60	50	70	40	20	30
+60	50	70	40	20	30
+2019-01-01	50
+2019-01-02	60
--- a/dbms/tests/queries/0_stateless/00829_bitmap_function.sql
+++ b/dbms/tests/queries/0_stateless/00829_bitmap_function.sql
@ -0,0 +1,77 @@
+SELECT bitmapToArray(bitmapBuild([1, 2, 3, 4, 5]));
+SELECT bitmapToArray(bitmapAnd(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])));
+SELECT bitmapToArray(bitmapOr(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])));
+SELECT bitmapToArray(bitmapXor(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])));
+SELECT bitmapToArray(bitmapAndnot(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])));
+SELECT bitmapCardinality(bitmapBuild([1, 2, 3, 4, 5]));
+SELECT bitmapAndCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]));
+SELECT bitmapOrCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]));
+SELECT bitmapXorCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]));
+SELECT bitmapAndnotCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]));
+
+DROP TABLE IF EXISTS test.bitmap_test;
+CREATE TABLE test.bitmap_test(pickup_date Date, city_id UInt32, uid UInt32)ENGINE = Memory;
+INSERT INTO test.bitmap_test SELECT '2019-01-01', 1, number FROM numbers(1,50);
+INSERT INTO test.bitmap_test SELECT '2019-01-02', 1, number FROM numbers(11,60);
+
+
+SELECT groupBitmap( uid ) AS user_num FROM test.bitmap_test;
+
+SELECT pickup_date, groupBitmap( uid ) AS user_num, bitmapToArray(groupBitmapState( uid )) AS users FROM test.bitmap_test GROUP BY pickup_date;
+
+SELECT
+    bitmapCardinality(day_today) AS today_users,
+    bitmapCardinality(day_before) AS before_users,
+    bitmapOrCardinality(day_today, day_before) AS all_users,
+    bitmapAndCardinality(day_today, day_before) AS old_users,
+    bitmapAndnotCardinality(day_today, day_before) AS new_users,
+    bitmapXorCardinality(day_today, day_before) AS diff_users
+FROM
+(
+ SELECT city_id, groupBitmapState( uid ) AS day_today FROM test.bitmap_test WHERE pickup_date = '2019-01-02' GROUP BY city_id
+ )
+ALL LEFT JOIN
+(
+ SELECT city_id, groupBitmapState( uid ) AS day_before FROM test.bitmap_test WHERE pickup_date = '2019-01-01' GROUP BY city_id
+)
+USING city_id;
+
+SELECT
+    bitmapCardinality(day_today) AS today_users,
+    bitmapCardinality(day_before) AS before_users,
+    bitmapCardinality(bitmapOr(day_today, day_before))ll_users,
+    bitmapCardinality(bitmapAnd(day_today, day_before)) AS old_users,
+    bitmapCardinality(bitmapAndnot(day_today, day_before)) AS new_users,
+    bitmapCardinality(bitmapXor(day_today, day_before)) AS diff_users
+FROM
+(
+ SELECT city_id, groupBitmapState( uid ) AS day_today FROM test.bitmap_test WHERE pickup_date = '2019-01-02' GROUP BY city_id
+ )
+ALL LEFT JOIN
+(
+ SELECT city_id, groupBitmapState( uid ) AS day_before FROM test.bitmap_test WHERE pickup_date = '2019-01-01' GROUP BY city_id
+)
+USING city_id;
+
+
+DROP TABLE IF EXISTS test.bitmap_state_test;
+CREATE TABLE test.bitmap_state_test
+(
+	pickup_date Date,
+	city_id UInt32,
+    uv AggregateFunction( groupBitmap, UInt32 )	
+)
+ENGINE = AggregatingMergeTree( pickup_date, ( pickup_date, city_id ), 8192);
+
+INSERT INTO test.bitmap_state_test SELECT 
+    pickup_date, 
+    city_id,
+    groupBitmapState(uid) AS uv
+FROM test.bitmap_test
+GROUP BY pickup_date, city_id;
+	
+SELECT pickup_date, groupBitmapMerge(uv) AS users from test.bitmap_state_test group by pickup_date;
+
+DROP TABLE IF EXISTS test.bitmap_test;
+DROP TABLE IF EXISTS test.bitmap_state_test;
+
--- a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
@ -0,0 +1,45 @@
+Row 1:
+──────
+t.a: 1
+s.b: 1
+s.a: 1
+s.b: 1
+y.a: 1
+y.b: 1
+
+Row 2:
+──────
+t.a: 2
+s.b: 0
+s.a: 0
+s.b: 0
+y.a: 0
+y.b: 0
+┌─t.a─┬─s.b─┬─s.a─┬─s.b─┬─y.a─┬─y.b─┐
+│   1 │   1 │   1 │   1 │   1 │   1 │
+│   2 │   0 │   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┴─────┴─────┘
+┌─t_a─┐
+│   1 │
+│   2 │
+└─────┘
+┌─t.a─┬─s_a─┐
+│   1 │   1 │
+│   2 │   0 │
+└─────┴─────┘
+┌─t.a─┬─t.a─┬─t_b─┐
+│   1 │   1 │   1 │
+│   2 │   2 │   2 │
+└─────┴─────┴─────┘
+┌─s.a─┬─s.a─┬─s_b─┬─s_b─┐
+│   1 │   1 │   1 │   1 │
+│   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┘
+┌─y.a─┬─y.a─┬─y_b─┬─y_b─┐
+│   1 │   1 │   1 │   1 │
+│   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┘
+┌─t_a─┬─t_a─┬─s_a─┬─s_a─┬─y_a─┬─y_a─┐
+│   1 │   1 │   1 │   1 │   1 │   1 │
+│   2 │   2 │   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┴─────┴─────┘
--- a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
@ -0,0 +1,48 @@
+use test;
+
+drop table if exists t;
+drop table if exists s;
+drop table if exists y;
+
+create table t(a Int64, b Int64) engine = TinyLog;
+create table s(a Int64, b Int64) engine = TinyLog;
+create table y(a Int64, b Int64) engine = TinyLog;
+
+insert into t values (1,1), (2,2);
+insert into s values (1,1);
+insert into y values (1,1);
+
+select t.a, s.b, s.a, s.b, y.a, y.b from t
+left join s on (t.a = s.a and t.b = s.b)
+left join y on (y.a = s.a and y.b = s.b) format Vertical;
+
+select t.a, s.b, s.a, s.b, y.a, y.b from t
+left join s on (t.a = s.a and s.b = t.b)
+left join y on (y.a = s.a and y.b = s.b) format PrettyCompactNoEscapes;
+
+select t.a as t_a from t
+left join s on s.a = t_a format PrettyCompactNoEscapes;
+
+select t.a, s.a as s_a from t
+left join s on s.a = t.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select t.a, t.a, t.b as t_b from t
+left join s on t.a = s.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select s.a, s.a, s.b as s_b, s.b from t
+left join s on s.a = t.a
+left join y on s.b = y.b format PrettyCompactNoEscapes;
+
+select y.a, y.a, y.b as y_b, y.b from t
+left join s on s.a = t.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select t.a, t.a as t_a, s.a, s.a as s_a, y.a, y.a as y_a from t
+left join s on t.a = s.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+drop table t;
+drop table s;
+drop table y;
--- a/dbms/tests/queries/0_stateless/00912_string_comparison.reference
+++ b/dbms/tests/queries/0_stateless/00912_string_comparison.reference
@ -0,0 +1,369 @@
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+1	0	0	1	1
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	1	0	1	0
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+1	0	0	1	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	0	1	0	1
+0	1	0	1	0
+0	0	1	0	1
+0	1	0	1	0
+0	0	1	0	1
+0	1	0	1	0
+0	0	1	0	1
+0	1	0	1	0
+0	0	1	0	1
+1
--- a/dbms/tests/queries/0_stateless/00912_string_comparison.sql
+++ b/dbms/tests/queries/0_stateless/00912_string_comparison.sql
@ -0,0 +1,18 @@
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' AS a, prefix || 'y' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'y' AS a, prefix || 'x' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' AS a, prefix || 'x' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' || prefix AS a, prefix || 'y' || prefix AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'y' || prefix AS a, prefix || 'x' || prefix AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' || prefix AS a, prefix || 'x' || prefix AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' || prefix AS a, prefix || 'y' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'y' || prefix AS a, prefix || 'x' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+WITH substring('aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa', 1, number) AS prefix, prefix || 'x' || prefix AS a, prefix || 'x' AS b SELECT a = b, a < b, a > b, a <= b, a >= b FROM numbers(40);
+
+WITH arrayJoin(['aaa', 'bbb']) AS a, 'aaa\0bbb' AS b SELECT a = b, a < b, a > b, a <= b, a >= b;
+WITH arrayJoin(['aaa', 'zzz']) AS a, 'aaa\0bbb' AS b SELECT a = b, a < b, a > b, a <= b, a >= b;
+WITH arrayJoin(['aaa', 'bbb']) AS a, materialize('aaa\0bbb') AS b SELECT a = b, a < b, a > b, a <= b, a >= b;
+WITH arrayJoin(['aaa', 'zzz']) AS a, materialize('aaa\0bbb') AS b SELECT a = b, a < b, a > b, a <= b, a >= b;
+
+SELECT empty(toFixedString('', 1 + randConstant() % 100));
--- a/dbms/tests/queries/0_stateless/00913_many_threads.reference
+++ b/dbms/tests/queries/0_stateless/00913_many_threads.reference
@ -0,0 +1,4 @@
+1
+1500
+0
+Ok.
--- a/dbms/tests/queries/0_stateless/00913_many_threads.sql
+++ b/dbms/tests/queries/0_stateless/00913_many_threads.sql
@ -0,0 +1,13 @@
+-- This test creates many threads to test a case when ThreadPool will remove some threads from pool after job is done.
+SET max_block_size = 1, min_insert_block_size_rows = 0, min_insert_block_size_bytes = 0;
+
+CREATE TEMPORARY TABLE t (x UInt64);
+INSERT INTO t SELECT * FROM system.numbers LIMIT 1500;
+
+SELECT DISTINCT blockSize() FROM t;
+
+SET max_threads = 1500;
+
+SELECT count() FROM t;
+SELECT sum(sleep(0.1)) FROM t; -- All threads have time to be created.
+SELECT 'Ok.';
--- a/docs/en/operations/table_engines/graphitemergetree.md
+++ b/docs/en/operations/table_engines/graphitemergetree.md
@ -75,6 +75,13 @@ Rollup configuration structure:

 ```
 required-columns
+pattern
+    regexp
+    function
+pattern
+    regexp
+    age + precision
+    ...
 pattern
    regexp
    function
@ -88,15 +95,20 @@ default
    ...
 ```

-When processing a row, ClickHouse checks the rules in the `pattern` section. If the metric name matches the `regexp`, the rules from the `pattern`section are applied; otherwise, the rules from the `default` section are used.
+**Important:** The order of patterns should be next:

-The rules are defined with fields `function` and `age + precision`.
+1. Patterns *without* `function` *or* `retention`.
+1. Patterns *with* both `function` *and* `retention`.
+1. Pattern `dafault`.
+
+
+When processing a row, ClickHouse checks the rules in the `pattern` sections. Each of `pattern` (including `default`) sections could contain `function` parameter for aggregation, `retention` parameters or both. If the metric name matches the `regexp`, the rules from the `pattern` section (or sections) are applied; otherwise, the rules from the `default` section are used.

 Fields for `pattern` and `default` sections:

 - `regexp`– A pattern for the metric name.
 - `age` – The minimum age of the data in seconds.
- `precision`– How precisely to define the age of the data in seconds.
+- `precision`– How precisely to define the age of the data in seconds. Should be a divisor for 86400 (seconds in a day).
 - `function` – The name of the aggregating function to apply to data whose age falls within the range `[age, age + precision]`.

 The `required-columns`:
--- a/docs/en/query_language/agg_functions/reference.md
+++ b/docs/en/query_language/agg_functions/reference.md
@ -179,6 +179,48 @@ binary     decimal
 01101000 = 104
 ```

+
+##groupBitmap
+
+Bitmap or Aggregate calculations from a unsigned integer column, return cardinality of type UInt64, if add suffix -State, then return [bitmap object](../functions/bitmap_functions.md).
+
+```
+groupBitmap(expr)
+```
+
+**Parameters**
+
+`expr` – An expression that results in `UInt*` type.
+
+**Return value**
+
+Value of the `UInt64` type.
+
+**Example**
+
+Test data:
+
+```
+userid
+1
+1
+2
+3
+```
+
+Query:
+
+```
+SELECT groupBitmap(userid) as num FROM t
+```
+
+Result:
+
+```
+num
+3
+```
+
 ## min(x) {#agg_function-min}

 Calculates the minimum.
--- a/docs/en/query_language/functions/bitmap_functions.md
+++ b/docs/en/query_language/functions/bitmap_functions.md
@ -0,0 +1,277 @@
+# Bitmap functions
+
+Bitmap functions work for two bitmaps Object value calculation, it is to return new bitmap or cardinality while using formula calculation, such as and, or, xor, and not, etc.
+
+There are 2 kinds of construction methods for Bitmap Object. One is to be constructed by aggregation function groupBitmap with -State, the other is to be constructed by Array Object. It is also to convert Bitmap Object to Array Object.
+
+RoaringBitmap is wrapped into a data structure while actual storage of Bitmap objects. When the cardinality is less than or equal to 32, it uses Set objet. When the cardinality is greater than 32, it uses RoaringBitmap object. That is why storage of low cardinality set is faster. 
+
+For more information on RoaringBitmap, see: [CRoaring](https://github.com/RoaringBitmap/CRoaring).
+
+
+## bitmapBuild
+
+Build a bitmap from unsigned integer array.
+
+```
+bitmapBuild(array)
+```
+
+**Parameters**
+
+- `array` – unsigned integer array.
+
+**Example**
+
+``` sql
+SELECT bitmapBuild([1, 2, 3, 4, 5]) AS res
+```
+
+## bitmapToArray
+
+Convert bitmap to integer array.
+
+```
+bitmapToArray(bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapToArray(bitmapBuild([1, 2, 3, 4, 5])) AS res
+```
+
+```
+┌─res─────────┐
+│ [1,2,3,4,5] │
+└─────────────┘
+```
+
+
+## bitmapAnd
+
+Two bitmap and calculation, the result is a new bitmap.
+
+```
+bitmapAnd(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapToArray(bitmapAnd(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]))) AS res
+```
+
+```
+┌─res─┐
+│ [3] │
+└─────┘
+```
+
+
+## bitmapOr
+
+Two bitmap or calculation, the result is a new bitmap.
+
+```
+bitmapOr(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapToArray(bitmapOr(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]))) AS res
+```
+
+```
+┌─res─────────┐
+│ [1,2,3,4,5] │
+└─────────────┘
+```
+
+## bitmapXor
+
+Two bitmap xor calculation, the result is a new bitmap.
+
+```
+bitmapXor(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapToArray(bitmapXor(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]))) AS res
+```
+
+```
+┌─res───────┐
+│ [1,2,4,5] │
+└───────────┘
+```
+
+## bitmapAndnot
+
+Two bitmap andnot calculation, the result is a new bitmap.
+
+```
+bitmapAndnot(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapToArray(bitmapAndnot(bitmapBuild([1,2,3]),bitmapBuild([3,4,5]))) AS res
+```
+
+```
+┌─res───┐
+│ [1,2] │
+└───────┘
+```
+
+## bitmapCardinality
+
+Retrun bitmap cardinality of type UInt64.
+
+
+```
+bitmapCardinality(bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapCardinality(bitmapBuild([1, 2, 3, 4, 5])) AS res
+```
+
+```
+┌─res─┐
+│   5 │
+└─────┘
+```
+
+## bitmapAndCardinality
+
+Two bitmap and calculation, return cardinality of type UInt64.
+
+
+```
+bitmapAndCardinality(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapAndCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])) AS res;
+```
+
+```
+┌─res─┐
+│   1 │
+└─────┘
+```
+
+
+## bitmapOrCardinality
+
+Two bitmap or calculation, return cardinality of type UInt64.
+
+```
+bitmapOrCardinality(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapOrCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])) AS res;
+```
+
+```
+┌─res─┐
+│   5 │
+└─────┘
+```
+
+## bitmapXorCardinality
+
+Two bitmap xor calculation, return cardinality of type UInt64.
+
+```
+bitmapXorCardinality(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapXorCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])) AS res;
+```
+
+```
+┌─res─┐
+│   4 │
+└─────┘
+```
+
+
+## bitmapAndnotCardinality
+
+Two bitmap andnot calculation, return cardinality of type UInt64.
+
+```
+bitmapAndnotCardinality(bitmap,bitmap)
+```
+
+**Parameters**
+
+- `bitmap` – bitmap object.
+
+**Example**
+
+``` sql
+SELECT bitmapAndnotCardinality(bitmapBuild([1,2,3]),bitmapBuild([3,4,5])) AS res;
+```
+
+```
+┌─res─┐
+│   2 │
+└─────┘
+```
+
+
+[Original article](https://clickhouse.yandex/docs/en/query_language/functions/bitmap_functions/) <!--hide-->
--- a/docs/en/query_language/select.md
+++ b/docs/en/query_language/select.md
@ -46,14 +46,23 @@ The FINAL modifier can be used only for a SELECT from a CollapsingMergeTree tabl

 ### SAMPLE Clause {#select-sample-clause}

-The SAMPLE clause allows for approximated query processing. Approximated query processing is only supported by the tables in the `MergeTree` family, and only if the sampling expression was specified during table creation (see the section [MergeTree engine](../operations/table_engines/mergetree.md)).
+The `SAMPLE` clause allows for approximated query processing. Approximated query processing is only supported by the tables in the `MergeTree` family, and only if the sampling expression was specified during table creation (see [MergeTree engine](../operations/table_engines/mergetree.md)).

-`SAMPLE` has the `SAMPLE k`, where `k` is a decimal number from 0 to 1, or `SAMPLE n`, where 'n' is a sufficiently large integer.
+The features of data sampling are listed below:

-In the first case, the query will be executed on 'k' percent of data. For example, `SAMPLE 0.1` runs the query on 10% of data.
-In the second case, the query will be executed on a sample of no more than 'n' rows. For example, `SAMPLE 10000000` runs the query on a maximum of 10,000,000 rows.
+- Data sampling is a deterministic mechanism. The result of the same `SELECT .. SAMPLE` query is always the same.
+- Sampling works consistently for different tables. For tables with a single sampling key, a sample with the same coefficient always selects the same subset of possible data. For example, a sample of user IDs takes rows with the same subset of all the possible user IDs from different tables. This allows using the sample in subqueries in the `IN` clause, as well as for manually correlating results of different queries with samples.
+- Sampling allows reading less data from a disk. Note that for this you must specify the sampling key correctly. For more details see [Creating a MergeTree Table](../operations/table_engines/mergetree.md#table_engine-mergetree-creating-a-table).

-Example:
+The `SAMPLE` clause can be specified in several ways:
+
+- `SAMPLE k`, where `k` is a decimal number from 0 to 1. The query is executed on `k` percent of data. For example, `SAMPLE 0.1` runs the query on 10% of data. [Read more](#select-sample-k)
+- `SAMPLE n`, where `n` is a sufficiently large integer. The query is executed on a sample of at least `n` rows (but not significantly more than this). For example, `SAMPLE 10000000` runs the query on a minimum of 10,000,000 rows. [Read more](#select-sample-n)
+- `SAMPLE k OFFSET m` where `k` and `m` are numbers from 0 to 1. The query is executed on a sample of `k` percent of the data. The data used for the sample is offset by `m` percent. [Read more](#select-sample-offset)
+
+#### SAMPLE k {#select-sample-k}
+
+In a `SAMPLE k` clause, `k` is a percent amount of data that the sample is taken from. The example is shown below:

 ``` sql
 SELECT
@ -63,26 +72,47 @@ FROM hits_distributed
 SAMPLE 0.1
 WHERE
    CounterID = 34
-    AND toDate(EventDate) >= toDate('2013-01-29')
-    AND toDate(EventDate) <= toDate('2013-02-04')
-    AND NOT DontCountHits
-    AND NOT Refresh
-    AND Title != ''
 GROUP BY Title
 ORDER BY PageViews DESC LIMIT 1000
 ```

 In this example, the query is executed on a sample from 0.1 (10%) of data. Values of aggregate functions are not corrected automatically, so to get an approximate result, the value 'count()' is manually multiplied by 10.

-When using something like `SAMPLE 10000000`, there isn't any information about which relative percent of data was processed or what the aggregate functions should be multiplied by, so this method of writing is not always appropriate to the situation.
+#### SAMPLE n {#select-sample-n}

-A sample with a relative coefficient is "consistent": if we look at all possible data that could be in the table, a sample (when using a single sampling expression specified during table creation) with the same coefficient always selects the same subset of possible data. In other words, a sample from different tables on different servers at different times is made the same way.
+In this case, the query is executed on a sample of at least `n` rows, where `n` is a sufficiently large integer. For example, `SAMPLE 10000000`.

-For example, a sample of user IDs takes rows with the same subset of all the possible user IDs from different tables. This allows using the sample in subqueries in the IN clause, as well as for manually correlating results of different queries with samples.
+Since the minimum unit for data reading is one granule (its size is set by the `index_granularity` setting), it makes sense to set a sample that is much larger than the size of the granule.

-**SAMPLE OFFSET**
+When using the `SAMPLE n` clause, the relative coefficient is calculated dynamically. Since you do not know which relative percent of data was processed, you do not know the coefficient the aggregate functions should be multiplied by (for example, you do not know if the `SAMPLE 1000000` was taken from a set of 10,000,000 rows or from a set of 1,000,000,000 rows). In this case, use the `_sample_factor` column to get the approximate result.

-You can specify the `SAMPLE k OFFSET n` clause, where `k` and `n` are numbers from 0 to 1. Examples are shown below.
+The `_sample_factor` is a virtual column that ClickHouse stores relative coefficients in. This column is created automatically when you create a table with the specified sampling key. The usage example is shown below:
+
+``` sql
+SELECT sum(Duration * _sample_factor)
+FROM visits
+SAMPLE 10000000
+```   
+
+If you need to get the approximate count of rows in a `SELECT .. SAMPLE n` query, get the sum() of `_sample_factor` column instead of counting `count(column * _sample_factor)` value. For example:
+
+``` sql
+SELECT sum(_sample_factor)
+FROM visits
+SAMPLE 10000000
+```  
+
+Note that to calculate the average in a `SELECT .. SAMPLE n` query, you do not need to use `_sample_factor` column:
+
+``` sql
+SELECT avg(Duration)
+FROM visits
+SAMPLE 10000000
+```  
+ 
+#### SAMPLE k OFFSET m {#select-sample-offset}
+
+You can specify the `SAMPLE k OFFSET m` clause, where `k` and `m` are numbers from 0 to 1. Examples are shown below.

 Example 1.

@ -718,10 +748,10 @@ DISTINCT is not supported if SELECT has at least one array column.

 ### LIMIT Clause

-LIMIT m allows you to select the first 'm' rows from the result.
-LIMIT n, m allows you to select the first 'm' rows from the result after skipping the first 'n' rows.
+`LIMIT m` allows you to select the first `m` rows from the result.
+`LIMIT n`, m allows you to select the first `m` rows from the result after skipping the first `n` rows.

-'n' and 'm' must be non-negative integers.
+`n` and `m` must be non-negative integers.

 If there isn't an ORDER BY clause that explicitly sorts results, the result may be arbitrary and nondeterministic.

--- a/docs/redirects.txt
+++ b/docs/redirects.txt
@ -86,6 +86,7 @@ functions/arithmetic_functions.md query_language/functions/arithmetic_functions.
 functions/array_functions.md query_language/functions/array_functions.md
 functions/array_join.md query_language/functions/array_join.md
 functions/bit_functions.md query_language/functions/bit_functions.md
+functions/bitmap_functions.md query_language/functions/bitmap_functions.md
 functions/comparison_functions.md query_language/functions/comparison_functions.md
 functions/conditional_functions.md query_language/functions/conditional_functions.md
 functions/date_time_functions.md query_language/functions/date_time_functions.md
--- a/docs/ru/operations/table_engines/graphitemergetree.md
+++ b/docs/ru/operations/table_engines/graphitemergetree.md
@ -72,12 +72,19 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]

 ## Конфигурация rollup

-Настройки для прореживания данных задаются параметром [graphite_rollup](../server_settings/settings.md#server_settings-graphite_rollup) Имя параметра может быть любым. Можно создать несколько конфигураций и использовать их для разных таблиц.
+Настройки для прореживания данных задаются параметром [graphite_rollup](../server_settings/settings.md#server_settings-graphite_rollup). Имя параметра может быть любым. Можно создать несколько конфигураций и использовать их для разных таблиц.

 Структура конфигурации rollup:

 ```
 required-columns
+pattern
+    regexp
+    function
+pattern
+    regexp
+    age + precision
+    ...
 pattern
    regexp
    function
@ -91,15 +98,19 @@ default
    ...
 ```

-При обработке строки ClickHouse проверяет правила в разделе `pattern`. Если имя метрики соответствует шаблону `regexp`, то  применяются правила из раздела `pattern`, в противном случае из раздела `default`.
+**Важно**: порядок разделов `pattern` должен быть следующим:

-Правила определяются с помощью полей `function` и `age + precision`.
+1. Разделы *без* параметра `function` *или* `retention`.
+1. Разделы *с* параметрами `function` *и* `retention`.
+1. Раздел `default`.

-Поля для разделов `pattenrn` и `default`:
+При обработке строки ClickHouse проверяет правила в разделах `pattern`. Каждый из разделов `pattern` (включая `default`) может содержать параметр `function` для аггрегации, правила `retention` для прореживания или оба эти параметра. Если имя метрики соответствует шаблону `regexp`, то применяются правила из раздела (или разделов) `pattern`, в противном случае из раздела `default`.
+
+Поля для разделов `pattern` и `default`:

 - `regexp` – шаблон имени метрики.
 - `age` – минимальный возраст данных в секундах.
- `precision` – точность определения возраста данных в секундах.
+- `precision` – точность определения возраста данных в секундах. Должен быть делителем для 86400 (количество секунд в дне).
 - `function` – имя агрегирующей функции, которую следует применить к данным, чей возраст оказался в интервале `[age, age + precision]`.

 `required-columns`:
@ -117,6 +128,10 @@ default
    <time_column_name>Time</time_column_name>
    <value_column_name>Value</value_column_name>
    <version_column_name>Version</version_column_name>
+    <pattern>
+        <regexp>\.count$</regexp>
+        <function>sum</function>
+    </pattern>
    <pattern>
        <regexp>click_cost</regexp>
        <function>any</function>
--- a/docs/ru/query_language/select.md
+++ b/docs/ru/query_language/select.md
@ -712,8 +712,6 @@ WHERE и HAVING отличаются тем, что WHERE выполняется

 `DISTINCT` работает с [NULL](syntax.md) как если бы `NULL` был конкретным значением, причём `NULL=NULL`. Т.е. в результате `DISTINCT` разные комбинации с `NULL` встретятся только по одному разу.

-`DISTINCT` работает с [NULL](syntax.md) как если бы `NULL` был конкретным значением, причём `NULL=NULL`. Т.е. в результате `DISTINCT` разные комбинации с `NULL` встретятся только по одному разу.
-
 ### Секция LIMIT

 LIMIT m позволяет выбрать из результата первые m строк.
--- a/docs/toc_en.yml
+++ b/docs/toc_en.yml
@ -115,6 +115,7 @@ nav:
    - 'Working with Arrays': 'query_language/functions/array_functions.md'
    - 'Splitting and Merging Strings and Arrays': 'query_language/functions/splitting_merging_functions.md'
    - 'Bit': 'query_language/functions/bit_functions.md'
+    - 'Bitmap functions': 'query_language/functions/bitmap_functions.md'    
    - 'Hash': 'query_language/functions/hash_functions.md'
    - 'Generating Pseudo-Random Numbers': 'query_language/functions/random_functions.md'
    - 'Encoding': 'query_language/functions/encoding_functions.md'
--- a/docs/zh/operations/table_engines/graphitemergetree.md
+++ b/docs/zh/operations/table_engines/graphitemergetree.md
@ -1,148 +0,0 @@
-
-# GraphiteMergeTree
-
-This engine is designed for rollup (thinning and aggregating/averaging) [Graphite](http://graphite.readthedocs.io/en/latest/index.html) data. It may be helpful to developers who want to use ClickHouse as a data store for Graphite.
-
-You can use any ClickHouse table engine to store the Graphite data if you don't need rollup, but if you need a rollup use `GraphiteMergeTree`. The engine reduces the volume of storage and increases the efficiency of queries from Graphite.
-
-The engine inherits properties from [MergeTree](mergetree.md).
-
-## Creating a Table
-
-```sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    Path String,
-    Time DateTime,
-    Value <Numeric_type>,
-    Version <Numeric_type>
-    ...
-) ENGINE = GraphiteMergeTree(config_section)
-[PARTITION BY expr]
-[ORDER BY expr]
-[SAMPLE BY expr]
-[SETTINGS name=value, ...]
-```
-
-For a description of request parameters, see [request description](../../query_language/create.md).
-
-A table for the Graphite date should have the following columns:
-
- Column with the metric name (Graphite sensor). Data type: `String`.
- Column with the time for measuring the metric. Data type: `DateTime`.
- Column with the value of the metric. Data type: any numeric.
- Column with the version of the metric with the same name and time of measurement. Data type: any numeric.
-
-    ClickHouse saves the rows with the highest version or the last written if versions are the same. Other rows are deleted during the merge of data parts.
-
-The names of these columns should be set in the rollup configuration.
-
-**GraphiteMergeTree parameters**
-
- `config_section` — Name of the section in the configuration file, where are the rules of rollup set.
-
-**Query clauses**
-
-When creating a `GraphiteMergeTree` table, the same [clauses](mergetree.md) are required, as when creating a `MergeTree` table.
-
-<details markdown="1"><summary>Deprecated Method for Creating a Table</summary>
-
-!!! attention
-    Do not use this method in new projects and, if possible, switch the old projects to the method described above.
-
-```sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    EventDate Date,
-    Path String,
-    Time DateTime,
-    Value <Numeric_type>,
-    Version <Numeric_type>
-    ...
-) ENGINE [=] GraphiteMergeTree(date-column [, sampling_expression], (primary, key), index_granularity, config_section)
-```
-
-All of the parameters excepting `config_section` have the same meaning as in `MergeTree`.
-
- `config_section` — Name of the section in the configuration file, where are the rules of rollup set.
-</details>
-
-## Rollup configuration
-
-The settings for rollup are defined by the [graphite_rollup](../server_settings/settings.md) parameter in the server configuration. The name of the parameter could be any. You can create several configurations and use them for different tables.
-
-Rollup configuration structure:
-
-```
-required-columns
-pattern
-    regexp
-    function
-    age + precision
-    ...
-pattern
-    ...
-default
-    function
-    age + precision
-    ...
-```
-
-When processing a row, ClickHouse checks the rules in the `pattern` section. If the metric name matches the `regexp`, the rules from the `pattern`section are applied; otherwise, the rules from the `default` section are used.
-
-The rules are defined with fields `function` and `age + precision`.
-
-Fields for `pattern` and `default` sections:
-
- `regexp`– A pattern for the metric name.
- `age` – The minimum age of the data in seconds.
- `precision`– How precisely to define the age of the data in seconds.
- `function` – The name of the aggregating function to apply to data whose age falls within the range `[age, age + precision]`.
-
-The `required-columns`:
-
- `path_column_name` — Column with the metric name (Graphite sensor).
- `time_column_name` — Column with the time for measuring the metric.
- `value_column_name` — Column with the value of the metric at the time set in `time_column_name`.
- `version_column_name` — Column with the version timestamp of the metric with the same name and time remains in the database.
-
-
-Example of settings:
-
-```xml
-<graphite_rollup>
-    <path_column_name>Path</path_column_name>
-    <time_column_name>Time</time_column_name>
-    <value_column_name>Value</value_column_name>
-    <version_column_name>Version</version_column_name>
-    <pattern>
-        <regexp>click_cost</regexp>
-        <function>any</function>
-        <retention>
-            <age>0</age>
-            <precision>5</precision>
-        </retention>
-        <retention>
-            <age>86400</age>
-            <precision>60</precision>
-        </retention>
-    </pattern>
-    <default>
-        <function>max</function>
-        <retention>
-            <age>0</age>
-            <precision>60</precision>
-        </retention>
-        <retention>
-            <age>3600</age>
-            <precision>300</precision>
-        </retention>
-        <retention>
-            <age>86400</age>
-            <precision>3600</precision>
-        </retention>
-    </default>
-</graphite_rollup>
-```
-
-[Original article](https://clickhouse.yandex/docs/en/operations/table_engines/graphitemergetree/) <!--hide-->
--- a/docs/zh/operations/table_engines/graphitemergetree.md
+++ b/docs/zh/operations/table_engines/graphitemergetree.md
@ -0,0 +1 @@
+../../../en/operations/table_engines/graphitemergetree.md
--- a/docs/zh/operations/table_engines/mergetree.md
+++ b/docs/zh/operations/table_engines/mergetree.md
@ -1,235 +0,0 @@
-# MergeTree {#table_engines-mergetree}
-
-The `MergeTree` engine and other engines of this family (`*MergeTree`) are the most robust ClickHousе table engines.
-
-The basic idea for `MergeTree` engines family is the following. When you have tremendous amount of a data that should be inserted into the table, you should write them quickly part by part and then merge parts by some rules in background. This method is much more efficient than constantly rewriting data in the storage at the insert.
-
-Main features:
-
- Stores data sorted by primary key.
-
-    This allows you to create a small sparse index that helps find data faster.
-
- This allows you to use partitions if the [partitioning key](custom_partitioning_key.md) is specified.
-
-    ClickHouse supports certain operations with partitions that are more effective than general operations on the same data with the same result. ClickHouse also automatically cuts off the partition data where the partitioning key is specified in the query. This also increases the query performance.
-
- Data replication support.
-
-    The family of `ReplicatedMergeTree` tables is used for this. For more information, see the [Data replication](replication.md) section.
-
- Data sampling support.
-
-    If necessary, you can set the data sampling method in the table.
-
-!!! info
-    The [Merge](merge.md) engine does not belong to the `*MergeTree` family.
-
-
-## Creating a Table
-
-```
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
-    ...
-) ENGINE = MergeTree()
-[PARTITION BY expr]
-[ORDER BY expr]
-[PRIMARY KEY expr]
-[SAMPLE BY expr]
-[SETTINGS name=value, ...]
-```
-
-For a description of request parameters, see [request description](../../query_language/create.md).
-
-**Query clauses**
-
- `ENGINE` - Name and parameters of the engine. `ENGINE = MergeTree()`. `MergeTree` engine does not have parameters.
-
- `PARTITION BY` — The [partitioning key](custom_partitioning_key.md).
-
-    For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](../../data_types/date.md). The partition names here have the `"YYYYMM"` format.
-
- `ORDER BY` — The sorting key.
-
-    A tuple of columns or arbitrary expressions. Example: `ORDER BY (CounterID, EventDate)`.
-
- `PRIMARY KEY` - The primary key if it [differs from the sorting key](mergetree.md).
-
-    By default the primary key is the same as the sorting key (which is specified by the `ORDER BY` clause).
-    Thus in most cases it is unnecessary to specify a separate `PRIMARY KEY` clause.
-
- `SAMPLE BY` — An expression for sampling.
-
-    If a sampling expression is used, the primary key must contain it. Example:  
-    `SAMPLE BY intHash32(UserID) ORDER BY (CounterID, EventDate, intHash32(UserID))`.
-
- `SETTINGS` — Additional parameters that control the behavior of the `MergeTree`:
-    - `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. By default, 8192.
-
-**Example of sections setting**
-
-```
-ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity=8192
-```
-
-In the example, we set partitioning by month.
-
-We also set an expression for sampling as a hash by the user ID. This allows you to pseudorandomize the data in the table for each `CounterID` and `EventDate`. If, when selecting the data, you define a [SAMPLE](../../query_language/select.md#select-sample-clause) clause, ClickHouse will return an evenly pseudorandom data sample for a subset of users.
-
-`index_granularity` could be omitted because 8192 is the default value.
-
-<details markdown="1"><summary>Deprecated Method for Creating a Table</summary>
-
-!!! attention
-    Do not use this method in new projects and, if possible, switch the old projects to the method described above.
-
-```
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
-    ...
-) ENGINE [=] MergeTree(date-column [, sampling_expression], (primary, key), index_granularity)
-```
-
-**MergeTree() parameters**
-
- `date-column` — The name of a column of the type [Date](../../data_types/date.md). ClickHouse automatically creates partitions by month on the basis of this column. The partition names are in the `"YYYYMM"` format.
- `sampling_expression` — an expression for sampling.
- `(primary, key)` — primary key. Type — [Tuple()](../../data_types/tuple.md- `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. The value 8192 is appropriate for most tasks.
-
-**Example**
-
-```
-MergeTree(EventDate, intHash32(UserID), (CounterID, EventDate, intHash32(UserID)), 8192)
-```
-
-The `MergeTree` engine is configured in the same way as in the example above for the main engine configuration method.
-</details>
-
-## Data Storage
-
-A table consists of data *parts* sorted by primary key.
-
-When data is inserted in a table, separate data parts are created and each of them is lexicographically sorted by primary key. For example, if the primary key is `(CounterID, Date)`, the data in the part is sorted by `CounterID`, and within each `CounterID`, it is ordered by `Date`.
-
-Data belonging to different partitions are separated into different parts. In the background, ClickHouse merges data parts for more efficient storage. Parts belonging to different partitions are not merged. The merge mechanism does not guarantee that all rows with the same primary key will be in the same data part.
-
-For each data part, ClickHouse creates an index file that contains the primary key value for each index row ("mark"). Index row numbers are defined as `n * index_granularity`. The maximum value `n` is equal to the integer part of dividing the total number of rows by the `index_granularity`. For each column, the "marks" are also written for the same index rows as the primary key. These "marks" allow you to find the data directly in the columns.
-
-You can use a single large table and continually add data to it in small chunks – this is what the `MergeTree` engine is intended for.
-
-## Primary Keys and Indexes in Queries
-
-Let's take the `(CounterID, Date)` primary key. In this case, the sorting and index can be illustrated as follows:
-
-```
-Whole data:     [-------------------------------------------------------------------------]
-CounterID:      [aaaaaaaaaaaaaaaaaabbbbcdeeeeeeeeeeeeefgggggggghhhhhhhhhiiiiiiiiikllllllll]
-Date:           [1111111222222233331233211111222222333211111112122222223111112223311122333]
-Marks:           |      |      |      |      |      |      |      |      |      |      |
-                a,1    a,2    a,3    b,3    e,2    e,3    g,1    h,2    i,1    i,3    l,3
-Marks numbers:   0      1      2      3      4      5      6      7      8      9      10
-```
-
-If the data query specifies:
-
- `CounterID in ('a', 'h')`, the server reads the data in the ranges of marks `[0, 3)` and `[6, 8)`.
- `CounterID IN ('a', 'h') AND Date = 3`, the server reads the data in the ranges of marks `[1, 3)` and `[7, 8)`.
- `Date = 3`, the server reads the data in the range of marks `[1, 10]`.
-
-The examples above show that it is always more effective to use an index than a full scan.
-
-A sparse index allows extra strings to be read. When reading a single range of the primary key, up to `index_granularity * 2` extra rows in each data block can be read. In most cases, ClickHouse performance does not degrade when `index_granularity = 8192`.
-
-Sparse indexes allow you to work with a very large number of table rows, because such indexes are always stored in the computer's RAM.
-
-ClickHouse does not require a unique primary key. You can insert multiple rows with the same primary key.
-
-### Selecting the Primary Key
-
-The number of columns in the primary key is not explicitly limited. Depending on the data structure, you can include more or fewer columns in the primary key. This may:
-
- Improve the performance of an index.
-
-    If the primary key is `(a, b)`, then adding another column `c` will improve the performance if the following conditions are met:
-    - There are queries with a condition on column `c`.
-    - Long data ranges (several times longer than the `index_granularity`) with identical values for `(a, b)` are common. In other words, when adding another column allows you to skip quite long data ranges.
-
- Improve data compression.
-
-    ClickHouse sorts data by primary key, so the higher the consistency, the better the compression.
-
- Provide additional logic when data parts merging in the [CollapsingMergeTree](collapsingmergetree.md#table_engine-collapsingmergetree) and [SummingMergeTree](summingmergetree.md) engines.
-
-    In this case it makes sense to specify the *sorting key* that is different from the primary key.
-
-A long primary key will negatively affect the insert performance and memory consumption, but extra columns in the primary key do not affect ClickHouse performance during `SELECT` queries.
-
-
-### Choosing the Primary Key that differs from the Sorting Key
-
-It is possible to specify the primary key (the expression, values of which are written into the index file
-for each mark) that is different from the sorting key (the expression for sorting the rows in data parts).
-In this case the primary key expression tuple must be a prefix of the sorting key expression tuple.
-
-This feature is helpful when using the [SummingMergeTree](summingmergetree.md) and
-[AggregatingMergeTree](aggregatingmergetree.md) table engines. In a common case when using these engines the
-table has two types of columns: *dimensions* and *measures*. Typical queries aggregate values of measure
-columns with arbitrary `GROUP BY` and filtering by dimensions. As SummingMergeTree and AggregatingMergeTree
-aggregate rows with the same value of the sorting key, it is natural to add all dimensions to it. As a result
-the key expression consists of a long list of columns and this list must be frequently updated with newly
-added dimensions.
-
-In this case it makes sense to leave only a few columns in the primary key that will provide efficient
-range scans and add the remaining dimension columns to the sorting key tuple.
-
-[ALTER of the sorting key](../../query_language/alter.md) is a
-lightweight operation because when a new column is simultaneously added to the table and to the sorting key
-data parts need not be changed (they remain sorted by the new sorting key expression).
-
-### Use of Indexes and Partitions in Queries
-
-For`SELECT` queries, ClickHouse analyzes whether an index can be used. An index can be used if the `WHERE/PREWHERE` clause has an expression (as one of the conjunction elements, or entirely) that represents an equality or inequality comparison operation, or if it has `IN` or `LIKE` with a fixed prefix on columns or expressions that are in the primary key or partitioning key, or on certain partially repetitive functions of these columns, or logical relationships of these expressions.
-
-Thus, it is possible to quickly run queries on one or many ranges of the primary key. In this example, queries will be fast when run for a specific tracking tag; for a specific tag and date range; for a specific tag and date; for multiple tags with a date range, and so on.
-
-Let's look at the engine configured as follows:
-
-```
-ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate) SETTINGS index_granularity=8192
-```
-
-In this case, in queries:
-
-``` sql
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND CounterID = 34
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND (CounterID = 34 OR CounterID = 42)
-SELECT count() FROM table WHERE ((EventDate >= toDate('2014-01-01') AND EventDate <= toDate('2014-01-31')) OR EventDate = toDate('2014-05-01')) AND CounterID IN (101500, 731962, 160656) AND (CounterID = 101500 OR EventDate != toDate('2014-05-01'))
-```
-
-ClickHouse will use the primary key index to trim improper data and the monthly partitioning key to trim partitions that are in improper date ranges.
-
-The queries above show that the index is used even for complex expressions. Reading from the table is organized so that using the index can't be slower than a full scan.
-
-In the example below, the index can't be used.
-
-``` sql
-SELECT count() FROM table WHERE CounterID = 34 OR URL LIKE '%upyachka%'
-```
-
-To check whether ClickHouse can use the index when running a query, use the settings [force_index_by_date](../settings/settings.md#settings-force_index_by_date) and [force_primary_key](../settings/settings.md).
-
-The key for partitioning by month allows reading only those data blocks which contain dates from the proper range. In this case, the data block may contain data for many dates (up to an entire month). Within a block, data is sorted by primary key, which might not contain the date as the first column. Because of this, using a query with only a date condition that does not specify the primary key prefix will cause more data to be read than for a single date.
-
-## Concurrent Data Access
-
-For concurrent table access, we use multi-versioning. In other words, when a table is simultaneously read and updated, data is read from a set of parts that is current at the time of the query. There are no lengthy locks. Inserts do not get in the way of read operations.
-
-Reading from a table is automatically parallelized.
-
-
-[Original article](https://clickhouse.yandex/docs/en/operations/table_engines/mergetree/) <!--hide-->
--- a/docs/zh/operations/table_engines/mergetree.md
+++ b/docs/zh/operations/table_engines/mergetree.md
@ -0,0 +1 @@
+../../../en/operations/table_engines/mergetree.md
--- a/utils/compressor/CMakeLists.txt
+++ b/utils/compressor/CMakeLists.txt
@ -1,11 +1,5 @@
 find_package (Threads)

-add_executable (util-clickhouse-compressor main.cpp)
-target_link_libraries (util-clickhouse-compressor PRIVATE clickhouse-compressor-lib)
-set_target_properties(util-clickhouse-compressor PROPERTIES OUTPUT_NAME "clickhouse-compressor")
-
-#install (TARGETS util-clickhouse-compressor RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} COMPONENT clickhouse-compressor)
-
 add_executable (zstd_test zstd_test.cpp)
 target_link_libraries (zstd_test PRIVATE ${ZSTD_LIBRARY} common Threads::Threads)
				`@ -0,0 +1 @@`
				`../../../en/operations/table_engines/graphitemergetree.md`
				`@ -0,0 +1 @@`
				`../../../en/operations/table_engines/mergetree.md`